diff --git "a/metrics.json" "b/metrics.json" new file mode 100755--- /dev/null +++ "b/metrics.json" @@ -0,0 +1,6141 @@ +{"num_parameters": 89682432, "trainable_parameters": 89682432, "step": 0} +{"train_info/time_between_train_steps": 2.4341917037963867, "step": 0} +{"info/global_step": 1, "train_info/time_within_train_step": 12.68381381034851, "step": 1} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 3644.77587890625, "train_info/memory_reserved": 3876.0, "train_info/memory_max_reserved": 3876.0, "_timestamp": 1746343938, "_runtime": 35}, "step": 1} +{"logs": {"train/loss": 8.5381, "train/learning_rate": 2e-06, "train/epoch": 0.0, "_timestamp": 1746343938, "_runtime": 35}, "step": 1} +{"train_info/time_between_train_steps": 0.03000950813293457, "step": 1} +{"info/global_step": 2, "train_info/time_within_train_step": 2.0820062160491943, "step": 2} +{"train_info/time_between_train_steps": 0.0035202503204345703, "step": 2} +{"info/global_step": 3, "train_info/time_within_train_step": 2.080089807510376, "step": 3} +{"train_info/time_between_train_steps": 0.0033354759216308594, "step": 3} +{"info/global_step": 4, "train_info/time_within_train_step": 2.083299160003662, "step": 4} +{"train_info/time_between_train_steps": 0.0033228397369384766, "step": 4} +{"info/global_step": 5, "train_info/time_within_train_step": 2.0807158946990967, "step": 5} +{"train_info/time_between_train_steps": 0.0032091140747070312, "step": 5} +{"info/global_step": 6, "train_info/time_within_train_step": 2.0893595218658447, "step": 6} +{"train_info/time_between_train_steps": 0.0034177303314208984, "step": 6} +{"info/global_step": 7, "train_info/time_within_train_step": 2.089799165725708, "step": 7} +{"train_info/time_between_train_steps": 0.003516674041748047, "step": 7} +{"info/global_step": 8, "train_info/time_within_train_step": 2.08964204788208, "step": 8} +{"train_info/time_between_train_steps": 0.0034182071685791016, "step": 8} +{"info/global_step": 9, "train_info/time_within_train_step": 2.0928685665130615, "step": 9} +{"train_info/time_between_train_steps": 0.0036041736602783203, "step": 9} +{"info/global_step": 10, "train_info/time_within_train_step": 2.0886964797973633, "step": 10} +{"train_info/time_between_train_steps": 0.003746509552001953, "step": 10} +{"info/global_step": 11, "train_info/time_within_train_step": 2.1116576194763184, "step": 11} +{"train_info/time_between_train_steps": 0.003777027130126953, "step": 11} +{"info/global_step": 12, "train_info/time_within_train_step": 2.253317356109619, "step": 12} +{"train_info/time_between_train_steps": 0.0037708282470703125, "step": 12} +{"info/global_step": 13, "train_info/time_within_train_step": 2.287325143814087, "step": 13} +{"train_info/time_between_train_steps": 0.0037794113159179688, "step": 13} +{"info/global_step": 14, "train_info/time_within_train_step": 2.286611318588257, "step": 14} +{"train_info/time_between_train_steps": 0.0036847591400146484, "step": 14} +{"info/global_step": 15, "train_info/time_within_train_step": 2.28690242767334, "step": 15} +{"train_info/time_between_train_steps": 0.0037381649017333984, "step": 15} +{"info/global_step": 16, "train_info/time_within_train_step": 2.2856996059417725, "step": 16} +{"train_info/time_between_train_steps": 0.003682374954223633, "step": 16} +{"info/global_step": 17, "train_info/time_within_train_step": 2.2859585285186768, "step": 17} +{"train_info/time_between_train_steps": 0.0036628246307373047, "step": 17} +{"info/global_step": 18, "train_info/time_within_train_step": 2.2861244678497314, "step": 18} +{"train_info/time_between_train_steps": 0.003766775131225586, "step": 18} +{"info/global_step": 19, "train_info/time_within_train_step": 2.2865419387817383, "step": 19} +{"train_info/time_between_train_steps": 0.003644227981567383, "step": 19} +{"info/global_step": 20, "train_info/time_within_train_step": 2.2857825756073, "step": 20} +{"train_info/time_between_train_steps": 0.0037293434143066406, "step": 20} +{"info/global_step": 21, "train_info/time_within_train_step": 2.286238670349121, "step": 21} +{"train_info/time_between_train_steps": 0.003628253936767578, "step": 21} +{"info/global_step": 22, "train_info/time_within_train_step": 2.285865068435669, "step": 22} +{"train_info/time_between_train_steps": 0.0034775733947753906, "step": 22} +{"info/global_step": 23, "train_info/time_within_train_step": 2.286024808883667, "step": 23} +{"train_info/time_between_train_steps": 0.0034987926483154297, "step": 23} +{"info/global_step": 24, "train_info/time_within_train_step": 2.2862465381622314, "step": 24} +{"train_info/time_between_train_steps": 0.0037109851837158203, "step": 24} +{"info/global_step": 25, "train_info/time_within_train_step": 2.285700798034668, "step": 25} +{"train_info/time_between_train_steps": 0.003598451614379883, "step": 25} +{"info/global_step": 26, "train_info/time_within_train_step": 2.291569232940674, "step": 26} +{"train_info/time_between_train_steps": 0.0034525394439697266, "step": 26} +{"info/global_step": 27, "train_info/time_within_train_step": 2.2862284183502197, "step": 27} +{"train_info/time_between_train_steps": 0.0036172866821289062, "step": 27} +{"info/global_step": 28, "train_info/time_within_train_step": 2.2868809700012207, "step": 28} +{"train_info/time_between_train_steps": 0.003487110137939453, "step": 28} +{"info/global_step": 29, "train_info/time_within_train_step": 2.2867109775543213, "step": 29} +{"train_info/time_between_train_steps": 0.003504514694213867, "step": 29} +{"info/global_step": 30, "train_info/time_within_train_step": 2.2869319915771484, "step": 30} +{"train_info/time_between_train_steps": 0.0035321712493896484, "step": 30} +{"info/global_step": 31, "train_info/time_within_train_step": 2.287548303604126, "step": 31} +{"train_info/time_between_train_steps": 0.0036330223083496094, "step": 31} +{"info/global_step": 32, "train_info/time_within_train_step": 2.287073850631714, "step": 32} +{"train_info/time_between_train_steps": 0.003679513931274414, "step": 32} +{"info/global_step": 33, "train_info/time_within_train_step": 2.286973237991333, "step": 33} +{"train_info/time_between_train_steps": 0.0035631656646728516, "step": 33} +{"info/global_step": 34, "train_info/time_within_train_step": 2.287584066390991, "step": 34} +{"train_info/time_between_train_steps": 0.0035123825073242188, "step": 34} +{"info/global_step": 35, "train_info/time_within_train_step": 2.2873263359069824, "step": 35} +{"train_info/time_between_train_steps": 0.003687143325805664, "step": 35} +{"info/global_step": 36, "train_info/time_within_train_step": 2.2868573665618896, "step": 36} +{"train_info/time_between_train_steps": 0.0035619735717773438, "step": 36} +{"info/global_step": 37, "train_info/time_within_train_step": 2.287187099456787, "step": 37} +{"train_info/time_between_train_steps": 0.0035047531127929688, "step": 37} +{"info/global_step": 38, "train_info/time_within_train_step": 2.286829710006714, "step": 38} +{"train_info/time_between_train_steps": 0.00373077392578125, "step": 38} +{"info/global_step": 39, "train_info/time_within_train_step": 2.287198305130005, "step": 39} +{"train_info/time_between_train_steps": 0.003540515899658203, "step": 39} +{"info/global_step": 40, "train_info/time_within_train_step": 2.286607265472412, "step": 40} +{"train_info/time_between_train_steps": 0.0034627914428710938, "step": 40} +{"info/global_step": 41, "train_info/time_within_train_step": 2.2860934734344482, "step": 41} +{"train_info/time_between_train_steps": 0.0036194324493408203, "step": 41} +{"info/global_step": 42, "train_info/time_within_train_step": 2.285940170288086, "step": 42} +{"train_info/time_between_train_steps": 0.003644227981567383, "step": 42} +{"info/global_step": 43, "train_info/time_within_train_step": 2.2858095169067383, "step": 43} +{"train_info/time_between_train_steps": 0.003661632537841797, "step": 43} +{"info/global_step": 44, "train_info/time_within_train_step": 2.2858245372772217, "step": 44} +{"train_info/time_between_train_steps": 0.003534078598022461, "step": 44} +{"info/global_step": 45, "train_info/time_within_train_step": 2.2858076095581055, "step": 45} +{"train_info/time_between_train_steps": 0.0035352706909179688, "step": 45} +{"info/global_step": 46, "train_info/time_within_train_step": 2.2863035202026367, "step": 46} +{"train_info/time_between_train_steps": 0.003424406051635742, "step": 46} +{"info/global_step": 47, "train_info/time_within_train_step": 2.2866709232330322, "step": 47} +{"train_info/time_between_train_steps": 0.0034186840057373047, "step": 47} +{"info/global_step": 48, "train_info/time_within_train_step": 2.2954483032226562, "step": 48} +{"train_info/time_between_train_steps": 0.003650188446044922, "step": 48} +{"info/global_step": 49, "train_info/time_within_train_step": 2.2858903408050537, "step": 49} +{"train_info/time_between_train_steps": 0.003635883331298828, "step": 49} +{"info/global_step": 50, "train_info/time_within_train_step": 2.286346912384033, "step": 50} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 4588.0, "train_info/memory_max_reserved": 4588.0, "_timestamp": 1746344049, "_runtime": 146}, "step": 50} +{"logs": {"train/loss": 7.241, "train/learning_rate": 9.999999999999999e-05, "train/epoch": 0.02, "_timestamp": 1746344049, "_runtime": 146}, "step": 50} +{"train_info/time_between_train_steps": 0.0246889591217041, "step": 50} +{"info/global_step": 51, "train_info/time_within_train_step": 2.2879371643066406, "step": 51} +{"train_info/time_between_train_steps": 0.003531217575073242, "step": 51} +{"info/global_step": 52, "train_info/time_within_train_step": 2.6478397846221924, "step": 52} +{"train_info/time_between_train_steps": 0.0033392906188964844, "step": 52} +{"info/global_step": 53, "train_info/time_within_train_step": 2.2859044075012207, "step": 53} +{"train_info/time_between_train_steps": 0.003214120864868164, "step": 53} +{"info/global_step": 54, "train_info/time_within_train_step": 2.285548210144043, "step": 54} +{"train_info/time_between_train_steps": 0.0033783912658691406, "step": 54} +{"info/global_step": 55, "train_info/time_within_train_step": 2.2860898971557617, "step": 55} +{"train_info/time_between_train_steps": 0.003134489059448242, "step": 55} +{"info/global_step": 56, "train_info/time_within_train_step": 2.286452531814575, "step": 56} +{"train_info/time_between_train_steps": 0.003284454345703125, "step": 56} +{"info/global_step": 57, "train_info/time_within_train_step": 2.2861034870147705, "step": 57} +{"train_info/time_between_train_steps": 0.0031480789184570312, "step": 57} +{"info/global_step": 58, "train_info/time_within_train_step": 2.2856178283691406, "step": 58} +{"train_info/time_between_train_steps": 0.0033555030822753906, "step": 58} +{"info/global_step": 59, "train_info/time_within_train_step": 2.285893678665161, "step": 59} +{"train_info/time_between_train_steps": 0.003203868865966797, "step": 59} +{"info/global_step": 60, "train_info/time_within_train_step": 2.285945415496826, "step": 60} +{"train_info/time_between_train_steps": 0.003233671188354492, "step": 60} +{"info/global_step": 61, "train_info/time_within_train_step": 2.2858517169952393, "step": 61} +{"train_info/time_between_train_steps": 0.00341033935546875, "step": 61} +{"info/global_step": 62, "train_info/time_within_train_step": 2.285785436630249, "step": 62} +{"train_info/time_between_train_steps": 0.0033788681030273438, "step": 62} +{"info/global_step": 63, "train_info/time_within_train_step": 2.439946413040161, "step": 63} +{"train_info/time_between_train_steps": 0.0033919811248779297, "step": 63} +{"info/global_step": 64, "train_info/time_within_train_step": 2.2857608795166016, "step": 64} +{"train_info/time_between_train_steps": 0.003408193588256836, "step": 64} +{"info/global_step": 65, "train_info/time_within_train_step": 2.285571575164795, "step": 65} +{"train_info/time_between_train_steps": 0.0034132003784179688, "step": 65} +{"info/global_step": 66, "train_info/time_within_train_step": 2.285238027572632, "step": 66} +{"train_info/time_between_train_steps": 0.0033800601959228516, "step": 66} +{"info/global_step": 67, "train_info/time_within_train_step": 2.2858338356018066, "step": 67} +{"train_info/time_between_train_steps": 0.003383159637451172, "step": 67} +{"info/global_step": 68, "train_info/time_within_train_step": 2.285597085952759, "step": 68} +{"train_info/time_between_train_steps": 0.003187417984008789, "step": 68} +{"info/global_step": 69, "train_info/time_within_train_step": 2.2858564853668213, "step": 69} +{"train_info/time_between_train_steps": 0.003313302993774414, "step": 69} +{"info/global_step": 70, "train_info/time_within_train_step": 2.2864153385162354, "step": 70} +{"train_info/time_between_train_steps": 0.0032236576080322266, "step": 70} +{"info/global_step": 71, "train_info/time_within_train_step": 2.286353588104248, "step": 71} +{"train_info/time_between_train_steps": 0.0034012794494628906, "step": 71} +{"info/global_step": 72, "train_info/time_within_train_step": 2.2863237857818604, "step": 72} +{"train_info/time_between_train_steps": 0.003416776657104492, "step": 72} +{"info/global_step": 73, "train_info/time_within_train_step": 2.2863364219665527, "step": 73} +{"train_info/time_between_train_steps": 0.003203868865966797, "step": 73} +{"info/global_step": 74, "train_info/time_within_train_step": 2.2868731021881104, "step": 74} +{"train_info/time_between_train_steps": 0.0032830238342285156, "step": 74} +{"info/global_step": 75, "train_info/time_within_train_step": 2.2862021923065186, "step": 75} +{"train_info/time_between_train_steps": 0.0033898353576660156, "step": 75} +{"info/global_step": 76, "train_info/time_within_train_step": 2.286127805709839, "step": 76} +{"train_info/time_between_train_steps": 0.0032525062561035156, "step": 76} +{"info/global_step": 77, "train_info/time_within_train_step": 2.286377429962158, "step": 77} +{"train_info/time_between_train_steps": 0.0033125877380371094, "step": 77} +{"info/global_step": 78, "train_info/time_within_train_step": 2.2866618633270264, "step": 78} +{"train_info/time_between_train_steps": 0.0035505294799804688, "step": 78} +{"info/global_step": 79, "train_info/time_within_train_step": 2.287308692932129, "step": 79} +{"train_info/time_between_train_steps": 0.003591299057006836, "step": 79} +{"info/global_step": 80, "train_info/time_within_train_step": 2.287376880645752, "step": 80} +{"train_info/time_between_train_steps": 0.0035343170166015625, "step": 80} +{"info/global_step": 81, "train_info/time_within_train_step": 2.287091016769409, "step": 81} +{"train_info/time_between_train_steps": 0.0036590099334716797, "step": 81} +{"info/global_step": 82, "train_info/time_within_train_step": 2.2868642807006836, "step": 82} +{"train_info/time_between_train_steps": 0.0035333633422851562, "step": 82} +{"info/global_step": 83, "train_info/time_within_train_step": 2.285820245742798, "step": 83} +{"train_info/time_between_train_steps": 0.0035643577575683594, "step": 83} +{"info/global_step": 84, "train_info/time_within_train_step": 2.286267042160034, "step": 84} +{"train_info/time_between_train_steps": 0.0035059452056884766, "step": 84} +{"info/global_step": 85, "train_info/time_within_train_step": 2.2865848541259766, "step": 85} +{"train_info/time_between_train_steps": 0.0035207271575927734, "step": 85} +{"info/global_step": 86, "train_info/time_within_train_step": 2.287356376647949, "step": 86} +{"train_info/time_between_train_steps": 0.0037631988525390625, "step": 86} +{"info/global_step": 87, "train_info/time_within_train_step": 2.286383628845215, "step": 87} +{"train_info/time_between_train_steps": 0.0034797191619873047, "step": 87} +{"info/global_step": 88, "train_info/time_within_train_step": 2.2861366271972656, "step": 88} +{"train_info/time_between_train_steps": 0.003530740737915039, "step": 88} +{"info/global_step": 89, "train_info/time_within_train_step": 2.2868361473083496, "step": 89} +{"train_info/time_between_train_steps": 0.003505229949951172, "step": 89} +{"info/global_step": 90, "train_info/time_within_train_step": 2.6400647163391113, "step": 90} +{"train_info/time_between_train_steps": 0.003392934799194336, "step": 90} +{"info/global_step": 91, "train_info/time_within_train_step": 2.2860324382781982, "step": 91} +{"train_info/time_between_train_steps": 0.003183126449584961, "step": 91} +{"info/global_step": 92, "train_info/time_within_train_step": 2.2909135818481445, "step": 92} +{"train_info/time_between_train_steps": 0.0032911300659179688, "step": 92} +{"info/global_step": 93, "train_info/time_within_train_step": 2.2875921726226807, "step": 93} +{"train_info/time_between_train_steps": 0.003572225570678711, "step": 93} +{"info/global_step": 94, "train_info/time_within_train_step": 2.2881579399108887, "step": 94} +{"train_info/time_between_train_steps": 0.0035467147827148438, "step": 94} +{"info/global_step": 95, "train_info/time_within_train_step": 2.3021047115325928, "step": 95} +{"train_info/time_between_train_steps": 0.0037920475006103516, "step": 95} +{"info/global_step": 96, "train_info/time_within_train_step": 2.287208318710327, "step": 96} +{"train_info/time_between_train_steps": 0.003660917282104492, "step": 96} +{"info/global_step": 97, "train_info/time_within_train_step": 2.287407398223877, "step": 97} +{"train_info/time_between_train_steps": 0.003634214401245117, "step": 97} +{"info/global_step": 98, "train_info/time_within_train_step": 2.2871522903442383, "step": 98} +{"train_info/time_between_train_steps": 0.003465414047241211, "step": 98} +{"info/global_step": 99, "train_info/time_within_train_step": 2.287456512451172, "step": 99} +{"train_info/time_between_train_steps": 0.0035169124603271484, "step": 99} +{"info/global_step": 100, "train_info/time_within_train_step": 2.286973476409912, "step": 100} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 4588.0, "train_info/memory_max_reserved": 4588.0, "_timestamp": 1746344166, "_runtime": 263}, "step": 100} +{"logs": {"train/loss": 6.3916, "train/learning_rate": 0.00019999999999999998, "train/epoch": 0.03, "_timestamp": 1746344166, "_runtime": 263}, "step": 100} +{"train_info/time_between_train_steps": 11.268674850463867, "step": 100} +{"info/global_step": 101, "train_info/time_within_train_step": 2.1139862537384033, "step": 101} +{"train_info/time_between_train_steps": 0.003579854965209961, "step": 101} +{"info/global_step": 102, "train_info/time_within_train_step": 2.105330228805542, "step": 102} +{"train_info/time_between_train_steps": 0.0036535263061523438, "step": 102} +{"info/global_step": 103, "train_info/time_within_train_step": 2.2546133995056152, "step": 103} +{"train_info/time_between_train_steps": 0.0036644935607910156, "step": 103} +{"info/global_step": 104, "train_info/time_within_train_step": 2.2852256298065186, "step": 104} +{"train_info/time_between_train_steps": 0.0036830902099609375, "step": 104} +{"info/global_step": 105, "train_info/time_within_train_step": 2.284849166870117, "step": 105} +{"train_info/time_between_train_steps": 0.003740549087524414, "step": 105} +{"info/global_step": 106, "train_info/time_within_train_step": 2.28511905670166, "step": 106} +{"train_info/time_between_train_steps": 0.0034613609313964844, "step": 106} +{"info/global_step": 107, "train_info/time_within_train_step": 2.2858047485351562, "step": 107} +{"train_info/time_between_train_steps": 0.0034868717193603516, "step": 107} +{"info/global_step": 108, "train_info/time_within_train_step": 2.2856993675231934, "step": 108} +{"train_info/time_between_train_steps": 0.003648996353149414, "step": 108} +{"info/global_step": 109, "train_info/time_within_train_step": 2.2858095169067383, "step": 109} +{"train_info/time_between_train_steps": 0.0034313201904296875, "step": 109} +{"info/global_step": 110, "train_info/time_within_train_step": 2.28653621673584, "step": 110} +{"train_info/time_between_train_steps": 0.0034470558166503906, "step": 110} +{"info/global_step": 111, "train_info/time_within_train_step": 2.2862682342529297, "step": 111} +{"train_info/time_between_train_steps": 0.0035305023193359375, "step": 111} +{"info/global_step": 112, "train_info/time_within_train_step": 2.2864835262298584, "step": 112} +{"train_info/time_between_train_steps": 0.0035016536712646484, "step": 112} +{"info/global_step": 113, "train_info/time_within_train_step": 2.2864861488342285, "step": 113} +{"train_info/time_between_train_steps": 0.003444194793701172, "step": 113} +{"info/global_step": 114, "train_info/time_within_train_step": 2.287369728088379, "step": 114} +{"train_info/time_between_train_steps": 0.003627300262451172, "step": 114} +{"info/global_step": 115, "train_info/time_within_train_step": 2.287757635116577, "step": 115} +{"train_info/time_between_train_steps": 0.003423452377319336, "step": 115} +{"info/global_step": 116, "train_info/time_within_train_step": 2.287526845932007, "step": 116} +{"train_info/time_between_train_steps": 0.003460407257080078, "step": 116} +{"info/global_step": 117, "train_info/time_within_train_step": 2.287576675415039, "step": 117} +{"train_info/time_between_train_steps": 0.003392934799194336, "step": 117} +{"info/global_step": 118, "train_info/time_within_train_step": 2.300708532333374, "step": 118} +{"train_info/time_between_train_steps": 0.0035762786865234375, "step": 118} +{"info/global_step": 119, "train_info/time_within_train_step": 2.2869625091552734, "step": 119} +{"train_info/time_between_train_steps": 0.003476858139038086, "step": 119} +{"info/global_step": 120, "train_info/time_within_train_step": 2.2875418663024902, "step": 120} +{"train_info/time_between_train_steps": 0.0036163330078125, "step": 120} +{"info/global_step": 121, "train_info/time_within_train_step": 2.2871429920196533, "step": 121} +{"train_info/time_between_train_steps": 0.003636598587036133, "step": 121} +{"info/global_step": 122, "train_info/time_within_train_step": 2.2868306636810303, "step": 122} +{"train_info/time_between_train_steps": 0.003621816635131836, "step": 122} +{"info/global_step": 123, "train_info/time_within_train_step": 2.2871274948120117, "step": 123} +{"train_info/time_between_train_steps": 0.003672361373901367, "step": 123} +{"info/global_step": 124, "train_info/time_within_train_step": 2.286360740661621, "step": 124} +{"train_info/time_between_train_steps": 0.003484487533569336, "step": 124} +{"info/global_step": 125, "train_info/time_within_train_step": 2.286604881286621, "step": 125} +{"train_info/time_between_train_steps": 0.16040897369384766, "step": 125} +{"info/global_step": 126, "train_info/time_within_train_step": 2.2862980365753174, "step": 126} +{"train_info/time_between_train_steps": 0.003313779830932617, "step": 126} +{"info/global_step": 127, "train_info/time_within_train_step": 2.286367416381836, "step": 127} +{"train_info/time_between_train_steps": 0.003360748291015625, "step": 127} +{"info/global_step": 128, "train_info/time_within_train_step": 2.2868740558624268, "step": 128} +{"train_info/time_between_train_steps": 0.0035142898559570312, "step": 128} +{"info/global_step": 129, "train_info/time_within_train_step": 2.286432981491089, "step": 129} +{"train_info/time_between_train_steps": 0.003374338150024414, "step": 129} +{"info/global_step": 130, "train_info/time_within_train_step": 2.285971164703369, "step": 130} +{"train_info/time_between_train_steps": 0.003446340560913086, "step": 130} +{"info/global_step": 131, "train_info/time_within_train_step": 2.286235809326172, "step": 131} +{"train_info/time_between_train_steps": 0.0035407543182373047, "step": 131} +{"info/global_step": 132, "train_info/time_within_train_step": 2.2864246368408203, "step": 132} +{"train_info/time_between_train_steps": 0.003295421600341797, "step": 132} +{"info/global_step": 133, "train_info/time_within_train_step": 2.604337692260742, "step": 133} +{"train_info/time_between_train_steps": 0.003228902816772461, "step": 133} +{"info/global_step": 134, "train_info/time_within_train_step": 2.2864816188812256, "step": 134} +{"train_info/time_between_train_steps": 0.003383159637451172, "step": 134} +{"info/global_step": 135, "train_info/time_within_train_step": 2.286201000213623, "step": 135} +{"train_info/time_between_train_steps": 0.0031518936157226562, "step": 135} +{"info/global_step": 136, "train_info/time_within_train_step": 2.285767078399658, "step": 136} +{"train_info/time_between_train_steps": 0.0032880306243896484, "step": 136} +{"info/global_step": 137, "train_info/time_within_train_step": 2.286149024963379, "step": 137} +{"train_info/time_between_train_steps": 0.0031409263610839844, "step": 137} +{"info/global_step": 138, "train_info/time_within_train_step": 2.2857792377471924, "step": 138} +{"train_info/time_between_train_steps": 0.00325775146484375, "step": 138} +{"info/global_step": 139, "train_info/time_within_train_step": 2.2859177589416504, "step": 139} +{"train_info/time_between_train_steps": 0.0033702850341796875, "step": 139} +{"info/global_step": 140, "train_info/time_within_train_step": 2.285876989364624, "step": 140} +{"train_info/time_between_train_steps": 0.003402233123779297, "step": 140} +{"info/global_step": 141, "train_info/time_within_train_step": 2.2858195304870605, "step": 141} +{"train_info/time_between_train_steps": 0.003370046615600586, "step": 141} +{"info/global_step": 142, "train_info/time_within_train_step": 2.285660982131958, "step": 142} +{"train_info/time_between_train_steps": 0.0032351016998291016, "step": 142} +{"info/global_step": 143, "train_info/time_within_train_step": 2.286034345626831, "step": 143} +{"train_info/time_between_train_steps": 0.003182649612426758, "step": 143} +{"info/global_step": 144, "train_info/time_within_train_step": 2.285822629928589, "step": 144} +{"train_info/time_between_train_steps": 0.0033211708068847656, "step": 144} +{"info/global_step": 145, "train_info/time_within_train_step": 2.285487651824951, "step": 145} +{"train_info/time_between_train_steps": 0.0033538341522216797, "step": 145} +{"info/global_step": 146, "train_info/time_within_train_step": 2.285566568374634, "step": 146} +{"train_info/time_between_train_steps": 0.0033500194549560547, "step": 146} +{"info/global_step": 147, "train_info/time_within_train_step": 2.2952256202697754, "step": 147} +{"train_info/time_between_train_steps": 0.0031681060791015625, "step": 147} +{"info/global_step": 148, "train_info/time_within_train_step": 2.285648822784424, "step": 148} +{"train_info/time_between_train_steps": 0.0031805038452148438, "step": 148} +{"info/global_step": 149, "train_info/time_within_train_step": 2.285449504852295, "step": 149} +{"train_info/time_between_train_steps": 0.003382444381713867, "step": 149} +{"info/global_step": 150, "train_info/time_within_train_step": 2.285499334335327, "step": 150} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 4588.0, "train_info/memory_max_reserved": 4588.0, "_timestamp": 1746344293, "_runtime": 390}, "step": 150} +{"logs": {"train/loss": 5.8898, "train/learning_rate": 0.0003, "train/epoch": 0.05, "_timestamp": 1746344293, "_runtime": 390}, "step": 150} +{"train_info/time_between_train_steps": 0.02480792999267578, "step": 150} +{"info/global_step": 151, "train_info/time_within_train_step": 2.286653518676758, "step": 151} +{"train_info/time_between_train_steps": 0.003432750701904297, "step": 151} +{"info/global_step": 152, "train_info/time_within_train_step": 2.295876979827881, "step": 152} +{"train_info/time_between_train_steps": 0.0031478404998779297, "step": 152} +{"info/global_step": 153, "train_info/time_within_train_step": 2.2867088317871094, "step": 153} +{"train_info/time_between_train_steps": 0.0033681392669677734, "step": 153} +{"info/global_step": 154, "train_info/time_within_train_step": 2.285867214202881, "step": 154} +{"train_info/time_between_train_steps": 0.0031092166900634766, "step": 154} +{"info/global_step": 155, "train_info/time_within_train_step": 2.286041736602783, "step": 155} +{"train_info/time_between_train_steps": 0.003253936767578125, "step": 155} +{"info/global_step": 156, "train_info/time_within_train_step": 2.285895347595215, "step": 156} +{"train_info/time_between_train_steps": 0.0031905174255371094, "step": 156} +{"info/global_step": 157, "train_info/time_within_train_step": 2.2859249114990234, "step": 157} +{"train_info/time_between_train_steps": 0.003317594528198242, "step": 157} +{"info/global_step": 158, "train_info/time_within_train_step": 2.286094903945923, "step": 158} +{"train_info/time_between_train_steps": 0.003155946731567383, "step": 158} +{"info/global_step": 159, "train_info/time_within_train_step": 2.286184310913086, "step": 159} +{"train_info/time_between_train_steps": 0.003161907196044922, "step": 159} +{"info/global_step": 160, "train_info/time_within_train_step": 2.2855541706085205, "step": 160} +{"train_info/time_between_train_steps": 0.0031807422637939453, "step": 160} +{"info/global_step": 161, "train_info/time_within_train_step": 2.2855944633483887, "step": 161} +{"train_info/time_between_train_steps": 0.003137350082397461, "step": 161} +{"info/global_step": 162, "train_info/time_within_train_step": 2.285947322845459, "step": 162} +{"train_info/time_between_train_steps": 0.003367185592651367, "step": 162} +{"info/global_step": 163, "train_info/time_within_train_step": 2.285498857498169, "step": 163} +{"train_info/time_between_train_steps": 0.0031239986419677734, "step": 163} +{"info/global_step": 164, "train_info/time_within_train_step": 2.285827159881592, "step": 164} +{"train_info/time_between_train_steps": 0.0031859874725341797, "step": 164} +{"info/global_step": 165, "train_info/time_within_train_step": 2.2851061820983887, "step": 165} +{"train_info/time_between_train_steps": 0.003500699996948242, "step": 165} +{"info/global_step": 166, "train_info/time_within_train_step": 2.2853996753692627, "step": 166} +{"train_info/time_between_train_steps": 0.003220796585083008, "step": 166} +{"info/global_step": 167, "train_info/time_within_train_step": 2.2856950759887695, "step": 167} +{"train_info/time_between_train_steps": 0.003294706344604492, "step": 167} +{"info/global_step": 168, "train_info/time_within_train_step": 2.285548686981201, "step": 168} +{"train_info/time_between_train_steps": 0.0031769275665283203, "step": 168} +{"info/global_step": 169, "train_info/time_within_train_step": 2.285492420196533, "step": 169} +{"train_info/time_between_train_steps": 0.0031516551971435547, "step": 169} +{"info/global_step": 170, "train_info/time_within_train_step": 2.285853624343872, "step": 170} +{"train_info/time_between_train_steps": 0.0032606124877929688, "step": 170} +{"info/global_step": 171, "train_info/time_within_train_step": 2.286283016204834, "step": 171} +{"train_info/time_between_train_steps": 0.003153085708618164, "step": 171} +{"info/global_step": 172, "train_info/time_within_train_step": 2.2864480018615723, "step": 172} +{"train_info/time_between_train_steps": 0.0033388137817382812, "step": 172} +{"info/global_step": 173, "train_info/time_within_train_step": 2.2861275672912598, "step": 173} +{"train_info/time_between_train_steps": 0.003391265869140625, "step": 173} +{"info/global_step": 174, "train_info/time_within_train_step": 2.286869764328003, "step": 174} +{"train_info/time_between_train_steps": 0.0031747817993164062, "step": 174} +{"info/global_step": 175, "train_info/time_within_train_step": 2.2865657806396484, "step": 175} +{"train_info/time_between_train_steps": 0.0033676624298095703, "step": 175} +{"info/global_step": 176, "train_info/time_within_train_step": 2.2864389419555664, "step": 176} +{"train_info/time_between_train_steps": 0.003377199172973633, "step": 176} +{"info/global_step": 177, "train_info/time_within_train_step": 2.2860584259033203, "step": 177} +{"train_info/time_between_train_steps": 0.0033180713653564453, "step": 177} +{"info/global_step": 178, "train_info/time_within_train_step": 2.296281099319458, "step": 178} +{"train_info/time_between_train_steps": 0.0032715797424316406, "step": 178} +{"info/global_step": 179, "train_info/time_within_train_step": 2.2861878871917725, "step": 179} +{"train_info/time_between_train_steps": 0.003386259078979492, "step": 179} +{"info/global_step": 180, "train_info/time_within_train_step": 2.2856502532958984, "step": 180} +{"train_info/time_between_train_steps": 0.003165006637573242, "step": 180} +{"info/global_step": 181, "train_info/time_within_train_step": 2.285902261734009, "step": 181} +{"train_info/time_between_train_steps": 0.003391742706298828, "step": 181} +{"info/global_step": 182, "train_info/time_within_train_step": 2.286249876022339, "step": 182} +{"train_info/time_between_train_steps": 0.0032787322998046875, "step": 182} +{"info/global_step": 183, "train_info/time_within_train_step": 2.285639524459839, "step": 183} +{"train_info/time_between_train_steps": 0.003177165985107422, "step": 183} +{"info/global_step": 184, "train_info/time_within_train_step": 2.2850263118743896, "step": 184} +{"train_info/time_between_train_steps": 0.003322124481201172, "step": 184} +{"info/global_step": 185, "train_info/time_within_train_step": 2.2853262424468994, "step": 185} +{"train_info/time_between_train_steps": 0.003376007080078125, "step": 185} +{"info/global_step": 186, "train_info/time_within_train_step": 2.285329580307007, "step": 186} +{"train_info/time_between_train_steps": 0.00333404541015625, "step": 186} +{"info/global_step": 187, "train_info/time_within_train_step": 2.2857439517974854, "step": 187} +{"train_info/time_between_train_steps": 0.0032520294189453125, "step": 187} +{"info/global_step": 188, "train_info/time_within_train_step": 2.4047985076904297, "step": 188} +{"train_info/time_between_train_steps": 0.0032584667205810547, "step": 188} +{"info/global_step": 189, "train_info/time_within_train_step": 2.2856643199920654, "step": 189} +{"train_info/time_between_train_steps": 0.0032126903533935547, "step": 189} +{"info/global_step": 190, "train_info/time_within_train_step": 2.285525321960449, "step": 190} +{"train_info/time_between_train_steps": 0.0032165050506591797, "step": 190} +{"info/global_step": 191, "train_info/time_within_train_step": 2.2858736515045166, "step": 191} +{"train_info/time_between_train_steps": 0.0032558441162109375, "step": 191} +{"info/global_step": 192, "train_info/time_within_train_step": 2.2856273651123047, "step": 192} +{"train_info/time_between_train_steps": 0.0032477378845214844, "step": 192} +{"info/global_step": 193, "train_info/time_within_train_step": 2.2861275672912598, "step": 193} +{"train_info/time_between_train_steps": 0.003371000289916992, "step": 193} +{"info/global_step": 194, "train_info/time_within_train_step": 2.2858855724334717, "step": 194} +{"train_info/time_between_train_steps": 0.0032355785369873047, "step": 194} +{"info/global_step": 195, "train_info/time_within_train_step": 2.286116361618042, "step": 195} +{"train_info/time_between_train_steps": 0.003165006637573242, "step": 195} +{"info/global_step": 196, "train_info/time_within_train_step": 2.285849094390869, "step": 196} +{"train_info/time_between_train_steps": 0.0032057762145996094, "step": 196} +{"info/global_step": 197, "train_info/time_within_train_step": 2.285615921020508, "step": 197} +{"train_info/time_between_train_steps": 0.003297567367553711, "step": 197} +{"info/global_step": 198, "train_info/time_within_train_step": 2.2855498790740967, "step": 198} +{"train_info/time_between_train_steps": 0.003233671188354492, "step": 198} +{"info/global_step": 199, "train_info/time_within_train_step": 2.2999467849731445, "step": 199} +{"train_info/time_between_train_steps": 0.0034284591674804688, "step": 199} +{"info/global_step": 200, "train_info/time_within_train_step": 2.2854530811309814, "step": 200} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 4588.0, "train_info/memory_max_reserved": 4588.0, "_timestamp": 1746344408, "_runtime": 505}, "step": 200} +{"logs": {"train/loss": 5.5444, "train/learning_rate": 0.00039999999999999996, "train/epoch": 0.07, "_timestamp": 1746344408, "_runtime": 505}, "step": 200} +{"train_info/time_between_train_steps": 11.245414972305298, "step": 200} +{"info/global_step": 201, "train_info/time_within_train_step": 2.1115498542785645, "step": 201} +{"train_info/time_between_train_steps": 0.0033884048461914062, "step": 201} +{"info/global_step": 202, "train_info/time_within_train_step": 2.1000828742980957, "step": 202} +{"train_info/time_between_train_steps": 0.0032706260681152344, "step": 202} +{"info/global_step": 203, "train_info/time_within_train_step": 2.216728687286377, "step": 203} +{"train_info/time_between_train_steps": 0.0033817291259765625, "step": 203} +{"info/global_step": 204, "train_info/time_within_train_step": 2.2848856449127197, "step": 204} +{"train_info/time_between_train_steps": 0.0032792091369628906, "step": 204} +{"info/global_step": 205, "train_info/time_within_train_step": 2.2858853340148926, "step": 205} +{"train_info/time_between_train_steps": 0.0034742355346679688, "step": 205} +{"info/global_step": 206, "train_info/time_within_train_step": 2.2868974208831787, "step": 206} +{"train_info/time_between_train_steps": 0.0031137466430664062, "step": 206} +{"info/global_step": 207, "train_info/time_within_train_step": 2.2858288288116455, "step": 207} +{"train_info/time_between_train_steps": 0.003210306167602539, "step": 207} +{"info/global_step": 208, "train_info/time_within_train_step": 2.5057144165039062, "step": 208} +{"train_info/time_between_train_steps": 0.0034062862396240234, "step": 208} +{"info/global_step": 209, "train_info/time_within_train_step": 2.285647392272949, "step": 209} +{"train_info/time_between_train_steps": 0.003887176513671875, "step": 209} +{"info/global_step": 210, "train_info/time_within_train_step": 2.286492347717285, "step": 210} +{"train_info/time_between_train_steps": 0.0034363269805908203, "step": 210} +{"info/global_step": 211, "train_info/time_within_train_step": 2.2863824367523193, "step": 211} +{"train_info/time_between_train_steps": 0.0031762123107910156, "step": 211} +{"info/global_step": 212, "train_info/time_within_train_step": 2.2865803241729736, "step": 212} +{"train_info/time_between_train_steps": 0.003183603286743164, "step": 212} +{"info/global_step": 213, "train_info/time_within_train_step": 2.286123514175415, "step": 213} +{"train_info/time_between_train_steps": 0.003160715103149414, "step": 213} +{"info/global_step": 214, "train_info/time_within_train_step": 2.2871367931365967, "step": 214} +{"train_info/time_between_train_steps": 0.0033621788024902344, "step": 214} +{"info/global_step": 215, "train_info/time_within_train_step": 2.286653995513916, "step": 215} +{"train_info/time_between_train_steps": 0.0034096240997314453, "step": 215} +{"info/global_step": 216, "train_info/time_within_train_step": 2.286644458770752, "step": 216} +{"train_info/time_between_train_steps": 0.0031991004943847656, "step": 216} +{"info/global_step": 217, "train_info/time_within_train_step": 2.2873375415802, "step": 217} +{"train_info/time_between_train_steps": 0.0032806396484375, "step": 217} +{"info/global_step": 218, "train_info/time_within_train_step": 2.287217855453491, "step": 218} +{"train_info/time_between_train_steps": 0.0033066272735595703, "step": 218} +{"info/global_step": 219, "train_info/time_within_train_step": 2.2880797386169434, "step": 219} +{"train_info/time_between_train_steps": 0.003343343734741211, "step": 219} +{"info/global_step": 220, "train_info/time_within_train_step": 2.286855936050415, "step": 220} +{"train_info/time_between_train_steps": 0.003149271011352539, "step": 220} +{"info/global_step": 221, "train_info/time_within_train_step": 2.2870142459869385, "step": 221} +{"train_info/time_between_train_steps": 0.0031616687774658203, "step": 221} +{"info/global_step": 222, "train_info/time_within_train_step": 2.2872986793518066, "step": 222} +{"train_info/time_between_train_steps": 0.00331878662109375, "step": 222} +{"info/global_step": 223, "train_info/time_within_train_step": 2.287513494491577, "step": 223} +{"train_info/time_between_train_steps": 0.0032777786254882812, "step": 223} +{"info/global_step": 224, "train_info/time_within_train_step": 2.2871909141540527, "step": 224} +{"train_info/time_between_train_steps": 0.0031816959381103516, "step": 224} +{"info/global_step": 225, "train_info/time_within_train_step": 2.287177085876465, "step": 225} +{"train_info/time_between_train_steps": 0.0032324790954589844, "step": 225} +{"info/global_step": 226, "train_info/time_within_train_step": 2.2871248722076416, "step": 226} +{"train_info/time_between_train_steps": 0.0031647682189941406, "step": 226} +{"info/global_step": 227, "train_info/time_within_train_step": 2.2871103286743164, "step": 227} +{"train_info/time_between_train_steps": 0.003410816192626953, "step": 227} +{"info/global_step": 228, "train_info/time_within_train_step": 2.287187337875366, "step": 228} +{"train_info/time_between_train_steps": 0.003186941146850586, "step": 228} +{"info/global_step": 229, "train_info/time_within_train_step": 2.287029266357422, "step": 229} +{"train_info/time_between_train_steps": 0.0033791065216064453, "step": 229} +{"info/global_step": 230, "train_info/time_within_train_step": 2.287071704864502, "step": 230} +{"train_info/time_between_train_steps": 0.003245115280151367, "step": 230} +{"info/global_step": 231, "train_info/time_within_train_step": 2.287341833114624, "step": 231} +{"train_info/time_between_train_steps": 0.0034232139587402344, "step": 231} +{"info/global_step": 232, "train_info/time_within_train_step": 2.2870490550994873, "step": 232} +{"train_info/time_between_train_steps": 0.003258228302001953, "step": 232} +{"info/global_step": 233, "train_info/time_within_train_step": 2.2873592376708984, "step": 233} +{"train_info/time_between_train_steps": 0.0032351016998291016, "step": 233} +{"info/global_step": 234, "train_info/time_within_train_step": 2.286996841430664, "step": 234} +{"train_info/time_between_train_steps": 0.0034203529357910156, "step": 234} +{"info/global_step": 235, "train_info/time_within_train_step": 2.286292552947998, "step": 235} +{"train_info/time_between_train_steps": 0.003348112106323242, "step": 235} +{"info/global_step": 236, "train_info/time_within_train_step": 2.2871315479278564, "step": 236} +{"train_info/time_between_train_steps": 0.003295421600341797, "step": 236} +{"info/global_step": 237, "train_info/time_within_train_step": 2.2864482402801514, "step": 237} +{"train_info/time_between_train_steps": 0.003373384475708008, "step": 237} +{"info/global_step": 238, "train_info/time_within_train_step": 2.2859411239624023, "step": 238} +{"train_info/time_between_train_steps": 0.0033121109008789062, "step": 238} +{"info/global_step": 239, "train_info/time_within_train_step": 2.285956621170044, "step": 239} +{"train_info/time_between_train_steps": 0.003319978713989258, "step": 239} +{"info/global_step": 240, "train_info/time_within_train_step": 2.2857820987701416, "step": 240} +{"train_info/time_between_train_steps": 0.0033254623413085938, "step": 240} +{"info/global_step": 241, "train_info/time_within_train_step": 2.2860629558563232, "step": 241} +{"train_info/time_between_train_steps": 0.0031082630157470703, "step": 241} +{"info/global_step": 242, "train_info/time_within_train_step": 2.285865545272827, "step": 242} +{"train_info/time_between_train_steps": 0.0030961036682128906, "step": 242} +{"info/global_step": 243, "train_info/time_within_train_step": 2.285645008087158, "step": 243} +{"train_info/time_between_train_steps": 0.003156423568725586, "step": 243} +{"info/global_step": 244, "train_info/time_within_train_step": 2.2866482734680176, "step": 244} +{"train_info/time_between_train_steps": 0.0032329559326171875, "step": 244} +{"info/global_step": 245, "train_info/time_within_train_step": 2.28659987449646, "step": 245} +{"train_info/time_between_train_steps": 0.003408193588256836, "step": 245} +{"info/global_step": 246, "train_info/time_within_train_step": 2.287158489227295, "step": 246} +{"train_info/time_between_train_steps": 0.003318309783935547, "step": 246} +{"info/global_step": 247, "train_info/time_within_train_step": 2.2867746353149414, "step": 247} +{"train_info/time_between_train_steps": 0.003237485885620117, "step": 247} +{"info/global_step": 248, "train_info/time_within_train_step": 2.286604166030884, "step": 248} +{"train_info/time_between_train_steps": 0.0031092166900634766, "step": 248} +{"info/global_step": 249, "train_info/time_within_train_step": 2.2867257595062256, "step": 249} +{"train_info/time_between_train_steps": 0.003155946731567383, "step": 249} +{"info/global_step": 250, "train_info/time_within_train_step": 2.628960609436035, "step": 250} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 4588.0, "train_info/memory_max_reserved": 4588.0, "_timestamp": 1746344535, "_runtime": 632}, "step": 250} +{"logs": {"train/loss": 5.2495, "train/learning_rate": 0.0005, "train/epoch": 0.08, "_timestamp": 1746344535, "_runtime": 632}, "step": 250} +{"train_info/time_between_train_steps": 0.14871525764465332, "step": 250} +{"info/global_step": 251, "train_info/time_within_train_step": 2.2870943546295166, "step": 251} +{"train_info/time_between_train_steps": 0.0032007694244384766, "step": 251} +{"info/global_step": 252, "train_info/time_within_train_step": 2.2965357303619385, "step": 252} +{"train_info/time_between_train_steps": 0.00313568115234375, "step": 252} +{"info/global_step": 253, "train_info/time_within_train_step": 2.286329746246338, "step": 253} +{"train_info/time_between_train_steps": 0.0031366348266601562, "step": 253} +{"info/global_step": 254, "train_info/time_within_train_step": 2.286421537399292, "step": 254} +{"train_info/time_between_train_steps": 0.0031299591064453125, "step": 254} +{"info/global_step": 255, "train_info/time_within_train_step": 2.286329507827759, "step": 255} +{"train_info/time_between_train_steps": 0.003146648406982422, "step": 255} +{"info/global_step": 256, "train_info/time_within_train_step": 2.285841226577759, "step": 256} +{"train_info/time_between_train_steps": 0.0031540393829345703, "step": 256} +{"info/global_step": 257, "train_info/time_within_train_step": 2.2860677242279053, "step": 257} +{"train_info/time_between_train_steps": 0.0031538009643554688, "step": 257} +{"info/global_step": 258, "train_info/time_within_train_step": 2.2867014408111572, "step": 258} +{"train_info/time_between_train_steps": 0.0032067298889160156, "step": 258} +{"info/global_step": 259, "train_info/time_within_train_step": 2.2858808040618896, "step": 259} +{"train_info/time_between_train_steps": 0.0031566619873046875, "step": 259} +{"info/global_step": 260, "train_info/time_within_train_step": 2.2862751483917236, "step": 260} +{"train_info/time_between_train_steps": 0.003114938735961914, "step": 260} +{"info/global_step": 261, "train_info/time_within_train_step": 2.2864580154418945, "step": 261} +{"train_info/time_between_train_steps": 0.003123760223388672, "step": 261} +{"info/global_step": 262, "train_info/time_within_train_step": 2.2862467765808105, "step": 262} +{"train_info/time_between_train_steps": 0.003132343292236328, "step": 262} +{"info/global_step": 263, "train_info/time_within_train_step": 2.2864186763763428, "step": 263} +{"train_info/time_between_train_steps": 0.003168344497680664, "step": 263} +{"info/global_step": 264, "train_info/time_within_train_step": 2.2860679626464844, "step": 264} +{"train_info/time_between_train_steps": 0.0031571388244628906, "step": 264} +{"info/global_step": 265, "train_info/time_within_train_step": 2.2872815132141113, "step": 265} +{"train_info/time_between_train_steps": 0.0031614303588867188, "step": 265} +{"info/global_step": 266, "train_info/time_within_train_step": 2.2864720821380615, "step": 266} +{"train_info/time_between_train_steps": 0.0031430721282958984, "step": 266} +{"info/global_step": 267, "train_info/time_within_train_step": 2.2865166664123535, "step": 267} +{"train_info/time_between_train_steps": 0.0031266212463378906, "step": 267} +{"info/global_step": 268, "train_info/time_within_train_step": 2.2963926792144775, "step": 268} +{"train_info/time_between_train_steps": 0.0031270980834960938, "step": 268} +{"info/global_step": 269, "train_info/time_within_train_step": 2.3060953617095947, "step": 269} +{"train_info/time_between_train_steps": 0.0031282901763916016, "step": 269} +{"info/global_step": 270, "train_info/time_within_train_step": 2.2870919704437256, "step": 270} +{"train_info/time_between_train_steps": 0.003113269805908203, "step": 270} +{"info/global_step": 271, "train_info/time_within_train_step": 2.2870264053344727, "step": 271} +{"train_info/time_between_train_steps": 0.003126859664916992, "step": 271} +{"info/global_step": 272, "train_info/time_within_train_step": 2.2864811420440674, "step": 272} +{"train_info/time_between_train_steps": 0.003155231475830078, "step": 272} +{"info/global_step": 273, "train_info/time_within_train_step": 2.2859389781951904, "step": 273} +{"train_info/time_between_train_steps": 0.003154754638671875, "step": 273} +{"info/global_step": 274, "train_info/time_within_train_step": 2.2861196994781494, "step": 274} +{"train_info/time_between_train_steps": 0.0031409263610839844, "step": 274} +{"info/global_step": 275, "train_info/time_within_train_step": 2.286360740661621, "step": 275} +{"train_info/time_between_train_steps": 0.0031309127807617188, "step": 275} +{"info/global_step": 276, "train_info/time_within_train_step": 2.28684663772583, "step": 276} +{"train_info/time_between_train_steps": 0.003162860870361328, "step": 276} +{"info/global_step": 277, "train_info/time_within_train_step": 2.2862868309020996, "step": 277} +{"train_info/time_between_train_steps": 0.0031349658966064453, "step": 277} +{"info/global_step": 278, "train_info/time_within_train_step": 2.295485258102417, "step": 278} +{"train_info/time_between_train_steps": 0.0031211376190185547, "step": 278} +{"info/global_step": 279, "train_info/time_within_train_step": 2.2858707904815674, "step": 279} +{"train_info/time_between_train_steps": 0.0031054019927978516, "step": 279} +{"info/global_step": 280, "train_info/time_within_train_step": 2.285719871520996, "step": 280} +{"train_info/time_between_train_steps": 0.0032265186309814453, "step": 280} +{"info/global_step": 281, "train_info/time_within_train_step": 2.285767078399658, "step": 281} +{"train_info/time_between_train_steps": 0.0031371116638183594, "step": 281} +{"info/global_step": 282, "train_info/time_within_train_step": 2.285433292388916, "step": 282} +{"train_info/time_between_train_steps": 0.003168821334838867, "step": 282} +{"info/global_step": 283, "train_info/time_within_train_step": 2.2858998775482178, "step": 283} +{"train_info/time_between_train_steps": 0.0031042098999023438, "step": 283} +{"info/global_step": 284, "train_info/time_within_train_step": 2.2859902381896973, "step": 284} +{"train_info/time_between_train_steps": 0.0033342838287353516, "step": 284} +{"info/global_step": 285, "train_info/time_within_train_step": 2.2863848209381104, "step": 285} +{"train_info/time_between_train_steps": 0.0031113624572753906, "step": 285} +{"info/global_step": 286, "train_info/time_within_train_step": 2.2860794067382812, "step": 286} +{"train_info/time_between_train_steps": 0.003094911575317383, "step": 286} +{"info/global_step": 287, "train_info/time_within_train_step": 2.2869889736175537, "step": 287} +{"train_info/time_between_train_steps": 0.003184080123901367, "step": 287} +{"info/global_step": 288, "train_info/time_within_train_step": 2.2861053943634033, "step": 288} +{"train_info/time_between_train_steps": 0.003148794174194336, "step": 288} +{"info/global_step": 289, "train_info/time_within_train_step": 2.286973476409912, "step": 289} +{"train_info/time_between_train_steps": 0.0031669139862060547, "step": 289} +{"info/global_step": 290, "train_info/time_within_train_step": 2.2868103981018066, "step": 290} +{"train_info/time_between_train_steps": 0.003124713897705078, "step": 290} +{"info/global_step": 291, "train_info/time_within_train_step": 2.287753105163574, "step": 291} +{"train_info/time_between_train_steps": 0.003222227096557617, "step": 291} +{"info/global_step": 292, "train_info/time_within_train_step": 2.536792039871216, "step": 292} +{"train_info/time_between_train_steps": 0.003254413604736328, "step": 292} +{"info/global_step": 293, "train_info/time_within_train_step": 2.2874526977539062, "step": 293} +{"train_info/time_between_train_steps": 0.003412485122680664, "step": 293} +{"info/global_step": 294, "train_info/time_within_train_step": 2.288477659225464, "step": 294} +{"train_info/time_between_train_steps": 0.0035037994384765625, "step": 294} +{"info/global_step": 295, "train_info/time_within_train_step": 2.2873153686523438, "step": 295} +{"train_info/time_between_train_steps": 0.0034842491149902344, "step": 295} +{"info/global_step": 296, "train_info/time_within_train_step": 2.2872469425201416, "step": 296} +{"train_info/time_between_train_steps": 0.003505706787109375, "step": 296} +{"info/global_step": 297, "train_info/time_within_train_step": 2.2872848510742188, "step": 297} +{"train_info/time_between_train_steps": 0.0034551620483398438, "step": 297} +{"info/global_step": 298, "train_info/time_within_train_step": 2.2920026779174805, "step": 298} +{"train_info/time_between_train_steps": 0.0034334659576416016, "step": 298} +{"info/global_step": 299, "train_info/time_within_train_step": 2.286780595779419, "step": 299} +{"train_info/time_between_train_steps": 0.003449678421020508, "step": 299} +{"info/global_step": 300, "train_info/time_within_train_step": 2.285857677459717, "step": 300} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 4588.0, "train_info/memory_max_reserved": 4588.0, "_timestamp": 1746344651, "_runtime": 748}, "step": 300} +{"logs": {"train/loss": 5.0361, "train/learning_rate": 0.0006, "train/epoch": 0.1, "_timestamp": 1746344651, "_runtime": 748}, "step": 300} +{"train_info/time_between_train_steps": 12.309519529342651, "step": 300} +{"info/global_step": 301, "train_info/time_within_train_step": 2.1156630516052246, "step": 301} +{"train_info/time_between_train_steps": 0.003551006317138672, "step": 301} +{"info/global_step": 302, "train_info/time_within_train_step": 2.1002731323242188, "step": 302} +{"train_info/time_between_train_steps": 0.003507852554321289, "step": 302} +{"info/global_step": 303, "train_info/time_within_train_step": 2.2189152240753174, "step": 303} +{"train_info/time_between_train_steps": 0.003534555435180664, "step": 303} +{"info/global_step": 304, "train_info/time_within_train_step": 2.2853052616119385, "step": 304} +{"train_info/time_between_train_steps": 0.003488302230834961, "step": 304} +{"info/global_step": 305, "train_info/time_within_train_step": 2.2856597900390625, "step": 305} +{"train_info/time_between_train_steps": 0.0035419464111328125, "step": 305} +{"info/global_step": 306, "train_info/time_within_train_step": 2.286318778991699, "step": 306} +{"train_info/time_between_train_steps": 0.003515005111694336, "step": 306} +{"info/global_step": 307, "train_info/time_within_train_step": 2.2863757610321045, "step": 307} +{"train_info/time_between_train_steps": 0.003455638885498047, "step": 307} +{"info/global_step": 308, "train_info/time_within_train_step": 2.286161422729492, "step": 308} +{"train_info/time_between_train_steps": 0.003535747528076172, "step": 308} +{"info/global_step": 309, "train_info/time_within_train_step": 2.286135673522949, "step": 309} +{"train_info/time_between_train_steps": 0.0035004615783691406, "step": 309} +{"info/global_step": 310, "train_info/time_within_train_step": 2.28719162940979, "step": 310} +{"train_info/time_between_train_steps": 0.003566265106201172, "step": 310} +{"info/global_step": 311, "train_info/time_within_train_step": 2.2874937057495117, "step": 311} +{"train_info/time_between_train_steps": 0.0035140514373779297, "step": 311} +{"info/global_step": 312, "train_info/time_within_train_step": 2.287537097930908, "step": 312} +{"train_info/time_between_train_steps": 0.003523111343383789, "step": 312} +{"info/global_step": 313, "train_info/time_within_train_step": 2.4622390270233154, "step": 313} +{"train_info/time_between_train_steps": 0.0033156871795654297, "step": 313} +{"info/global_step": 314, "train_info/time_within_train_step": 2.2870073318481445, "step": 314} +{"train_info/time_between_train_steps": 0.0033140182495117188, "step": 314} +{"info/global_step": 315, "train_info/time_within_train_step": 2.2860312461853027, "step": 315} +{"train_info/time_between_train_steps": 0.0033190250396728516, "step": 315} +{"info/global_step": 316, "train_info/time_within_train_step": 2.2865102291107178, "step": 316} +{"train_info/time_between_train_steps": 0.003278017044067383, "step": 316} +{"info/global_step": 317, "train_info/time_within_train_step": 2.286144495010376, "step": 317} +{"train_info/time_between_train_steps": 0.00333404541015625, "step": 317} +{"info/global_step": 318, "train_info/time_within_train_step": 2.2863519191741943, "step": 318} +{"train_info/time_between_train_steps": 0.0032958984375, "step": 318} +{"info/global_step": 319, "train_info/time_within_train_step": 2.2864928245544434, "step": 319} +{"train_info/time_between_train_steps": 0.003305196762084961, "step": 319} +{"info/global_step": 320, "train_info/time_within_train_step": 2.2867627143859863, "step": 320} +{"train_info/time_between_train_steps": 0.0032820701599121094, "step": 320} +{"info/global_step": 321, "train_info/time_within_train_step": 2.2862343788146973, "step": 321} +{"train_info/time_between_train_steps": 0.003374814987182617, "step": 321} +{"info/global_step": 322, "train_info/time_within_train_step": 2.2866756916046143, "step": 322} +{"train_info/time_between_train_steps": 0.003410816192626953, "step": 322} +{"info/global_step": 323, "train_info/time_within_train_step": 2.286652088165283, "step": 323} +{"train_info/time_between_train_steps": 0.003313302993774414, "step": 323} +{"info/global_step": 324, "train_info/time_within_train_step": 2.2865257263183594, "step": 324} +{"train_info/time_between_train_steps": 0.0032956600189208984, "step": 324} +{"info/global_step": 325, "train_info/time_within_train_step": 2.2867977619171143, "step": 325} +{"train_info/time_between_train_steps": 0.0033180713653564453, "step": 325} +{"info/global_step": 326, "train_info/time_within_train_step": 2.2870121002197266, "step": 326} +{"train_info/time_between_train_steps": 0.003302335739135742, "step": 326} +{"info/global_step": 327, "train_info/time_within_train_step": 2.2869503498077393, "step": 327} +{"train_info/time_between_train_steps": 0.003187417984008789, "step": 327} +{"info/global_step": 328, "train_info/time_within_train_step": 2.2872378826141357, "step": 328} +{"train_info/time_between_train_steps": 0.0032923221588134766, "step": 328} +{"info/global_step": 329, "train_info/time_within_train_step": 2.2871997356414795, "step": 329} +{"train_info/time_between_train_steps": 0.0033333301544189453, "step": 329} +{"info/global_step": 330, "train_info/time_within_train_step": 2.287407159805298, "step": 330} +{"train_info/time_between_train_steps": 0.003359556198120117, "step": 330} +{"info/global_step": 331, "train_info/time_within_train_step": 2.2875499725341797, "step": 331} +{"train_info/time_between_train_steps": 0.003323793411254883, "step": 331} +{"info/global_step": 332, "train_info/time_within_train_step": 2.28769588470459, "step": 332} +{"train_info/time_between_train_steps": 0.003354310989379883, "step": 332} +{"info/global_step": 333, "train_info/time_within_train_step": 2.287604570388794, "step": 333} +{"train_info/time_between_train_steps": 0.0032329559326171875, "step": 333} +{"info/global_step": 334, "train_info/time_within_train_step": 2.2873454093933105, "step": 334} +{"train_info/time_between_train_steps": 0.003316640853881836, "step": 334} +{"info/global_step": 335, "train_info/time_within_train_step": 2.286924362182617, "step": 335} +{"train_info/time_between_train_steps": 0.003335714340209961, "step": 335} +{"info/global_step": 336, "train_info/time_within_train_step": 2.286576509475708, "step": 336} +{"train_info/time_between_train_steps": 0.0032787322998046875, "step": 336} +{"info/global_step": 337, "train_info/time_within_train_step": 2.2866311073303223, "step": 337} +{"train_info/time_between_train_steps": 0.0033876895904541016, "step": 337} +{"info/global_step": 338, "train_info/time_within_train_step": 2.2863028049468994, "step": 338} +{"train_info/time_between_train_steps": 0.003262758255004883, "step": 338} +{"info/global_step": 339, "train_info/time_within_train_step": 2.286328077316284, "step": 339} +{"train_info/time_between_train_steps": 0.003245830535888672, "step": 339} +{"info/global_step": 340, "train_info/time_within_train_step": 2.2860565185546875, "step": 340} +{"train_info/time_between_train_steps": 0.0032837390899658203, "step": 340} +{"info/global_step": 341, "train_info/time_within_train_step": 2.285862684249878, "step": 341} +{"train_info/time_between_train_steps": 0.0032830238342285156, "step": 341} +{"info/global_step": 342, "train_info/time_within_train_step": 2.2863893508911133, "step": 342} +{"train_info/time_between_train_steps": 0.0033032894134521484, "step": 342} +{"info/global_step": 343, "train_info/time_within_train_step": 2.2861645221710205, "step": 343} +{"train_info/time_between_train_steps": 0.0032541751861572266, "step": 343} +{"info/global_step": 344, "train_info/time_within_train_step": 2.2863097190856934, "step": 344} +{"train_info/time_between_train_steps": 0.003270387649536133, "step": 344} +{"info/global_step": 345, "train_info/time_within_train_step": 2.2862629890441895, "step": 345} +{"train_info/time_between_train_steps": 0.0032868385314941406, "step": 345} +{"info/global_step": 346, "train_info/time_within_train_step": 2.286836862564087, "step": 346} +{"train_info/time_between_train_steps": 0.003256559371948242, "step": 346} +{"info/global_step": 347, "train_info/time_within_train_step": 2.2865774631500244, "step": 347} +{"train_info/time_between_train_steps": 0.003289937973022461, "step": 347} +{"info/global_step": 348, "train_info/time_within_train_step": 2.28688645362854, "step": 348} +{"train_info/time_between_train_steps": 0.003291606903076172, "step": 348} +{"info/global_step": 349, "train_info/time_within_train_step": 2.2868220806121826, "step": 349} +{"train_info/time_between_train_steps": 0.003283262252807617, "step": 349} +{"info/global_step": 350, "train_info/time_within_train_step": 2.286627769470215, "step": 350} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 4588.0, "train_info/memory_max_reserved": 4588.0, "_timestamp": 1746344779, "_runtime": 876}, "step": 350} +{"logs": {"train/loss": 4.8976, "train/learning_rate": 0.0005888888888888889, "train/epoch": 0.12, "_timestamp": 1746344779, "_runtime": 876}, "step": 350} +{"train_info/time_between_train_steps": 0.024029970169067383, "step": 350} +{"info/global_step": 351, "train_info/time_within_train_step": 2.287203788757324, "step": 351} +{"train_info/time_between_train_steps": 0.003363370895385742, "step": 351} +{"info/global_step": 352, "train_info/time_within_train_step": 2.286475419998169, "step": 352} +{"train_info/time_between_train_steps": 0.0033235549926757812, "step": 352} +{"info/global_step": 353, "train_info/time_within_train_step": 2.2867794036865234, "step": 353} +{"train_info/time_between_train_steps": 0.003277301788330078, "step": 353} +{"info/global_step": 354, "train_info/time_within_train_step": 2.286595344543457, "step": 354} +{"train_info/time_between_train_steps": 0.003300189971923828, "step": 354} +{"info/global_step": 355, "train_info/time_within_train_step": 2.2861828804016113, "step": 355} +{"train_info/time_between_train_steps": 0.0033316612243652344, "step": 355} +{"info/global_step": 356, "train_info/time_within_train_step": 2.2865395545959473, "step": 356} +{"train_info/time_between_train_steps": 0.003301382064819336, "step": 356} +{"info/global_step": 357, "train_info/time_within_train_step": 2.2863945960998535, "step": 357} +{"train_info/time_between_train_steps": 0.0032835006713867188, "step": 357} +{"info/global_step": 358, "train_info/time_within_train_step": 2.2863144874572754, "step": 358} +{"train_info/time_between_train_steps": 0.003346681594848633, "step": 358} +{"info/global_step": 359, "train_info/time_within_train_step": 2.2857420444488525, "step": 359} +{"train_info/time_between_train_steps": 0.003308534622192383, "step": 359} +{"info/global_step": 360, "train_info/time_within_train_step": 2.2865869998931885, "step": 360} +{"train_info/time_between_train_steps": 0.0033020973205566406, "step": 360} +{"info/global_step": 361, "train_info/time_within_train_step": 2.285897731781006, "step": 361} +{"train_info/time_between_train_steps": 0.0033147335052490234, "step": 361} +{"info/global_step": 362, "train_info/time_within_train_step": 2.285980463027954, "step": 362} +{"train_info/time_between_train_steps": 0.0033376216888427734, "step": 362} +{"info/global_step": 363, "train_info/time_within_train_step": 2.286003351211548, "step": 363} +{"train_info/time_between_train_steps": 0.0033788681030273438, "step": 363} +{"info/global_step": 364, "train_info/time_within_train_step": 2.286348581314087, "step": 364} +{"train_info/time_between_train_steps": 0.0033111572265625, "step": 364} +{"info/global_step": 365, "train_info/time_within_train_step": 2.2854459285736084, "step": 365} +{"train_info/time_between_train_steps": 0.0032806396484375, "step": 365} +{"info/global_step": 366, "train_info/time_within_train_step": 2.2860546112060547, "step": 366} +{"train_info/time_between_train_steps": 0.0032737255096435547, "step": 366} +{"info/global_step": 367, "train_info/time_within_train_step": 2.285999298095703, "step": 367} +{"train_info/time_between_train_steps": 0.003286600112915039, "step": 367} +{"info/global_step": 368, "train_info/time_within_train_step": 2.286473512649536, "step": 368} +{"train_info/time_between_train_steps": 0.003226041793823242, "step": 368} +{"info/global_step": 369, "train_info/time_within_train_step": 2.2854011058807373, "step": 369} +{"train_info/time_between_train_steps": 0.0032885074615478516, "step": 369} +{"info/global_step": 370, "train_info/time_within_train_step": 2.2865259647369385, "step": 370} +{"train_info/time_between_train_steps": 0.0033283233642578125, "step": 370} +{"info/global_step": 371, "train_info/time_within_train_step": 2.286416530609131, "step": 371} +{"train_info/time_between_train_steps": 0.003389596939086914, "step": 371} +{"info/global_step": 372, "train_info/time_within_train_step": 2.604247808456421, "step": 372} +{"train_info/time_between_train_steps": 0.003186941146850586, "step": 372} +{"info/global_step": 373, "train_info/time_within_train_step": 2.285781145095825, "step": 373} +{"train_info/time_between_train_steps": 0.0032079219818115234, "step": 373} +{"info/global_step": 374, "train_info/time_within_train_step": 2.2860732078552246, "step": 374} +{"train_info/time_between_train_steps": 0.0031669139862060547, "step": 374} +{"info/global_step": 375, "train_info/time_within_train_step": 2.2857604026794434, "step": 375} +{"train_info/time_between_train_steps": 0.12479639053344727, "step": 375} +{"info/global_step": 376, "train_info/time_within_train_step": 2.3093719482421875, "step": 376} +{"train_info/time_between_train_steps": 0.0031981468200683594, "step": 376} +{"info/global_step": 377, "train_info/time_within_train_step": 2.285937786102295, "step": 377} +{"train_info/time_between_train_steps": 0.0031952857971191406, "step": 377} +{"info/global_step": 378, "train_info/time_within_train_step": 2.294886589050293, "step": 378} +{"train_info/time_between_train_steps": 0.003197193145751953, "step": 378} +{"info/global_step": 379, "train_info/time_within_train_step": 2.2859792709350586, "step": 379} +{"train_info/time_between_train_steps": 0.003177642822265625, "step": 379} +{"info/global_step": 380, "train_info/time_within_train_step": 2.2854692935943604, "step": 380} +{"train_info/time_between_train_steps": 0.0031626224517822266, "step": 380} +{"info/global_step": 381, "train_info/time_within_train_step": 2.285933017730713, "step": 381} +{"train_info/time_between_train_steps": 0.0032606124877929688, "step": 381} +{"info/global_step": 382, "train_info/time_within_train_step": 2.2857472896575928, "step": 382} +{"train_info/time_between_train_steps": 0.0031719207763671875, "step": 382} +{"info/global_step": 383, "train_info/time_within_train_step": 2.285784959793091, "step": 383} +{"train_info/time_between_train_steps": 0.0031943321228027344, "step": 383} +{"info/global_step": 384, "train_info/time_within_train_step": 2.28548002243042, "step": 384} +{"train_info/time_between_train_steps": 0.0031692981719970703, "step": 384} +{"info/global_step": 385, "train_info/time_within_train_step": 2.2995107173919678, "step": 385} +{"train_info/time_between_train_steps": 0.0031812191009521484, "step": 385} +{"info/global_step": 386, "train_info/time_within_train_step": 2.2852516174316406, "step": 386} +{"train_info/time_between_train_steps": 0.003162860870361328, "step": 386} +{"info/global_step": 387, "train_info/time_within_train_step": 2.2847564220428467, "step": 387} +{"train_info/time_between_train_steps": 0.0031592845916748047, "step": 387} +{"info/global_step": 388, "train_info/time_within_train_step": 2.28489089012146, "step": 388} +{"train_info/time_between_train_steps": 0.003181934356689453, "step": 388} +{"info/global_step": 389, "train_info/time_within_train_step": 2.285107135772705, "step": 389} +{"train_info/time_between_train_steps": 0.003164052963256836, "step": 389} +{"info/global_step": 390, "train_info/time_within_train_step": 2.2852532863616943, "step": 390} +{"train_info/time_between_train_steps": 0.0031630992889404297, "step": 390} +{"info/global_step": 391, "train_info/time_within_train_step": 2.2854888439178467, "step": 391} +{"train_info/time_between_train_steps": 0.003217935562133789, "step": 391} +{"info/global_step": 392, "train_info/time_within_train_step": 2.299556255340576, "step": 392} +{"train_info/time_between_train_steps": 0.0031752586364746094, "step": 392} +{"info/global_step": 393, "train_info/time_within_train_step": 2.2857449054718018, "step": 393} +{"train_info/time_between_train_steps": 0.0032112598419189453, "step": 393} +{"info/global_step": 394, "train_info/time_within_train_step": 2.2862181663513184, "step": 394} +{"train_info/time_between_train_steps": 0.003171205520629883, "step": 394} +{"info/global_step": 395, "train_info/time_within_train_step": 2.285810708999634, "step": 395} +{"train_info/time_between_train_steps": 0.0031778812408447266, "step": 395} +{"info/global_step": 396, "train_info/time_within_train_step": 2.2858941555023193, "step": 396} +{"train_info/time_between_train_steps": 0.0031557083129882812, "step": 396} +{"info/global_step": 397, "train_info/time_within_train_step": 2.2853305339813232, "step": 397} +{"train_info/time_between_train_steps": 0.0031557083129882812, "step": 397} +{"info/global_step": 398, "train_info/time_within_train_step": 2.286156415939331, "step": 398} +{"train_info/time_between_train_steps": 0.0031533241271972656, "step": 398} +{"info/global_step": 399, "train_info/time_within_train_step": 2.285953998565674, "step": 399} +{"train_info/time_between_train_steps": 0.003175020217895508, "step": 399} +{"info/global_step": 400, "train_info/time_within_train_step": 2.2856662273406982, "step": 400} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 4588.0, "train_info/memory_max_reserved": 4588.0, "_timestamp": 1746344895, "_runtime": 992}, "step": 400} +{"logs": {"train/loss": 4.8056, "train/learning_rate": 0.0005777777777777776, "train/epoch": 0.13, "_timestamp": 1746344895, "_runtime": 992}, "step": 400} +{"train_info/time_between_train_steps": 17.3736515045166, "step": 400} +{"info/global_step": 401, "train_info/time_within_train_step": 2.1167454719543457, "step": 401} +{"train_info/time_between_train_steps": 0.0031201839447021484, "step": 401} +{"info/global_step": 402, "train_info/time_within_train_step": 2.099668264389038, "step": 402} +{"train_info/time_between_train_steps": 0.003154277801513672, "step": 402} +{"info/global_step": 403, "train_info/time_within_train_step": 2.134308338165283, "step": 403} +{"train_info/time_between_train_steps": 0.0032196044921875, "step": 403} +{"info/global_step": 404, "train_info/time_within_train_step": 2.2827343940734863, "step": 404} +{"train_info/time_between_train_steps": 0.003170490264892578, "step": 404} +{"info/global_step": 405, "train_info/time_within_train_step": 2.284076690673828, "step": 405} +{"train_info/time_between_train_steps": 0.0031507015228271484, "step": 405} +{"info/global_step": 406, "train_info/time_within_train_step": 2.2838263511657715, "step": 406} +{"train_info/time_between_train_steps": 0.0032320022583007812, "step": 406} +{"info/global_step": 407, "train_info/time_within_train_step": 2.285350799560547, "step": 407} +{"train_info/time_between_train_steps": 0.0031859874725341797, "step": 407} +{"info/global_step": 408, "train_info/time_within_train_step": 2.2864065170288086, "step": 408} +{"train_info/time_between_train_steps": 0.003192424774169922, "step": 408} +{"info/global_step": 409, "train_info/time_within_train_step": 2.2858800888061523, "step": 409} +{"train_info/time_between_train_steps": 0.0031936168670654297, "step": 409} +{"info/global_step": 410, "train_info/time_within_train_step": 2.285991907119751, "step": 410} +{"train_info/time_between_train_steps": 0.003187894821166992, "step": 410} +{"info/global_step": 411, "train_info/time_within_train_step": 2.2862911224365234, "step": 411} +{"train_info/time_between_train_steps": 0.003138303756713867, "step": 411} +{"info/global_step": 412, "train_info/time_within_train_step": 2.2867724895477295, "step": 412} +{"train_info/time_between_train_steps": 0.0031859874725341797, "step": 412} +{"info/global_step": 413, "train_info/time_within_train_step": 2.2867305278778076, "step": 413} +{"train_info/time_between_train_steps": 0.0031969547271728516, "step": 413} +{"info/global_step": 414, "train_info/time_within_train_step": 2.2862398624420166, "step": 414} +{"train_info/time_between_train_steps": 0.0031986236572265625, "step": 414} +{"info/global_step": 415, "train_info/time_within_train_step": 2.2867136001586914, "step": 415} +{"train_info/time_between_train_steps": 0.0031752586364746094, "step": 415} +{"info/global_step": 416, "train_info/time_within_train_step": 2.2873945236206055, "step": 416} +{"train_info/time_between_train_steps": 0.003217458724975586, "step": 416} +{"info/global_step": 417, "train_info/time_within_train_step": 2.287273645401001, "step": 417} +{"train_info/time_between_train_steps": 0.003206014633178711, "step": 417} +{"info/global_step": 418, "train_info/time_within_train_step": 2.286929130554199, "step": 418} +{"train_info/time_between_train_steps": 0.003205537796020508, "step": 418} +{"info/global_step": 419, "train_info/time_within_train_step": 2.2871620655059814, "step": 419} +{"train_info/time_between_train_steps": 0.003214597702026367, "step": 419} +{"info/global_step": 420, "train_info/time_within_train_step": 2.2873363494873047, "step": 420} +{"train_info/time_between_train_steps": 0.0031957626342773438, "step": 420} +{"info/global_step": 421, "train_info/time_within_train_step": 2.287693738937378, "step": 421} +{"train_info/time_between_train_steps": 0.003202199935913086, "step": 421} +{"info/global_step": 422, "train_info/time_within_train_step": 2.2872607707977295, "step": 422} +{"train_info/time_between_train_steps": 0.0032210350036621094, "step": 422} +{"info/global_step": 423, "train_info/time_within_train_step": 2.2877371311187744, "step": 423} +{"train_info/time_between_train_steps": 0.0031871795654296875, "step": 423} +{"info/global_step": 424, "train_info/time_within_train_step": 2.287684917449951, "step": 424} +{"train_info/time_between_train_steps": 0.0031824111938476562, "step": 424} +{"info/global_step": 425, "train_info/time_within_train_step": 2.2883780002593994, "step": 425} +{"train_info/time_between_train_steps": 0.003225088119506836, "step": 425} +{"info/global_step": 426, "train_info/time_within_train_step": 2.2872695922851562, "step": 426} +{"train_info/time_between_train_steps": 0.0031633377075195312, "step": 426} +{"info/global_step": 427, "train_info/time_within_train_step": 2.2877588272094727, "step": 427} +{"train_info/time_between_train_steps": 0.003152608871459961, "step": 427} +{"info/global_step": 428, "train_info/time_within_train_step": 2.2878434658050537, "step": 428} +{"train_info/time_between_train_steps": 0.0031516551971435547, "step": 428} +{"info/global_step": 429, "train_info/time_within_train_step": 2.2876877784729004, "step": 429} +{"train_info/time_between_train_steps": 0.003171205520629883, "step": 429} +{"info/global_step": 430, "train_info/time_within_train_step": 2.287602663040161, "step": 430} +{"train_info/time_between_train_steps": 0.003238201141357422, "step": 430} +{"info/global_step": 431, "train_info/time_within_train_step": 2.2872135639190674, "step": 431} +{"train_info/time_between_train_steps": 0.003211498260498047, "step": 431} +{"info/global_step": 432, "train_info/time_within_train_step": 2.287283182144165, "step": 432} +{"train_info/time_between_train_steps": 0.003176450729370117, "step": 432} +{"info/global_step": 433, "train_info/time_within_train_step": 2.28672456741333, "step": 433} +{"train_info/time_between_train_steps": 0.0031690597534179688, "step": 433} +{"info/global_step": 434, "train_info/time_within_train_step": 2.2872142791748047, "step": 434} +{"train_info/time_between_train_steps": 0.0031647682189941406, "step": 434} +{"info/global_step": 435, "train_info/time_within_train_step": 2.2870771884918213, "step": 435} +{"train_info/time_between_train_steps": 0.003144979476928711, "step": 435} +{"info/global_step": 436, "train_info/time_within_train_step": 2.2867090702056885, "step": 436} +{"train_info/time_between_train_steps": 0.0031681060791015625, "step": 436} +{"info/global_step": 437, "train_info/time_within_train_step": 2.5289669036865234, "step": 437} +{"train_info/time_between_train_steps": 0.003243684768676758, "step": 437} +{"info/global_step": 438, "train_info/time_within_train_step": 2.409118413925171, "step": 438} +{"train_info/time_between_train_steps": 0.0032265186309814453, "step": 438} +{"info/global_step": 439, "train_info/time_within_train_step": 2.2869393825531006, "step": 439} +{"train_info/time_between_train_steps": 0.003160238265991211, "step": 439} +{"info/global_step": 440, "train_info/time_within_train_step": 2.286426305770874, "step": 440} +{"train_info/time_between_train_steps": 0.0032036304473876953, "step": 440} +{"info/global_step": 441, "train_info/time_within_train_step": 2.286778688430786, "step": 441} +{"train_info/time_between_train_steps": 0.0031540393829345703, "step": 441} +{"info/global_step": 442, "train_info/time_within_train_step": 2.2870612144470215, "step": 442} +{"train_info/time_between_train_steps": 0.0031402111053466797, "step": 442} +{"info/global_step": 443, "train_info/time_within_train_step": 2.2870404720306396, "step": 443} +{"train_info/time_between_train_steps": 0.0031986236572265625, "step": 443} +{"info/global_step": 444, "train_info/time_within_train_step": 2.2871880531311035, "step": 444} +{"train_info/time_between_train_steps": 0.003138303756713867, "step": 444} +{"info/global_step": 445, "train_info/time_within_train_step": 2.286479949951172, "step": 445} +{"train_info/time_between_train_steps": 0.003168821334838867, "step": 445} +{"info/global_step": 446, "train_info/time_within_train_step": 2.286700487136841, "step": 446} +{"train_info/time_between_train_steps": 0.0031626224517822266, "step": 446} +{"info/global_step": 447, "train_info/time_within_train_step": 2.2870430946350098, "step": 447} +{"train_info/time_between_train_steps": 0.003148794174194336, "step": 447} +{"info/global_step": 448, "train_info/time_within_train_step": 2.2868473529815674, "step": 448} +{"train_info/time_between_train_steps": 0.003174304962158203, "step": 448} +{"info/global_step": 449, "train_info/time_within_train_step": 2.286860704421997, "step": 449} +{"train_info/time_between_train_steps": 0.003131389617919922, "step": 449} +{"info/global_step": 450, "train_info/time_within_train_step": 2.286912202835083, "step": 450} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 4588.0, "train_info/memory_max_reserved": 4588.0, "_timestamp": 1746345028, "_runtime": 1125}, "step": 450} +{"logs": {"train/loss": 4.7468, "train/learning_rate": 0.0005666666666666666, "train/epoch": 0.15, "_timestamp": 1746345028, "_runtime": 1125}, "step": 450} +{"train_info/time_between_train_steps": 0.02398824691772461, "step": 450} +{"info/global_step": 451, "train_info/time_within_train_step": 2.286007881164551, "step": 451} +{"train_info/time_between_train_steps": 0.003131866455078125, "step": 451} +{"info/global_step": 452, "train_info/time_within_train_step": 2.2861580848693848, "step": 452} +{"train_info/time_between_train_steps": 0.0031599998474121094, "step": 452} +{"info/global_step": 453, "train_info/time_within_train_step": 2.286132335662842, "step": 453} +{"train_info/time_between_train_steps": 0.0032057762145996094, "step": 453} +{"info/global_step": 454, "train_info/time_within_train_step": 2.2862679958343506, "step": 454} +{"train_info/time_between_train_steps": 0.003232717514038086, "step": 454} +{"info/global_step": 455, "train_info/time_within_train_step": 2.28631854057312, "step": 455} +{"train_info/time_between_train_steps": 0.0031766891479492188, "step": 455} +{"info/global_step": 456, "train_info/time_within_train_step": 2.295585870742798, "step": 456} +{"train_info/time_between_train_steps": 0.0032219886779785156, "step": 456} +{"info/global_step": 457, "train_info/time_within_train_step": 2.2856807708740234, "step": 457} +{"train_info/time_between_train_steps": 0.00315093994140625, "step": 457} +{"info/global_step": 458, "train_info/time_within_train_step": 2.2866621017456055, "step": 458} +{"train_info/time_between_train_steps": 0.003202199935913086, "step": 458} +{"info/global_step": 459, "train_info/time_within_train_step": 2.2860586643218994, "step": 459} +{"train_info/time_between_train_steps": 0.0031456947326660156, "step": 459} +{"info/global_step": 460, "train_info/time_within_train_step": 2.3001646995544434, "step": 460} +{"train_info/time_between_train_steps": 0.0031473636627197266, "step": 460} +{"info/global_step": 461, "train_info/time_within_train_step": 2.286878824234009, "step": 461} +{"train_info/time_between_train_steps": 0.003206968307495117, "step": 461} +{"info/global_step": 462, "train_info/time_within_train_step": 2.2867588996887207, "step": 462} +{"train_info/time_between_train_steps": 0.0032196044921875, "step": 462} +{"info/global_step": 463, "train_info/time_within_train_step": 2.2876951694488525, "step": 463} +{"train_info/time_between_train_steps": 0.0031766891479492188, "step": 463} +{"info/global_step": 464, "train_info/time_within_train_step": 2.286717176437378, "step": 464} +{"train_info/time_between_train_steps": 0.003162860870361328, "step": 464} +{"info/global_step": 465, "train_info/time_within_train_step": 2.286156177520752, "step": 465} +{"train_info/time_between_train_steps": 0.0031964778900146484, "step": 465} +{"info/global_step": 466, "train_info/time_within_train_step": 2.2865309715270996, "step": 466} +{"train_info/time_between_train_steps": 0.003173351287841797, "step": 466} +{"info/global_step": 467, "train_info/time_within_train_step": 2.286874771118164, "step": 467} +{"train_info/time_between_train_steps": 0.0031974315643310547, "step": 467} +{"info/global_step": 468, "train_info/time_within_train_step": 2.2866501808166504, "step": 468} +{"train_info/time_between_train_steps": 0.003192424774169922, "step": 468} +{"info/global_step": 469, "train_info/time_within_train_step": 2.286689281463623, "step": 469} +{"train_info/time_between_train_steps": 0.003223896026611328, "step": 469} +{"info/global_step": 470, "train_info/time_within_train_step": 2.2866733074188232, "step": 470} +{"train_info/time_between_train_steps": 0.0031752586364746094, "step": 470} +{"info/global_step": 471, "train_info/time_within_train_step": 2.2861878871917725, "step": 471} +{"train_info/time_between_train_steps": 0.0031719207763671875, "step": 471} +{"info/global_step": 472, "train_info/time_within_train_step": 2.2864978313446045, "step": 472} +{"train_info/time_between_train_steps": 0.0031549930572509766, "step": 472} +{"info/global_step": 473, "train_info/time_within_train_step": 2.2864279747009277, "step": 473} +{"train_info/time_between_train_steps": 0.003170013427734375, "step": 473} +{"info/global_step": 474, "train_info/time_within_train_step": 2.286020040512085, "step": 474} +{"train_info/time_between_train_steps": 0.0031626224517822266, "step": 474} +{"info/global_step": 475, "train_info/time_within_train_step": 2.2863707542419434, "step": 475} +{"train_info/time_between_train_steps": 0.0031392574310302734, "step": 475} +{"info/global_step": 476, "train_info/time_within_train_step": 2.286205768585205, "step": 476} +{"train_info/time_between_train_steps": 0.0031850337982177734, "step": 476} +{"info/global_step": 477, "train_info/time_within_train_step": 2.2867443561553955, "step": 477} +{"train_info/time_between_train_steps": 0.0031740665435791016, "step": 477} +{"info/global_step": 478, "train_info/time_within_train_step": 2.2866392135620117, "step": 478} +{"train_info/time_between_train_steps": 0.003216981887817383, "step": 478} +{"info/global_step": 479, "train_info/time_within_train_step": 2.2861478328704834, "step": 479} +{"train_info/time_between_train_steps": 0.0031578540802001953, "step": 479} +{"info/global_step": 480, "train_info/time_within_train_step": 2.286764144897461, "step": 480} +{"train_info/time_between_train_steps": 0.003153085708618164, "step": 480} +{"info/global_step": 481, "train_info/time_within_train_step": 2.2866358757019043, "step": 481} +{"train_info/time_between_train_steps": 0.0031561851501464844, "step": 481} +{"info/global_step": 482, "train_info/time_within_train_step": 2.2963948249816895, "step": 482} +{"train_info/time_between_train_steps": 0.003154277801513672, "step": 482} +{"info/global_step": 483, "train_info/time_within_train_step": 2.2870092391967773, "step": 483} +{"train_info/time_between_train_steps": 0.0031578540802001953, "step": 483} +{"info/global_step": 484, "train_info/time_within_train_step": 2.2871851921081543, "step": 484} +{"train_info/time_between_train_steps": 0.0031621456146240234, "step": 484} +{"info/global_step": 485, "train_info/time_within_train_step": 2.287080764770508, "step": 485} +{"train_info/time_between_train_steps": 0.003163576126098633, "step": 485} +{"info/global_step": 486, "train_info/time_within_train_step": 2.300523281097412, "step": 486} +{"train_info/time_between_train_steps": 0.0031502246856689453, "step": 486} +{"info/global_step": 487, "train_info/time_within_train_step": 2.2874093055725098, "step": 487} +{"train_info/time_between_train_steps": 0.003169536590576172, "step": 487} +{"info/global_step": 488, "train_info/time_within_train_step": 2.2868592739105225, "step": 488} +{"train_info/time_between_train_steps": 0.0031747817993164062, "step": 488} +{"info/global_step": 489, "train_info/time_within_train_step": 2.5276505947113037, "step": 489} +{"train_info/time_between_train_steps": 0.003158092498779297, "step": 489} +{"info/global_step": 490, "train_info/time_within_train_step": 2.286928415298462, "step": 490} +{"train_info/time_between_train_steps": 0.003206014633178711, "step": 490} +{"info/global_step": 491, "train_info/time_within_train_step": 2.2862250804901123, "step": 491} +{"train_info/time_between_train_steps": 0.003154277801513672, "step": 491} +{"info/global_step": 492, "train_info/time_within_train_step": 2.2861101627349854, "step": 492} +{"train_info/time_between_train_steps": 0.0031991004943847656, "step": 492} +{"info/global_step": 493, "train_info/time_within_train_step": 2.286355972290039, "step": 493} +{"train_info/time_between_train_steps": 0.0031685829162597656, "step": 493} +{"info/global_step": 494, "train_info/time_within_train_step": 2.2862377166748047, "step": 494} +{"train_info/time_between_train_steps": 0.003149271011352539, "step": 494} +{"info/global_step": 495, "train_info/time_within_train_step": 2.286621332168579, "step": 495} +{"train_info/time_between_train_steps": 0.003139019012451172, "step": 495} +{"info/global_step": 496, "train_info/time_within_train_step": 2.2859485149383545, "step": 496} +{"train_info/time_between_train_steps": 0.0031354427337646484, "step": 496} +{"info/global_step": 497, "train_info/time_within_train_step": 2.286003828048706, "step": 497} +{"train_info/time_between_train_steps": 0.0031032562255859375, "step": 497} +{"info/global_step": 498, "train_info/time_within_train_step": 2.2859108448028564, "step": 498} +{"train_info/time_between_train_steps": 0.0031273365020751953, "step": 498} +{"info/global_step": 499, "train_info/time_within_train_step": 2.2858681678771973, "step": 499} +{"train_info/time_between_train_steps": 0.003099679946899414, "step": 499} +{"info/global_step": 500, "train_info/time_within_train_step": 2.5711863040924072, "step": 500} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 4588.0, "train_info/memory_max_reserved": 4588.0, "_timestamp": 1746345144, "_runtime": 1241}, "step": 500} +{"logs": {"train/loss": 4.6888, "train/learning_rate": 0.0005555555555555556, "train/epoch": 0.17, "_timestamp": 1746345144, "_runtime": 1241}, "step": 500} +{"train_info/time_between_train_steps": 16.478650331497192, "step": 500} +{"info/global_step": 501, "train_info/time_within_train_step": 2.115143060684204, "step": 501} +{"train_info/time_between_train_steps": 0.0031747817993164062, "step": 501} +{"info/global_step": 502, "train_info/time_within_train_step": 2.0951876640319824, "step": 502} +{"train_info/time_between_train_steps": 0.0031681060791015625, "step": 502} +{"info/global_step": 503, "train_info/time_within_train_step": 2.157630205154419, "step": 503} +{"train_info/time_between_train_steps": 0.0032029151916503906, "step": 503} +{"info/global_step": 504, "train_info/time_within_train_step": 2.2857043743133545, "step": 504} +{"train_info/time_between_train_steps": 0.003171205520629883, "step": 504} +{"info/global_step": 505, "train_info/time_within_train_step": 2.2863729000091553, "step": 505} +{"train_info/time_between_train_steps": 0.0031321048736572266, "step": 505} +{"info/global_step": 506, "train_info/time_within_train_step": 2.28598690032959, "step": 506} +{"train_info/time_between_train_steps": 0.003125429153442383, "step": 506} +{"info/global_step": 507, "train_info/time_within_train_step": 2.287038564682007, "step": 507} +{"train_info/time_between_train_steps": 0.0031244754791259766, "step": 507} +{"info/global_step": 508, "train_info/time_within_train_step": 2.287238359451294, "step": 508} +{"train_info/time_between_train_steps": 0.003184080123901367, "step": 508} +{"info/global_step": 509, "train_info/time_within_train_step": 2.2881786823272705, "step": 509} +{"train_info/time_between_train_steps": 0.0031595230102539062, "step": 509} +{"info/global_step": 510, "train_info/time_within_train_step": 2.28757381439209, "step": 510} +{"train_info/time_between_train_steps": 0.003172159194946289, "step": 510} +{"info/global_step": 511, "train_info/time_within_train_step": 2.288205146789551, "step": 511} +{"train_info/time_between_train_steps": 0.003205537796020508, "step": 511} +{"info/global_step": 512, "train_info/time_within_train_step": 2.2882680892944336, "step": 512} +{"train_info/time_between_train_steps": 0.003153085708618164, "step": 512} +{"info/global_step": 513, "train_info/time_within_train_step": 2.2886757850646973, "step": 513} +{"train_info/time_between_train_steps": 0.0032095909118652344, "step": 513} +{"info/global_step": 514, "train_info/time_within_train_step": 2.288525342941284, "step": 514} +{"train_info/time_between_train_steps": 0.003172159194946289, "step": 514} +{"info/global_step": 515, "train_info/time_within_train_step": 2.2884156703948975, "step": 515} +{"train_info/time_between_train_steps": 0.0032036304473876953, "step": 515} +{"info/global_step": 516, "train_info/time_within_train_step": 2.288114070892334, "step": 516} +{"train_info/time_between_train_steps": 0.003165721893310547, "step": 516} +{"info/global_step": 517, "train_info/time_within_train_step": 2.2887001037597656, "step": 517} +{"train_info/time_between_train_steps": 0.0032036304473876953, "step": 517} +{"info/global_step": 518, "train_info/time_within_train_step": 2.289628267288208, "step": 518} +{"train_info/time_between_train_steps": 0.0031957626342773438, "step": 518} +{"info/global_step": 519, "train_info/time_within_train_step": 2.2881059646606445, "step": 519} +{"train_info/time_between_train_steps": 0.0031981468200683594, "step": 519} +{"info/global_step": 520, "train_info/time_within_train_step": 2.2879478931427, "step": 520} +{"train_info/time_between_train_steps": 0.0031702518463134766, "step": 520} +{"info/global_step": 521, "train_info/time_within_train_step": 2.2883293628692627, "step": 521} +{"train_info/time_between_train_steps": 0.003138303756713867, "step": 521} +{"info/global_step": 522, "train_info/time_within_train_step": 2.288437843322754, "step": 522} +{"train_info/time_between_train_steps": 0.003161907196044922, "step": 522} +{"info/global_step": 523, "train_info/time_within_train_step": 2.2883660793304443, "step": 523} +{"train_info/time_between_train_steps": 0.0031919479370117188, "step": 523} +{"info/global_step": 524, "train_info/time_within_train_step": 2.287883758544922, "step": 524} +{"train_info/time_between_train_steps": 0.0031404495239257812, "step": 524} +{"info/global_step": 525, "train_info/time_within_train_step": 2.2876498699188232, "step": 525} +{"train_info/time_between_train_steps": 0.0031769275665283203, "step": 525} +{"info/global_step": 526, "train_info/time_within_train_step": 2.2876996994018555, "step": 526} +{"train_info/time_between_train_steps": 0.0031576156616210938, "step": 526} +{"info/global_step": 527, "train_info/time_within_train_step": 2.296901226043701, "step": 527} +{"train_info/time_between_train_steps": 0.0031578540802001953, "step": 527} +{"info/global_step": 528, "train_info/time_within_train_step": 2.2877416610717773, "step": 528} +{"train_info/time_between_train_steps": 0.0031960010528564453, "step": 528} +{"info/global_step": 529, "train_info/time_within_train_step": 2.2880072593688965, "step": 529} +{"train_info/time_between_train_steps": 0.003147602081298828, "step": 529} +{"info/global_step": 530, "train_info/time_within_train_step": 2.288029193878174, "step": 530} +{"train_info/time_between_train_steps": 0.0031135082244873047, "step": 530} +{"info/global_step": 531, "train_info/time_within_train_step": 2.2877798080444336, "step": 531} +{"train_info/time_between_train_steps": 0.0031325817108154297, "step": 531} +{"info/global_step": 532, "train_info/time_within_train_step": 2.2887914180755615, "step": 532} +{"train_info/time_between_train_steps": 0.003136157989501953, "step": 532} +{"info/global_step": 533, "train_info/time_within_train_step": 2.287943124771118, "step": 533} +{"train_info/time_between_train_steps": 0.003145933151245117, "step": 533} +{"info/global_step": 534, "train_info/time_within_train_step": 2.2883365154266357, "step": 534} +{"train_info/time_between_train_steps": 0.0031538009643554688, "step": 534} +{"info/global_step": 535, "train_info/time_within_train_step": 2.288465976715088, "step": 535} +{"train_info/time_between_train_steps": 0.003168344497680664, "step": 535} +{"info/global_step": 536, "train_info/time_within_train_step": 2.288503408432007, "step": 536} +{"train_info/time_between_train_steps": 0.0031876564025878906, "step": 536} +{"info/global_step": 537, "train_info/time_within_train_step": 2.2881829738616943, "step": 537} +{"train_info/time_between_train_steps": 0.0031948089599609375, "step": 537} +{"info/global_step": 538, "train_info/time_within_train_step": 2.287992238998413, "step": 538} +{"train_info/time_between_train_steps": 0.003144979476928711, "step": 538} +{"info/global_step": 539, "train_info/time_within_train_step": 2.2874646186828613, "step": 539} +{"train_info/time_between_train_steps": 0.0031273365020751953, "step": 539} +{"info/global_step": 540, "train_info/time_within_train_step": 2.2878170013427734, "step": 540} +{"train_info/time_between_train_steps": 0.0032606124877929688, "step": 540} +{"info/global_step": 541, "train_info/time_within_train_step": 2.288723945617676, "step": 541} +{"train_info/time_between_train_steps": 0.0033349990844726562, "step": 541} +{"info/global_step": 542, "train_info/time_within_train_step": 2.2880051136016846, "step": 542} +{"train_info/time_between_train_steps": 0.0031707286834716797, "step": 542} +{"info/global_step": 543, "train_info/time_within_train_step": 2.288043260574341, "step": 543} +{"train_info/time_between_train_steps": 0.003137350082397461, "step": 543} +{"info/global_step": 544, "train_info/time_within_train_step": 2.288473129272461, "step": 544} +{"train_info/time_between_train_steps": 0.003152608871459961, "step": 544} +{"info/global_step": 545, "train_info/time_within_train_step": 2.2874209880828857, "step": 545} +{"train_info/time_between_train_steps": 0.0031249523162841797, "step": 545} +{"info/global_step": 546, "train_info/time_within_train_step": 2.286778211593628, "step": 546} +{"train_info/time_between_train_steps": 0.003112316131591797, "step": 546} +{"info/global_step": 547, "train_info/time_within_train_step": 2.2871854305267334, "step": 547} +{"train_info/time_between_train_steps": 0.003145933151245117, "step": 547} +{"info/global_step": 548, "train_info/time_within_train_step": 2.287728786468506, "step": 548} +{"train_info/time_between_train_steps": 0.0032434463500976562, "step": 548} +{"info/global_step": 549, "train_info/time_within_train_step": 2.287405252456665, "step": 549} +{"train_info/time_between_train_steps": 0.0031528472900390625, "step": 549} +{"info/global_step": 550, "train_info/time_within_train_step": 2.2879669666290283, "step": 550} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 4588.0, "train_info/memory_max_reserved": 4588.0, "_timestamp": 1746345275, "_runtime": 1372}, "step": 550} +{"logs": {"train/loss": 4.6127, "train/learning_rate": 0.0005444444444444444, "train/epoch": 0.18, "_timestamp": 1746345275, "_runtime": 1372}, "step": 550} +{"train_info/time_between_train_steps": 0.023983478546142578, "step": 550} +{"info/global_step": 551, "train_info/time_within_train_step": 2.2875990867614746, "step": 551} +{"train_info/time_between_train_steps": 0.0031538009643554688, "step": 551} +{"info/global_step": 552, "train_info/time_within_train_step": 2.287182569503784, "step": 552} +{"train_info/time_between_train_steps": 0.0031571388244628906, "step": 552} +{"info/global_step": 553, "train_info/time_within_train_step": 2.2979209423065186, "step": 553} +{"train_info/time_between_train_steps": 0.0031652450561523438, "step": 553} +{"info/global_step": 554, "train_info/time_within_train_step": 2.2879297733306885, "step": 554} +{"train_info/time_between_train_steps": 0.003139019012451172, "step": 554} +{"info/global_step": 555, "train_info/time_within_train_step": 2.287454843521118, "step": 555} +{"train_info/time_between_train_steps": 0.003156423568725586, "step": 555} +{"info/global_step": 556, "train_info/time_within_train_step": 2.2878129482269287, "step": 556} +{"train_info/time_between_train_steps": 0.0031402111053466797, "step": 556} +{"info/global_step": 557, "train_info/time_within_train_step": 2.2884204387664795, "step": 557} +{"train_info/time_between_train_steps": 0.003191709518432617, "step": 557} +{"info/global_step": 558, "train_info/time_within_train_step": 2.2875702381134033, "step": 558} +{"train_info/time_between_train_steps": 0.003199338912963867, "step": 558} +{"info/global_step": 559, "train_info/time_within_train_step": 2.536106824874878, "step": 559} +{"train_info/time_between_train_steps": 0.0031774044036865234, "step": 559} +{"info/global_step": 560, "train_info/time_within_train_step": 2.287421941757202, "step": 560} +{"train_info/time_between_train_steps": 0.0031270980834960938, "step": 560} +{"info/global_step": 561, "train_info/time_within_train_step": 2.287648916244507, "step": 561} +{"train_info/time_between_train_steps": 0.0033936500549316406, "step": 561} +{"info/global_step": 562, "train_info/time_within_train_step": 2.288550615310669, "step": 562} +{"train_info/time_between_train_steps": 0.0031480789184570312, "step": 562} +{"info/global_step": 563, "train_info/time_within_train_step": 2.4323830604553223, "step": 563} +{"train_info/time_between_train_steps": 0.0031626224517822266, "step": 563} +{"info/global_step": 564, "train_info/time_within_train_step": 2.28772234916687, "step": 564} +{"train_info/time_between_train_steps": 0.0031554698944091797, "step": 564} +{"info/global_step": 565, "train_info/time_within_train_step": 2.286362648010254, "step": 565} +{"train_info/time_between_train_steps": 0.003195047378540039, "step": 565} +{"info/global_step": 566, "train_info/time_within_train_step": 2.2880711555480957, "step": 566} +{"train_info/time_between_train_steps": 0.0031507015228271484, "step": 566} +{"info/global_step": 567, "train_info/time_within_train_step": 2.2872653007507324, "step": 567} +{"train_info/time_between_train_steps": 0.003130197525024414, "step": 567} +{"info/global_step": 568, "train_info/time_within_train_step": 2.287024736404419, "step": 568} +{"train_info/time_between_train_steps": 0.0031557083129882812, "step": 568} +{"info/global_step": 569, "train_info/time_within_train_step": 2.2868001461029053, "step": 569} +{"train_info/time_between_train_steps": 0.0031561851501464844, "step": 569} +{"info/global_step": 570, "train_info/time_within_train_step": 2.287715196609497, "step": 570} +{"train_info/time_between_train_steps": 0.003224611282348633, "step": 570} +{"info/global_step": 571, "train_info/time_within_train_step": 2.2872610092163086, "step": 571} +{"train_info/time_between_train_steps": 0.003130674362182617, "step": 571} +{"info/global_step": 572, "train_info/time_within_train_step": 2.287449359893799, "step": 572} +{"train_info/time_between_train_steps": 0.0032165050506591797, "step": 572} +{"info/global_step": 573, "train_info/time_within_train_step": 2.2871105670928955, "step": 573} +{"train_info/time_between_train_steps": 0.003188610076904297, "step": 573} +{"info/global_step": 574, "train_info/time_within_train_step": 2.287142276763916, "step": 574} +{"train_info/time_between_train_steps": 0.0032007694244384766, "step": 574} +{"info/global_step": 575, "train_info/time_within_train_step": 2.2869770526885986, "step": 575} +{"train_info/time_between_train_steps": 0.003170013427734375, "step": 575} +{"info/global_step": 576, "train_info/time_within_train_step": 2.287278175354004, "step": 576} +{"train_info/time_between_train_steps": 0.003153562545776367, "step": 576} +{"info/global_step": 577, "train_info/time_within_train_step": 2.2871618270874023, "step": 577} +{"train_info/time_between_train_steps": 0.0031280517578125, "step": 577} +{"info/global_step": 578, "train_info/time_within_train_step": 2.296297550201416, "step": 578} +{"train_info/time_between_train_steps": 0.003111124038696289, "step": 578} +{"info/global_step": 579, "train_info/time_within_train_step": 2.2874507904052734, "step": 579} +{"train_info/time_between_train_steps": 0.003129243850708008, "step": 579} +{"info/global_step": 580, "train_info/time_within_train_step": 2.287447929382324, "step": 580} +{"train_info/time_between_train_steps": 0.0031571388244628906, "step": 580} +{"info/global_step": 581, "train_info/time_within_train_step": 2.28688645362854, "step": 581} +{"train_info/time_between_train_steps": 0.003194093704223633, "step": 581} +{"info/global_step": 582, "train_info/time_within_train_step": 2.2873942852020264, "step": 582} +{"train_info/time_between_train_steps": 0.0031397342681884766, "step": 582} +{"info/global_step": 583, "train_info/time_within_train_step": 2.28725004196167, "step": 583} +{"train_info/time_between_train_steps": 0.003159046173095703, "step": 583} +{"info/global_step": 584, "train_info/time_within_train_step": 2.288123369216919, "step": 584} +{"train_info/time_between_train_steps": 0.003121614456176758, "step": 584} +{"info/global_step": 585, "train_info/time_within_train_step": 2.28732967376709, "step": 585} +{"train_info/time_between_train_steps": 0.003133058547973633, "step": 585} +{"info/global_step": 586, "train_info/time_within_train_step": 2.2873799800872803, "step": 586} +{"train_info/time_between_train_steps": 0.003147602081298828, "step": 586} +{"info/global_step": 587, "train_info/time_within_train_step": 2.286990165710449, "step": 587} +{"train_info/time_between_train_steps": 0.003189563751220703, "step": 587} +{"info/global_step": 588, "train_info/time_within_train_step": 2.2871499061584473, "step": 588} +{"train_info/time_between_train_steps": 0.0032129287719726562, "step": 588} +{"info/global_step": 589, "train_info/time_within_train_step": 2.28678035736084, "step": 589} +{"train_info/time_between_train_steps": 0.0031969547271728516, "step": 589} +{"info/global_step": 590, "train_info/time_within_train_step": 2.2867889404296875, "step": 590} +{"train_info/time_between_train_steps": 0.0031659603118896484, "step": 590} +{"info/global_step": 591, "train_info/time_within_train_step": 2.2868435382843018, "step": 591} +{"train_info/time_between_train_steps": 0.0031659603118896484, "step": 591} +{"info/global_step": 592, "train_info/time_within_train_step": 2.2869913578033447, "step": 592} +{"train_info/time_between_train_steps": 0.0031664371490478516, "step": 592} +{"info/global_step": 593, "train_info/time_within_train_step": 2.2871053218841553, "step": 593} +{"train_info/time_between_train_steps": 0.003137826919555664, "step": 593} +{"info/global_step": 594, "train_info/time_within_train_step": 2.2868504524230957, "step": 594} +{"train_info/time_between_train_steps": 0.003195524215698242, "step": 594} +{"info/global_step": 595, "train_info/time_within_train_step": 2.287384271621704, "step": 595} +{"train_info/time_between_train_steps": 0.0031325817108154297, "step": 595} +{"info/global_step": 596, "train_info/time_within_train_step": 2.2864530086517334, "step": 596} +{"train_info/time_between_train_steps": 0.0032265186309814453, "step": 596} +{"info/global_step": 597, "train_info/time_within_train_step": 2.2867016792297363, "step": 597} +{"train_info/time_between_train_steps": 0.003192424774169922, "step": 597} +{"info/global_step": 598, "train_info/time_within_train_step": 2.287325859069824, "step": 598} +{"train_info/time_between_train_steps": 0.003199338912963867, "step": 598} +{"info/global_step": 599, "train_info/time_within_train_step": 2.2872300148010254, "step": 599} +{"train_info/time_between_train_steps": 0.0031461715698242188, "step": 599} +{"info/global_step": 600, "train_info/time_within_train_step": 2.2873497009277344, "step": 600} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 4588.0, "train_info/memory_max_reserved": 4588.0, "_timestamp": 1746345391, "_runtime": 1488}, "step": 600} +{"logs": {"train/loss": 4.5206, "train/learning_rate": 0.0005333333333333333, "train/epoch": 0.2, "_timestamp": 1746345391, "_runtime": 1488}, "step": 600} +{"train_info/time_between_train_steps": 11.381881713867188, "step": 600} +{"info/global_step": 601, "train_info/time_within_train_step": 2.1163079738616943, "step": 601} +{"train_info/time_between_train_steps": 0.003185749053955078, "step": 601} +{"info/global_step": 602, "train_info/time_within_train_step": 2.104153871536255, "step": 602} +{"train_info/time_between_train_steps": 0.0031690597534179688, "step": 602} +{"info/global_step": 603, "train_info/time_within_train_step": 2.215461254119873, "step": 603} +{"train_info/time_between_train_steps": 0.0031654834747314453, "step": 603} +{"info/global_step": 604, "train_info/time_within_train_step": 2.285670280456543, "step": 604} +{"train_info/time_between_train_steps": 0.0031278133392333984, "step": 604} +{"info/global_step": 605, "train_info/time_within_train_step": 2.286295175552368, "step": 605} +{"train_info/time_between_train_steps": 0.003177642822265625, "step": 605} +{"info/global_step": 606, "train_info/time_within_train_step": 2.286235809326172, "step": 606} +{"train_info/time_between_train_steps": 0.003164529800415039, "step": 606} +{"info/global_step": 607, "train_info/time_within_train_step": 2.2860004901885986, "step": 607} +{"train_info/time_between_train_steps": 0.003125429153442383, "step": 607} +{"info/global_step": 608, "train_info/time_within_train_step": 2.285191774368286, "step": 608} +{"train_info/time_between_train_steps": 0.0032682418823242188, "step": 608} +{"info/global_step": 609, "train_info/time_within_train_step": 2.2864580154418945, "step": 609} +{"train_info/time_between_train_steps": 0.0031583309173583984, "step": 609} +{"info/global_step": 610, "train_info/time_within_train_step": 2.287365674972534, "step": 610} +{"train_info/time_between_train_steps": 0.0031533241271972656, "step": 610} +{"info/global_step": 611, "train_info/time_within_train_step": 2.2872190475463867, "step": 611} +{"train_info/time_between_train_steps": 0.003159046173095703, "step": 611} +{"info/global_step": 612, "train_info/time_within_train_step": 2.287088394165039, "step": 612} +{"train_info/time_between_train_steps": 0.003136157989501953, "step": 612} +{"info/global_step": 613, "train_info/time_within_train_step": 2.287959575653076, "step": 613} +{"train_info/time_between_train_steps": 0.00316619873046875, "step": 613} +{"info/global_step": 614, "train_info/time_within_train_step": 2.287299871444702, "step": 614} +{"train_info/time_between_train_steps": 0.0031862258911132812, "step": 614} +{"info/global_step": 615, "train_info/time_within_train_step": 2.2867729663848877, "step": 615} +{"train_info/time_between_train_steps": 0.0031409263610839844, "step": 615} +{"info/global_step": 616, "train_info/time_within_train_step": 2.287260055541992, "step": 616} +{"train_info/time_between_train_steps": 0.0031478404998779297, "step": 616} +{"info/global_step": 617, "train_info/time_within_train_step": 2.5378973484039307, "step": 617} +{"train_info/time_between_train_steps": 0.0032265186309814453, "step": 617} +{"info/global_step": 618, "train_info/time_within_train_step": 2.28763747215271, "step": 618} +{"train_info/time_between_train_steps": 0.003194570541381836, "step": 618} +{"info/global_step": 619, "train_info/time_within_train_step": 2.288041591644287, "step": 619} +{"train_info/time_between_train_steps": 0.003168344497680664, "step": 619} +{"info/global_step": 620, "train_info/time_within_train_step": 2.288145065307617, "step": 620} +{"train_info/time_between_train_steps": 0.003189563751220703, "step": 620} +{"info/global_step": 621, "train_info/time_within_train_step": 2.2884252071380615, "step": 621} +{"train_info/time_between_train_steps": 0.0031461715698242188, "step": 621} +{"info/global_step": 622, "train_info/time_within_train_step": 2.287809371948242, "step": 622} +{"train_info/time_between_train_steps": 0.0031828880310058594, "step": 622} +{"info/global_step": 623, "train_info/time_within_train_step": 2.28853178024292, "step": 623} +{"train_info/time_between_train_steps": 0.0031766891479492188, "step": 623} +{"info/global_step": 624, "train_info/time_within_train_step": 2.287754535675049, "step": 624} +{"train_info/time_between_train_steps": 0.0032014846801757812, "step": 624} +{"info/global_step": 625, "train_info/time_within_train_step": 2.2881720066070557, "step": 625} +{"train_info/time_between_train_steps": 0.12412762641906738, "step": 625} +{"info/global_step": 626, "train_info/time_within_train_step": 2.321791887283325, "step": 626} +{"train_info/time_between_train_steps": 0.00316619873046875, "step": 626} +{"info/global_step": 627, "train_info/time_within_train_step": 2.2880754470825195, "step": 627} +{"train_info/time_between_train_steps": 0.0031752586364746094, "step": 627} +{"info/global_step": 628, "train_info/time_within_train_step": 2.286795139312744, "step": 628} +{"train_info/time_between_train_steps": 0.003146648406982422, "step": 628} +{"info/global_step": 629, "train_info/time_within_train_step": 2.287095785140991, "step": 629} +{"train_info/time_between_train_steps": 0.0031800270080566406, "step": 629} +{"info/global_step": 630, "train_info/time_within_train_step": 2.301354169845581, "step": 630} +{"train_info/time_between_train_steps": 0.0031409263610839844, "step": 630} +{"info/global_step": 631, "train_info/time_within_train_step": 2.287262439727783, "step": 631} +{"train_info/time_between_train_steps": 0.003127574920654297, "step": 631} +{"info/global_step": 632, "train_info/time_within_train_step": 2.286785364151001, "step": 632} +{"train_info/time_between_train_steps": 0.0031909942626953125, "step": 632} +{"info/global_step": 633, "train_info/time_within_train_step": 2.303041696548462, "step": 633} +{"train_info/time_between_train_steps": 0.0032148361206054688, "step": 633} +{"info/global_step": 634, "train_info/time_within_train_step": 2.287142753601074, "step": 634} +{"train_info/time_between_train_steps": 0.003171682357788086, "step": 634} +{"info/global_step": 635, "train_info/time_within_train_step": 2.2873358726501465, "step": 635} +{"train_info/time_between_train_steps": 0.0031952857971191406, "step": 635} +{"info/global_step": 636, "train_info/time_within_train_step": 2.2872023582458496, "step": 636} +{"train_info/time_between_train_steps": 0.0031800270080566406, "step": 636} +{"info/global_step": 637, "train_info/time_within_train_step": 2.2870278358459473, "step": 637} +{"train_info/time_between_train_steps": 0.0031614303588867188, "step": 637} +{"info/global_step": 638, "train_info/time_within_train_step": 2.2870304584503174, "step": 638} +{"train_info/time_between_train_steps": 0.0031325817108154297, "step": 638} +{"info/global_step": 639, "train_info/time_within_train_step": 2.2873053550720215, "step": 639} +{"train_info/time_between_train_steps": 0.0031359195709228516, "step": 639} +{"info/global_step": 640, "train_info/time_within_train_step": 2.2877180576324463, "step": 640} +{"train_info/time_between_train_steps": 0.003180265426635742, "step": 640} +{"info/global_step": 641, "train_info/time_within_train_step": 2.28688645362854, "step": 641} +{"train_info/time_between_train_steps": 0.0031614303588867188, "step": 641} +{"info/global_step": 642, "train_info/time_within_train_step": 2.288032054901123, "step": 642} +{"train_info/time_between_train_steps": 0.0031495094299316406, "step": 642} +{"info/global_step": 643, "train_info/time_within_train_step": 2.2870194911956787, "step": 643} +{"train_info/time_between_train_steps": 0.0031414031982421875, "step": 643} +{"info/global_step": 644, "train_info/time_within_train_step": 2.2873375415802, "step": 644} +{"train_info/time_between_train_steps": 0.003156900405883789, "step": 644} +{"info/global_step": 645, "train_info/time_within_train_step": 2.2878432273864746, "step": 645} +{"train_info/time_between_train_steps": 0.0031294822692871094, "step": 645} +{"info/global_step": 646, "train_info/time_within_train_step": 2.2878611087799072, "step": 646} +{"train_info/time_between_train_steps": 0.003148317337036133, "step": 646} +{"info/global_step": 647, "train_info/time_within_train_step": 2.287668228149414, "step": 647} +{"train_info/time_between_train_steps": 0.003165006637573242, "step": 647} +{"info/global_step": 648, "train_info/time_within_train_step": 2.287822723388672, "step": 648} +{"train_info/time_between_train_steps": 0.0032329559326171875, "step": 648} +{"info/global_step": 649, "train_info/time_within_train_step": 2.287335157394409, "step": 649} +{"train_info/time_between_train_steps": 0.0031881332397460938, "step": 649} +{"info/global_step": 650, "train_info/time_within_train_step": 2.2875561714172363, "step": 650} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 4588.0, "train_info/memory_max_reserved": 4588.0, "_timestamp": 1746345518, "_runtime": 1615}, "step": 650} +{"logs": {"train/loss": 4.4185, "train/learning_rate": 0.0005222222222222222, "train/epoch": 0.22, "_timestamp": 1746345518, "_runtime": 1615}, "step": 650} +{"train_info/time_between_train_steps": 0.024737119674682617, "step": 650} +{"info/global_step": 651, "train_info/time_within_train_step": 2.2879691123962402, "step": 651} +{"train_info/time_between_train_steps": 0.0031762123107910156, "step": 651} +{"info/global_step": 652, "train_info/time_within_train_step": 2.3201847076416016, "step": 652} +{"train_info/time_between_train_steps": 0.003161191940307617, "step": 652} +{"info/global_step": 653, "train_info/time_within_train_step": 2.287271738052368, "step": 653} +{"train_info/time_between_train_steps": 0.0031676292419433594, "step": 653} +{"info/global_step": 654, "train_info/time_within_train_step": 2.288377523422241, "step": 654} +{"train_info/time_between_train_steps": 0.0031545162200927734, "step": 654} +{"info/global_step": 655, "train_info/time_within_train_step": 2.2873966693878174, "step": 655} +{"train_info/time_between_train_steps": 0.003187417984008789, "step": 655} +{"info/global_step": 656, "train_info/time_within_train_step": 2.3013529777526855, "step": 656} +{"train_info/time_between_train_steps": 0.0031919479370117188, "step": 656} +{"info/global_step": 657, "train_info/time_within_train_step": 2.28726863861084, "step": 657} +{"train_info/time_between_train_steps": 0.0032317638397216797, "step": 657} +{"info/global_step": 658, "train_info/time_within_train_step": 2.2874820232391357, "step": 658} +{"train_info/time_between_train_steps": 0.003204345703125, "step": 658} +{"info/global_step": 659, "train_info/time_within_train_step": 2.3017642498016357, "step": 659} +{"train_info/time_between_train_steps": 0.00318145751953125, "step": 659} +{"info/global_step": 660, "train_info/time_within_train_step": 2.2874250411987305, "step": 660} +{"train_info/time_between_train_steps": 0.003170013427734375, "step": 660} +{"info/global_step": 661, "train_info/time_within_train_step": 2.287806272506714, "step": 661} +{"train_info/time_between_train_steps": 0.003161907196044922, "step": 661} +{"info/global_step": 662, "train_info/time_within_train_step": 2.2873473167419434, "step": 662} +{"train_info/time_between_train_steps": 0.003161907196044922, "step": 662} +{"info/global_step": 663, "train_info/time_within_train_step": 2.2885947227478027, "step": 663} +{"train_info/time_between_train_steps": 0.0031609535217285156, "step": 663} +{"info/global_step": 664, "train_info/time_within_train_step": 2.2874367237091064, "step": 664} +{"train_info/time_between_train_steps": 0.0031943321228027344, "step": 664} +{"info/global_step": 665, "train_info/time_within_train_step": 2.2875733375549316, "step": 665} +{"train_info/time_between_train_steps": 0.003164529800415039, "step": 665} +{"info/global_step": 666, "train_info/time_within_train_step": 2.288259744644165, "step": 666} +{"train_info/time_between_train_steps": 0.0031747817993164062, "step": 666} +{"info/global_step": 667, "train_info/time_within_train_step": 2.2876670360565186, "step": 667} +{"train_info/time_between_train_steps": 0.0032129287719726562, "step": 667} +{"info/global_step": 668, "train_info/time_within_train_step": 2.2877180576324463, "step": 668} +{"train_info/time_between_train_steps": 0.003183603286743164, "step": 668} +{"info/global_step": 669, "train_info/time_within_train_step": 2.5433707237243652, "step": 669} +{"train_info/time_between_train_steps": 0.0032041072845458984, "step": 669} +{"info/global_step": 670, "train_info/time_within_train_step": 2.2871651649475098, "step": 670} +{"train_info/time_between_train_steps": 0.0031349658966064453, "step": 670} +{"info/global_step": 671, "train_info/time_within_train_step": 2.2873599529266357, "step": 671} +{"train_info/time_between_train_steps": 0.003186941146850586, "step": 671} +{"info/global_step": 672, "train_info/time_within_train_step": 2.28765869140625, "step": 672} +{"train_info/time_between_train_steps": 0.0031545162200927734, "step": 672} +{"info/global_step": 673, "train_info/time_within_train_step": 2.2873973846435547, "step": 673} +{"train_info/time_between_train_steps": 0.0031585693359375, "step": 673} +{"info/global_step": 674, "train_info/time_within_train_step": 2.2875757217407227, "step": 674} +{"train_info/time_between_train_steps": 0.003184080123901367, "step": 674} +{"info/global_step": 675, "train_info/time_within_train_step": 2.2874879837036133, "step": 675} +{"train_info/time_between_train_steps": 0.0031538009643554688, "step": 675} +{"info/global_step": 676, "train_info/time_within_train_step": 2.2878150939941406, "step": 676} +{"train_info/time_between_train_steps": 0.00313568115234375, "step": 676} +{"info/global_step": 677, "train_info/time_within_train_step": 2.286970376968384, "step": 677} +{"train_info/time_between_train_steps": 0.003154754638671875, "step": 677} +{"info/global_step": 678, "train_info/time_within_train_step": 2.2869489192962646, "step": 678} +{"train_info/time_between_train_steps": 0.003117799758911133, "step": 678} +{"info/global_step": 679, "train_info/time_within_train_step": 2.2874486446380615, "step": 679} +{"train_info/time_between_train_steps": 0.003193378448486328, "step": 679} +{"info/global_step": 680, "train_info/time_within_train_step": 2.2871081829071045, "step": 680} +{"train_info/time_between_train_steps": 0.0032050609588623047, "step": 680} +{"info/global_step": 681, "train_info/time_within_train_step": 2.2872560024261475, "step": 681} +{"train_info/time_between_train_steps": 0.0031838417053222656, "step": 681} +{"info/global_step": 682, "train_info/time_within_train_step": 2.2870798110961914, "step": 682} +{"train_info/time_between_train_steps": 0.0031440258026123047, "step": 682} +{"info/global_step": 683, "train_info/time_within_train_step": 2.2871103286743164, "step": 683} +{"train_info/time_between_train_steps": 0.003143787384033203, "step": 683} +{"info/global_step": 684, "train_info/time_within_train_step": 2.287233829498291, "step": 684} +{"train_info/time_between_train_steps": 0.003124713897705078, "step": 684} +{"info/global_step": 685, "train_info/time_within_train_step": 2.287656545639038, "step": 685} +{"train_info/time_between_train_steps": 0.0031194686889648438, "step": 685} +{"info/global_step": 686, "train_info/time_within_train_step": 2.2871150970458984, "step": 686} +{"train_info/time_between_train_steps": 0.003144979476928711, "step": 686} +{"info/global_step": 687, "train_info/time_within_train_step": 2.2868738174438477, "step": 687} +{"train_info/time_between_train_steps": 0.0032129287719726562, "step": 687} +{"info/global_step": 688, "train_info/time_within_train_step": 2.410083055496216, "step": 688} +{"train_info/time_between_train_steps": 0.0031969547271728516, "step": 688} +{"info/global_step": 689, "train_info/time_within_train_step": 2.287533760070801, "step": 689} +{"train_info/time_between_train_steps": 0.0031843185424804688, "step": 689} +{"info/global_step": 690, "train_info/time_within_train_step": 2.287846326828003, "step": 690} +{"train_info/time_between_train_steps": 0.003202676773071289, "step": 690} +{"info/global_step": 691, "train_info/time_within_train_step": 2.2875113487243652, "step": 691} +{"train_info/time_between_train_steps": 0.0031523704528808594, "step": 691} +{"info/global_step": 692, "train_info/time_within_train_step": 2.288011074066162, "step": 692} +{"train_info/time_between_train_steps": 0.0031609535217285156, "step": 692} +{"info/global_step": 693, "train_info/time_within_train_step": 2.2881786823272705, "step": 693} +{"train_info/time_between_train_steps": 0.003136873245239258, "step": 693} +{"info/global_step": 694, "train_info/time_within_train_step": 2.2880399227142334, "step": 694} +{"train_info/time_between_train_steps": 0.003174304962158203, "step": 694} +{"info/global_step": 695, "train_info/time_within_train_step": 2.2873921394348145, "step": 695} +{"train_info/time_between_train_steps": 0.0031538009643554688, "step": 695} +{"info/global_step": 696, "train_info/time_within_train_step": 2.288020610809326, "step": 696} +{"train_info/time_between_train_steps": 0.003184795379638672, "step": 696} +{"info/global_step": 697, "train_info/time_within_train_step": 2.2878315448760986, "step": 697} +{"train_info/time_between_train_steps": 0.0031430721282958984, "step": 697} +{"info/global_step": 698, "train_info/time_within_train_step": 2.2873306274414062, "step": 698} +{"train_info/time_between_train_steps": 0.003152132034301758, "step": 698} +{"info/global_step": 699, "train_info/time_within_train_step": 2.2868030071258545, "step": 699} +{"train_info/time_between_train_steps": 0.0031404495239257812, "step": 699} +{"info/global_step": 700, "train_info/time_within_train_step": 2.2867064476013184, "step": 700} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 4588.0, "train_info/memory_max_reserved": 4588.0, "_timestamp": 1746345634, "_runtime": 1731}, "step": 700} +{"logs": {"train/loss": 4.3261, "train/learning_rate": 0.0005111111111111111, "train/epoch": 0.23, "_timestamp": 1746345634, "_runtime": 1731}, "step": 700} +{"train_info/time_between_train_steps": 12.627620458602905, "step": 700} +{"info/global_step": 701, "train_info/time_within_train_step": 2.113818645477295, "step": 701} +{"train_info/time_between_train_steps": 0.0031626224517822266, "step": 701} +{"info/global_step": 702, "train_info/time_within_train_step": 2.0991053581237793, "step": 702} +{"train_info/time_between_train_steps": 0.003249645233154297, "step": 702} +{"info/global_step": 703, "train_info/time_within_train_step": 2.1986801624298096, "step": 703} +{"train_info/time_between_train_steps": 0.0032377243041992188, "step": 703} +{"info/global_step": 704, "train_info/time_within_train_step": 2.285125255584717, "step": 704} +{"train_info/time_between_train_steps": 0.0031862258911132812, "step": 704} +{"info/global_step": 705, "train_info/time_within_train_step": 2.2857272624969482, "step": 705} +{"train_info/time_between_train_steps": 0.003173351287841797, "step": 705} +{"info/global_step": 706, "train_info/time_within_train_step": 2.285918951034546, "step": 706} +{"train_info/time_between_train_steps": 0.0032176971435546875, "step": 706} +{"info/global_step": 707, "train_info/time_within_train_step": 2.286201238632202, "step": 707} +{"train_info/time_between_train_steps": 0.0031461715698242188, "step": 707} +{"info/global_step": 708, "train_info/time_within_train_step": 2.286386251449585, "step": 708} +{"train_info/time_between_train_steps": 0.0031480789184570312, "step": 708} +{"info/global_step": 709, "train_info/time_within_train_step": 2.2871007919311523, "step": 709} +{"train_info/time_between_train_steps": 0.0031719207763671875, "step": 709} +{"info/global_step": 710, "train_info/time_within_train_step": 2.287480115890503, "step": 710} +{"train_info/time_between_train_steps": 0.0031478404998779297, "step": 710} +{"info/global_step": 711, "train_info/time_within_train_step": 2.287508249282837, "step": 711} +{"train_info/time_between_train_steps": 0.003186941146850586, "step": 711} +{"info/global_step": 712, "train_info/time_within_train_step": 2.2871696949005127, "step": 712} +{"train_info/time_between_train_steps": 0.003171682357788086, "step": 712} +{"info/global_step": 713, "train_info/time_within_train_step": 2.287367105484009, "step": 713} +{"train_info/time_between_train_steps": 0.0031630992889404297, "step": 713} +{"info/global_step": 714, "train_info/time_within_train_step": 2.2868869304656982, "step": 714} +{"train_info/time_between_train_steps": 0.0031785964965820312, "step": 714} +{"info/global_step": 715, "train_info/time_within_train_step": 2.5455524921417236, "step": 715} +{"train_info/time_between_train_steps": 0.0031518936157226562, "step": 715} +{"info/global_step": 716, "train_info/time_within_train_step": 2.2868430614471436, "step": 716} +{"train_info/time_between_train_steps": 0.003180265426635742, "step": 716} +{"info/global_step": 717, "train_info/time_within_train_step": 2.2866604328155518, "step": 717} +{"train_info/time_between_train_steps": 0.0031332969665527344, "step": 717} +{"info/global_step": 718, "train_info/time_within_train_step": 2.2868306636810303, "step": 718} +{"train_info/time_between_train_steps": 0.003165721893310547, "step": 718} +{"info/global_step": 719, "train_info/time_within_train_step": 2.286181926727295, "step": 719} +{"train_info/time_between_train_steps": 0.0032110214233398438, "step": 719} +{"info/global_step": 720, "train_info/time_within_train_step": 2.2874133586883545, "step": 720} +{"train_info/time_between_train_steps": 0.0032203197479248047, "step": 720} +{"info/global_step": 721, "train_info/time_within_train_step": 2.286100149154663, "step": 721} +{"train_info/time_between_train_steps": 0.003186941146850586, "step": 721} +{"info/global_step": 722, "train_info/time_within_train_step": 2.2865636348724365, "step": 722} +{"train_info/time_between_train_steps": 0.0031561851501464844, "step": 722} +{"info/global_step": 723, "train_info/time_within_train_step": 2.2872817516326904, "step": 723} +{"train_info/time_between_train_steps": 0.0031075477600097656, "step": 723} +{"info/global_step": 724, "train_info/time_within_train_step": 2.2865793704986572, "step": 724} +{"train_info/time_between_train_steps": 0.003148794174194336, "step": 724} +{"info/global_step": 725, "train_info/time_within_train_step": 2.2873287200927734, "step": 725} +{"train_info/time_between_train_steps": 0.0031194686889648438, "step": 725} +{"info/global_step": 726, "train_info/time_within_train_step": 2.2868409156799316, "step": 726} +{"train_info/time_between_train_steps": 0.003161191940307617, "step": 726} +{"info/global_step": 727, "train_info/time_within_train_step": 2.2870395183563232, "step": 727} +{"train_info/time_between_train_steps": 0.0031747817993164062, "step": 727} +{"info/global_step": 728, "train_info/time_within_train_step": 2.2874109745025635, "step": 728} +{"train_info/time_between_train_steps": 0.00318145751953125, "step": 728} +{"info/global_step": 729, "train_info/time_within_train_step": 2.2884035110473633, "step": 729} +{"train_info/time_between_train_steps": 0.003145456314086914, "step": 729} +{"info/global_step": 730, "train_info/time_within_train_step": 2.2876667976379395, "step": 730} +{"train_info/time_between_train_steps": 0.003167390823364258, "step": 730} +{"info/global_step": 731, "train_info/time_within_train_step": 2.2874817848205566, "step": 731} +{"train_info/time_between_train_steps": 0.003185272216796875, "step": 731} +{"info/global_step": 732, "train_info/time_within_train_step": 2.287015914916992, "step": 732} +{"train_info/time_between_train_steps": 0.003108501434326172, "step": 732} +{"info/global_step": 733, "train_info/time_within_train_step": 2.2878918647766113, "step": 733} +{"train_info/time_between_train_steps": 0.0031366348266601562, "step": 733} +{"info/global_step": 734, "train_info/time_within_train_step": 2.2868711948394775, "step": 734} +{"train_info/time_between_train_steps": 0.0032117366790771484, "step": 734} +{"info/global_step": 735, "train_info/time_within_train_step": 2.286717414855957, "step": 735} +{"train_info/time_between_train_steps": 0.0031936168670654297, "step": 735} +{"info/global_step": 736, "train_info/time_within_train_step": 2.2873125076293945, "step": 736} +{"train_info/time_between_train_steps": 0.0031566619873046875, "step": 736} +{"info/global_step": 737, "train_info/time_within_train_step": 2.287445306777954, "step": 737} +{"train_info/time_between_train_steps": 0.0031440258026123047, "step": 737} +{"info/global_step": 738, "train_info/time_within_train_step": 2.2866342067718506, "step": 738} +{"train_info/time_between_train_steps": 0.0031321048736572266, "step": 738} +{"info/global_step": 739, "train_info/time_within_train_step": 2.2871153354644775, "step": 739} +{"train_info/time_between_train_steps": 0.0031266212463378906, "step": 739} +{"info/global_step": 740, "train_info/time_within_train_step": 2.287193775177002, "step": 740} +{"train_info/time_between_train_steps": 0.003136873245239258, "step": 740} +{"info/global_step": 741, "train_info/time_within_train_step": 2.286557197570801, "step": 741} +{"train_info/time_between_train_steps": 0.0031850337982177734, "step": 741} +{"info/global_step": 742, "train_info/time_within_train_step": 2.2866663932800293, "step": 742} +{"train_info/time_between_train_steps": 0.0032196044921875, "step": 742} +{"info/global_step": 743, "train_info/time_within_train_step": 2.286569595336914, "step": 743} +{"train_info/time_between_train_steps": 0.0032944679260253906, "step": 743} +{"info/global_step": 744, "train_info/time_within_train_step": 2.2876155376434326, "step": 744} +{"train_info/time_between_train_steps": 0.003521442413330078, "step": 744} +{"info/global_step": 745, "train_info/time_within_train_step": 2.287710428237915, "step": 745} +{"train_info/time_between_train_steps": 0.0037221908569335938, "step": 745} +{"info/global_step": 746, "train_info/time_within_train_step": 2.287222146987915, "step": 746} +{"train_info/time_between_train_steps": 0.0035011768341064453, "step": 746} +{"info/global_step": 747, "train_info/time_within_train_step": 2.2869510650634766, "step": 747} +{"train_info/time_between_train_steps": 0.003457307815551758, "step": 747} +{"info/global_step": 748, "train_info/time_within_train_step": 2.287458896636963, "step": 748} +{"train_info/time_between_train_steps": 0.0035181045532226562, "step": 748} +{"info/global_step": 749, "train_info/time_within_train_step": 2.287374496459961, "step": 749} +{"train_info/time_between_train_steps": 0.0035200119018554688, "step": 749} +{"info/global_step": 750, "train_info/time_within_train_step": 2.5909109115600586, "step": 750} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 4588.0, "train_info/memory_max_reserved": 4588.0, "_timestamp": 1746345763, "_runtime": 1860}, "step": 750} +{"logs": {"train/loss": 4.2372, "train/learning_rate": 0.0005, "train/epoch": 0.25, "_timestamp": 1746345763, "_runtime": 1860}, "step": 750} +{"train_info/time_between_train_steps": 0.14646029472351074, "step": 750} +{"info/global_step": 751, "train_info/time_within_train_step": 2.2872376441955566, "step": 751} +{"train_info/time_between_train_steps": 0.0032880306243896484, "step": 751} +{"info/global_step": 752, "train_info/time_within_train_step": 2.320772647857666, "step": 752} +{"train_info/time_between_train_steps": 0.003302335739135742, "step": 752} +{"info/global_step": 753, "train_info/time_within_train_step": 2.2873613834381104, "step": 753} +{"train_info/time_between_train_steps": 0.0033206939697265625, "step": 753} +{"info/global_step": 754, "train_info/time_within_train_step": 2.287524700164795, "step": 754} +{"train_info/time_between_train_steps": 0.003278970718383789, "step": 754} +{"info/global_step": 755, "train_info/time_within_train_step": 2.2875280380249023, "step": 755} +{"train_info/time_between_train_steps": 0.003320455551147461, "step": 755} +{"info/global_step": 756, "train_info/time_within_train_step": 2.287621259689331, "step": 756} +{"train_info/time_between_train_steps": 0.003259420394897461, "step": 756} +{"info/global_step": 757, "train_info/time_within_train_step": 2.287978172302246, "step": 757} +{"train_info/time_between_train_steps": 0.003358125686645508, "step": 757} +{"info/global_step": 758, "train_info/time_within_train_step": 2.28849458694458, "step": 758} +{"train_info/time_between_train_steps": 0.0034842491149902344, "step": 758} +{"info/global_step": 759, "train_info/time_within_train_step": 2.2896854877471924, "step": 759} +{"train_info/time_between_train_steps": 0.0035932064056396484, "step": 759} +{"info/global_step": 760, "train_info/time_within_train_step": 2.288754463195801, "step": 760} +{"train_info/time_between_train_steps": 0.0037555694580078125, "step": 760} +{"info/global_step": 761, "train_info/time_within_train_step": 2.2881083488464355, "step": 761} +{"train_info/time_between_train_steps": 0.0036416053771972656, "step": 761} +{"info/global_step": 762, "train_info/time_within_train_step": 2.287836790084839, "step": 762} +{"train_info/time_between_train_steps": 0.003679513931274414, "step": 762} +{"info/global_step": 763, "train_info/time_within_train_step": 2.2879722118377686, "step": 763} +{"train_info/time_between_train_steps": 0.0036787986755371094, "step": 763} +{"info/global_step": 764, "train_info/time_within_train_step": 2.2877750396728516, "step": 764} +{"train_info/time_between_train_steps": 0.0036818981170654297, "step": 764} +{"info/global_step": 765, "train_info/time_within_train_step": 2.287543296813965, "step": 765} +{"train_info/time_between_train_steps": 0.0035653114318847656, "step": 765} +{"info/global_step": 766, "train_info/time_within_train_step": 2.2872726917266846, "step": 766} +{"train_info/time_between_train_steps": 0.003663778305053711, "step": 766} +{"info/global_step": 767, "train_info/time_within_train_step": 2.286637783050537, "step": 767} +{"train_info/time_between_train_steps": 0.0035877227783203125, "step": 767} +{"info/global_step": 768, "train_info/time_within_train_step": 2.287642240524292, "step": 768} +{"train_info/time_between_train_steps": 0.0035631656646728516, "step": 768} +{"info/global_step": 769, "train_info/time_within_train_step": 2.2875993251800537, "step": 769} +{"train_info/time_between_train_steps": 0.0035583972930908203, "step": 769} +{"info/global_step": 770, "train_info/time_within_train_step": 2.287447929382324, "step": 770} +{"train_info/time_between_train_steps": 0.0035305023193359375, "step": 770} +{"info/global_step": 771, "train_info/time_within_train_step": 2.287977933883667, "step": 771} +{"train_info/time_between_train_steps": 0.003598451614379883, "step": 771} +{"info/global_step": 772, "train_info/time_within_train_step": 2.2879738807678223, "step": 772} +{"train_info/time_between_train_steps": 0.0036041736602783203, "step": 772} +{"info/global_step": 773, "train_info/time_within_train_step": 2.2883856296539307, "step": 773} +{"train_info/time_between_train_steps": 0.003581523895263672, "step": 773} +{"info/global_step": 774, "train_info/time_within_train_step": 2.288179397583008, "step": 774} +{"train_info/time_between_train_steps": 0.0036094188690185547, "step": 774} +{"info/global_step": 775, "train_info/time_within_train_step": 2.2878596782684326, "step": 775} +{"train_info/time_between_train_steps": 0.0035758018493652344, "step": 775} +{"info/global_step": 776, "train_info/time_within_train_step": 2.2876806259155273, "step": 776} +{"train_info/time_between_train_steps": 0.003509998321533203, "step": 776} +{"info/global_step": 777, "train_info/time_within_train_step": 2.2881581783294678, "step": 777} +{"train_info/time_between_train_steps": 0.003523588180541992, "step": 777} +{"info/global_step": 778, "train_info/time_within_train_step": 2.320094108581543, "step": 778} +{"train_info/time_between_train_steps": 0.003548145294189453, "step": 778} +{"info/global_step": 779, "train_info/time_within_train_step": 2.288135051727295, "step": 779} +{"train_info/time_between_train_steps": 0.0035626888275146484, "step": 779} +{"info/global_step": 780, "train_info/time_within_train_step": 2.306748867034912, "step": 780} +{"train_info/time_between_train_steps": 0.0030875205993652344, "step": 780} +{"info/global_step": 781, "train_info/time_within_train_step": 2.2864584922790527, "step": 781} +{"train_info/time_between_train_steps": 0.0030944347381591797, "step": 781} +{"info/global_step": 782, "train_info/time_within_train_step": 2.286295175552368, "step": 782} +{"train_info/time_between_train_steps": 0.003003835678100586, "step": 782} +{"info/global_step": 783, "train_info/time_within_train_step": 2.2864573001861572, "step": 783} +{"train_info/time_between_train_steps": 0.0030019283294677734, "step": 783} +{"info/global_step": 784, "train_info/time_within_train_step": 2.2852885723114014, "step": 784} +{"train_info/time_between_train_steps": 0.0030210018157958984, "step": 784} +{"info/global_step": 785, "train_info/time_within_train_step": 2.2858827114105225, "step": 785} +{"train_info/time_between_train_steps": 0.003020763397216797, "step": 785} +{"info/global_step": 786, "train_info/time_within_train_step": 2.2856740951538086, "step": 786} +{"train_info/time_between_train_steps": 0.003062725067138672, "step": 786} +{"info/global_step": 787, "train_info/time_within_train_step": 2.285029888153076, "step": 787} +{"train_info/time_between_train_steps": 0.002989530563354492, "step": 787} +{"info/global_step": 788, "train_info/time_within_train_step": 2.2851929664611816, "step": 788} +{"train_info/time_between_train_steps": 0.003125905990600586, "step": 788} +{"info/global_step": 789, "train_info/time_within_train_step": 2.2853198051452637, "step": 789} +{"train_info/time_between_train_steps": 0.003114938735961914, "step": 789} +{"info/global_step": 790, "train_info/time_within_train_step": 2.2869484424591064, "step": 790} +{"train_info/time_between_train_steps": 0.0031855106353759766, "step": 790} +{"info/global_step": 791, "train_info/time_within_train_step": 2.286890745162964, "step": 791} +{"train_info/time_between_train_steps": 0.003152132034301758, "step": 791} +{"info/global_step": 792, "train_info/time_within_train_step": 2.2864949703216553, "step": 792} +{"train_info/time_between_train_steps": 0.003144502639770508, "step": 792} +{"info/global_step": 793, "train_info/time_within_train_step": 2.2861573696136475, "step": 793} +{"train_info/time_between_train_steps": 0.003137826919555664, "step": 793} +{"info/global_step": 794, "train_info/time_within_train_step": 2.286515712738037, "step": 794} +{"train_info/time_between_train_steps": 0.0031278133392333984, "step": 794} +{"info/global_step": 795, "train_info/time_within_train_step": 2.2863657474517822, "step": 795} +{"train_info/time_between_train_steps": 0.003150463104248047, "step": 795} +{"info/global_step": 796, "train_info/time_within_train_step": 2.287018299102783, "step": 796} +{"train_info/time_between_train_steps": 0.0030739307403564453, "step": 796} +{"info/global_step": 797, "train_info/time_within_train_step": 2.286937713623047, "step": 797} +{"train_info/time_between_train_steps": 0.0031325817108154297, "step": 797} +{"info/global_step": 798, "train_info/time_within_train_step": 2.2867119312286377, "step": 798} +{"train_info/time_between_train_steps": 0.0031185150146484375, "step": 798} +{"info/global_step": 799, "train_info/time_within_train_step": 2.286844253540039, "step": 799} +{"train_info/time_between_train_steps": 0.0030813217163085938, "step": 799} +{"info/global_step": 800, "train_info/time_within_train_step": 2.286761522293091, "step": 800} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 4588.0, "train_info/memory_max_reserved": 4588.0, "_timestamp": 1746345878, "_runtime": 1975}, "step": 800} +{"logs": {"train/loss": 4.1649, "train/learning_rate": 0.0004888888888888889, "train/epoch": 0.27, "_timestamp": 1746345878, "_runtime": 1975}, "step": 800} +{"train_info/time_between_train_steps": 11.632420539855957, "step": 800} +{"info/global_step": 801, "train_info/time_within_train_step": 2.111112594604492, "step": 801} +{"train_info/time_between_train_steps": 0.0030677318572998047, "step": 801} +{"info/global_step": 802, "train_info/time_within_train_step": 2.1000561714172363, "step": 802} +{"train_info/time_between_train_steps": 0.0031261444091796875, "step": 802} +{"info/global_step": 803, "train_info/time_within_train_step": 2.2316548824310303, "step": 803} +{"train_info/time_between_train_steps": 0.003086566925048828, "step": 803} +{"info/global_step": 804, "train_info/time_within_train_step": 2.5955238342285156, "step": 804} +{"train_info/time_between_train_steps": 0.0029554367065429688, "step": 804} +{"info/global_step": 805, "train_info/time_within_train_step": 2.283848524093628, "step": 805} +{"train_info/time_between_train_steps": 0.002881288528442383, "step": 805} +{"info/global_step": 806, "train_info/time_within_train_step": 2.284209966659546, "step": 806} +{"train_info/time_between_train_steps": 0.0028908252716064453, "step": 806} +{"info/global_step": 807, "train_info/time_within_train_step": 2.284507989883423, "step": 807} +{"train_info/time_between_train_steps": 0.003108978271484375, "step": 807} +{"info/global_step": 808, "train_info/time_within_train_step": 2.2855257987976074, "step": 808} +{"train_info/time_between_train_steps": 0.0031518936157226562, "step": 808} +{"info/global_step": 809, "train_info/time_within_train_step": 2.2850911617279053, "step": 809} +{"train_info/time_between_train_steps": 0.0031468868255615234, "step": 809} +{"info/global_step": 810, "train_info/time_within_train_step": 2.2851362228393555, "step": 810} +{"train_info/time_between_train_steps": 0.003070831298828125, "step": 810} +{"info/global_step": 811, "train_info/time_within_train_step": 2.2853617668151855, "step": 811} +{"train_info/time_between_train_steps": 0.0031266212463378906, "step": 811} +{"info/global_step": 812, "train_info/time_within_train_step": 2.2864370346069336, "step": 812} +{"train_info/time_between_train_steps": 0.003131389617919922, "step": 812} +{"info/global_step": 813, "train_info/time_within_train_step": 2.2853212356567383, "step": 813} +{"train_info/time_between_train_steps": 0.0030884742736816406, "step": 813} +{"info/global_step": 814, "train_info/time_within_train_step": 2.2861099243164062, "step": 814} +{"train_info/time_between_train_steps": 0.0030493736267089844, "step": 814} +{"info/global_step": 815, "train_info/time_within_train_step": 2.28564453125, "step": 815} +{"train_info/time_between_train_steps": 0.003083467483520508, "step": 815} +{"info/global_step": 816, "train_info/time_within_train_step": 2.2857234477996826, "step": 816} +{"train_info/time_between_train_steps": 0.0031032562255859375, "step": 816} +{"info/global_step": 817, "train_info/time_within_train_step": 2.28599214553833, "step": 817} +{"train_info/time_between_train_steps": 0.003051280975341797, "step": 817} +{"info/global_step": 818, "train_info/time_within_train_step": 2.286419153213501, "step": 818} +{"train_info/time_between_train_steps": 0.003101825714111328, "step": 818} +{"info/global_step": 819, "train_info/time_within_train_step": 2.286595344543457, "step": 819} +{"train_info/time_between_train_steps": 0.003091096878051758, "step": 819} +{"info/global_step": 820, "train_info/time_within_train_step": 2.287177801132202, "step": 820} +{"train_info/time_between_train_steps": 0.0031042098999023438, "step": 820} +{"info/global_step": 821, "train_info/time_within_train_step": 2.2868447303771973, "step": 821} +{"train_info/time_between_train_steps": 0.0029981136322021484, "step": 821} +{"info/global_step": 822, "train_info/time_within_train_step": 2.2865922451019287, "step": 822} +{"train_info/time_between_train_steps": 0.0029921531677246094, "step": 822} +{"info/global_step": 823, "train_info/time_within_train_step": 2.286438226699829, "step": 823} +{"train_info/time_between_train_steps": 0.0030319690704345703, "step": 823} +{"info/global_step": 824, "train_info/time_within_train_step": 2.2872087955474854, "step": 824} +{"train_info/time_between_train_steps": 0.003060579299926758, "step": 824} +{"info/global_step": 825, "train_info/time_within_train_step": 2.2871510982513428, "step": 825} +{"train_info/time_between_train_steps": 0.0030744075775146484, "step": 825} +{"info/global_step": 826, "train_info/time_within_train_step": 2.2862019538879395, "step": 826} +{"train_info/time_between_train_steps": 0.003076791763305664, "step": 826} +{"info/global_step": 827, "train_info/time_within_train_step": 2.2859671115875244, "step": 827} +{"train_info/time_between_train_steps": 0.0030498504638671875, "step": 827} +{"info/global_step": 828, "train_info/time_within_train_step": 2.285515546798706, "step": 828} +{"train_info/time_between_train_steps": 0.0030443668365478516, "step": 828} +{"info/global_step": 829, "train_info/time_within_train_step": 2.2864558696746826, "step": 829} +{"train_info/time_between_train_steps": 0.0031223297119140625, "step": 829} +{"info/global_step": 830, "train_info/time_within_train_step": 2.286206007003784, "step": 830} +{"train_info/time_between_train_steps": 0.0029838085174560547, "step": 830} +{"info/global_step": 831, "train_info/time_within_train_step": 2.286017894744873, "step": 831} +{"train_info/time_between_train_steps": 0.0029840469360351562, "step": 831} +{"info/global_step": 832, "train_info/time_within_train_step": 2.286255359649658, "step": 832} +{"train_info/time_between_train_steps": 0.003027200698852539, "step": 832} +{"info/global_step": 833, "train_info/time_within_train_step": 2.285681962966919, "step": 833} +{"train_info/time_between_train_steps": 0.003053426742553711, "step": 833} +{"info/global_step": 834, "train_info/time_within_train_step": 2.286541700363159, "step": 834} +{"train_info/time_between_train_steps": 0.003056049346923828, "step": 834} +{"info/global_step": 835, "train_info/time_within_train_step": 2.2860376834869385, "step": 835} +{"train_info/time_between_train_steps": 0.002966642379760742, "step": 835} +{"info/global_step": 836, "train_info/time_within_train_step": 2.2864768505096436, "step": 836} +{"train_info/time_between_train_steps": 0.0030355453491210938, "step": 836} +{"info/global_step": 837, "train_info/time_within_train_step": 2.285923719406128, "step": 837} +{"train_info/time_between_train_steps": 0.002940654754638672, "step": 837} +{"info/global_step": 838, "train_info/time_within_train_step": 2.287135124206543, "step": 838} +{"train_info/time_between_train_steps": 0.00298309326171875, "step": 838} +{"info/global_step": 839, "train_info/time_within_train_step": 2.2866523265838623, "step": 839} +{"train_info/time_between_train_steps": 0.002993345260620117, "step": 839} +{"info/global_step": 840, "train_info/time_within_train_step": 2.2868356704711914, "step": 840} +{"train_info/time_between_train_steps": 0.003071308135986328, "step": 840} +{"info/global_step": 841, "train_info/time_within_train_step": 2.286116361618042, "step": 841} +{"train_info/time_between_train_steps": 0.00299835205078125, "step": 841} +{"info/global_step": 842, "train_info/time_within_train_step": 2.286505699157715, "step": 842} +{"train_info/time_between_train_steps": 0.0030565261840820312, "step": 842} +{"info/global_step": 843, "train_info/time_within_train_step": 2.287794828414917, "step": 843} +{"train_info/time_between_train_steps": 0.0029900074005126953, "step": 843} +{"info/global_step": 844, "train_info/time_within_train_step": 2.2861149311065674, "step": 844} +{"train_info/time_between_train_steps": 0.0031104087829589844, "step": 844} +{"info/global_step": 845, "train_info/time_within_train_step": 2.286015510559082, "step": 845} +{"train_info/time_between_train_steps": 0.0029757022857666016, "step": 845} +{"info/global_step": 846, "train_info/time_within_train_step": 2.2860610485076904, "step": 846} +{"train_info/time_between_train_steps": 0.003000020980834961, "step": 846} +{"info/global_step": 847, "train_info/time_within_train_step": 2.2857065200805664, "step": 847} +{"train_info/time_between_train_steps": 0.0030107498168945312, "step": 847} +{"info/global_step": 848, "train_info/time_within_train_step": 2.286013126373291, "step": 848} +{"train_info/time_between_train_steps": 0.002971172332763672, "step": 848} +{"info/global_step": 849, "train_info/time_within_train_step": 2.285212755203247, "step": 849} +{"train_info/time_between_train_steps": 0.0030171871185302734, "step": 849} +{"info/global_step": 850, "train_info/time_within_train_step": 2.2855141162872314, "step": 850} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 4588.0, "train_info/memory_max_reserved": 4588.0, "_timestamp": 1746346005, "_runtime": 2102}, "step": 850} +{"logs": {"train/loss": 4.1126, "train/learning_rate": 0.0004777777777777777, "train/epoch": 0.28, "_timestamp": 1746346005, "_runtime": 2102}, "step": 850} +{"train_info/time_between_train_steps": 0.024573564529418945, "step": 850} +{"info/global_step": 851, "train_info/time_within_train_step": 2.285752773284912, "step": 851} +{"train_info/time_between_train_steps": 0.003087759017944336, "step": 851} +{"info/global_step": 852, "train_info/time_within_train_step": 2.286266326904297, "step": 852} +{"train_info/time_between_train_steps": 0.0029840469360351562, "step": 852} +{"info/global_step": 853, "train_info/time_within_train_step": 2.2855045795440674, "step": 853} +{"train_info/time_between_train_steps": 0.002967357635498047, "step": 853} +{"info/global_step": 854, "train_info/time_within_train_step": 2.2857720851898193, "step": 854} +{"train_info/time_between_train_steps": 0.0030069351196289062, "step": 854} +{"info/global_step": 855, "train_info/time_within_train_step": 2.2852554321289062, "step": 855} +{"train_info/time_between_train_steps": 0.00315093994140625, "step": 855} +{"info/global_step": 856, "train_info/time_within_train_step": 2.2869114875793457, "step": 856} +{"train_info/time_between_train_steps": 0.0029981136322021484, "step": 856} +{"info/global_step": 857, "train_info/time_within_train_step": 2.286187171936035, "step": 857} +{"train_info/time_between_train_steps": 0.003004312515258789, "step": 857} +{"info/global_step": 858, "train_info/time_within_train_step": 2.2857770919799805, "step": 858} +{"train_info/time_between_train_steps": 0.002971172332763672, "step": 858} +{"info/global_step": 859, "train_info/time_within_train_step": 2.2864785194396973, "step": 859} +{"train_info/time_between_train_steps": 0.002966165542602539, "step": 859} +{"info/global_step": 860, "train_info/time_within_train_step": 2.286608934402466, "step": 860} +{"train_info/time_between_train_steps": 0.0030624866485595703, "step": 860} +{"info/global_step": 861, "train_info/time_within_train_step": 2.286404609680176, "step": 861} +{"train_info/time_between_train_steps": 0.0030357837677001953, "step": 861} +{"info/global_step": 862, "train_info/time_within_train_step": 2.4984629154205322, "step": 862} +{"train_info/time_between_train_steps": 0.002960681915283203, "step": 862} +{"info/global_step": 863, "train_info/time_within_train_step": 2.2858896255493164, "step": 863} +{"train_info/time_between_train_steps": 0.00290679931640625, "step": 863} +{"info/global_step": 864, "train_info/time_within_train_step": 2.286109447479248, "step": 864} +{"train_info/time_between_train_steps": 0.002904176712036133, "step": 864} +{"info/global_step": 865, "train_info/time_within_train_step": 2.285984754562378, "step": 865} +{"train_info/time_between_train_steps": 0.0028944015502929688, "step": 865} +{"info/global_step": 866, "train_info/time_within_train_step": 2.285395860671997, "step": 866} +{"train_info/time_between_train_steps": 0.0028738975524902344, "step": 866} +{"info/global_step": 867, "train_info/time_within_train_step": 2.2852699756622314, "step": 867} +{"train_info/time_between_train_steps": 0.002901315689086914, "step": 867} +{"info/global_step": 868, "train_info/time_within_train_step": 2.285374879837036, "step": 868} +{"train_info/time_between_train_steps": 0.0028753280639648438, "step": 868} +{"info/global_step": 869, "train_info/time_within_train_step": 2.286428451538086, "step": 869} +{"train_info/time_between_train_steps": 0.002882719039916992, "step": 869} +{"info/global_step": 870, "train_info/time_within_train_step": 2.2844927310943604, "step": 870} +{"train_info/time_between_train_steps": 0.002873659133911133, "step": 870} +{"info/global_step": 871, "train_info/time_within_train_step": 2.284963607788086, "step": 871} +{"train_info/time_between_train_steps": 0.002948760986328125, "step": 871} +{"info/global_step": 872, "train_info/time_within_train_step": 2.2855193614959717, "step": 872} +{"train_info/time_between_train_steps": 0.002875804901123047, "step": 872} +{"info/global_step": 873, "train_info/time_within_train_step": 2.285191059112549, "step": 873} +{"train_info/time_between_train_steps": 0.002911090850830078, "step": 873} +{"info/global_step": 874, "train_info/time_within_train_step": 2.2858726978302, "step": 874} +{"train_info/time_between_train_steps": 0.0028908252716064453, "step": 874} +{"info/global_step": 875, "train_info/time_within_train_step": 2.285127878189087, "step": 875} +{"train_info/time_between_train_steps": 0.002900838851928711, "step": 875} +{"info/global_step": 876, "train_info/time_within_train_step": 2.2856032848358154, "step": 876} +{"train_info/time_between_train_steps": 0.002866029739379883, "step": 876} +{"info/global_step": 877, "train_info/time_within_train_step": 2.285491466522217, "step": 877} +{"train_info/time_between_train_steps": 0.002857685089111328, "step": 877} +{"info/global_step": 878, "train_info/time_within_train_step": 2.2863998413085938, "step": 878} +{"train_info/time_between_train_steps": 0.0028886795043945312, "step": 878} +{"info/global_step": 879, "train_info/time_within_train_step": 2.285637378692627, "step": 879} +{"train_info/time_between_train_steps": 0.002859830856323242, "step": 879} +{"info/global_step": 880, "train_info/time_within_train_step": 2.285297155380249, "step": 880} +{"train_info/time_between_train_steps": 0.0028934478759765625, "step": 880} +{"info/global_step": 881, "train_info/time_within_train_step": 2.2860374450683594, "step": 881} +{"train_info/time_between_train_steps": 0.0028808116912841797, "step": 881} +{"info/global_step": 882, "train_info/time_within_train_step": 2.286795139312744, "step": 882} +{"train_info/time_between_train_steps": 0.0029392242431640625, "step": 882} +{"info/global_step": 883, "train_info/time_within_train_step": 2.2859480381011963, "step": 883} +{"train_info/time_between_train_steps": 0.0028710365295410156, "step": 883} +{"info/global_step": 884, "train_info/time_within_train_step": 2.285595417022705, "step": 884} +{"train_info/time_between_train_steps": 0.0029191970825195312, "step": 884} +{"info/global_step": 885, "train_info/time_within_train_step": 2.285715103149414, "step": 885} +{"train_info/time_between_train_steps": 0.002853870391845703, "step": 885} +{"info/global_step": 886, "train_info/time_within_train_step": 2.286099910736084, "step": 886} +{"train_info/time_between_train_steps": 0.002856731414794922, "step": 886} +{"info/global_step": 887, "train_info/time_within_train_step": 2.286043167114258, "step": 887} +{"train_info/time_between_train_steps": 0.0028848648071289062, "step": 887} +{"info/global_step": 888, "train_info/time_within_train_step": 2.2859179973602295, "step": 888} +{"train_info/time_between_train_steps": 0.0029921531677246094, "step": 888} +{"info/global_step": 889, "train_info/time_within_train_step": 2.2850635051727295, "step": 889} +{"train_info/time_between_train_steps": 0.0028853416442871094, "step": 889} +{"info/global_step": 890, "train_info/time_within_train_step": 2.285283088684082, "step": 890} +{"train_info/time_between_train_steps": 0.0028929710388183594, "step": 890} +{"info/global_step": 891, "train_info/time_within_train_step": 2.2854745388031006, "step": 891} +{"train_info/time_between_train_steps": 0.0029370784759521484, "step": 891} +{"info/global_step": 892, "train_info/time_within_train_step": 2.2851433753967285, "step": 892} +{"train_info/time_between_train_steps": 0.002900838851928711, "step": 892} +{"info/global_step": 893, "train_info/time_within_train_step": 2.284327983856201, "step": 893} +{"train_info/time_between_train_steps": 0.002866029739379883, "step": 893} +{"info/global_step": 894, "train_info/time_within_train_step": 2.284752607345581, "step": 894} +{"train_info/time_between_train_steps": 0.0028738975524902344, "step": 894} +{"info/global_step": 895, "train_info/time_within_train_step": 2.2844958305358887, "step": 895} +{"train_info/time_between_train_steps": 0.002890348434448242, "step": 895} +{"info/global_step": 896, "train_info/time_within_train_step": 2.284909963607788, "step": 896} +{"train_info/time_between_train_steps": 0.0028715133666992188, "step": 896} +{"info/global_step": 897, "train_info/time_within_train_step": 2.284686326980591, "step": 897} +{"train_info/time_between_train_steps": 0.00292205810546875, "step": 897} +{"info/global_step": 898, "train_info/time_within_train_step": 2.2846853733062744, "step": 898} +{"train_info/time_between_train_steps": 0.002868175506591797, "step": 898} +{"info/global_step": 899, "train_info/time_within_train_step": 2.2846577167510986, "step": 899} +{"train_info/time_between_train_steps": 0.0028514862060546875, "step": 899} +{"info/global_step": 900, "train_info/time_within_train_step": 2.2856130599975586, "step": 900} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 4588.0, "train_info/memory_max_reserved": 4588.0, "_timestamp": 1746346121, "_runtime": 2218}, "step": 900} +{"logs": {"train/loss": 4.0515, "train/learning_rate": 0.0004666666666666666, "train/epoch": 0.3, "_timestamp": 1746346121, "_runtime": 2218}, "step": 900} +{"train_info/time_between_train_steps": 11.390202760696411, "step": 900} +{"info/global_step": 901, "train_info/time_within_train_step": 2.1347620487213135, "step": 901} +{"train_info/time_between_train_steps": 0.0028922557830810547, "step": 901} +{"info/global_step": 902, "train_info/time_within_train_step": 2.244244337081909, "step": 902} +{"train_info/time_between_train_steps": 0.003447294235229492, "step": 902} +{"info/global_step": 903, "train_info/time_within_train_step": 2.2071452140808105, "step": 903} +{"train_info/time_between_train_steps": 0.003001689910888672, "step": 903} +{"info/global_step": 904, "train_info/time_within_train_step": 2.283853530883789, "step": 904} +{"train_info/time_between_train_steps": 0.0028815269470214844, "step": 904} +{"info/global_step": 905, "train_info/time_within_train_step": 2.2832815647125244, "step": 905} +{"train_info/time_between_train_steps": 0.0028731822967529297, "step": 905} +{"info/global_step": 906, "train_info/time_within_train_step": 2.284043073654175, "step": 906} +{"train_info/time_between_train_steps": 0.002889871597290039, "step": 906} +{"info/global_step": 907, "train_info/time_within_train_step": 2.285810947418213, "step": 907} +{"train_info/time_between_train_steps": 0.0029137134552001953, "step": 907} +{"info/global_step": 908, "train_info/time_within_train_step": 2.284986972808838, "step": 908} +{"train_info/time_between_train_steps": 0.0028934478759765625, "step": 908} +{"info/global_step": 909, "train_info/time_within_train_step": 2.2859745025634766, "step": 909} +{"train_info/time_between_train_steps": 0.0029413700103759766, "step": 909} +{"info/global_step": 910, "train_info/time_within_train_step": 2.2850840091705322, "step": 910} +{"train_info/time_between_train_steps": 0.002963542938232422, "step": 910} +{"info/global_step": 911, "train_info/time_within_train_step": 2.2854666709899902, "step": 911} +{"train_info/time_between_train_steps": 0.0029392242431640625, "step": 911} +{"info/global_step": 912, "train_info/time_within_train_step": 2.2850730419158936, "step": 912} +{"train_info/time_between_train_steps": 0.002946615219116211, "step": 912} +{"info/global_step": 913, "train_info/time_within_train_step": 2.284961700439453, "step": 913} +{"train_info/time_between_train_steps": 0.002910614013671875, "step": 913} +{"info/global_step": 914, "train_info/time_within_train_step": 2.285288095474243, "step": 914} +{"train_info/time_between_train_steps": 0.002912759780883789, "step": 914} +{"info/global_step": 915, "train_info/time_within_train_step": 2.28593111038208, "step": 915} +{"train_info/time_between_train_steps": 0.0028934478759765625, "step": 915} +{"info/global_step": 916, "train_info/time_within_train_step": 2.285815477371216, "step": 916} +{"train_info/time_between_train_steps": 0.0028939247131347656, "step": 916} +{"info/global_step": 917, "train_info/time_within_train_step": 2.2853875160217285, "step": 917} +{"train_info/time_between_train_steps": 0.0059642791748046875, "step": 917} +{"info/global_step": 918, "train_info/time_within_train_step": 2.2854485511779785, "step": 918} +{"train_info/time_between_train_steps": 0.0029027462005615234, "step": 918} +{"info/global_step": 919, "train_info/time_within_train_step": 2.2842559814453125, "step": 919} +{"train_info/time_between_train_steps": 0.0029320716857910156, "step": 919} +{"info/global_step": 920, "train_info/time_within_train_step": 2.2849056720733643, "step": 920} +{"train_info/time_between_train_steps": 0.002928495407104492, "step": 920} +{"info/global_step": 921, "train_info/time_within_train_step": 2.2851462364196777, "step": 921} +{"train_info/time_between_train_steps": 0.0029387474060058594, "step": 921} +{"info/global_step": 922, "train_info/time_within_train_step": 2.286458730697632, "step": 922} +{"train_info/time_between_train_steps": 0.0028924942016601562, "step": 922} +{"info/global_step": 923, "train_info/time_within_train_step": 2.2858331203460693, "step": 923} +{"train_info/time_between_train_steps": 0.0029125213623046875, "step": 923} +{"info/global_step": 924, "train_info/time_within_train_step": 2.2855136394500732, "step": 924} +{"train_info/time_between_train_steps": 0.0028717517852783203, "step": 924} +{"info/global_step": 925, "train_info/time_within_train_step": 2.285386800765991, "step": 925} +{"train_info/time_between_train_steps": 0.0028896331787109375, "step": 925} +{"info/global_step": 926, "train_info/time_within_train_step": 2.285957098007202, "step": 926} +{"train_info/time_between_train_steps": 0.0029382705688476562, "step": 926} +{"info/global_step": 927, "train_info/time_within_train_step": 2.2861521244049072, "step": 927} +{"train_info/time_between_train_steps": 0.0028874874114990234, "step": 927} +{"info/global_step": 928, "train_info/time_within_train_step": 2.285978078842163, "step": 928} +{"train_info/time_between_train_steps": 0.0028803348541259766, "step": 928} +{"info/global_step": 929, "train_info/time_within_train_step": 2.28505802154541, "step": 929} +{"train_info/time_between_train_steps": 0.0028705596923828125, "step": 929} +{"info/global_step": 930, "train_info/time_within_train_step": 2.286045789718628, "step": 930} +{"train_info/time_between_train_steps": 0.002935171127319336, "step": 930} +{"info/global_step": 931, "train_info/time_within_train_step": 2.286194324493408, "step": 931} +{"train_info/time_between_train_steps": 0.002857208251953125, "step": 931} +{"info/global_step": 932, "train_info/time_within_train_step": 2.2852678298950195, "step": 932} +{"train_info/time_between_train_steps": 0.0028815269470214844, "step": 932} +{"info/global_step": 933, "train_info/time_within_train_step": 2.2857306003570557, "step": 933} +{"train_info/time_between_train_steps": 0.0029172897338867188, "step": 933} +{"info/global_step": 934, "train_info/time_within_train_step": 2.2857747077941895, "step": 934} +{"train_info/time_between_train_steps": 0.0029256343841552734, "step": 934} +{"info/global_step": 935, "train_info/time_within_train_step": 2.285871744155884, "step": 935} +{"train_info/time_between_train_steps": 0.0028815269470214844, "step": 935} +{"info/global_step": 936, "train_info/time_within_train_step": 2.2852325439453125, "step": 936} +{"train_info/time_between_train_steps": 0.002900362014770508, "step": 936} +{"info/global_step": 937, "train_info/time_within_train_step": 2.2856264114379883, "step": 937} +{"train_info/time_between_train_steps": 0.002849102020263672, "step": 937} +{"info/global_step": 938, "train_info/time_within_train_step": 2.2851572036743164, "step": 938} +{"train_info/time_between_train_steps": 0.0028641223907470703, "step": 938} +{"info/global_step": 939, "train_info/time_within_train_step": 2.285259485244751, "step": 939} +{"train_info/time_between_train_steps": 0.002878904342651367, "step": 939} +{"info/global_step": 940, "train_info/time_within_train_step": 2.2848610877990723, "step": 940} +{"train_info/time_between_train_steps": 0.0028624534606933594, "step": 940} +{"info/global_step": 941, "train_info/time_within_train_step": 2.4067933559417725, "step": 941} +{"train_info/time_between_train_steps": 0.0029556751251220703, "step": 941} +{"info/global_step": 942, "train_info/time_within_train_step": 2.2851719856262207, "step": 942} +{"train_info/time_between_train_steps": 0.0028569698333740234, "step": 942} +{"info/global_step": 943, "train_info/time_within_train_step": 2.2853972911834717, "step": 943} +{"train_info/time_between_train_steps": 0.0028786659240722656, "step": 943} +{"info/global_step": 944, "train_info/time_within_train_step": 2.28534197807312, "step": 944} +{"train_info/time_between_train_steps": 0.0028731822967529297, "step": 944} +{"info/global_step": 945, "train_info/time_within_train_step": 2.2851271629333496, "step": 945} +{"train_info/time_between_train_steps": 0.002853870391845703, "step": 945} +{"info/global_step": 946, "train_info/time_within_train_step": 2.2858335971832275, "step": 946} +{"train_info/time_between_train_steps": 0.002900838851928711, "step": 946} +{"info/global_step": 947, "train_info/time_within_train_step": 2.285515069961548, "step": 947} +{"train_info/time_between_train_steps": 0.0028998851776123047, "step": 947} +{"info/global_step": 948, "train_info/time_within_train_step": 2.2852230072021484, "step": 948} +{"train_info/time_between_train_steps": 0.0028743743896484375, "step": 948} +{"info/global_step": 949, "train_info/time_within_train_step": 2.2861578464508057, "step": 949} +{"train_info/time_between_train_steps": 0.0028884410858154297, "step": 949} +{"info/global_step": 950, "train_info/time_within_train_step": 2.286133050918579, "step": 950} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 4588.0, "train_info/memory_max_reserved": 4588.0, "_timestamp": 1746346248, "_runtime": 2345}, "step": 950} +{"logs": {"train/loss": 4.001, "train/learning_rate": 0.00045555555555555556, "train/epoch": 0.32, "_timestamp": 1746346248, "_runtime": 2345}, "step": 950} +{"train_info/time_between_train_steps": 0.023247718811035156, "step": 950} +{"info/global_step": 951, "train_info/time_within_train_step": 2.285740852355957, "step": 951} +{"train_info/time_between_train_steps": 0.00287628173828125, "step": 951} +{"info/global_step": 952, "train_info/time_within_train_step": 2.3173627853393555, "step": 952} +{"train_info/time_between_train_steps": 0.0028645992279052734, "step": 952} +{"info/global_step": 953, "train_info/time_within_train_step": 2.303805112838745, "step": 953} +{"train_info/time_between_train_steps": 0.0028319358825683594, "step": 953} +{"info/global_step": 954, "train_info/time_within_train_step": 2.2847840785980225, "step": 954} +{"train_info/time_between_train_steps": 0.002866029739379883, "step": 954} +{"info/global_step": 955, "train_info/time_within_train_step": 2.285221815109253, "step": 955} +{"train_info/time_between_train_steps": 0.002923727035522461, "step": 955} +{"info/global_step": 956, "train_info/time_within_train_step": 2.285402297973633, "step": 956} +{"train_info/time_between_train_steps": 0.002859830856323242, "step": 956} +{"info/global_step": 957, "train_info/time_within_train_step": 2.285571336746216, "step": 957} +{"train_info/time_between_train_steps": 0.0029044151306152344, "step": 957} +{"info/global_step": 958, "train_info/time_within_train_step": 2.2847158908843994, "step": 958} +{"train_info/time_between_train_steps": 0.002923727035522461, "step": 958} +{"info/global_step": 959, "train_info/time_within_train_step": 2.285097599029541, "step": 959} +{"train_info/time_between_train_steps": 0.002935171127319336, "step": 959} +{"info/global_step": 960, "train_info/time_within_train_step": 2.285223960876465, "step": 960} +{"train_info/time_between_train_steps": 0.0028619766235351562, "step": 960} +{"info/global_step": 961, "train_info/time_within_train_step": 2.2848875522613525, "step": 961} +{"train_info/time_between_train_steps": 0.0028760433197021484, "step": 961} +{"info/global_step": 962, "train_info/time_within_train_step": 2.284977436065674, "step": 962} +{"train_info/time_between_train_steps": 0.0028524398803710938, "step": 962} +{"info/global_step": 963, "train_info/time_within_train_step": 2.2850444316864014, "step": 963} +{"train_info/time_between_train_steps": 0.002889394760131836, "step": 963} +{"info/global_step": 964, "train_info/time_within_train_step": 2.285437822341919, "step": 964} +{"train_info/time_between_train_steps": 0.0028619766235351562, "step": 964} +{"info/global_step": 965, "train_info/time_within_train_step": 2.285527229309082, "step": 965} +{"train_info/time_between_train_steps": 0.002865314483642578, "step": 965} +{"info/global_step": 966, "train_info/time_within_train_step": 2.285614252090454, "step": 966} +{"train_info/time_between_train_steps": 0.0029218196868896484, "step": 966} +{"info/global_step": 967, "train_info/time_within_train_step": 2.2856791019439697, "step": 967} +{"train_info/time_between_train_steps": 0.0029087066650390625, "step": 967} +{"info/global_step": 968, "train_info/time_within_train_step": 2.2851767539978027, "step": 968} +{"train_info/time_between_train_steps": 0.002872943878173828, "step": 968} +{"info/global_step": 969, "train_info/time_within_train_step": 2.2853047847747803, "step": 969} +{"train_info/time_between_train_steps": 0.002963542938232422, "step": 969} +{"info/global_step": 970, "train_info/time_within_train_step": 2.2860326766967773, "step": 970} +{"train_info/time_between_train_steps": 0.0028612613677978516, "step": 970} +{"info/global_step": 971, "train_info/time_within_train_step": 2.2855875492095947, "step": 971} +{"train_info/time_between_train_steps": 0.002876758575439453, "step": 971} +{"info/global_step": 972, "train_info/time_within_train_step": 2.2852330207824707, "step": 972} +{"train_info/time_between_train_steps": 0.002898693084716797, "step": 972} +{"info/global_step": 973, "train_info/time_within_train_step": 2.2855286598205566, "step": 973} +{"train_info/time_between_train_steps": 0.00287628173828125, "step": 973} +{"info/global_step": 974, "train_info/time_within_train_step": 2.28532075881958, "step": 974} +{"train_info/time_between_train_steps": 0.0028803348541259766, "step": 974} +{"info/global_step": 975, "train_info/time_within_train_step": 2.285409450531006, "step": 975} +{"train_info/time_between_train_steps": 0.0028464794158935547, "step": 975} +{"info/global_step": 976, "train_info/time_within_train_step": 2.285099744796753, "step": 976} +{"train_info/time_between_train_steps": 0.0028905868530273438, "step": 976} +{"info/global_step": 977, "train_info/time_within_train_step": 2.2844982147216797, "step": 977} +{"train_info/time_between_train_steps": 0.0028808116912841797, "step": 977} +{"info/global_step": 978, "train_info/time_within_train_step": 2.3175461292266846, "step": 978} +{"train_info/time_between_train_steps": 0.002907276153564453, "step": 978} +{"info/global_step": 979, "train_info/time_within_train_step": 2.3035709857940674, "step": 979} +{"train_info/time_between_train_steps": 0.002863645553588867, "step": 979} +{"info/global_step": 980, "train_info/time_within_train_step": 2.284595012664795, "step": 980} +{"train_info/time_between_train_steps": 0.002864837646484375, "step": 980} +{"info/global_step": 981, "train_info/time_within_train_step": 2.2848918437957764, "step": 981} +{"train_info/time_between_train_steps": 0.002882242202758789, "step": 981} +{"info/global_step": 982, "train_info/time_within_train_step": 2.2843215465545654, "step": 982} +{"train_info/time_between_train_steps": 0.0029256343841552734, "step": 982} +{"info/global_step": 983, "train_info/time_within_train_step": 2.285417079925537, "step": 983} +{"train_info/time_between_train_steps": 0.002873659133911133, "step": 983} +{"info/global_step": 984, "train_info/time_within_train_step": 2.284850597381592, "step": 984} +{"train_info/time_between_train_steps": 0.0028786659240722656, "step": 984} +{"info/global_step": 985, "train_info/time_within_train_step": 2.2855684757232666, "step": 985} +{"train_info/time_between_train_steps": 0.002873659133911133, "step": 985} +{"info/global_step": 986, "train_info/time_within_train_step": 2.28528094291687, "step": 986} +{"train_info/time_between_train_steps": 0.002858400344848633, "step": 986} +{"info/global_step": 987, "train_info/time_within_train_step": 2.285074234008789, "step": 987} +{"train_info/time_between_train_steps": 0.0028972625732421875, "step": 987} +{"info/global_step": 988, "train_info/time_within_train_step": 2.28547739982605, "step": 988} +{"train_info/time_between_train_steps": 0.0028672218322753906, "step": 988} +{"info/global_step": 989, "train_info/time_within_train_step": 2.2856457233428955, "step": 989} +{"train_info/time_between_train_steps": 0.0029151439666748047, "step": 989} +{"info/global_step": 990, "train_info/time_within_train_step": 2.2863283157348633, "step": 990} +{"train_info/time_between_train_steps": 0.002886533737182617, "step": 990} +{"info/global_step": 991, "train_info/time_within_train_step": 2.2855637073516846, "step": 991} +{"train_info/time_between_train_steps": 0.0029020309448242188, "step": 991} +{"info/global_step": 992, "train_info/time_within_train_step": 2.2860090732574463, "step": 992} +{"train_info/time_between_train_steps": 0.0028753280639648438, "step": 992} +{"info/global_step": 993, "train_info/time_within_train_step": 2.285632848739624, "step": 993} +{"train_info/time_between_train_steps": 0.0028836727142333984, "step": 993} +{"info/global_step": 994, "train_info/time_within_train_step": 2.2854630947113037, "step": 994} +{"train_info/time_between_train_steps": 0.002851247787475586, "step": 994} +{"info/global_step": 995, "train_info/time_within_train_step": 2.2850685119628906, "step": 995} +{"train_info/time_between_train_steps": 0.002871274948120117, "step": 995} +{"info/global_step": 996, "train_info/time_within_train_step": 2.2851433753967285, "step": 996} +{"train_info/time_between_train_steps": 0.0028870105743408203, "step": 996} +{"info/global_step": 997, "train_info/time_within_train_step": 2.2855453491210938, "step": 997} +{"train_info/time_between_train_steps": 0.002911090850830078, "step": 997} +{"info/global_step": 998, "train_info/time_within_train_step": 2.2851545810699463, "step": 998} +{"train_info/time_between_train_steps": 0.0029375553131103516, "step": 998} +{"info/global_step": 999, "train_info/time_within_train_step": 2.2852578163146973, "step": 999} +{"train_info/time_between_train_steps": 0.002892732620239258, "step": 999} +{"info/global_step": 1000, "train_info/time_within_train_step": 2.621251106262207, "step": 1000} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 4588.0, "train_info/memory_max_reserved": 4588.0, "_timestamp": 1746346364, "_runtime": 2461}, "step": 1000} +{"logs": {"train/loss": 3.9562, "train/learning_rate": 0.00044444444444444436, "train/epoch": 0.33, "_timestamp": 1746346364, "_runtime": 2461}, "step": 1000} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746346369, "_runtime": 2466}, "step": 1000} +{"logs": {"eval/loss": 4.205341815948486, "eval/runtime": 5.6372, "eval/samples_per_second": 43.284, "eval/steps_per_second": 1.419, "train/epoch": 0.33, "_timestamp": 1746346369, "_runtime": 2466}, "step": 1000} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746346370, "_runtime": 2467}, "step": 1000} +{"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.205341815948486, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 67.04351029119135, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 5.6372, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 43.284, "train/epoch": 0.33, "_timestamp": 1746346370, "_runtime": 2467}, "step": 1000} +{"train_info/time_between_train_steps": 21.61821460723877, "step": 1000} +{"info/global_step": 1001, "train_info/time_within_train_step": 2.114335060119629, "step": 1001} +{"train_info/time_between_train_steps": 0.0030107498168945312, "step": 1001} +{"info/global_step": 1002, "train_info/time_within_train_step": 2.100193738937378, "step": 1002} +{"train_info/time_between_train_steps": 0.002916574478149414, "step": 1002} +{"info/global_step": 1003, "train_info/time_within_train_step": 2.1937501430511475, "step": 1003} +{"train_info/time_between_train_steps": 0.0029184818267822266, "step": 1003} +{"info/global_step": 1004, "train_info/time_within_train_step": 2.284675121307373, "step": 1004} +{"train_info/time_between_train_steps": 0.00295257568359375, "step": 1004} +{"info/global_step": 1005, "train_info/time_within_train_step": 2.285310745239258, "step": 1005} +{"train_info/time_between_train_steps": 0.0028848648071289062, "step": 1005} +{"info/global_step": 1006, "train_info/time_within_train_step": 2.285696029663086, "step": 1006} +{"train_info/time_between_train_steps": 0.002885580062866211, "step": 1006} +{"info/global_step": 1007, "train_info/time_within_train_step": 2.286538600921631, "step": 1007} +{"train_info/time_between_train_steps": 0.0028929710388183594, "step": 1007} +{"info/global_step": 1008, "train_info/time_within_train_step": 2.2861905097961426, "step": 1008} +{"train_info/time_between_train_steps": 0.0028672218322753906, "step": 1008} +{"info/global_step": 1009, "train_info/time_within_train_step": 2.2857916355133057, "step": 1009} +{"train_info/time_between_train_steps": 0.002885103225708008, "step": 1009} +{"info/global_step": 1010, "train_info/time_within_train_step": 2.2858479022979736, "step": 1010} +{"train_info/time_between_train_steps": 0.002863645553588867, "step": 1010} +{"info/global_step": 1011, "train_info/time_within_train_step": 2.2860920429229736, "step": 1011} +{"train_info/time_between_train_steps": 0.0028760433197021484, "step": 1011} +{"info/global_step": 1012, "train_info/time_within_train_step": 2.286336898803711, "step": 1012} +{"train_info/time_between_train_steps": 0.002878427505493164, "step": 1012} +{"info/global_step": 1013, "train_info/time_within_train_step": 2.3700215816497803, "step": 1013} +{"train_info/time_between_train_steps": 0.0028810501098632812, "step": 1013} +{"info/global_step": 1014, "train_info/time_within_train_step": 2.286097764968872, "step": 1014} +{"train_info/time_between_train_steps": 0.002870321273803711, "step": 1014} +{"info/global_step": 1015, "train_info/time_within_train_step": 2.286733627319336, "step": 1015} +{"train_info/time_between_train_steps": 0.002886056900024414, "step": 1015} +{"info/global_step": 1016, "train_info/time_within_train_step": 2.2878448963165283, "step": 1016} +{"train_info/time_between_train_steps": 0.002845287322998047, "step": 1016} +{"info/global_step": 1017, "train_info/time_within_train_step": 2.287163019180298, "step": 1017} +{"train_info/time_between_train_steps": 0.0029175281524658203, "step": 1017} +{"info/global_step": 1018, "train_info/time_within_train_step": 2.2871322631835938, "step": 1018} +{"train_info/time_between_train_steps": 0.00287628173828125, "step": 1018} +{"info/global_step": 1019, "train_info/time_within_train_step": 2.2874648571014404, "step": 1019} +{"train_info/time_between_train_steps": 0.002895355224609375, "step": 1019} +{"info/global_step": 1020, "train_info/time_within_train_step": 2.2875888347625732, "step": 1020} +{"train_info/time_between_train_steps": 0.0028841495513916016, "step": 1020} +{"info/global_step": 1021, "train_info/time_within_train_step": 2.287166118621826, "step": 1021} +{"train_info/time_between_train_steps": 0.0028502941131591797, "step": 1021} +{"info/global_step": 1022, "train_info/time_within_train_step": 2.2876136302948, "step": 1022} +{"train_info/time_between_train_steps": 0.0028641223907470703, "step": 1022} +{"info/global_step": 1023, "train_info/time_within_train_step": 2.2879629135131836, "step": 1023} +{"train_info/time_between_train_steps": 0.0028781890869140625, "step": 1023} +{"info/global_step": 1024, "train_info/time_within_train_step": 2.2880542278289795, "step": 1024} +{"train_info/time_between_train_steps": 0.002877473831176758, "step": 1024} +{"info/global_step": 1025, "train_info/time_within_train_step": 2.2884042263031006, "step": 1025} +{"train_info/time_between_train_steps": 0.002844095230102539, "step": 1025} +{"info/global_step": 1026, "train_info/time_within_train_step": 2.2877869606018066, "step": 1026} +{"train_info/time_between_train_steps": 0.0029168128967285156, "step": 1026} +{"info/global_step": 1027, "train_info/time_within_train_step": 2.2873170375823975, "step": 1027} +{"train_info/time_between_train_steps": 0.0028676986694335938, "step": 1027} +{"info/global_step": 1028, "train_info/time_within_train_step": 2.287449598312378, "step": 1028} +{"train_info/time_between_train_steps": 0.0029082298278808594, "step": 1028} +{"info/global_step": 1029, "train_info/time_within_train_step": 2.2867894172668457, "step": 1029} +{"train_info/time_between_train_steps": 0.002880573272705078, "step": 1029} +{"info/global_step": 1030, "train_info/time_within_train_step": 2.287046194076538, "step": 1030} +{"train_info/time_between_train_steps": 0.002864360809326172, "step": 1030} +{"info/global_step": 1031, "train_info/time_within_train_step": 2.2870612144470215, "step": 1031} +{"train_info/time_between_train_steps": 0.0028481483459472656, "step": 1031} +{"info/global_step": 1032, "train_info/time_within_train_step": 2.286811590194702, "step": 1032} +{"train_info/time_between_train_steps": 0.002833843231201172, "step": 1032} +{"info/global_step": 1033, "train_info/time_within_train_step": 2.28629994392395, "step": 1033} +{"train_info/time_between_train_steps": 0.0028748512268066406, "step": 1033} +{"info/global_step": 1034, "train_info/time_within_train_step": 2.2862448692321777, "step": 1034} +{"train_info/time_between_train_steps": 0.002886533737182617, "step": 1034} +{"info/global_step": 1035, "train_info/time_within_train_step": 2.287465810775757, "step": 1035} +{"train_info/time_between_train_steps": 0.002901315689086914, "step": 1035} +{"info/global_step": 1036, "train_info/time_within_train_step": 2.286761999130249, "step": 1036} +{"train_info/time_between_train_steps": 0.002887248992919922, "step": 1036} +{"info/global_step": 1037, "train_info/time_within_train_step": 2.2872629165649414, "step": 1037} +{"train_info/time_between_train_steps": 0.002871274948120117, "step": 1037} +{"info/global_step": 1038, "train_info/time_within_train_step": 2.2874162197113037, "step": 1038} +{"train_info/time_between_train_steps": 0.00287628173828125, "step": 1038} +{"info/global_step": 1039, "train_info/time_within_train_step": 2.286835193634033, "step": 1039} +{"train_info/time_between_train_steps": 0.0029075145721435547, "step": 1039} +{"info/global_step": 1040, "train_info/time_within_train_step": 2.2872395515441895, "step": 1040} +{"train_info/time_between_train_steps": 0.0028574466705322266, "step": 1040} +{"info/global_step": 1041, "train_info/time_within_train_step": 2.286241292953491, "step": 1041} +{"train_info/time_between_train_steps": 0.002900362014770508, "step": 1041} +{"info/global_step": 1042, "train_info/time_within_train_step": 2.2866740226745605, "step": 1042} +{"train_info/time_between_train_steps": 0.002859830856323242, "step": 1042} +{"info/global_step": 1043, "train_info/time_within_train_step": 2.285895824432373, "step": 1043} +{"train_info/time_between_train_steps": 0.002875804901123047, "step": 1043} +{"info/global_step": 1044, "train_info/time_within_train_step": 2.2862093448638916, "step": 1044} +{"train_info/time_between_train_steps": 0.0028650760650634766, "step": 1044} +{"info/global_step": 1045, "train_info/time_within_train_step": 2.2866227626800537, "step": 1045} +{"train_info/time_between_train_steps": 0.002870321273803711, "step": 1045} +{"info/global_step": 1046, "train_info/time_within_train_step": 2.2864091396331787, "step": 1046} +{"train_info/time_between_train_steps": 0.0028753280639648438, "step": 1046} +{"info/global_step": 1047, "train_info/time_within_train_step": 2.286266326904297, "step": 1047} +{"train_info/time_between_train_steps": 0.002885103225708008, "step": 1047} +{"info/global_step": 1048, "train_info/time_within_train_step": 2.286048650741577, "step": 1048} +{"train_info/time_between_train_steps": 0.002896547317504883, "step": 1048} +{"info/global_step": 1049, "train_info/time_within_train_step": 2.2866384983062744, "step": 1049} +{"train_info/time_between_train_steps": 0.0028607845306396484, "step": 1049} +{"info/global_step": 1050, "train_info/time_within_train_step": 2.286463737487793, "step": 1050} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746346501, "_runtime": 2598}, "step": 1050} +{"logs": {"train/loss": 3.9171, "train/learning_rate": 0.0004333333333333333, "train/epoch": 0.35, "_timestamp": 1746346501, "_runtime": 2598}, "step": 1050} +{"train_info/time_between_train_steps": 0.02440500259399414, "step": 1050} +{"info/global_step": 1051, "train_info/time_within_train_step": 2.287196159362793, "step": 1051} +{"train_info/time_between_train_steps": 0.002864837646484375, "step": 1051} +{"info/global_step": 1052, "train_info/time_within_train_step": 2.286656618118286, "step": 1052} +{"train_info/time_between_train_steps": 0.002877473831176758, "step": 1052} +{"info/global_step": 1053, "train_info/time_within_train_step": 2.2862231731414795, "step": 1053} +{"train_info/time_between_train_steps": 0.0029582977294921875, "step": 1053} +{"info/global_step": 1054, "train_info/time_within_train_step": 2.2869739532470703, "step": 1054} +{"train_info/time_between_train_steps": 0.0028429031372070312, "step": 1054} +{"info/global_step": 1055, "train_info/time_within_train_step": 2.286052942276001, "step": 1055} +{"train_info/time_between_train_steps": 0.0028502941131591797, "step": 1055} +{"info/global_step": 1056, "train_info/time_within_train_step": 2.286473274230957, "step": 1056} +{"train_info/time_between_train_steps": 0.0029332637786865234, "step": 1056} +{"info/global_step": 1057, "train_info/time_within_train_step": 2.28593373298645, "step": 1057} +{"train_info/time_between_train_steps": 0.0029435157775878906, "step": 1057} +{"info/global_step": 1058, "train_info/time_within_train_step": 2.2867584228515625, "step": 1058} +{"train_info/time_between_train_steps": 0.0029430389404296875, "step": 1058} +{"info/global_step": 1059, "train_info/time_within_train_step": 2.286362886428833, "step": 1059} +{"train_info/time_between_train_steps": 0.0029821395874023438, "step": 1059} +{"info/global_step": 1060, "train_info/time_within_train_step": 2.286381483078003, "step": 1060} +{"train_info/time_between_train_steps": 0.002918720245361328, "step": 1060} +{"info/global_step": 1061, "train_info/time_within_train_step": 2.285903215408325, "step": 1061} +{"train_info/time_between_train_steps": 0.0028917789459228516, "step": 1061} +{"info/global_step": 1062, "train_info/time_within_train_step": 2.286273956298828, "step": 1062} +{"train_info/time_between_train_steps": 0.002862215042114258, "step": 1062} +{"info/global_step": 1063, "train_info/time_within_train_step": 2.2859835624694824, "step": 1063} +{"train_info/time_between_train_steps": 0.0028722286224365234, "step": 1063} +{"info/global_step": 1064, "train_info/time_within_train_step": 2.286285161972046, "step": 1064} +{"train_info/time_between_train_steps": 0.0029730796813964844, "step": 1064} +{"info/global_step": 1065, "train_info/time_within_train_step": 2.285445213317871, "step": 1065} +{"train_info/time_between_train_steps": 0.0029494762420654297, "step": 1065} +{"info/global_step": 1066, "train_info/time_within_train_step": 2.2866029739379883, "step": 1066} +{"train_info/time_between_train_steps": 0.0029828548431396484, "step": 1066} +{"info/global_step": 1067, "train_info/time_within_train_step": 2.286729097366333, "step": 1067} +{"train_info/time_between_train_steps": 0.0030651092529296875, "step": 1067} +{"info/global_step": 1068, "train_info/time_within_train_step": 2.286743402481079, "step": 1068} +{"train_info/time_between_train_steps": 0.002889871597290039, "step": 1068} +{"info/global_step": 1069, "train_info/time_within_train_step": 2.286937713623047, "step": 1069} +{"train_info/time_between_train_steps": 0.0029687881469726562, "step": 1069} +{"info/global_step": 1070, "train_info/time_within_train_step": 2.287008285522461, "step": 1070} +{"train_info/time_between_train_steps": 0.002969980239868164, "step": 1070} +{"info/global_step": 1071, "train_info/time_within_train_step": 2.287102460861206, "step": 1071} +{"train_info/time_between_train_steps": 0.002872943878173828, "step": 1071} +{"info/global_step": 1072, "train_info/time_within_train_step": 2.2870450019836426, "step": 1072} +{"train_info/time_between_train_steps": 0.003127574920654297, "step": 1072} +{"info/global_step": 1073, "train_info/time_within_train_step": 2.2866320610046387, "step": 1073} +{"train_info/time_between_train_steps": 0.003056049346923828, "step": 1073} +{"info/global_step": 1074, "train_info/time_within_train_step": 2.2869694232940674, "step": 1074} +{"train_info/time_between_train_steps": 0.0031490325927734375, "step": 1074} +{"info/global_step": 1075, "train_info/time_within_train_step": 2.286707878112793, "step": 1075} +{"train_info/time_between_train_steps": 0.003156900405883789, "step": 1075} +{"info/global_step": 1076, "train_info/time_within_train_step": 2.2863566875457764, "step": 1076} +{"train_info/time_between_train_steps": 0.0030412673950195312, "step": 1076} +{"info/global_step": 1077, "train_info/time_within_train_step": 2.286328077316284, "step": 1077} +{"train_info/time_between_train_steps": 0.0030815601348876953, "step": 1077} +{"info/global_step": 1078, "train_info/time_within_train_step": 2.2870352268218994, "step": 1078} +{"train_info/time_between_train_steps": 0.0030546188354492188, "step": 1078} +{"info/global_step": 1079, "train_info/time_within_train_step": 2.2864913940429688, "step": 1079} +{"train_info/time_between_train_steps": 0.0030722618103027344, "step": 1079} +{"info/global_step": 1080, "train_info/time_within_train_step": 2.286682367324829, "step": 1080} +{"train_info/time_between_train_steps": 0.0032074451446533203, "step": 1080} +{"info/global_step": 1081, "train_info/time_within_train_step": 2.2866783142089844, "step": 1081} +{"train_info/time_between_train_steps": 0.003295421600341797, "step": 1081} +{"info/global_step": 1082, "train_info/time_within_train_step": 2.2871742248535156, "step": 1082} +{"train_info/time_between_train_steps": 0.003063678741455078, "step": 1082} +{"info/global_step": 1083, "train_info/time_within_train_step": 2.2864232063293457, "step": 1083} +{"train_info/time_between_train_steps": 0.003291606903076172, "step": 1083} +{"info/global_step": 1084, "train_info/time_within_train_step": 2.2873480319976807, "step": 1084} +{"train_info/time_between_train_steps": 0.0033178329467773438, "step": 1084} +{"info/global_step": 1085, "train_info/time_within_train_step": 2.287436008453369, "step": 1085} +{"train_info/time_between_train_steps": 0.0032689571380615234, "step": 1085} +{"info/global_step": 1086, "train_info/time_within_train_step": 2.2879674434661865, "step": 1086} +{"train_info/time_between_train_steps": 0.0031991004943847656, "step": 1086} +{"info/global_step": 1087, "train_info/time_within_train_step": 2.287642002105713, "step": 1087} +{"train_info/time_between_train_steps": 0.003351926803588867, "step": 1087} +{"info/global_step": 1088, "train_info/time_within_train_step": 2.2881052494049072, "step": 1088} +{"train_info/time_between_train_steps": 0.003354787826538086, "step": 1088} +{"info/global_step": 1089, "train_info/time_within_train_step": 2.2884745597839355, "step": 1089} +{"train_info/time_between_train_steps": 0.0035638809204101562, "step": 1089} +{"info/global_step": 1090, "train_info/time_within_train_step": 2.2884726524353027, "step": 1090} +{"train_info/time_between_train_steps": 0.003347158432006836, "step": 1090} +{"info/global_step": 1091, "train_info/time_within_train_step": 2.288771152496338, "step": 1091} +{"train_info/time_between_train_steps": 0.003765106201171875, "step": 1091} +{"info/global_step": 1092, "train_info/time_within_train_step": 2.2887091636657715, "step": 1092} +{"train_info/time_between_train_steps": 1.8863434791564941, "step": 1092} +{"info/global_step": 1093, "train_info/time_within_train_step": 2.2854833602905273, "step": 1093} +{"train_info/time_between_train_steps": 0.0031578540802001953, "step": 1093} +{"info/global_step": 1094, "train_info/time_within_train_step": 2.2869837284088135, "step": 1094} +{"train_info/time_between_train_steps": 0.0031311511993408203, "step": 1094} +{"info/global_step": 1095, "train_info/time_within_train_step": 2.286062479019165, "step": 1095} +{"train_info/time_between_train_steps": 0.0031082630157470703, "step": 1095} +{"info/global_step": 1096, "train_info/time_within_train_step": 2.285876750946045, "step": 1096} +{"train_info/time_between_train_steps": 0.0030891895294189453, "step": 1096} +{"info/global_step": 1097, "train_info/time_within_train_step": 2.286713123321533, "step": 1097} +{"train_info/time_between_train_steps": 0.0030908584594726562, "step": 1097} +{"info/global_step": 1098, "train_info/time_within_train_step": 2.2873375415802, "step": 1098} +{"train_info/time_between_train_steps": 0.003093242645263672, "step": 1098} +{"info/global_step": 1099, "train_info/time_within_train_step": 2.3337178230285645, "step": 1099} +{"train_info/time_between_train_steps": 0.0031280517578125, "step": 1099} +{"info/global_step": 1100, "train_info/time_within_train_step": 2.286834239959717, "step": 1100} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746346618, "_runtime": 2715}, "step": 1100} +{"logs": {"train/loss": 3.8806, "train/learning_rate": 0.0004222222222222222, "train/epoch": 1.0, "_timestamp": 1746346618, "_runtime": 2715}, "step": 1100} +{"train_info/time_between_train_steps": 12.067265748977661, "step": 1100} +{"info/global_step": 1101, "train_info/time_within_train_step": 2.112938642501831, "step": 1101} +{"train_info/time_between_train_steps": 0.003101348876953125, "step": 1101} +{"info/global_step": 1102, "train_info/time_within_train_step": 2.102748394012451, "step": 1102} +{"train_info/time_between_train_steps": 0.003117799758911133, "step": 1102} +{"info/global_step": 1103, "train_info/time_within_train_step": 2.2076284885406494, "step": 1103} +{"train_info/time_between_train_steps": 0.0031180381774902344, "step": 1103} +{"info/global_step": 1104, "train_info/time_within_train_step": 2.2848682403564453, "step": 1104} +{"train_info/time_between_train_steps": 0.0030832290649414062, "step": 1104} +{"info/global_step": 1105, "train_info/time_within_train_step": 2.2842507362365723, "step": 1105} +{"train_info/time_between_train_steps": 0.003083944320678711, "step": 1105} +{"info/global_step": 1106, "train_info/time_within_train_step": 2.2853660583496094, "step": 1106} +{"train_info/time_between_train_steps": 0.0030684471130371094, "step": 1106} +{"info/global_step": 1107, "train_info/time_within_train_step": 2.2854955196380615, "step": 1107} +{"train_info/time_between_train_steps": 0.003072977066040039, "step": 1107} +{"info/global_step": 1108, "train_info/time_within_train_step": 2.2862963676452637, "step": 1108} +{"train_info/time_between_train_steps": 0.0031058788299560547, "step": 1108} +{"info/global_step": 1109, "train_info/time_within_train_step": 2.285680055618286, "step": 1109} +{"train_info/time_between_train_steps": 0.003133535385131836, "step": 1109} +{"info/global_step": 1110, "train_info/time_within_train_step": 2.285430908203125, "step": 1110} +{"train_info/time_between_train_steps": 0.0031642913818359375, "step": 1110} +{"info/global_step": 1111, "train_info/time_within_train_step": 2.2861220836639404, "step": 1111} +{"train_info/time_between_train_steps": 0.003119945526123047, "step": 1111} +{"info/global_step": 1112, "train_info/time_within_train_step": 2.285228967666626, "step": 1112} +{"train_info/time_between_train_steps": 0.003262758255004883, "step": 1112} +{"info/global_step": 1113, "train_info/time_within_train_step": 2.2870965003967285, "step": 1113} +{"train_info/time_between_train_steps": 0.003072500228881836, "step": 1113} +{"info/global_step": 1114, "train_info/time_within_train_step": 2.286184310913086, "step": 1114} +{"train_info/time_between_train_steps": 0.003088712692260742, "step": 1114} +{"info/global_step": 1115, "train_info/time_within_train_step": 2.479149103164673, "step": 1115} +{"train_info/time_between_train_steps": 0.0031359195709228516, "step": 1115} +{"info/global_step": 1116, "train_info/time_within_train_step": 2.287609815597534, "step": 1116} +{"train_info/time_between_train_steps": 0.003100872039794922, "step": 1116} +{"info/global_step": 1117, "train_info/time_within_train_step": 2.2868714332580566, "step": 1117} +{"train_info/time_between_train_steps": 0.0031280517578125, "step": 1117} +{"info/global_step": 1118, "train_info/time_within_train_step": 2.287214994430542, "step": 1118} +{"train_info/time_between_train_steps": 0.0031397342681884766, "step": 1118} +{"info/global_step": 1119, "train_info/time_within_train_step": 2.287554979324341, "step": 1119} +{"train_info/time_between_train_steps": 0.003173351287841797, "step": 1119} +{"info/global_step": 1120, "train_info/time_within_train_step": 2.2872374057769775, "step": 1120} +{"train_info/time_between_train_steps": 0.0031549930572509766, "step": 1120} +{"info/global_step": 1121, "train_info/time_within_train_step": 2.2869064807891846, "step": 1121} +{"train_info/time_between_train_steps": 0.0031087398529052734, "step": 1121} +{"info/global_step": 1122, "train_info/time_within_train_step": 2.2871508598327637, "step": 1122} +{"train_info/time_between_train_steps": 0.0030965805053710938, "step": 1122} +{"info/global_step": 1123, "train_info/time_within_train_step": 2.2878286838531494, "step": 1123} +{"train_info/time_between_train_steps": 0.0030798912048339844, "step": 1123} +{"info/global_step": 1124, "train_info/time_within_train_step": 2.2878763675689697, "step": 1124} +{"train_info/time_between_train_steps": 0.0030744075775146484, "step": 1124} +{"info/global_step": 1125, "train_info/time_within_train_step": 2.2873008251190186, "step": 1125} +{"train_info/time_between_train_steps": 0.003116130828857422, "step": 1125} +{"info/global_step": 1126, "train_info/time_within_train_step": 2.287645101547241, "step": 1126} +{"train_info/time_between_train_steps": 0.003134489059448242, "step": 1126} +{"info/global_step": 1127, "train_info/time_within_train_step": 2.287546157836914, "step": 1127} +{"train_info/time_between_train_steps": 0.0031890869140625, "step": 1127} +{"info/global_step": 1128, "train_info/time_within_train_step": 2.286985158920288, "step": 1128} +{"train_info/time_between_train_steps": 0.00308990478515625, "step": 1128} +{"info/global_step": 1129, "train_info/time_within_train_step": 2.286555767059326, "step": 1129} +{"train_info/time_between_train_steps": 0.003085613250732422, "step": 1129} +{"info/global_step": 1130, "train_info/time_within_train_step": 2.2867488861083984, "step": 1130} +{"train_info/time_between_train_steps": 0.0031020641326904297, "step": 1130} +{"info/global_step": 1131, "train_info/time_within_train_step": 2.2871253490448, "step": 1131} +{"train_info/time_between_train_steps": 0.0031342506408691406, "step": 1131} +{"info/global_step": 1132, "train_info/time_within_train_step": 2.2860605716705322, "step": 1132} +{"train_info/time_between_train_steps": 0.0031578540802001953, "step": 1132} +{"info/global_step": 1133, "train_info/time_within_train_step": 2.287040948867798, "step": 1133} +{"train_info/time_between_train_steps": 0.003130674362182617, "step": 1133} +{"info/global_step": 1134, "train_info/time_within_train_step": 2.2866427898406982, "step": 1134} +{"train_info/time_between_train_steps": 0.003118753433227539, "step": 1134} +{"info/global_step": 1135, "train_info/time_within_train_step": 2.287034749984741, "step": 1135} +{"train_info/time_between_train_steps": 0.0031058788299560547, "step": 1135} +{"info/global_step": 1136, "train_info/time_within_train_step": 2.2866623401641846, "step": 1136} +{"train_info/time_between_train_steps": 0.00311279296875, "step": 1136} +{"info/global_step": 1137, "train_info/time_within_train_step": 2.2869338989257812, "step": 1137} +{"train_info/time_between_train_steps": 0.0033299922943115234, "step": 1137} +{"info/global_step": 1138, "train_info/time_within_train_step": 2.2876243591308594, "step": 1138} +{"train_info/time_between_train_steps": 0.0033168792724609375, "step": 1138} +{"info/global_step": 1139, "train_info/time_within_train_step": 2.2876205444335938, "step": 1139} +{"train_info/time_between_train_steps": 0.003353595733642578, "step": 1139} +{"info/global_step": 1140, "train_info/time_within_train_step": 2.2872557640075684, "step": 1140} +{"train_info/time_between_train_steps": 0.0034253597259521484, "step": 1140} +{"info/global_step": 1141, "train_info/time_within_train_step": 2.2872025966644287, "step": 1141} +{"train_info/time_between_train_steps": 0.0033807754516601562, "step": 1141} +{"info/global_step": 1142, "train_info/time_within_train_step": 2.288531541824341, "step": 1142} +{"train_info/time_between_train_steps": 0.0034482479095458984, "step": 1142} +{"info/global_step": 1143, "train_info/time_within_train_step": 2.2873501777648926, "step": 1143} +{"train_info/time_between_train_steps": 0.0033922195434570312, "step": 1143} +{"info/global_step": 1144, "train_info/time_within_train_step": 2.2874112129211426, "step": 1144} +{"train_info/time_between_train_steps": 0.0034246444702148438, "step": 1144} +{"info/global_step": 1145, "train_info/time_within_train_step": 2.2878968715667725, "step": 1145} +{"train_info/time_between_train_steps": 0.0034492015838623047, "step": 1145} +{"info/global_step": 1146, "train_info/time_within_train_step": 2.2891175746917725, "step": 1146} +{"train_info/time_between_train_steps": 0.0033783912658691406, "step": 1146} +{"info/global_step": 1147, "train_info/time_within_train_step": 2.287900924682617, "step": 1147} +{"train_info/time_between_train_steps": 0.0033795833587646484, "step": 1147} +{"info/global_step": 1148, "train_info/time_within_train_step": 2.2876169681549072, "step": 1148} +{"train_info/time_between_train_steps": 0.003385305404663086, "step": 1148} +{"info/global_step": 1149, "train_info/time_within_train_step": 2.2879209518432617, "step": 1149} +{"train_info/time_between_train_steps": 0.003416776657104492, "step": 1149} +{"info/global_step": 1150, "train_info/time_within_train_step": 2.2884020805358887, "step": 1150} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746346745, "_runtime": 2842}, "step": 1150} +{"logs": {"train/loss": 3.8468, "train/learning_rate": 0.0004111111111111111, "train/epoch": 1.02, "_timestamp": 1746346745, "_runtime": 2842}, "step": 1150} +{"train_info/time_between_train_steps": 0.0247647762298584, "step": 1150} +{"info/global_step": 1151, "train_info/time_within_train_step": 2.287850856781006, "step": 1151} +{"train_info/time_between_train_steps": 0.0034034252166748047, "step": 1151} +{"info/global_step": 1152, "train_info/time_within_train_step": 2.2876758575439453, "step": 1152} +{"train_info/time_between_train_steps": 0.0033898353576660156, "step": 1152} +{"info/global_step": 1153, "train_info/time_within_train_step": 2.28779673576355, "step": 1153} +{"train_info/time_between_train_steps": 0.0035011768341064453, "step": 1153} +{"info/global_step": 1154, "train_info/time_within_train_step": 2.288548469543457, "step": 1154} +{"train_info/time_between_train_steps": 0.0034134387969970703, "step": 1154} +{"info/global_step": 1155, "train_info/time_within_train_step": 2.453213930130005, "step": 1155} +{"train_info/time_between_train_steps": 0.003591775894165039, "step": 1155} +{"info/global_step": 1156, "train_info/time_within_train_step": 2.2892990112304688, "step": 1156} +{"train_info/time_between_train_steps": 0.003225088119506836, "step": 1156} +{"info/global_step": 1157, "train_info/time_within_train_step": 2.287017345428467, "step": 1157} +{"train_info/time_between_train_steps": 0.003278017044067383, "step": 1157} +{"info/global_step": 1158, "train_info/time_within_train_step": 2.286998987197876, "step": 1158} +{"train_info/time_between_train_steps": 0.003286600112915039, "step": 1158} +{"info/global_step": 1159, "train_info/time_within_train_step": 2.2874999046325684, "step": 1159} +{"train_info/time_between_train_steps": 0.003416299819946289, "step": 1159} +{"info/global_step": 1160, "train_info/time_within_train_step": 2.2869107723236084, "step": 1160} +{"train_info/time_between_train_steps": 0.003208637237548828, "step": 1160} +{"info/global_step": 1161, "train_info/time_within_train_step": 2.2874176502227783, "step": 1161} +{"train_info/time_between_train_steps": 0.003271818161010742, "step": 1161} +{"info/global_step": 1162, "train_info/time_within_train_step": 2.2864625453948975, "step": 1162} +{"train_info/time_between_train_steps": 0.003258228302001953, "step": 1162} +{"info/global_step": 1163, "train_info/time_within_train_step": 2.2866365909576416, "step": 1163} +{"train_info/time_between_train_steps": 0.0032269954681396484, "step": 1163} +{"info/global_step": 1164, "train_info/time_within_train_step": 2.287247896194458, "step": 1164} +{"train_info/time_between_train_steps": 0.0032813549041748047, "step": 1164} +{"info/global_step": 1165, "train_info/time_within_train_step": 2.287381649017334, "step": 1165} +{"train_info/time_between_train_steps": 0.003338336944580078, "step": 1165} +{"info/global_step": 1166, "train_info/time_within_train_step": 2.288233757019043, "step": 1166} +{"train_info/time_between_train_steps": 0.0032775402069091797, "step": 1166} +{"info/global_step": 1167, "train_info/time_within_train_step": 2.287140130996704, "step": 1167} +{"train_info/time_between_train_steps": 0.003269195556640625, "step": 1167} +{"info/global_step": 1168, "train_info/time_within_train_step": 2.287341594696045, "step": 1168} +{"train_info/time_between_train_steps": 0.003258228302001953, "step": 1168} +{"info/global_step": 1169, "train_info/time_within_train_step": 2.2871367931365967, "step": 1169} +{"train_info/time_between_train_steps": 0.0032300949096679688, "step": 1169} +{"info/global_step": 1170, "train_info/time_within_train_step": 2.2867674827575684, "step": 1170} +{"train_info/time_between_train_steps": 0.0032753944396972656, "step": 1170} +{"info/global_step": 1171, "train_info/time_within_train_step": 2.286708354949951, "step": 1171} +{"train_info/time_between_train_steps": 0.003238677978515625, "step": 1171} +{"info/global_step": 1172, "train_info/time_within_train_step": 2.2863008975982666, "step": 1172} +{"train_info/time_between_train_steps": 0.003241300582885742, "step": 1172} +{"info/global_step": 1173, "train_info/time_within_train_step": 2.2868943214416504, "step": 1173} +{"train_info/time_between_train_steps": 0.0032613277435302734, "step": 1173} +{"info/global_step": 1174, "train_info/time_within_train_step": 2.286425828933716, "step": 1174} +{"train_info/time_between_train_steps": 0.0032520294189453125, "step": 1174} +{"info/global_step": 1175, "train_info/time_within_train_step": 2.28664493560791, "step": 1175} +{"train_info/time_between_train_steps": 0.003245830535888672, "step": 1175} +{"info/global_step": 1176, "train_info/time_within_train_step": 2.2868192195892334, "step": 1176} +{"train_info/time_between_train_steps": 0.003181934356689453, "step": 1176} +{"info/global_step": 1177, "train_info/time_within_train_step": 2.2868499755859375, "step": 1177} +{"train_info/time_between_train_steps": 0.003186941146850586, "step": 1177} +{"info/global_step": 1178, "train_info/time_within_train_step": 2.286492347717285, "step": 1178} +{"train_info/time_between_train_steps": 0.0032205581665039062, "step": 1178} +{"info/global_step": 1179, "train_info/time_within_train_step": 2.286860942840576, "step": 1179} +{"train_info/time_between_train_steps": 0.0032558441162109375, "step": 1179} +{"info/global_step": 1180, "train_info/time_within_train_step": 2.287187337875366, "step": 1180} +{"train_info/time_between_train_steps": 0.003155946731567383, "step": 1180} +{"info/global_step": 1181, "train_info/time_within_train_step": 2.2863175868988037, "step": 1181} +{"train_info/time_between_train_steps": 0.0032346248626708984, "step": 1181} +{"info/global_step": 1182, "train_info/time_within_train_step": 2.286821126937866, "step": 1182} +{"train_info/time_between_train_steps": 0.003208637237548828, "step": 1182} +{"info/global_step": 1183, "train_info/time_within_train_step": 2.287071704864502, "step": 1183} +{"train_info/time_between_train_steps": 0.0031921863555908203, "step": 1183} +{"info/global_step": 1184, "train_info/time_within_train_step": 2.2872846126556396, "step": 1184} +{"train_info/time_between_train_steps": 0.0032205581665039062, "step": 1184} +{"info/global_step": 1185, "train_info/time_within_train_step": 2.286797046661377, "step": 1185} +{"train_info/time_between_train_steps": 0.003230571746826172, "step": 1185} +{"info/global_step": 1186, "train_info/time_within_train_step": 2.2873306274414062, "step": 1186} +{"train_info/time_between_train_steps": 0.003215789794921875, "step": 1186} +{"info/global_step": 1187, "train_info/time_within_train_step": 2.287411689758301, "step": 1187} +{"train_info/time_between_train_steps": 0.0031723976135253906, "step": 1187} +{"info/global_step": 1188, "train_info/time_within_train_step": 2.286879539489746, "step": 1188} +{"train_info/time_between_train_steps": 0.003154277801513672, "step": 1188} +{"info/global_step": 1189, "train_info/time_within_train_step": 2.2871429920196533, "step": 1189} +{"train_info/time_between_train_steps": 0.0032281875610351562, "step": 1189} +{"info/global_step": 1190, "train_info/time_within_train_step": 2.287132740020752, "step": 1190} +{"train_info/time_between_train_steps": 0.0032143592834472656, "step": 1190} +{"info/global_step": 1191, "train_info/time_within_train_step": 2.2868003845214844, "step": 1191} +{"train_info/time_between_train_steps": 0.0031592845916748047, "step": 1191} +{"info/global_step": 1192, "train_info/time_within_train_step": 2.286956310272217, "step": 1192} +{"train_info/time_between_train_steps": 0.003192901611328125, "step": 1192} +{"info/global_step": 1193, "train_info/time_within_train_step": 2.285801887512207, "step": 1193} +{"train_info/time_between_train_steps": 0.003176450729370117, "step": 1193} +{"info/global_step": 1194, "train_info/time_within_train_step": 2.2860679626464844, "step": 1194} +{"train_info/time_between_train_steps": 0.0032536983489990234, "step": 1194} +{"info/global_step": 1195, "train_info/time_within_train_step": 2.2870092391967773, "step": 1195} +{"train_info/time_between_train_steps": 0.003239870071411133, "step": 1195} +{"info/global_step": 1196, "train_info/time_within_train_step": 2.286968231201172, "step": 1196} +{"train_info/time_between_train_steps": 0.003275156021118164, "step": 1196} +{"info/global_step": 1197, "train_info/time_within_train_step": 2.286263942718506, "step": 1197} +{"train_info/time_between_train_steps": 0.003454923629760742, "step": 1197} +{"info/global_step": 1198, "train_info/time_within_train_step": 2.286825656890869, "step": 1198} +{"train_info/time_between_train_steps": 0.0033721923828125, "step": 1198} +{"info/global_step": 1199, "train_info/time_within_train_step": 2.286583662033081, "step": 1199} +{"train_info/time_between_train_steps": 0.003419160842895508, "step": 1199} +{"info/global_step": 1200, "train_info/time_within_train_step": 2.2869362831115723, "step": 1200} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746346861, "_runtime": 2958}, "step": 1200} +{"logs": {"train/loss": 3.8235, "train/learning_rate": 0.00039999999999999996, "train/epoch": 1.04, "_timestamp": 1746346861, "_runtime": 2958}, "step": 1200} +{"train_info/time_between_train_steps": 12.581591129302979, "step": 1200} +{"info/global_step": 1201, "train_info/time_within_train_step": 2.4235541820526123, "step": 1201} +{"train_info/time_between_train_steps": 0.003204822540283203, "step": 1201} +{"info/global_step": 1202, "train_info/time_within_train_step": 2.103959321975708, "step": 1202} +{"train_info/time_between_train_steps": 0.003172159194946289, "step": 1202} +{"info/global_step": 1203, "train_info/time_within_train_step": 2.1972641944885254, "step": 1203} +{"train_info/time_between_train_steps": 0.003145933151245117, "step": 1203} +{"info/global_step": 1204, "train_info/time_within_train_step": 2.2847025394439697, "step": 1204} +{"train_info/time_between_train_steps": 0.0031507015228271484, "step": 1204} +{"info/global_step": 1205, "train_info/time_within_train_step": 2.2852890491485596, "step": 1205} +{"train_info/time_between_train_steps": 0.0031664371490478516, "step": 1205} +{"info/global_step": 1206, "train_info/time_within_train_step": 2.285745143890381, "step": 1206} +{"train_info/time_between_train_steps": 0.0031638145446777344, "step": 1206} +{"info/global_step": 1207, "train_info/time_within_train_step": 2.287120819091797, "step": 1207} +{"train_info/time_between_train_steps": 0.003164529800415039, "step": 1207} +{"info/global_step": 1208, "train_info/time_within_train_step": 2.2870657444000244, "step": 1208} +{"train_info/time_between_train_steps": 0.0031871795654296875, "step": 1208} +{"info/global_step": 1209, "train_info/time_within_train_step": 2.2874133586883545, "step": 1209} +{"train_info/time_between_train_steps": 0.003171205520629883, "step": 1209} +{"info/global_step": 1210, "train_info/time_within_train_step": 2.287198066711426, "step": 1210} +{"train_info/time_between_train_steps": 0.0031783580780029297, "step": 1210} +{"info/global_step": 1211, "train_info/time_within_train_step": 2.2866768836975098, "step": 1211} +{"train_info/time_between_train_steps": 0.0031490325927734375, "step": 1211} +{"info/global_step": 1212, "train_info/time_within_train_step": 2.2875447273254395, "step": 1212} +{"train_info/time_between_train_steps": 0.003140687942504883, "step": 1212} +{"info/global_step": 1213, "train_info/time_within_train_step": 2.287400484085083, "step": 1213} +{"train_info/time_between_train_steps": 0.0032134056091308594, "step": 1213} +{"info/global_step": 1214, "train_info/time_within_train_step": 2.287769079208374, "step": 1214} +{"train_info/time_between_train_steps": 0.0031769275665283203, "step": 1214} +{"info/global_step": 1215, "train_info/time_within_train_step": 2.2877488136291504, "step": 1215} +{"train_info/time_between_train_steps": 0.003143787384033203, "step": 1215} +{"info/global_step": 1216, "train_info/time_within_train_step": 2.288174629211426, "step": 1216} +{"train_info/time_between_train_steps": 0.003160238265991211, "step": 1216} +{"info/global_step": 1217, "train_info/time_within_train_step": 2.2876415252685547, "step": 1217} +{"train_info/time_between_train_steps": 0.13883423805236816, "step": 1217} +{"info/global_step": 1218, "train_info/time_within_train_step": 2.2870445251464844, "step": 1218} +{"train_info/time_between_train_steps": 0.003129720687866211, "step": 1218} +{"info/global_step": 1219, "train_info/time_within_train_step": 2.286973237991333, "step": 1219} +{"train_info/time_between_train_steps": 0.0031299591064453125, "step": 1219} +{"info/global_step": 1220, "train_info/time_within_train_step": 2.2878055572509766, "step": 1220} +{"train_info/time_between_train_steps": 0.0031769275665283203, "step": 1220} +{"info/global_step": 1221, "train_info/time_within_train_step": 2.2873237133026123, "step": 1221} +{"train_info/time_between_train_steps": 0.0032036304473876953, "step": 1221} +{"info/global_step": 1222, "train_info/time_within_train_step": 2.286383867263794, "step": 1222} +{"train_info/time_between_train_steps": 0.003173828125, "step": 1222} +{"info/global_step": 1223, "train_info/time_within_train_step": 2.286668062210083, "step": 1223} +{"train_info/time_between_train_steps": 0.003161191940307617, "step": 1223} +{"info/global_step": 1224, "train_info/time_within_train_step": 2.2877089977264404, "step": 1224} +{"train_info/time_between_train_steps": 0.0031502246856689453, "step": 1224} +{"info/global_step": 1225, "train_info/time_within_train_step": 2.2871060371398926, "step": 1225} +{"train_info/time_between_train_steps": 0.0031414031982421875, "step": 1225} +{"info/global_step": 1226, "train_info/time_within_train_step": 2.3293731212615967, "step": 1226} +{"train_info/time_between_train_steps": 0.0031702518463134766, "step": 1226} +{"info/global_step": 1227, "train_info/time_within_train_step": 2.287673234939575, "step": 1227} +{"train_info/time_between_train_steps": 0.003145933151245117, "step": 1227} +{"info/global_step": 1228, "train_info/time_within_train_step": 2.287351131439209, "step": 1228} +{"train_info/time_between_train_steps": 0.0031585693359375, "step": 1228} +{"info/global_step": 1229, "train_info/time_within_train_step": 2.2875800132751465, "step": 1229} +{"train_info/time_between_train_steps": 0.0031957626342773438, "step": 1229} +{"info/global_step": 1230, "train_info/time_within_train_step": 2.2876932621002197, "step": 1230} +{"train_info/time_between_train_steps": 0.003204345703125, "step": 1230} +{"info/global_step": 1231, "train_info/time_within_train_step": 2.2879483699798584, "step": 1231} +{"train_info/time_between_train_steps": 0.003152132034301758, "step": 1231} +{"info/global_step": 1232, "train_info/time_within_train_step": 2.2872402667999268, "step": 1232} +{"train_info/time_between_train_steps": 0.0031816959381103516, "step": 1232} +{"info/global_step": 1233, "train_info/time_within_train_step": 2.2877604961395264, "step": 1233} +{"train_info/time_between_train_steps": 0.0032231807708740234, "step": 1233} +{"info/global_step": 1234, "train_info/time_within_train_step": 2.2878453731536865, "step": 1234} +{"train_info/time_between_train_steps": 0.003176450729370117, "step": 1234} +{"info/global_step": 1235, "train_info/time_within_train_step": 2.2870469093322754, "step": 1235} +{"train_info/time_between_train_steps": 0.003136873245239258, "step": 1235} +{"info/global_step": 1236, "train_info/time_within_train_step": 2.287273406982422, "step": 1236} +{"train_info/time_between_train_steps": 0.0031366348266601562, "step": 1236} +{"info/global_step": 1237, "train_info/time_within_train_step": 2.2868103981018066, "step": 1237} +{"train_info/time_between_train_steps": 0.003144979476928711, "step": 1237} +{"info/global_step": 1238, "train_info/time_within_train_step": 2.287277936935425, "step": 1238} +{"train_info/time_between_train_steps": 0.0031452178955078125, "step": 1238} +{"info/global_step": 1239, "train_info/time_within_train_step": 2.287491798400879, "step": 1239} +{"train_info/time_between_train_steps": 0.0031592845916748047, "step": 1239} +{"info/global_step": 1240, "train_info/time_within_train_step": 2.2867162227630615, "step": 1240} +{"train_info/time_between_train_steps": 0.0031516551971435547, "step": 1240} +{"info/global_step": 1241, "train_info/time_within_train_step": 2.2875659465789795, "step": 1241} +{"train_info/time_between_train_steps": 0.003184795379638672, "step": 1241} +{"info/global_step": 1242, "train_info/time_within_train_step": 2.2871081829071045, "step": 1242} +{"train_info/time_between_train_steps": 0.0031464099884033203, "step": 1242} +{"info/global_step": 1243, "train_info/time_within_train_step": 2.2872536182403564, "step": 1243} +{"train_info/time_between_train_steps": 0.003150463104248047, "step": 1243} +{"info/global_step": 1244, "train_info/time_within_train_step": 2.286616325378418, "step": 1244} +{"train_info/time_between_train_steps": 0.003168821334838867, "step": 1244} +{"info/global_step": 1245, "train_info/time_within_train_step": 2.2867259979248047, "step": 1245} +{"train_info/time_between_train_steps": 0.0033783912658691406, "step": 1245} +{"info/global_step": 1246, "train_info/time_within_train_step": 2.2874059677124023, "step": 1246} +{"train_info/time_between_train_steps": 0.003177642822265625, "step": 1246} +{"info/global_step": 1247, "train_info/time_within_train_step": 2.287708044052124, "step": 1247} +{"train_info/time_between_train_steps": 0.003160238265991211, "step": 1247} +{"info/global_step": 1248, "train_info/time_within_train_step": 2.2875301837921143, "step": 1248} +{"train_info/time_between_train_steps": 0.0031495094299316406, "step": 1248} +{"info/global_step": 1249, "train_info/time_within_train_step": 2.288039207458496, "step": 1249} +{"train_info/time_between_train_steps": 0.0031363964080810547, "step": 1249} +{"info/global_step": 1250, "train_info/time_within_train_step": 2.65439510345459, "step": 1250} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746346990, "_runtime": 3087}, "step": 1250} +{"logs": {"train/loss": 3.7888, "train/learning_rate": 0.00038888888888888887, "train/epoch": 1.05, "_timestamp": 1746346990, "_runtime": 3087}, "step": 1250} +{"train_info/time_between_train_steps": 0.02462148666381836, "step": 1250} +{"info/global_step": 1251, "train_info/time_within_train_step": 2.287383794784546, "step": 1251} +{"train_info/time_between_train_steps": 0.0031671524047851562, "step": 1251} +{"info/global_step": 1252, "train_info/time_within_train_step": 2.2875425815582275, "step": 1252} +{"train_info/time_between_train_steps": 0.0032074451446533203, "step": 1252} +{"info/global_step": 1253, "train_info/time_within_train_step": 2.287757158279419, "step": 1253} +{"train_info/time_between_train_steps": 0.003251314163208008, "step": 1253} +{"info/global_step": 1254, "train_info/time_within_train_step": 2.5051839351654053, "step": 1254} +{"train_info/time_between_train_steps": 0.0031805038452148438, "step": 1254} +{"info/global_step": 1255, "train_info/time_within_train_step": 2.287973642349243, "step": 1255} +{"train_info/time_between_train_steps": 0.0031385421752929688, "step": 1255} +{"info/global_step": 1256, "train_info/time_within_train_step": 2.2880537509918213, "step": 1256} +{"train_info/time_between_train_steps": 0.003149271011352539, "step": 1256} +{"info/global_step": 1257, "train_info/time_within_train_step": 2.28810453414917, "step": 1257} +{"train_info/time_between_train_steps": 0.0031342506408691406, "step": 1257} +{"info/global_step": 1258, "train_info/time_within_train_step": 2.2874562740325928, "step": 1258} +{"train_info/time_between_train_steps": 0.003170013427734375, "step": 1258} +{"info/global_step": 1259, "train_info/time_within_train_step": 2.28733491897583, "step": 1259} +{"train_info/time_between_train_steps": 0.0031507015228271484, "step": 1259} +{"info/global_step": 1260, "train_info/time_within_train_step": 2.287050485610962, "step": 1260} +{"train_info/time_between_train_steps": 0.003201723098754883, "step": 1260} +{"info/global_step": 1261, "train_info/time_within_train_step": 2.2869575023651123, "step": 1261} +{"train_info/time_between_train_steps": 0.0031185150146484375, "step": 1261} +{"info/global_step": 1262, "train_info/time_within_train_step": 2.2874016761779785, "step": 1262} +{"train_info/time_between_train_steps": 0.0031032562255859375, "step": 1262} +{"info/global_step": 1263, "train_info/time_within_train_step": 2.28657603263855, "step": 1263} +{"train_info/time_between_train_steps": 0.0031642913818359375, "step": 1263} +{"info/global_step": 1264, "train_info/time_within_train_step": 2.287304401397705, "step": 1264} +{"train_info/time_between_train_steps": 0.0031366348266601562, "step": 1264} +{"info/global_step": 1265, "train_info/time_within_train_step": 2.287109613418579, "step": 1265} +{"train_info/time_between_train_steps": 0.003149747848510742, "step": 1265} +{"info/global_step": 1266, "train_info/time_within_train_step": 2.287494421005249, "step": 1266} +{"train_info/time_between_train_steps": 0.003162860870361328, "step": 1266} +{"info/global_step": 1267, "train_info/time_within_train_step": 2.2872934341430664, "step": 1267} +{"train_info/time_between_train_steps": 0.0031480789184570312, "step": 1267} +{"info/global_step": 1268, "train_info/time_within_train_step": 2.286773443222046, "step": 1268} +{"train_info/time_between_train_steps": 0.003155231475830078, "step": 1268} +{"info/global_step": 1269, "train_info/time_within_train_step": 2.2870326042175293, "step": 1269} +{"train_info/time_between_train_steps": 0.0031409263610839844, "step": 1269} +{"info/global_step": 1270, "train_info/time_within_train_step": 2.287278652191162, "step": 1270} +{"train_info/time_between_train_steps": 0.003152608871459961, "step": 1270} +{"info/global_step": 1271, "train_info/time_within_train_step": 2.2874860763549805, "step": 1271} +{"train_info/time_between_train_steps": 0.0031151771545410156, "step": 1271} +{"info/global_step": 1272, "train_info/time_within_train_step": 2.287147045135498, "step": 1272} +{"train_info/time_between_train_steps": 0.0031349658966064453, "step": 1272} +{"info/global_step": 1273, "train_info/time_within_train_step": 2.28727388381958, "step": 1273} +{"train_info/time_between_train_steps": 0.0031576156616210938, "step": 1273} +{"info/global_step": 1274, "train_info/time_within_train_step": 2.2871437072753906, "step": 1274} +{"train_info/time_between_train_steps": 0.003103971481323242, "step": 1274} +{"info/global_step": 1275, "train_info/time_within_train_step": 2.2877256870269775, "step": 1275} +{"train_info/time_between_train_steps": 0.0032019615173339844, "step": 1275} +{"info/global_step": 1276, "train_info/time_within_train_step": 2.2880828380584717, "step": 1276} +{"train_info/time_between_train_steps": 0.00316619873046875, "step": 1276} +{"info/global_step": 1277, "train_info/time_within_train_step": 2.287811279296875, "step": 1277} +{"train_info/time_between_train_steps": 0.003183603286743164, "step": 1277} +{"info/global_step": 1278, "train_info/time_within_train_step": 2.2884387969970703, "step": 1278} +{"train_info/time_between_train_steps": 0.0031414031982421875, "step": 1278} +{"info/global_step": 1279, "train_info/time_within_train_step": 2.287642002105713, "step": 1279} +{"train_info/time_between_train_steps": 0.0031099319458007812, "step": 1279} +{"info/global_step": 1280, "train_info/time_within_train_step": 2.4310073852539062, "step": 1280} +{"train_info/time_between_train_steps": 0.003145933151245117, "step": 1280} +{"info/global_step": 1281, "train_info/time_within_train_step": 2.2873356342315674, "step": 1281} +{"train_info/time_between_train_steps": 0.0031387805938720703, "step": 1281} +{"info/global_step": 1282, "train_info/time_within_train_step": 2.2868826389312744, "step": 1282} +{"train_info/time_between_train_steps": 0.003202199935913086, "step": 1282} +{"info/global_step": 1283, "train_info/time_within_train_step": 2.2872354984283447, "step": 1283} +{"train_info/time_between_train_steps": 0.003218412399291992, "step": 1283} +{"info/global_step": 1284, "train_info/time_within_train_step": 2.2874672412872314, "step": 1284} +{"train_info/time_between_train_steps": 0.003194570541381836, "step": 1284} +{"info/global_step": 1285, "train_info/time_within_train_step": 2.2868762016296387, "step": 1285} +{"train_info/time_between_train_steps": 0.003131389617919922, "step": 1285} +{"info/global_step": 1286, "train_info/time_within_train_step": 2.2869129180908203, "step": 1286} +{"train_info/time_between_train_steps": 0.003153085708618164, "step": 1286} +{"info/global_step": 1287, "train_info/time_within_train_step": 2.287186622619629, "step": 1287} +{"train_info/time_between_train_steps": 0.003126859664916992, "step": 1287} +{"info/global_step": 1288, "train_info/time_within_train_step": 2.2865147590637207, "step": 1288} +{"train_info/time_between_train_steps": 0.003173351287841797, "step": 1288} +{"info/global_step": 1289, "train_info/time_within_train_step": 2.2863173484802246, "step": 1289} +{"train_info/time_between_train_steps": 0.0031414031982421875, "step": 1289} +{"info/global_step": 1290, "train_info/time_within_train_step": 2.2861990928649902, "step": 1290} +{"train_info/time_between_train_steps": 0.0031456947326660156, "step": 1290} +{"info/global_step": 1291, "train_info/time_within_train_step": 2.285799026489258, "step": 1291} +{"train_info/time_between_train_steps": 0.0031719207763671875, "step": 1291} +{"info/global_step": 1292, "train_info/time_within_train_step": 2.5014326572418213, "step": 1292} +{"train_info/time_between_train_steps": 0.0032291412353515625, "step": 1292} +{"info/global_step": 1293, "train_info/time_within_train_step": 2.2878928184509277, "step": 1293} +{"train_info/time_between_train_steps": 0.003181934356689453, "step": 1293} +{"info/global_step": 1294, "train_info/time_within_train_step": 2.287355661392212, "step": 1294} +{"train_info/time_between_train_steps": 0.0031392574310302734, "step": 1294} +{"info/global_step": 1295, "train_info/time_within_train_step": 2.2873923778533936, "step": 1295} +{"train_info/time_between_train_steps": 0.0031692981719970703, "step": 1295} +{"info/global_step": 1296, "train_info/time_within_train_step": 2.287053346633911, "step": 1296} +{"train_info/time_between_train_steps": 0.0031402111053466797, "step": 1296} +{"info/global_step": 1297, "train_info/time_within_train_step": 2.2875540256500244, "step": 1297} +{"train_info/time_between_train_steps": 0.0031468868255615234, "step": 1297} +{"info/global_step": 1298, "train_info/time_within_train_step": 2.287118673324585, "step": 1298} +{"train_info/time_between_train_steps": 0.003143310546875, "step": 1298} +{"info/global_step": 1299, "train_info/time_within_train_step": 2.287357807159424, "step": 1299} +{"train_info/time_between_train_steps": 0.0031714439392089844, "step": 1299} +{"info/global_step": 1300, "train_info/time_within_train_step": 2.287626266479492, "step": 1300} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746347106, "_runtime": 3203}, "step": 1300} +{"logs": {"train/loss": 3.7616, "train/learning_rate": 0.00037777777777777777, "train/epoch": 1.07, "_timestamp": 1746347106, "_runtime": 3203}, "step": 1300} +{"train_info/time_between_train_steps": 12.001736402511597, "step": 1300} +{"info/global_step": 1301, "train_info/time_within_train_step": 2.117476463317871, "step": 1301} +{"train_info/time_between_train_steps": 0.003168821334838867, "step": 1301} +{"info/global_step": 1302, "train_info/time_within_train_step": 2.0993454456329346, "step": 1302} +{"train_info/time_between_train_steps": 0.0031371116638183594, "step": 1302} +{"info/global_step": 1303, "train_info/time_within_train_step": 2.2272331714630127, "step": 1303} +{"train_info/time_between_train_steps": 0.0031104087829589844, "step": 1303} +{"info/global_step": 1304, "train_info/time_within_train_step": 2.2829625606536865, "step": 1304} +{"train_info/time_between_train_steps": 0.0031278133392333984, "step": 1304} +{"info/global_step": 1305, "train_info/time_within_train_step": 2.2837555408477783, "step": 1305} +{"train_info/time_between_train_steps": 0.0031163692474365234, "step": 1305} +{"info/global_step": 1306, "train_info/time_within_train_step": 2.2843821048736572, "step": 1306} +{"train_info/time_between_train_steps": 0.003156900405883789, "step": 1306} +{"info/global_step": 1307, "train_info/time_within_train_step": 2.2849206924438477, "step": 1307} +{"train_info/time_between_train_steps": 0.0031070709228515625, "step": 1307} +{"info/global_step": 1308, "train_info/time_within_train_step": 2.2852725982666016, "step": 1308} +{"train_info/time_between_train_steps": 0.003111124038696289, "step": 1308} +{"info/global_step": 1309, "train_info/time_within_train_step": 2.2851977348327637, "step": 1309} +{"train_info/time_between_train_steps": 0.0031571388244628906, "step": 1309} +{"info/global_step": 1310, "train_info/time_within_train_step": 2.2860803604125977, "step": 1310} +{"train_info/time_between_train_steps": 0.0031511783599853516, "step": 1310} +{"info/global_step": 1311, "train_info/time_within_train_step": 2.286010265350342, "step": 1311} +{"train_info/time_between_train_steps": 0.0031425952911376953, "step": 1311} +{"info/global_step": 1312, "train_info/time_within_train_step": 2.2913055419921875, "step": 1312} +{"train_info/time_between_train_steps": 0.003149271011352539, "step": 1312} +{"info/global_step": 1313, "train_info/time_within_train_step": 2.2868423461914062, "step": 1313} +{"train_info/time_between_train_steps": 0.003133535385131836, "step": 1313} +{"info/global_step": 1314, "train_info/time_within_train_step": 2.286702871322632, "step": 1314} +{"train_info/time_between_train_steps": 0.00315093994140625, "step": 1314} +{"info/global_step": 1315, "train_info/time_within_train_step": 2.286851644515991, "step": 1315} +{"train_info/time_between_train_steps": 0.003142833709716797, "step": 1315} +{"info/global_step": 1316, "train_info/time_within_train_step": 2.287160873413086, "step": 1316} +{"train_info/time_between_train_steps": 0.003137350082397461, "step": 1316} +{"info/global_step": 1317, "train_info/time_within_train_step": 2.2872493267059326, "step": 1317} +{"train_info/time_between_train_steps": 0.003170490264892578, "step": 1317} +{"info/global_step": 1318, "train_info/time_within_train_step": 2.286912441253662, "step": 1318} +{"train_info/time_between_train_steps": 0.0031480789184570312, "step": 1318} +{"info/global_step": 1319, "train_info/time_within_train_step": 2.2872023582458496, "step": 1319} +{"train_info/time_between_train_steps": 0.0031304359436035156, "step": 1319} +{"info/global_step": 1320, "train_info/time_within_train_step": 2.2870943546295166, "step": 1320} +{"train_info/time_between_train_steps": 0.0031282901763916016, "step": 1320} +{"info/global_step": 1321, "train_info/time_within_train_step": 2.2863171100616455, "step": 1321} +{"train_info/time_between_train_steps": 0.003117799758911133, "step": 1321} +{"info/global_step": 1322, "train_info/time_within_train_step": 2.2859156131744385, "step": 1322} +{"train_info/time_between_train_steps": 0.003107786178588867, "step": 1322} +{"info/global_step": 1323, "train_info/time_within_train_step": 2.286104917526245, "step": 1323} +{"train_info/time_between_train_steps": 0.003099679946899414, "step": 1323} +{"info/global_step": 1324, "train_info/time_within_train_step": 2.2867448329925537, "step": 1324} +{"train_info/time_between_train_steps": 0.0031325817108154297, "step": 1324} +{"info/global_step": 1325, "train_info/time_within_train_step": 2.285749673843384, "step": 1325} +{"train_info/time_between_train_steps": 0.003216981887817383, "step": 1325} +{"info/global_step": 1326, "train_info/time_within_train_step": 2.2862548828125, "step": 1326} +{"train_info/time_between_train_steps": 0.0031664371490478516, "step": 1326} +{"info/global_step": 1327, "train_info/time_within_train_step": 2.285722255706787, "step": 1327} +{"train_info/time_between_train_steps": 0.003143310546875, "step": 1327} +{"info/global_step": 1328, "train_info/time_within_train_step": 2.2855730056762695, "step": 1328} +{"train_info/time_between_train_steps": 0.0031096935272216797, "step": 1328} +{"info/global_step": 1329, "train_info/time_within_train_step": 2.2860660552978516, "step": 1329} +{"train_info/time_between_train_steps": 0.0036623477935791016, "step": 1329} +{"info/global_step": 1330, "train_info/time_within_train_step": 2.286086082458496, "step": 1330} +{"train_info/time_between_train_steps": 0.003103971481323242, "step": 1330} +{"info/global_step": 1331, "train_info/time_within_train_step": 2.286306619644165, "step": 1331} +{"train_info/time_between_train_steps": 0.0030863285064697266, "step": 1331} +{"info/global_step": 1332, "train_info/time_within_train_step": 2.2864198684692383, "step": 1332} +{"train_info/time_between_train_steps": 0.0032372474670410156, "step": 1332} +{"info/global_step": 1333, "train_info/time_within_train_step": 2.287104606628418, "step": 1333} +{"train_info/time_between_train_steps": 0.0031342506408691406, "step": 1333} +{"info/global_step": 1334, "train_info/time_within_train_step": 2.2872369289398193, "step": 1334} +{"train_info/time_between_train_steps": 0.003113985061645508, "step": 1334} +{"info/global_step": 1335, "train_info/time_within_train_step": 2.2869231700897217, "step": 1335} +{"train_info/time_between_train_steps": 0.003129243850708008, "step": 1335} +{"info/global_step": 1336, "train_info/time_within_train_step": 2.287116765975952, "step": 1336} +{"train_info/time_between_train_steps": 0.003112316131591797, "step": 1336} +{"info/global_step": 1337, "train_info/time_within_train_step": 2.286357879638672, "step": 1337} +{"train_info/time_between_train_steps": 0.0031821727752685547, "step": 1337} +{"info/global_step": 1338, "train_info/time_within_train_step": 2.2924680709838867, "step": 1338} +{"train_info/time_between_train_steps": 0.0031082630157470703, "step": 1338} +{"info/global_step": 1339, "train_info/time_within_train_step": 2.2875781059265137, "step": 1339} +{"train_info/time_between_train_steps": 0.003131389617919922, "step": 1339} +{"info/global_step": 1340, "train_info/time_within_train_step": 2.2871901988983154, "step": 1340} +{"train_info/time_between_train_steps": 0.0031545162200927734, "step": 1340} +{"info/global_step": 1341, "train_info/time_within_train_step": 2.2879433631896973, "step": 1341} +{"train_info/time_between_train_steps": 0.0031189918518066406, "step": 1341} +{"info/global_step": 1342, "train_info/time_within_train_step": 2.285872220993042, "step": 1342} +{"train_info/time_between_train_steps": 0.12274026870727539, "step": 1342} +{"info/global_step": 1343, "train_info/time_within_train_step": 2.2864632606506348, "step": 1343} +{"train_info/time_between_train_steps": 0.003161191940307617, "step": 1343} +{"info/global_step": 1344, "train_info/time_within_train_step": 2.2855191230773926, "step": 1344} +{"train_info/time_between_train_steps": 0.003154277801513672, "step": 1344} +{"info/global_step": 1345, "train_info/time_within_train_step": 2.2850637435913086, "step": 1345} +{"train_info/time_between_train_steps": 0.003159761428833008, "step": 1345} +{"info/global_step": 1346, "train_info/time_within_train_step": 2.2859418392181396, "step": 1346} +{"train_info/time_between_train_steps": 0.003161191940307617, "step": 1346} +{"info/global_step": 1347, "train_info/time_within_train_step": 2.285402297973633, "step": 1347} +{"train_info/time_between_train_steps": 0.003118276596069336, "step": 1347} +{"info/global_step": 1348, "train_info/time_within_train_step": 2.5066635608673096, "step": 1348} +{"train_info/time_between_train_steps": 0.003170013427734375, "step": 1348} +{"info/global_step": 1349, "train_info/time_within_train_step": 2.285863161087036, "step": 1349} +{"train_info/time_between_train_steps": 0.003327608108520508, "step": 1349} +{"info/global_step": 1350, "train_info/time_within_train_step": 2.286709785461426, "step": 1350} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746347233, "_runtime": 3330}, "step": 1350} +{"logs": {"train/loss": 3.7324, "train/learning_rate": 0.00036666666666666667, "train/epoch": 1.09, "_timestamp": 1746347233, "_runtime": 3330}, "step": 1350} +{"train_info/time_between_train_steps": 0.02504277229309082, "step": 1350} +{"info/global_step": 1351, "train_info/time_within_train_step": 2.2875123023986816, "step": 1351} +{"train_info/time_between_train_steps": 0.003152132034301758, "step": 1351} +{"info/global_step": 1352, "train_info/time_within_train_step": 2.287222385406494, "step": 1352} +{"train_info/time_between_train_steps": 0.003152608871459961, "step": 1352} +{"info/global_step": 1353, "train_info/time_within_train_step": 2.287081480026245, "step": 1353} +{"train_info/time_between_train_steps": 0.003203153610229492, "step": 1353} +{"info/global_step": 1354, "train_info/time_within_train_step": 2.286999464035034, "step": 1354} +{"train_info/time_between_train_steps": 0.0031762123107910156, "step": 1354} +{"info/global_step": 1355, "train_info/time_within_train_step": 2.2866735458374023, "step": 1355} +{"train_info/time_between_train_steps": 0.003184080123901367, "step": 1355} +{"info/global_step": 1356, "train_info/time_within_train_step": 2.2873077392578125, "step": 1356} +{"train_info/time_between_train_steps": 0.0032715797424316406, "step": 1356} +{"info/global_step": 1357, "train_info/time_within_train_step": 2.2878401279449463, "step": 1357} +{"train_info/time_between_train_steps": 0.0031876564025878906, "step": 1357} +{"info/global_step": 1358, "train_info/time_within_train_step": 2.2876291275024414, "step": 1358} +{"train_info/time_between_train_steps": 0.0032122135162353516, "step": 1358} +{"info/global_step": 1359, "train_info/time_within_train_step": 2.2866969108581543, "step": 1359} +{"train_info/time_between_train_steps": 0.003158092498779297, "step": 1359} +{"info/global_step": 1360, "train_info/time_within_train_step": 2.2869699001312256, "step": 1360} +{"train_info/time_between_train_steps": 0.00315093994140625, "step": 1360} +{"info/global_step": 1361, "train_info/time_within_train_step": 2.2874255180358887, "step": 1361} +{"train_info/time_between_train_steps": 0.0031747817993164062, "step": 1361} +{"info/global_step": 1362, "train_info/time_within_train_step": 2.2861385345458984, "step": 1362} +{"train_info/time_between_train_steps": 0.0031440258026123047, "step": 1362} +{"info/global_step": 1363, "train_info/time_within_train_step": 2.2866718769073486, "step": 1363} +{"train_info/time_between_train_steps": 0.0031659603118896484, "step": 1363} +{"info/global_step": 1364, "train_info/time_within_train_step": 2.286311388015747, "step": 1364} +{"train_info/time_between_train_steps": 0.003144502639770508, "step": 1364} +{"info/global_step": 1365, "train_info/time_within_train_step": 2.2855050563812256, "step": 1365} +{"train_info/time_between_train_steps": 0.003194093704223633, "step": 1365} +{"info/global_step": 1366, "train_info/time_within_train_step": 2.2856953144073486, "step": 1366} +{"train_info/time_between_train_steps": 0.003154754638671875, "step": 1366} +{"info/global_step": 1367, "train_info/time_within_train_step": 2.285961151123047, "step": 1367} +{"train_info/time_between_train_steps": 0.0031554698944091797, "step": 1367} +{"info/global_step": 1368, "train_info/time_within_train_step": 2.286109685897827, "step": 1368} +{"train_info/time_between_train_steps": 0.0031545162200927734, "step": 1368} +{"info/global_step": 1369, "train_info/time_within_train_step": 2.2863004207611084, "step": 1369} +{"train_info/time_between_train_steps": 0.003142118453979492, "step": 1369} +{"info/global_step": 1370, "train_info/time_within_train_step": 2.2853636741638184, "step": 1370} +{"train_info/time_between_train_steps": 0.0031456947326660156, "step": 1370} +{"info/global_step": 1371, "train_info/time_within_train_step": 2.286006212234497, "step": 1371} +{"train_info/time_between_train_steps": 0.0031576156616210938, "step": 1371} +{"info/global_step": 1372, "train_info/time_within_train_step": 2.286144971847534, "step": 1372} +{"train_info/time_between_train_steps": 0.0031728744506835938, "step": 1372} +{"info/global_step": 1373, "train_info/time_within_train_step": 2.286851167678833, "step": 1373} +{"train_info/time_between_train_steps": 0.00318145751953125, "step": 1373} +{"info/global_step": 1374, "train_info/time_within_train_step": 2.2862889766693115, "step": 1374} +{"train_info/time_between_train_steps": 0.0031723976135253906, "step": 1374} +{"info/global_step": 1375, "train_info/time_within_train_step": 2.286372423171997, "step": 1375} +{"train_info/time_between_train_steps": 0.0031402111053466797, "step": 1375} +{"info/global_step": 1376, "train_info/time_within_train_step": 2.286982774734497, "step": 1376} +{"train_info/time_between_train_steps": 0.003121614456176758, "step": 1376} +{"info/global_step": 1377, "train_info/time_within_train_step": 2.2869770526885986, "step": 1377} +{"train_info/time_between_train_steps": 0.003111124038696289, "step": 1377} +{"info/global_step": 1378, "train_info/time_within_train_step": 2.286550998687744, "step": 1378} +{"train_info/time_between_train_steps": 0.003090381622314453, "step": 1378} +{"info/global_step": 1379, "train_info/time_within_train_step": 2.286406993865967, "step": 1379} +{"train_info/time_between_train_steps": 0.0031418800354003906, "step": 1379} +{"info/global_step": 1380, "train_info/time_within_train_step": 2.2871298789978027, "step": 1380} +{"train_info/time_between_train_steps": 0.003130197525024414, "step": 1380} +{"info/global_step": 1381, "train_info/time_within_train_step": 2.286226272583008, "step": 1381} +{"train_info/time_between_train_steps": 0.0031440258026123047, "step": 1381} +{"info/global_step": 1382, "train_info/time_within_train_step": 2.285865545272827, "step": 1382} +{"train_info/time_between_train_steps": 0.003130197525024414, "step": 1382} +{"info/global_step": 1383, "train_info/time_within_train_step": 2.286245822906494, "step": 1383} +{"train_info/time_between_train_steps": 0.0031266212463378906, "step": 1383} +{"info/global_step": 1384, "train_info/time_within_train_step": 2.2864840030670166, "step": 1384} +{"train_info/time_between_train_steps": 0.0031366348266601562, "step": 1384} +{"info/global_step": 1385, "train_info/time_within_train_step": 2.285543918609619, "step": 1385} +{"train_info/time_between_train_steps": 0.0031118392944335938, "step": 1385} +{"info/global_step": 1386, "train_info/time_within_train_step": 2.2859747409820557, "step": 1386} +{"train_info/time_between_train_steps": 0.0031070709228515625, "step": 1386} +{"info/global_step": 1387, "train_info/time_within_train_step": 2.5092031955718994, "step": 1387} +{"train_info/time_between_train_steps": 0.0031042098999023438, "step": 1387} +{"info/global_step": 1388, "train_info/time_within_train_step": 2.2854013442993164, "step": 1388} +{"train_info/time_between_train_steps": 0.003141164779663086, "step": 1388} +{"info/global_step": 1389, "train_info/time_within_train_step": 2.2849819660186768, "step": 1389} +{"train_info/time_between_train_steps": 0.0031325817108154297, "step": 1389} +{"info/global_step": 1390, "train_info/time_within_train_step": 2.285984754562378, "step": 1390} +{"train_info/time_between_train_steps": 0.0031185150146484375, "step": 1390} +{"info/global_step": 1391, "train_info/time_within_train_step": 2.2857489585876465, "step": 1391} +{"train_info/time_between_train_steps": 0.0031251907348632812, "step": 1391} +{"info/global_step": 1392, "train_info/time_within_train_step": 2.285853147506714, "step": 1392} +{"train_info/time_between_train_steps": 0.0031108856201171875, "step": 1392} +{"info/global_step": 1393, "train_info/time_within_train_step": 2.2857162952423096, "step": 1393} +{"train_info/time_between_train_steps": 0.0031707286834716797, "step": 1393} +{"info/global_step": 1394, "train_info/time_within_train_step": 2.2863047122955322, "step": 1394} +{"train_info/time_between_train_steps": 0.003139495849609375, "step": 1394} +{"info/global_step": 1395, "train_info/time_within_train_step": 2.286418914794922, "step": 1395} +{"train_info/time_between_train_steps": 0.0031065940856933594, "step": 1395} +{"info/global_step": 1396, "train_info/time_within_train_step": 2.2868010997772217, "step": 1396} +{"train_info/time_between_train_steps": 0.0031609535217285156, "step": 1396} +{"info/global_step": 1397, "train_info/time_within_train_step": 2.2865800857543945, "step": 1397} +{"train_info/time_between_train_steps": 0.0031425952911376953, "step": 1397} +{"info/global_step": 1398, "train_info/time_within_train_step": 2.286235809326172, "step": 1398} +{"train_info/time_between_train_steps": 0.0031740665435791016, "step": 1398} +{"info/global_step": 1399, "train_info/time_within_train_step": 2.2864937782287598, "step": 1399} +{"train_info/time_between_train_steps": 0.003117799758911133, "step": 1399} +{"info/global_step": 1400, "train_info/time_within_train_step": 2.285926342010498, "step": 1400} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746347349, "_runtime": 3446}, "step": 1400} +{"logs": {"train/loss": 3.7167, "train/learning_rate": 0.0003555555555555555, "train/epoch": 1.1, "_timestamp": 1746347349, "_runtime": 3446}, "step": 1400} +{"train_info/time_between_train_steps": 11.887185335159302, "step": 1400} +{"info/global_step": 1401, "train_info/time_within_train_step": 2.115710496902466, "step": 1401} +{"train_info/time_between_train_steps": 0.003168821334838867, "step": 1401} +{"info/global_step": 1402, "train_info/time_within_train_step": 2.095954418182373, "step": 1402} +{"train_info/time_between_train_steps": 0.003186941146850586, "step": 1402} +{"info/global_step": 1403, "train_info/time_within_train_step": 2.221346855163574, "step": 1403} +{"train_info/time_between_train_steps": 0.003153085708618164, "step": 1403} +{"info/global_step": 1404, "train_info/time_within_train_step": 2.283172607421875, "step": 1404} +{"train_info/time_between_train_steps": 0.0031380653381347656, "step": 1404} +{"info/global_step": 1405, "train_info/time_within_train_step": 2.4071130752563477, "step": 1405} +{"train_info/time_between_train_steps": 0.003164529800415039, "step": 1405} +{"info/global_step": 1406, "train_info/time_within_train_step": 2.2855000495910645, "step": 1406} +{"train_info/time_between_train_steps": 0.003175020217895508, "step": 1406} +{"info/global_step": 1407, "train_info/time_within_train_step": 2.2853050231933594, "step": 1407} +{"train_info/time_between_train_steps": 0.003131389617919922, "step": 1407} +{"info/global_step": 1408, "train_info/time_within_train_step": 2.2855422496795654, "step": 1408} +{"train_info/time_between_train_steps": 0.0031538009643554688, "step": 1408} +{"info/global_step": 1409, "train_info/time_within_train_step": 2.2857871055603027, "step": 1409} +{"train_info/time_between_train_steps": 0.0031664371490478516, "step": 1409} +{"info/global_step": 1410, "train_info/time_within_train_step": 2.285977602005005, "step": 1410} +{"train_info/time_between_train_steps": 0.003127574920654297, "step": 1410} +{"info/global_step": 1411, "train_info/time_within_train_step": 2.2857978343963623, "step": 1411} +{"train_info/time_between_train_steps": 0.003110170364379883, "step": 1411} +{"info/global_step": 1412, "train_info/time_within_train_step": 2.286410331726074, "step": 1412} +{"train_info/time_between_train_steps": 0.003100156784057617, "step": 1412} +{"info/global_step": 1413, "train_info/time_within_train_step": 2.2865681648254395, "step": 1413} +{"train_info/time_between_train_steps": 0.0031499862670898438, "step": 1413} +{"info/global_step": 1414, "train_info/time_within_train_step": 2.2861998081207275, "step": 1414} +{"train_info/time_between_train_steps": 0.003111600875854492, "step": 1414} +{"info/global_step": 1415, "train_info/time_within_train_step": 2.2859551906585693, "step": 1415} +{"train_info/time_between_train_steps": 0.0031185150146484375, "step": 1415} +{"info/global_step": 1416, "train_info/time_within_train_step": 2.285963773727417, "step": 1416} +{"train_info/time_between_train_steps": 0.003157377243041992, "step": 1416} +{"info/global_step": 1417, "train_info/time_within_train_step": 2.2858972549438477, "step": 1417} +{"train_info/time_between_train_steps": 0.003149747848510742, "step": 1417} +{"info/global_step": 1418, "train_info/time_within_train_step": 2.2863776683807373, "step": 1418} +{"train_info/time_between_train_steps": 0.003147602081298828, "step": 1418} +{"info/global_step": 1419, "train_info/time_within_train_step": 2.2861928939819336, "step": 1419} +{"train_info/time_between_train_steps": 0.0031366348266601562, "step": 1419} +{"info/global_step": 1420, "train_info/time_within_train_step": 2.2863175868988037, "step": 1420} +{"train_info/time_between_train_steps": 0.0031118392944335938, "step": 1420} +{"info/global_step": 1421, "train_info/time_within_train_step": 2.286104917526245, "step": 1421} +{"train_info/time_between_train_steps": 0.003106832504272461, "step": 1421} +{"info/global_step": 1422, "train_info/time_within_train_step": 2.2862541675567627, "step": 1422} +{"train_info/time_between_train_steps": 0.0031099319458007812, "step": 1422} +{"info/global_step": 1423, "train_info/time_within_train_step": 2.286529302597046, "step": 1423} +{"train_info/time_between_train_steps": 0.003118753433227539, "step": 1423} +{"info/global_step": 1424, "train_info/time_within_train_step": 2.2867162227630615, "step": 1424} +{"train_info/time_between_train_steps": 0.003226041793823242, "step": 1424} +{"info/global_step": 1425, "train_info/time_within_train_step": 2.2865850925445557, "step": 1425} +{"train_info/time_between_train_steps": 0.003165006637573242, "step": 1425} +{"info/global_step": 1426, "train_info/time_within_train_step": 2.2867677211761475, "step": 1426} +{"train_info/time_between_train_steps": 0.003201723098754883, "step": 1426} +{"info/global_step": 1427, "train_info/time_within_train_step": 2.286461591720581, "step": 1427} +{"train_info/time_between_train_steps": 0.003161191940307617, "step": 1427} +{"info/global_step": 1428, "train_info/time_within_train_step": 2.286325693130493, "step": 1428} +{"train_info/time_between_train_steps": 0.0031309127807617188, "step": 1428} +{"info/global_step": 1429, "train_info/time_within_train_step": 2.2866077423095703, "step": 1429} +{"train_info/time_between_train_steps": 0.003142833709716797, "step": 1429} +{"info/global_step": 1430, "train_info/time_within_train_step": 2.287733554840088, "step": 1430} +{"train_info/time_between_train_steps": 0.003142118453979492, "step": 1430} +{"info/global_step": 1431, "train_info/time_within_train_step": 2.2863335609436035, "step": 1431} +{"train_info/time_between_train_steps": 0.0031442642211914062, "step": 1431} +{"info/global_step": 1432, "train_info/time_within_train_step": 2.2868659496307373, "step": 1432} +{"train_info/time_between_train_steps": 0.0031991004943847656, "step": 1432} +{"info/global_step": 1433, "train_info/time_within_train_step": 2.286752700805664, "step": 1433} +{"train_info/time_between_train_steps": 0.003171682357788086, "step": 1433} +{"info/global_step": 1434, "train_info/time_within_train_step": 2.286839485168457, "step": 1434} +{"train_info/time_between_train_steps": 0.003167867660522461, "step": 1434} +{"info/global_step": 1435, "train_info/time_within_train_step": 2.2861180305480957, "step": 1435} +{"train_info/time_between_train_steps": 0.003197193145751953, "step": 1435} +{"info/global_step": 1436, "train_info/time_within_train_step": 2.287139654159546, "step": 1436} +{"train_info/time_between_train_steps": 0.00313568115234375, "step": 1436} +{"info/global_step": 1437, "train_info/time_within_train_step": 2.2870142459869385, "step": 1437} +{"train_info/time_between_train_steps": 0.003184795379638672, "step": 1437} +{"info/global_step": 1438, "train_info/time_within_train_step": 2.2860116958618164, "step": 1438} +{"train_info/time_between_train_steps": 0.003127574920654297, "step": 1438} +{"info/global_step": 1439, "train_info/time_within_train_step": 2.2863447666168213, "step": 1439} +{"train_info/time_between_train_steps": 0.0031549930572509766, "step": 1439} +{"info/global_step": 1440, "train_info/time_within_train_step": 2.2860944271087646, "step": 1440} +{"train_info/time_between_train_steps": 0.0031554698944091797, "step": 1440} +{"info/global_step": 1441, "train_info/time_within_train_step": 2.2863240242004395, "step": 1441} +{"train_info/time_between_train_steps": 0.00315093994140625, "step": 1441} +{"info/global_step": 1442, "train_info/time_within_train_step": 2.286100149154663, "step": 1442} +{"train_info/time_between_train_steps": 0.003156900405883789, "step": 1442} +{"info/global_step": 1443, "train_info/time_within_train_step": 2.2864174842834473, "step": 1443} +{"train_info/time_between_train_steps": 0.003134012222290039, "step": 1443} +{"info/global_step": 1444, "train_info/time_within_train_step": 2.286407470703125, "step": 1444} +{"train_info/time_between_train_steps": 0.003108978271484375, "step": 1444} +{"info/global_step": 1445, "train_info/time_within_train_step": 2.516667366027832, "step": 1445} +{"train_info/time_between_train_steps": 0.0031201839447021484, "step": 1445} +{"info/global_step": 1446, "train_info/time_within_train_step": 2.2856204509735107, "step": 1446} +{"train_info/time_between_train_steps": 0.0031261444091796875, "step": 1446} +{"info/global_step": 1447, "train_info/time_within_train_step": 2.28541898727417, "step": 1447} +{"train_info/time_between_train_steps": 0.0031533241271972656, "step": 1447} +{"info/global_step": 1448, "train_info/time_within_train_step": 2.2863242626190186, "step": 1448} +{"train_info/time_between_train_steps": 0.0031735897064208984, "step": 1448} +{"info/global_step": 1449, "train_info/time_within_train_step": 2.2863998413085938, "step": 1449} +{"train_info/time_between_train_steps": 0.003130674362182617, "step": 1449} +{"info/global_step": 1450, "train_info/time_within_train_step": 2.2860772609710693, "step": 1450} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746347476, "_runtime": 3573}, "step": 1450} +{"logs": {"train/loss": 3.686, "train/learning_rate": 0.0003444444444444444, "train/epoch": 1.12, "_timestamp": 1746347476, "_runtime": 3573}, "step": 1450} +{"train_info/time_between_train_steps": 0.024305343627929688, "step": 1450} +{"info/global_step": 1451, "train_info/time_within_train_step": 2.2861075401306152, "step": 1451} +{"train_info/time_between_train_steps": 0.0031137466430664062, "step": 1451} +{"info/global_step": 1452, "train_info/time_within_train_step": 2.327388048171997, "step": 1452} +{"train_info/time_between_train_steps": 0.003114938735961914, "step": 1452} +{"info/global_step": 1453, "train_info/time_within_train_step": 2.286398410797119, "step": 1453} +{"train_info/time_between_train_steps": 0.003188610076904297, "step": 1453} +{"info/global_step": 1454, "train_info/time_within_train_step": 2.286731004714966, "step": 1454} +{"train_info/time_between_train_steps": 0.003142118453979492, "step": 1454} +{"info/global_step": 1455, "train_info/time_within_train_step": 2.2864434719085693, "step": 1455} +{"train_info/time_between_train_steps": 0.0031523704528808594, "step": 1455} +{"info/global_step": 1456, "train_info/time_within_train_step": 2.286378860473633, "step": 1456} +{"train_info/time_between_train_steps": 0.00313568115234375, "step": 1456} +{"info/global_step": 1457, "train_info/time_within_train_step": 2.286280393600464, "step": 1457} +{"train_info/time_between_train_steps": 0.0031578540802001953, "step": 1457} +{"info/global_step": 1458, "train_info/time_within_train_step": 2.2862565517425537, "step": 1458} +{"train_info/time_between_train_steps": 0.0031452178955078125, "step": 1458} +{"info/global_step": 1459, "train_info/time_within_train_step": 2.286942958831787, "step": 1459} +{"train_info/time_between_train_steps": 0.0031697750091552734, "step": 1459} +{"info/global_step": 1460, "train_info/time_within_train_step": 2.286438465118408, "step": 1460} +{"train_info/time_between_train_steps": 0.0031363964080810547, "step": 1460} +{"info/global_step": 1461, "train_info/time_within_train_step": 2.286611795425415, "step": 1461} +{"train_info/time_between_train_steps": 0.003113269805908203, "step": 1461} +{"info/global_step": 1462, "train_info/time_within_train_step": 2.2868881225585938, "step": 1462} +{"train_info/time_between_train_steps": 0.0031740665435791016, "step": 1462} +{"info/global_step": 1463, "train_info/time_within_train_step": 2.286609411239624, "step": 1463} +{"train_info/time_between_train_steps": 0.0031685829162597656, "step": 1463} +{"info/global_step": 1464, "train_info/time_within_train_step": 2.2861130237579346, "step": 1464} +{"train_info/time_between_train_steps": 0.0031490325927734375, "step": 1464} +{"info/global_step": 1465, "train_info/time_within_train_step": 2.286144733428955, "step": 1465} +{"train_info/time_between_train_steps": 0.0031273365020751953, "step": 1465} +{"info/global_step": 1466, "train_info/time_within_train_step": 2.286109209060669, "step": 1466} +{"train_info/time_between_train_steps": 0.0031096935272216797, "step": 1466} +{"info/global_step": 1467, "train_info/time_within_train_step": 2.286125898361206, "step": 1467} +{"train_info/time_between_train_steps": 0.12172698974609375, "step": 1467} +{"info/global_step": 1468, "train_info/time_within_train_step": 2.310176134109497, "step": 1468} +{"train_info/time_between_train_steps": 0.0031435489654541016, "step": 1468} +{"info/global_step": 1469, "train_info/time_within_train_step": 2.286144256591797, "step": 1469} +{"train_info/time_between_train_steps": 0.0031337738037109375, "step": 1469} +{"info/global_step": 1470, "train_info/time_within_train_step": 2.2857859134674072, "step": 1470} +{"train_info/time_between_train_steps": 0.0031538009643554688, "step": 1470} +{"info/global_step": 1471, "train_info/time_within_train_step": 2.2865445613861084, "step": 1471} +{"train_info/time_between_train_steps": 0.003180980682373047, "step": 1471} +{"info/global_step": 1472, "train_info/time_within_train_step": 2.2859370708465576, "step": 1472} +{"train_info/time_between_train_steps": 0.0031588077545166016, "step": 1472} +{"info/global_step": 1473, "train_info/time_within_train_step": 2.286611318588257, "step": 1473} +{"train_info/time_between_train_steps": 0.0031256675720214844, "step": 1473} +{"info/global_step": 1474, "train_info/time_within_train_step": 2.28635835647583, "step": 1474} +{"train_info/time_between_train_steps": 0.0031893253326416016, "step": 1474} +{"info/global_step": 1475, "train_info/time_within_train_step": 2.287182569503784, "step": 1475} +{"train_info/time_between_train_steps": 0.003120899200439453, "step": 1475} +{"info/global_step": 1476, "train_info/time_within_train_step": 2.2862770557403564, "step": 1476} +{"train_info/time_between_train_steps": 0.003110170364379883, "step": 1476} +{"info/global_step": 1477, "train_info/time_within_train_step": 2.2858176231384277, "step": 1477} +{"train_info/time_between_train_steps": 0.0030977725982666016, "step": 1477} +{"info/global_step": 1478, "train_info/time_within_train_step": 2.326780080795288, "step": 1478} +{"train_info/time_between_train_steps": 0.003129720687866211, "step": 1478} +{"info/global_step": 1479, "train_info/time_within_train_step": 2.2856011390686035, "step": 1479} +{"train_info/time_between_train_steps": 0.0031387805938720703, "step": 1479} +{"info/global_step": 1480, "train_info/time_within_train_step": 2.2859532833099365, "step": 1480} +{"train_info/time_between_train_steps": 0.0031371116638183594, "step": 1480} +{"info/global_step": 1481, "train_info/time_within_train_step": 2.2861735820770264, "step": 1481} +{"train_info/time_between_train_steps": 0.003153562545776367, "step": 1481} +{"info/global_step": 1482, "train_info/time_within_train_step": 2.286101818084717, "step": 1482} +{"train_info/time_between_train_steps": 0.003128528594970703, "step": 1482} +{"info/global_step": 1483, "train_info/time_within_train_step": 2.286864995956421, "step": 1483} +{"train_info/time_between_train_steps": 0.003112316131591797, "step": 1483} +{"info/global_step": 1484, "train_info/time_within_train_step": 2.285834312438965, "step": 1484} +{"train_info/time_between_train_steps": 0.0030994415283203125, "step": 1484} +{"info/global_step": 1485, "train_info/time_within_train_step": 2.2867698669433594, "step": 1485} +{"train_info/time_between_train_steps": 0.003140687942504883, "step": 1485} +{"info/global_step": 1486, "train_info/time_within_train_step": 2.286090135574341, "step": 1486} +{"train_info/time_between_train_steps": 0.0031099319458007812, "step": 1486} +{"info/global_step": 1487, "train_info/time_within_train_step": 2.2862648963928223, "step": 1487} +{"train_info/time_between_train_steps": 0.003175973892211914, "step": 1487} +{"info/global_step": 1488, "train_info/time_within_train_step": 2.2866408824920654, "step": 1488} +{"train_info/time_between_train_steps": 0.0031769275665283203, "step": 1488} +{"info/global_step": 1489, "train_info/time_within_train_step": 2.2864885330200195, "step": 1489} +{"train_info/time_between_train_steps": 0.0031456947326660156, "step": 1489} +{"info/global_step": 1490, "train_info/time_within_train_step": 2.2865278720855713, "step": 1490} +{"train_info/time_between_train_steps": 0.003160238265991211, "step": 1490} +{"info/global_step": 1491, "train_info/time_within_train_step": 2.2874057292938232, "step": 1491} +{"train_info/time_between_train_steps": 0.0031359195709228516, "step": 1491} +{"info/global_step": 1492, "train_info/time_within_train_step": 2.2867791652679443, "step": 1492} +{"train_info/time_between_train_steps": 0.0031845569610595703, "step": 1492} +{"info/global_step": 1493, "train_info/time_within_train_step": 2.2864015102386475, "step": 1493} +{"train_info/time_between_train_steps": 0.0031228065490722656, "step": 1493} +{"info/global_step": 1494, "train_info/time_within_train_step": 2.287379741668701, "step": 1494} +{"train_info/time_between_train_steps": 0.003129243850708008, "step": 1494} +{"info/global_step": 1495, "train_info/time_within_train_step": 2.2865114212036133, "step": 1495} +{"train_info/time_between_train_steps": 0.0031919479370117188, "step": 1495} +{"info/global_step": 1496, "train_info/time_within_train_step": 2.2858874797821045, "step": 1496} +{"train_info/time_between_train_steps": 0.0031311511993408203, "step": 1496} +{"info/global_step": 1497, "train_info/time_within_train_step": 2.285851240158081, "step": 1497} +{"train_info/time_between_train_steps": 0.0031442642211914062, "step": 1497} +{"info/global_step": 1498, "train_info/time_within_train_step": 2.286342144012451, "step": 1498} +{"train_info/time_between_train_steps": 0.0031261444091796875, "step": 1498} +{"info/global_step": 1499, "train_info/time_within_train_step": 2.5207064151763916, "step": 1499} +{"train_info/time_between_train_steps": 0.003136873245239258, "step": 1499} +{"info/global_step": 1500, "train_info/time_within_train_step": 2.6426820755004883, "step": 1500} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746347593, "_runtime": 3690}, "step": 1500} +{"logs": {"train/loss": 3.6554, "train/learning_rate": 0.0003333333333333333, "train/epoch": 1.14, "_timestamp": 1746347593, "_runtime": 3690}, "step": 1500} +{"train_info/time_between_train_steps": 16.541712045669556, "step": 1500} +{"info/global_step": 1501, "train_info/time_within_train_step": 2.1102590560913086, "step": 1501} +{"train_info/time_between_train_steps": 0.0032181739807128906, "step": 1501} +{"info/global_step": 1502, "train_info/time_within_train_step": 2.0981979370117188, "step": 1502} +{"train_info/time_between_train_steps": 0.003204822540283203, "step": 1502} +{"info/global_step": 1503, "train_info/time_within_train_step": 2.148127317428589, "step": 1503} +{"train_info/time_between_train_steps": 0.003140687942504883, "step": 1503} +{"info/global_step": 1504, "train_info/time_within_train_step": 2.284256935119629, "step": 1504} +{"train_info/time_between_train_steps": 0.003169536590576172, "step": 1504} +{"info/global_step": 1505, "train_info/time_within_train_step": 2.2857089042663574, "step": 1505} +{"train_info/time_between_train_steps": 0.0031387805938720703, "step": 1505} +{"info/global_step": 1506, "train_info/time_within_train_step": 2.285731554031372, "step": 1506} +{"train_info/time_between_train_steps": 0.0031211376190185547, "step": 1506} +{"info/global_step": 1507, "train_info/time_within_train_step": 2.286432981491089, "step": 1507} +{"train_info/time_between_train_steps": 0.0031280517578125, "step": 1507} +{"info/global_step": 1508, "train_info/time_within_train_step": 2.286862850189209, "step": 1508} +{"train_info/time_between_train_steps": 0.0031058788299560547, "step": 1508} +{"info/global_step": 1509, "train_info/time_within_train_step": 2.2869374752044678, "step": 1509} +{"train_info/time_between_train_steps": 0.003139019012451172, "step": 1509} +{"info/global_step": 1510, "train_info/time_within_train_step": 2.2865395545959473, "step": 1510} +{"train_info/time_between_train_steps": 0.003133058547973633, "step": 1510} +{"info/global_step": 1511, "train_info/time_within_train_step": 2.287485361099243, "step": 1511} +{"train_info/time_between_train_steps": 0.0031828880310058594, "step": 1511} +{"info/global_step": 1512, "train_info/time_within_train_step": 2.2872207164764404, "step": 1512} +{"train_info/time_between_train_steps": 0.0031468868255615234, "step": 1512} +{"info/global_step": 1513, "train_info/time_within_train_step": 2.287306785583496, "step": 1513} +{"train_info/time_between_train_steps": 0.0031790733337402344, "step": 1513} +{"info/global_step": 1514, "train_info/time_within_train_step": 2.2869131565093994, "step": 1514} +{"train_info/time_between_train_steps": 0.003111600875854492, "step": 1514} +{"info/global_step": 1515, "train_info/time_within_train_step": 2.2861156463623047, "step": 1515} +{"train_info/time_between_train_steps": 0.0031082630157470703, "step": 1515} +{"info/global_step": 1516, "train_info/time_within_train_step": 2.2865874767303467, "step": 1516} +{"train_info/time_between_train_steps": 0.00311279296875, "step": 1516} +{"info/global_step": 1517, "train_info/time_within_train_step": 2.286695957183838, "step": 1517} +{"train_info/time_between_train_steps": 0.003122091293334961, "step": 1517} +{"info/global_step": 1518, "train_info/time_within_train_step": 2.2871856689453125, "step": 1518} +{"train_info/time_between_train_steps": 0.0031049251556396484, "step": 1518} +{"info/global_step": 1519, "train_info/time_within_train_step": 2.286773920059204, "step": 1519} +{"train_info/time_between_train_steps": 0.0031664371490478516, "step": 1519} +{"info/global_step": 1520, "train_info/time_within_train_step": 2.2871053218841553, "step": 1520} +{"train_info/time_between_train_steps": 0.0031976699829101562, "step": 1520} +{"info/global_step": 1521, "train_info/time_within_train_step": 2.2864062786102295, "step": 1521} +{"train_info/time_between_train_steps": 0.003121614456176758, "step": 1521} +{"info/global_step": 1522, "train_info/time_within_train_step": 2.2870688438415527, "step": 1522} +{"train_info/time_between_train_steps": 0.0031287670135498047, "step": 1522} +{"info/global_step": 1523, "train_info/time_within_train_step": 2.2872252464294434, "step": 1523} +{"train_info/time_between_train_steps": 0.0031151771545410156, "step": 1523} +{"info/global_step": 1524, "train_info/time_within_train_step": 2.2876806259155273, "step": 1524} +{"train_info/time_between_train_steps": 0.003137350082397461, "step": 1524} +{"info/global_step": 1525, "train_info/time_within_train_step": 2.2872250080108643, "step": 1525} +{"train_info/time_between_train_steps": 0.003103494644165039, "step": 1525} +{"info/global_step": 1526, "train_info/time_within_train_step": 2.2872135639190674, "step": 1526} +{"train_info/time_between_train_steps": 0.003091573715209961, "step": 1526} +{"info/global_step": 1527, "train_info/time_within_train_step": 2.287142515182495, "step": 1527} +{"train_info/time_between_train_steps": 0.0031418800354003906, "step": 1527} +{"info/global_step": 1528, "train_info/time_within_train_step": 2.287367582321167, "step": 1528} +{"train_info/time_between_train_steps": 0.003147602081298828, "step": 1528} +{"info/global_step": 1529, "train_info/time_within_train_step": 2.288179397583008, "step": 1529} +{"train_info/time_between_train_steps": 0.0031480789184570312, "step": 1529} +{"info/global_step": 1530, "train_info/time_within_train_step": 2.410067081451416, "step": 1530} +{"train_info/time_between_train_steps": 0.003160715103149414, "step": 1530} +{"info/global_step": 1531, "train_info/time_within_train_step": 2.2877843379974365, "step": 1531} +{"train_info/time_between_train_steps": 0.0031571388244628906, "step": 1531} +{"info/global_step": 1532, "train_info/time_within_train_step": 2.2882936000823975, "step": 1532} +{"train_info/time_between_train_steps": 0.00316619873046875, "step": 1532} +{"info/global_step": 1533, "train_info/time_within_train_step": 2.2875871658325195, "step": 1533} +{"train_info/time_between_train_steps": 0.0031638145446777344, "step": 1533} +{"info/global_step": 1534, "train_info/time_within_train_step": 2.2874484062194824, "step": 1534} +{"train_info/time_between_train_steps": 0.003190279006958008, "step": 1534} +{"info/global_step": 1535, "train_info/time_within_train_step": 2.2872908115386963, "step": 1535} +{"train_info/time_between_train_steps": 0.003160715103149414, "step": 1535} +{"info/global_step": 1536, "train_info/time_within_train_step": 2.287824869155884, "step": 1536} +{"train_info/time_between_train_steps": 0.003155946731567383, "step": 1536} +{"info/global_step": 1537, "train_info/time_within_train_step": 2.286944627761841, "step": 1537} +{"train_info/time_between_train_steps": 0.003133058547973633, "step": 1537} +{"info/global_step": 1538, "train_info/time_within_train_step": 2.2872791290283203, "step": 1538} +{"train_info/time_between_train_steps": 0.003138303756713867, "step": 1538} +{"info/global_step": 1539, "train_info/time_within_train_step": 2.2874042987823486, "step": 1539} +{"train_info/time_between_train_steps": 0.003137350082397461, "step": 1539} +{"info/global_step": 1540, "train_info/time_within_train_step": 2.2877683639526367, "step": 1540} +{"train_info/time_between_train_steps": 0.0031387805938720703, "step": 1540} +{"info/global_step": 1541, "train_info/time_within_train_step": 2.2868945598602295, "step": 1541} +{"train_info/time_between_train_steps": 0.003121614456176758, "step": 1541} +{"info/global_step": 1542, "train_info/time_within_train_step": 2.2873427867889404, "step": 1542} +{"train_info/time_between_train_steps": 0.0031337738037109375, "step": 1542} +{"info/global_step": 1543, "train_info/time_within_train_step": 2.286804676055908, "step": 1543} +{"train_info/time_between_train_steps": 0.003178834915161133, "step": 1543} +{"info/global_step": 1544, "train_info/time_within_train_step": 2.2869722843170166, "step": 1544} +{"train_info/time_between_train_steps": 0.0031883716583251953, "step": 1544} +{"info/global_step": 1545, "train_info/time_within_train_step": 2.287299156188965, "step": 1545} +{"train_info/time_between_train_steps": 0.003160238265991211, "step": 1545} +{"info/global_step": 1546, "train_info/time_within_train_step": 2.2866761684417725, "step": 1546} +{"train_info/time_between_train_steps": 0.003133535385131836, "step": 1546} +{"info/global_step": 1547, "train_info/time_within_train_step": 2.287165641784668, "step": 1547} +{"train_info/time_between_train_steps": 0.003138303756713867, "step": 1547} +{"info/global_step": 1548, "train_info/time_within_train_step": 2.2875115871429443, "step": 1548} +{"train_info/time_between_train_steps": 0.0031626224517822266, "step": 1548} +{"info/global_step": 1549, "train_info/time_within_train_step": 2.2874679565429688, "step": 1549} +{"train_info/time_between_train_steps": 0.00312042236328125, "step": 1549} +{"info/global_step": 1550, "train_info/time_within_train_step": 2.2871079444885254, "step": 1550} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746347724, "_runtime": 3821}, "step": 1550} +{"logs": {"train/loss": 3.6528, "train/learning_rate": 0.0003222222222222222, "train/epoch": 1.15, "_timestamp": 1746347724, "_runtime": 3821}, "step": 1550} +{"train_info/time_between_train_steps": 0.02443552017211914, "step": 1550} +{"info/global_step": 1551, "train_info/time_within_train_step": 2.2880682945251465, "step": 1551} +{"train_info/time_between_train_steps": 0.0031991004943847656, "step": 1551} +{"info/global_step": 1552, "train_info/time_within_train_step": 2.287910223007202, "step": 1552} +{"train_info/time_between_train_steps": 0.0031871795654296875, "step": 1552} +{"info/global_step": 1553, "train_info/time_within_train_step": 2.287557601928711, "step": 1553} +{"train_info/time_between_train_steps": 0.0032358169555664062, "step": 1553} +{"info/global_step": 1554, "train_info/time_within_train_step": 2.287447452545166, "step": 1554} +{"train_info/time_between_train_steps": 0.003156423568725586, "step": 1554} +{"info/global_step": 1555, "train_info/time_within_train_step": 2.287712335586548, "step": 1555} +{"train_info/time_between_train_steps": 0.0031883716583251953, "step": 1555} +{"info/global_step": 1556, "train_info/time_within_train_step": 2.287862539291382, "step": 1556} +{"train_info/time_between_train_steps": 0.003183603286743164, "step": 1556} +{"info/global_step": 1557, "train_info/time_within_train_step": 2.2878170013427734, "step": 1557} +{"train_info/time_between_train_steps": 0.0033783912658691406, "step": 1557} +{"info/global_step": 1558, "train_info/time_within_train_step": 2.287529468536377, "step": 1558} +{"train_info/time_between_train_steps": 0.003184795379638672, "step": 1558} +{"info/global_step": 1559, "train_info/time_within_train_step": 2.2876994609832764, "step": 1559} +{"train_info/time_between_train_steps": 0.0031986236572265625, "step": 1559} +{"info/global_step": 1560, "train_info/time_within_train_step": 2.2875492572784424, "step": 1560} +{"train_info/time_between_train_steps": 0.003212451934814453, "step": 1560} +{"info/global_step": 1561, "train_info/time_within_train_step": 2.287196397781372, "step": 1561} +{"train_info/time_between_train_steps": 0.0031867027282714844, "step": 1561} +{"info/global_step": 1562, "train_info/time_within_train_step": 2.2873635292053223, "step": 1562} +{"train_info/time_between_train_steps": 0.003191232681274414, "step": 1562} +{"info/global_step": 1563, "train_info/time_within_train_step": 2.287050724029541, "step": 1563} +{"train_info/time_between_train_steps": 0.00318145751953125, "step": 1563} +{"info/global_step": 1564, "train_info/time_within_train_step": 2.2874679565429688, "step": 1564} +{"train_info/time_between_train_steps": 0.003236055374145508, "step": 1564} +{"info/global_step": 1565, "train_info/time_within_train_step": 2.2872848510742188, "step": 1565} +{"train_info/time_between_train_steps": 0.003192424774169922, "step": 1565} +{"info/global_step": 1566, "train_info/time_within_train_step": 2.2872772216796875, "step": 1566} +{"train_info/time_between_train_steps": 0.003190279006958008, "step": 1566} +{"info/global_step": 1567, "train_info/time_within_train_step": 2.2865209579467773, "step": 1567} +{"train_info/time_between_train_steps": 0.0031714439392089844, "step": 1567} +{"info/global_step": 1568, "train_info/time_within_train_step": 2.287511110305786, "step": 1568} +{"train_info/time_between_train_steps": 0.003186464309692383, "step": 1568} +{"info/global_step": 1569, "train_info/time_within_train_step": 2.2871241569519043, "step": 1569} +{"train_info/time_between_train_steps": 0.003171205520629883, "step": 1569} +{"info/global_step": 1570, "train_info/time_within_train_step": 2.2873716354370117, "step": 1570} +{"train_info/time_between_train_steps": 0.003156423568725586, "step": 1570} +{"info/global_step": 1571, "train_info/time_within_train_step": 2.288048267364502, "step": 1571} +{"train_info/time_between_train_steps": 0.003190755844116211, "step": 1571} +{"info/global_step": 1572, "train_info/time_within_train_step": 2.2875068187713623, "step": 1572} +{"train_info/time_between_train_steps": 0.003151416778564453, "step": 1572} +{"info/global_step": 1573, "train_info/time_within_train_step": 2.2874574661254883, "step": 1573} +{"train_info/time_between_train_steps": 0.003146648406982422, "step": 1573} +{"info/global_step": 1574, "train_info/time_within_train_step": 2.2887187004089355, "step": 1574} +{"train_info/time_between_train_steps": 0.0031342506408691406, "step": 1574} +{"info/global_step": 1575, "train_info/time_within_train_step": 2.2882747650146484, "step": 1575} +{"train_info/time_between_train_steps": 0.003228425979614258, "step": 1575} +{"info/global_step": 1576, "train_info/time_within_train_step": 2.287564516067505, "step": 1576} +{"train_info/time_between_train_steps": 0.0031719207763671875, "step": 1576} +{"info/global_step": 1577, "train_info/time_within_train_step": 2.288041353225708, "step": 1577} +{"train_info/time_between_train_steps": 0.0031690597534179688, "step": 1577} +{"info/global_step": 1578, "train_info/time_within_train_step": 2.288151741027832, "step": 1578} +{"train_info/time_between_train_steps": 0.003136157989501953, "step": 1578} +{"info/global_step": 1579, "train_info/time_within_train_step": 2.287642240524292, "step": 1579} +{"train_info/time_between_train_steps": 0.003148317337036133, "step": 1579} +{"info/global_step": 1580, "train_info/time_within_train_step": 2.2873408794403076, "step": 1580} +{"train_info/time_between_train_steps": 0.0031654834747314453, "step": 1580} +{"info/global_step": 1581, "train_info/time_within_train_step": 2.2872354984283447, "step": 1581} +{"train_info/time_between_train_steps": 0.003181934356689453, "step": 1581} +{"info/global_step": 1582, "train_info/time_within_train_step": 2.2868499755859375, "step": 1582} +{"train_info/time_between_train_steps": 0.0031380653381347656, "step": 1582} +{"info/global_step": 1583, "train_info/time_within_train_step": 2.530517101287842, "step": 1583} +{"train_info/time_between_train_steps": 0.003269195556640625, "step": 1583} +{"info/global_step": 1584, "train_info/time_within_train_step": 2.285940170288086, "step": 1584} +{"train_info/time_between_train_steps": 0.0031647682189941406, "step": 1584} +{"info/global_step": 1585, "train_info/time_within_train_step": 2.2858357429504395, "step": 1585} +{"train_info/time_between_train_steps": 0.0031347274780273438, "step": 1585} +{"info/global_step": 1586, "train_info/time_within_train_step": 2.2862751483917236, "step": 1586} +{"train_info/time_between_train_steps": 0.003181934356689453, "step": 1586} +{"info/global_step": 1587, "train_info/time_within_train_step": 2.2859020233154297, "step": 1587} +{"train_info/time_between_train_steps": 0.0031404495239257812, "step": 1587} +{"info/global_step": 1588, "train_info/time_within_train_step": 2.2856314182281494, "step": 1588} +{"train_info/time_between_train_steps": 0.0031156539916992188, "step": 1588} +{"info/global_step": 1589, "train_info/time_within_train_step": 2.286142587661743, "step": 1589} +{"train_info/time_between_train_steps": 0.003100872039794922, "step": 1589} +{"info/global_step": 1590, "train_info/time_within_train_step": 2.286703109741211, "step": 1590} +{"train_info/time_between_train_steps": 0.003204345703125, "step": 1590} +{"info/global_step": 1591, "train_info/time_within_train_step": 2.287060022354126, "step": 1591} +{"train_info/time_between_train_steps": 0.0031642913818359375, "step": 1591} +{"info/global_step": 1592, "train_info/time_within_train_step": 2.2870609760284424, "step": 1592} +{"train_info/time_between_train_steps": 0.12616419792175293, "step": 1592} +{"info/global_step": 1593, "train_info/time_within_train_step": 2.2875356674194336, "step": 1593} +{"train_info/time_between_train_steps": 0.003245115280151367, "step": 1593} +{"info/global_step": 1594, "train_info/time_within_train_step": 2.2879576683044434, "step": 1594} +{"train_info/time_between_train_steps": 0.0031697750091552734, "step": 1594} +{"info/global_step": 1595, "train_info/time_within_train_step": 2.288170337677002, "step": 1595} +{"train_info/time_between_train_steps": 0.003179311752319336, "step": 1595} +{"info/global_step": 1596, "train_info/time_within_train_step": 2.2874233722686768, "step": 1596} +{"train_info/time_between_train_steps": 0.0031173229217529297, "step": 1596} +{"info/global_step": 1597, "train_info/time_within_train_step": 2.2875285148620605, "step": 1597} +{"train_info/time_between_train_steps": 0.0031893253326416016, "step": 1597} +{"info/global_step": 1598, "train_info/time_within_train_step": 2.287086248397827, "step": 1598} +{"train_info/time_between_train_steps": 0.0031442642211914062, "step": 1598} +{"info/global_step": 1599, "train_info/time_within_train_step": 2.2870819568634033, "step": 1599} +{"train_info/time_between_train_steps": 0.0032155513763427734, "step": 1599} +{"info/global_step": 1600, "train_info/time_within_train_step": 2.286939859390259, "step": 1600} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746347840, "_runtime": 3937}, "step": 1600} +{"logs": {"train/loss": 3.6335, "train/learning_rate": 0.00031111111111111107, "train/epoch": 1.17, "_timestamp": 1746347840, "_runtime": 3937}, "step": 1600} +{"train_info/time_between_train_steps": 16.892279624938965, "step": 1600} +{"info/global_step": 1601, "train_info/time_within_train_step": 2.1288328170776367, "step": 1601} +{"train_info/time_between_train_steps": 0.0031440258026123047, "step": 1601} +{"info/global_step": 1602, "train_info/time_within_train_step": 2.0991621017456055, "step": 1602} +{"train_info/time_between_train_steps": 0.003154754638671875, "step": 1602} +{"info/global_step": 1603, "train_info/time_within_train_step": 2.160428285598755, "step": 1603} +{"train_info/time_between_train_steps": 0.0031926631927490234, "step": 1603} +{"info/global_step": 1604, "train_info/time_within_train_step": 2.284291982650757, "step": 1604} +{"train_info/time_between_train_steps": 0.003153085708618164, "step": 1604} +{"info/global_step": 1605, "train_info/time_within_train_step": 2.2839725017547607, "step": 1605} +{"train_info/time_between_train_steps": 0.0031790733337402344, "step": 1605} +{"info/global_step": 1606, "train_info/time_within_train_step": 2.2842421531677246, "step": 1606} +{"train_info/time_between_train_steps": 0.003223896026611328, "step": 1606} +{"info/global_step": 1607, "train_info/time_within_train_step": 2.2861430644989014, "step": 1607} +{"train_info/time_between_train_steps": 0.003181934356689453, "step": 1607} +{"info/global_step": 1608, "train_info/time_within_train_step": 2.2867164611816406, "step": 1608} +{"train_info/time_between_train_steps": 0.003160715103149414, "step": 1608} +{"info/global_step": 1609, "train_info/time_within_train_step": 2.2861204147338867, "step": 1609} +{"train_info/time_between_train_steps": 0.0032525062561035156, "step": 1609} +{"info/global_step": 1610, "train_info/time_within_train_step": 2.2867112159729004, "step": 1610} +{"train_info/time_between_train_steps": 0.003175020217895508, "step": 1610} +{"info/global_step": 1611, "train_info/time_within_train_step": 2.2866883277893066, "step": 1611} +{"train_info/time_between_train_steps": 0.0031757354736328125, "step": 1611} +{"info/global_step": 1612, "train_info/time_within_train_step": 2.2862892150878906, "step": 1612} +{"train_info/time_between_train_steps": 0.003126859664916992, "step": 1612} +{"info/global_step": 1613, "train_info/time_within_train_step": 2.2862679958343506, "step": 1613} +{"train_info/time_between_train_steps": 0.003101825714111328, "step": 1613} +{"info/global_step": 1614, "train_info/time_within_train_step": 2.2867140769958496, "step": 1614} +{"train_info/time_between_train_steps": 0.003204345703125, "step": 1614} +{"info/global_step": 1615, "train_info/time_within_train_step": 2.285696029663086, "step": 1615} +{"train_info/time_between_train_steps": 0.003146648406982422, "step": 1615} +{"info/global_step": 1616, "train_info/time_within_train_step": 2.2873806953430176, "step": 1616} +{"train_info/time_between_train_steps": 0.003176450729370117, "step": 1616} +{"info/global_step": 1617, "train_info/time_within_train_step": 2.286651134490967, "step": 1617} +{"train_info/time_between_train_steps": 0.003129243850708008, "step": 1617} +{"info/global_step": 1618, "train_info/time_within_train_step": 2.286858558654785, "step": 1618} +{"train_info/time_between_train_steps": 0.003114938735961914, "step": 1618} +{"info/global_step": 1619, "train_info/time_within_train_step": 2.2869200706481934, "step": 1619} +{"train_info/time_between_train_steps": 0.0031206607818603516, "step": 1619} +{"info/global_step": 1620, "train_info/time_within_train_step": 2.28745436668396, "step": 1620} +{"train_info/time_between_train_steps": 0.003140687942504883, "step": 1620} +{"info/global_step": 1621, "train_info/time_within_train_step": 2.2874419689178467, "step": 1621} +{"train_info/time_between_train_steps": 0.0031468868255615234, "step": 1621} +{"info/global_step": 1622, "train_info/time_within_train_step": 2.2875614166259766, "step": 1622} +{"train_info/time_between_train_steps": 0.0031461715698242188, "step": 1622} +{"info/global_step": 1623, "train_info/time_within_train_step": 2.287543296813965, "step": 1623} +{"train_info/time_between_train_steps": 0.003139495849609375, "step": 1623} +{"info/global_step": 1624, "train_info/time_within_train_step": 2.2872512340545654, "step": 1624} +{"train_info/time_between_train_steps": 0.0031380653381347656, "step": 1624} +{"info/global_step": 1625, "train_info/time_within_train_step": 2.2871875762939453, "step": 1625} +{"train_info/time_between_train_steps": 0.003149271011352539, "step": 1625} +{"info/global_step": 1626, "train_info/time_within_train_step": 2.2873027324676514, "step": 1626} +{"train_info/time_between_train_steps": 0.003152132034301758, "step": 1626} +{"info/global_step": 1627, "train_info/time_within_train_step": 2.2876319885253906, "step": 1627} +{"train_info/time_between_train_steps": 0.0031425952911376953, "step": 1627} +{"info/global_step": 1628, "train_info/time_within_train_step": 2.287498950958252, "step": 1628} +{"train_info/time_between_train_steps": 0.0031244754791259766, "step": 1628} +{"info/global_step": 1629, "train_info/time_within_train_step": 2.287675380706787, "step": 1629} +{"train_info/time_between_train_steps": 0.0033195018768310547, "step": 1629} +{"info/global_step": 1630, "train_info/time_within_train_step": 2.2873754501342773, "step": 1630} +{"train_info/time_between_train_steps": 0.003192424774169922, "step": 1630} +{"info/global_step": 1631, "train_info/time_within_train_step": 2.2876555919647217, "step": 1631} +{"train_info/time_between_train_steps": 0.003182649612426758, "step": 1631} +{"info/global_step": 1632, "train_info/time_within_train_step": 2.286126136779785, "step": 1632} +{"train_info/time_between_train_steps": 0.003208637237548828, "step": 1632} +{"info/global_step": 1633, "train_info/time_within_train_step": 2.2863845825195312, "step": 1633} +{"train_info/time_between_train_steps": 0.003179311752319336, "step": 1633} +{"info/global_step": 1634, "train_info/time_within_train_step": 2.28637433052063, "step": 1634} +{"train_info/time_between_train_steps": 0.0032024383544921875, "step": 1634} +{"info/global_step": 1635, "train_info/time_within_train_step": 2.2870421409606934, "step": 1635} +{"train_info/time_between_train_steps": 0.003144979476928711, "step": 1635} +{"info/global_step": 1636, "train_info/time_within_train_step": 2.2869646549224854, "step": 1636} +{"train_info/time_between_train_steps": 0.0032150745391845703, "step": 1636} +{"info/global_step": 1637, "train_info/time_within_train_step": 2.2874398231506348, "step": 1637} +{"train_info/time_between_train_steps": 0.003223896026611328, "step": 1637} +{"info/global_step": 1638, "train_info/time_within_train_step": 2.286909818649292, "step": 1638} +{"train_info/time_between_train_steps": 0.003207683563232422, "step": 1638} +{"info/global_step": 1639, "train_info/time_within_train_step": 2.28753662109375, "step": 1639} +{"train_info/time_between_train_steps": 0.0031862258911132812, "step": 1639} +{"info/global_step": 1640, "train_info/time_within_train_step": 2.288167953491211, "step": 1640} +{"train_info/time_between_train_steps": 0.0032281875610351562, "step": 1640} +{"info/global_step": 1641, "train_info/time_within_train_step": 2.287707805633545, "step": 1641} +{"train_info/time_between_train_steps": 0.003177165985107422, "step": 1641} +{"info/global_step": 1642, "train_info/time_within_train_step": 2.287146806716919, "step": 1642} +{"train_info/time_between_train_steps": 0.003164052963256836, "step": 1642} +{"info/global_step": 1643, "train_info/time_within_train_step": 2.2876017093658447, "step": 1643} +{"train_info/time_between_train_steps": 0.003254413604736328, "step": 1643} +{"info/global_step": 1644, "train_info/time_within_train_step": 2.2867071628570557, "step": 1644} +{"train_info/time_between_train_steps": 0.0031592845916748047, "step": 1644} +{"info/global_step": 1645, "train_info/time_within_train_step": 2.286329507827759, "step": 1645} +{"train_info/time_between_train_steps": 0.003109455108642578, "step": 1645} +{"info/global_step": 1646, "train_info/time_within_train_step": 2.2863361835479736, "step": 1646} +{"train_info/time_between_train_steps": 0.0031669139862060547, "step": 1646} +{"info/global_step": 1647, "train_info/time_within_train_step": 2.286494493484497, "step": 1647} +{"train_info/time_between_train_steps": 0.0031762123107910156, "step": 1647} +{"info/global_step": 1648, "train_info/time_within_train_step": 2.2871592044830322, "step": 1648} +{"train_info/time_between_train_steps": 0.0033147335052490234, "step": 1648} +{"info/global_step": 1649, "train_info/time_within_train_step": 2.2861287593841553, "step": 1649} +{"train_info/time_between_train_steps": 0.003163576126098633, "step": 1649} +{"info/global_step": 1650, "train_info/time_within_train_step": 2.2872352600097656, "step": 1650} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746347973, "_runtime": 4070}, "step": 1650} +{"logs": {"train/loss": 3.6159, "train/learning_rate": 0.0003, "train/epoch": 1.19, "_timestamp": 1746347973, "_runtime": 4070}, "step": 1650} +{"train_info/time_between_train_steps": 0.024178504943847656, "step": 1650} +{"info/global_step": 1651, "train_info/time_within_train_step": 2.2861552238464355, "step": 1651} +{"train_info/time_between_train_steps": 0.003143787384033203, "step": 1651} +{"info/global_step": 1652, "train_info/time_within_train_step": 2.2859764099121094, "step": 1652} +{"train_info/time_between_train_steps": 0.003145456314086914, "step": 1652} +{"info/global_step": 1653, "train_info/time_within_train_step": 2.285966157913208, "step": 1653} +{"train_info/time_between_train_steps": 0.003173828125, "step": 1653} +{"info/global_step": 1654, "train_info/time_within_train_step": 2.2860026359558105, "step": 1654} +{"train_info/time_between_train_steps": 0.0031838417053222656, "step": 1654} +{"info/global_step": 1655, "train_info/time_within_train_step": 2.411879777908325, "step": 1655} +{"train_info/time_between_train_steps": 0.0031807422637939453, "step": 1655} +{"info/global_step": 1656, "train_info/time_within_train_step": 2.2858855724334717, "step": 1656} +{"train_info/time_between_train_steps": 0.0031387805938720703, "step": 1656} +{"info/global_step": 1657, "train_info/time_within_train_step": 2.2868480682373047, "step": 1657} +{"train_info/time_between_train_steps": 0.0031309127807617188, "step": 1657} +{"info/global_step": 1658, "train_info/time_within_train_step": 2.530433416366577, "step": 1658} +{"train_info/time_between_train_steps": 0.0031633377075195312, "step": 1658} +{"info/global_step": 1659, "train_info/time_within_train_step": 2.2868151664733887, "step": 1659} +{"train_info/time_between_train_steps": 0.0031197071075439453, "step": 1659} +{"info/global_step": 1660, "train_info/time_within_train_step": 2.2867591381073, "step": 1660} +{"train_info/time_between_train_steps": 0.0031816959381103516, "step": 1660} +{"info/global_step": 1661, "train_info/time_within_train_step": 2.287623882293701, "step": 1661} +{"train_info/time_between_train_steps": 0.0031762123107910156, "step": 1661} +{"info/global_step": 1662, "train_info/time_within_train_step": 2.2927322387695312, "step": 1662} +{"train_info/time_between_train_steps": 0.0032057762145996094, "step": 1662} +{"info/global_step": 1663, "train_info/time_within_train_step": 2.2873587608337402, "step": 1663} +{"train_info/time_between_train_steps": 0.0031833648681640625, "step": 1663} +{"info/global_step": 1664, "train_info/time_within_train_step": 2.286984443664551, "step": 1664} +{"train_info/time_between_train_steps": 0.0031859874725341797, "step": 1664} +{"info/global_step": 1665, "train_info/time_within_train_step": 2.2878124713897705, "step": 1665} +{"train_info/time_between_train_steps": 0.003152608871459961, "step": 1665} +{"info/global_step": 1666, "train_info/time_within_train_step": 2.2867178916931152, "step": 1666} +{"train_info/time_between_train_steps": 0.0031554698944091797, "step": 1666} +{"info/global_step": 1667, "train_info/time_within_train_step": 2.2862613201141357, "step": 1667} +{"train_info/time_between_train_steps": 0.0031495094299316406, "step": 1667} +{"info/global_step": 1668, "train_info/time_within_train_step": 2.286372184753418, "step": 1668} +{"train_info/time_between_train_steps": 0.0032134056091308594, "step": 1668} +{"info/global_step": 1669, "train_info/time_within_train_step": 2.286522626876831, "step": 1669} +{"train_info/time_between_train_steps": 0.003246307373046875, "step": 1669} +{"info/global_step": 1670, "train_info/time_within_train_step": 2.286782741546631, "step": 1670} +{"train_info/time_between_train_steps": 0.0031816959381103516, "step": 1670} +{"info/global_step": 1671, "train_info/time_within_train_step": 2.2866780757904053, "step": 1671} +{"train_info/time_between_train_steps": 0.003178834915161133, "step": 1671} +{"info/global_step": 1672, "train_info/time_within_train_step": 2.2862021923065186, "step": 1672} +{"train_info/time_between_train_steps": 0.003190755844116211, "step": 1672} +{"info/global_step": 1673, "train_info/time_within_train_step": 2.28609299659729, "step": 1673} +{"train_info/time_between_train_steps": 0.003181934356689453, "step": 1673} +{"info/global_step": 1674, "train_info/time_within_train_step": 2.286214828491211, "step": 1674} +{"train_info/time_between_train_steps": 0.0031638145446777344, "step": 1674} +{"info/global_step": 1675, "train_info/time_within_train_step": 2.2858452796936035, "step": 1675} +{"train_info/time_between_train_steps": 0.0031595230102539062, "step": 1675} +{"info/global_step": 1676, "train_info/time_within_train_step": 2.286083459854126, "step": 1676} +{"train_info/time_between_train_steps": 0.003184795379638672, "step": 1676} +{"info/global_step": 1677, "train_info/time_within_train_step": 2.2863378524780273, "step": 1677} +{"train_info/time_between_train_steps": 0.003180980682373047, "step": 1677} +{"info/global_step": 1678, "train_info/time_within_train_step": 2.2867047786712646, "step": 1678} +{"train_info/time_between_train_steps": 0.003139019012451172, "step": 1678} +{"info/global_step": 1679, "train_info/time_within_train_step": 2.286120653152466, "step": 1679} +{"train_info/time_between_train_steps": 0.003120899200439453, "step": 1679} +{"info/global_step": 1680, "train_info/time_within_train_step": 2.2862050533294678, "step": 1680} +{"train_info/time_between_train_steps": 0.003164529800415039, "step": 1680} +{"info/global_step": 1681, "train_info/time_within_train_step": 2.285839080810547, "step": 1681} +{"train_info/time_between_train_steps": 0.0031299591064453125, "step": 1681} +{"info/global_step": 1682, "train_info/time_within_train_step": 2.2860097885131836, "step": 1682} +{"train_info/time_between_train_steps": 0.003198385238647461, "step": 1682} +{"info/global_step": 1683, "train_info/time_within_train_step": 2.2863354682922363, "step": 1683} +{"train_info/time_between_train_steps": 0.0031287670135498047, "step": 1683} +{"info/global_step": 1684, "train_info/time_within_train_step": 2.2860960960388184, "step": 1684} +{"train_info/time_between_train_steps": 0.003217935562133789, "step": 1684} +{"info/global_step": 1685, "train_info/time_within_train_step": 2.286374092102051, "step": 1685} +{"train_info/time_between_train_steps": 0.003230571746826172, "step": 1685} +{"info/global_step": 1686, "train_info/time_within_train_step": 2.2861135005950928, "step": 1686} +{"train_info/time_between_train_steps": 0.003160715103149414, "step": 1686} +{"info/global_step": 1687, "train_info/time_within_train_step": 2.285940170288086, "step": 1687} +{"train_info/time_between_train_steps": 0.003149271011352539, "step": 1687} +{"info/global_step": 1688, "train_info/time_within_train_step": 2.295057535171509, "step": 1688} +{"train_info/time_between_train_steps": 0.003160715103149414, "step": 1688} +{"info/global_step": 1689, "train_info/time_within_train_step": 2.28594708442688, "step": 1689} +{"train_info/time_between_train_steps": 0.0031654834747314453, "step": 1689} +{"info/global_step": 1690, "train_info/time_within_train_step": 2.2853169441223145, "step": 1690} +{"train_info/time_between_train_steps": 0.0031468868255615234, "step": 1690} +{"info/global_step": 1691, "train_info/time_within_train_step": 2.285158157348633, "step": 1691} +{"train_info/time_between_train_steps": 0.003149271011352539, "step": 1691} +{"info/global_step": 1692, "train_info/time_within_train_step": 2.2847907543182373, "step": 1692} +{"train_info/time_between_train_steps": 0.00318145751953125, "step": 1692} +{"info/global_step": 1693, "train_info/time_within_train_step": 2.285895586013794, "step": 1693} +{"train_info/time_between_train_steps": 0.0031890869140625, "step": 1693} +{"info/global_step": 1694, "train_info/time_within_train_step": 2.286398410797119, "step": 1694} +{"train_info/time_between_train_steps": 0.0031838417053222656, "step": 1694} +{"info/global_step": 1695, "train_info/time_within_train_step": 2.285520076751709, "step": 1695} +{"train_info/time_between_train_steps": 0.003162384033203125, "step": 1695} +{"info/global_step": 1696, "train_info/time_within_train_step": 2.286846160888672, "step": 1696} +{"train_info/time_between_train_steps": 0.0031747817993164062, "step": 1696} +{"info/global_step": 1697, "train_info/time_within_train_step": 2.286687135696411, "step": 1697} +{"train_info/time_between_train_steps": 0.003207683563232422, "step": 1697} +{"info/global_step": 1698, "train_info/time_within_train_step": 2.2867276668548584, "step": 1698} +{"train_info/time_between_train_steps": 0.003161191940307617, "step": 1698} +{"info/global_step": 1699, "train_info/time_within_train_step": 2.288217067718506, "step": 1699} +{"train_info/time_between_train_steps": 0.0031626224517822266, "step": 1699} +{"info/global_step": 1700, "train_info/time_within_train_step": 2.2868809700012207, "step": 1700} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746348089, "_runtime": 4186}, "step": 1700} +{"logs": {"train/loss": 3.587, "train/learning_rate": 0.0002888888888888888, "train/epoch": 1.2, "_timestamp": 1746348089, "_runtime": 4186}, "step": 1700} +{"train_info/time_between_train_steps": 12.55452036857605, "step": 1700} +{"info/global_step": 1701, "train_info/time_within_train_step": 2.121567487716675, "step": 1701} +{"train_info/time_between_train_steps": 0.0032007694244384766, "step": 1701} +{"info/global_step": 1702, "train_info/time_within_train_step": 2.10587477684021, "step": 1702} +{"train_info/time_between_train_steps": 0.0031585693359375, "step": 1702} +{"info/global_step": 1703, "train_info/time_within_train_step": 2.206407308578491, "step": 1703} +{"train_info/time_between_train_steps": 0.003191709518432617, "step": 1703} +{"info/global_step": 1704, "train_info/time_within_train_step": 2.2826120853424072, "step": 1704} +{"train_info/time_between_train_steps": 0.0031256675720214844, "step": 1704} +{"info/global_step": 1705, "train_info/time_within_train_step": 2.283353090286255, "step": 1705} +{"train_info/time_between_train_steps": 0.003136157989501953, "step": 1705} +{"info/global_step": 1706, "train_info/time_within_train_step": 2.2843146324157715, "step": 1706} +{"train_info/time_between_train_steps": 0.003152132034301758, "step": 1706} +{"info/global_step": 1707, "train_info/time_within_train_step": 2.2849559783935547, "step": 1707} +{"train_info/time_between_train_steps": 0.003135204315185547, "step": 1707} +{"info/global_step": 1708, "train_info/time_within_train_step": 2.284344434738159, "step": 1708} +{"train_info/time_between_train_steps": 0.0031425952911376953, "step": 1708} +{"info/global_step": 1709, "train_info/time_within_train_step": 2.530186176300049, "step": 1709} +{"train_info/time_between_train_steps": 0.0031762123107910156, "step": 1709} +{"info/global_step": 1710, "train_info/time_within_train_step": 2.2849884033203125, "step": 1710} +{"train_info/time_between_train_steps": 0.0033559799194335938, "step": 1710} +{"info/global_step": 1711, "train_info/time_within_train_step": 2.2855842113494873, "step": 1711} +{"train_info/time_between_train_steps": 0.0031952857971191406, "step": 1711} +{"info/global_step": 1712, "train_info/time_within_train_step": 2.285750150680542, "step": 1712} +{"train_info/time_between_train_steps": 0.0031511783599853516, "step": 1712} +{"info/global_step": 1713, "train_info/time_within_train_step": 2.2859489917755127, "step": 1713} +{"train_info/time_between_train_steps": 0.0031447410583496094, "step": 1713} +{"info/global_step": 1714, "train_info/time_within_train_step": 2.2869694232940674, "step": 1714} +{"train_info/time_between_train_steps": 0.0031828880310058594, "step": 1714} +{"info/global_step": 1715, "train_info/time_within_train_step": 2.2865138053894043, "step": 1715} +{"train_info/time_between_train_steps": 0.0031566619873046875, "step": 1715} +{"info/global_step": 1716, "train_info/time_within_train_step": 2.2866971492767334, "step": 1716} +{"train_info/time_between_train_steps": 0.0031898021697998047, "step": 1716} +{"info/global_step": 1717, "train_info/time_within_train_step": 2.291128396987915, "step": 1717} +{"train_info/time_between_train_steps": 0.1308906078338623, "step": 1717} +{"info/global_step": 1718, "train_info/time_within_train_step": 2.2864060401916504, "step": 1718} +{"train_info/time_between_train_steps": 0.0032427310943603516, "step": 1718} +{"info/global_step": 1719, "train_info/time_within_train_step": 2.286836624145508, "step": 1719} +{"train_info/time_between_train_steps": 0.0031807422637939453, "step": 1719} +{"info/global_step": 1720, "train_info/time_within_train_step": 2.2862050533294678, "step": 1720} +{"train_info/time_between_train_steps": 0.003205537796020508, "step": 1720} +{"info/global_step": 1721, "train_info/time_within_train_step": 2.2859606742858887, "step": 1721} +{"train_info/time_between_train_steps": 0.0032243728637695312, "step": 1721} +{"info/global_step": 1722, "train_info/time_within_train_step": 2.2857937812805176, "step": 1722} +{"train_info/time_between_train_steps": 0.003183603286743164, "step": 1722} +{"info/global_step": 1723, "train_info/time_within_train_step": 2.2857472896575928, "step": 1723} +{"train_info/time_between_train_steps": 0.0031402111053466797, "step": 1723} +{"info/global_step": 1724, "train_info/time_within_train_step": 2.285308361053467, "step": 1724} +{"train_info/time_between_train_steps": 0.0031633377075195312, "step": 1724} +{"info/global_step": 1725, "train_info/time_within_train_step": 2.2851202487945557, "step": 1725} +{"train_info/time_between_train_steps": 0.003173351287841797, "step": 1725} +{"info/global_step": 1726, "train_info/time_within_train_step": 2.3278656005859375, "step": 1726} +{"train_info/time_between_train_steps": 0.0031728744506835938, "step": 1726} +{"info/global_step": 1727, "train_info/time_within_train_step": 2.2855701446533203, "step": 1727} +{"train_info/time_between_train_steps": 0.0031664371490478516, "step": 1727} +{"info/global_step": 1728, "train_info/time_within_train_step": 2.2855336666107178, "step": 1728} +{"train_info/time_between_train_steps": 0.003143787384033203, "step": 1728} +{"info/global_step": 1729, "train_info/time_within_train_step": 2.2903542518615723, "step": 1729} +{"train_info/time_between_train_steps": 0.003122568130493164, "step": 1729} +{"info/global_step": 1730, "train_info/time_within_train_step": 2.285665988922119, "step": 1730} +{"train_info/time_between_train_steps": 0.003117799758911133, "step": 1730} +{"info/global_step": 1731, "train_info/time_within_train_step": 2.2862491607666016, "step": 1731} +{"train_info/time_between_train_steps": 0.0031206607818603516, "step": 1731} +{"info/global_step": 1732, "train_info/time_within_train_step": 2.2864110469818115, "step": 1732} +{"train_info/time_between_train_steps": 0.003164052963256836, "step": 1732} +{"info/global_step": 1733, "train_info/time_within_train_step": 2.285792589187622, "step": 1733} +{"train_info/time_between_train_steps": 0.003148317337036133, "step": 1733} +{"info/global_step": 1734, "train_info/time_within_train_step": 2.286376476287842, "step": 1734} +{"train_info/time_between_train_steps": 0.0037441253662109375, "step": 1734} +{"info/global_step": 1735, "train_info/time_within_train_step": 2.286134958267212, "step": 1735} +{"train_info/time_between_train_steps": 0.0031354427337646484, "step": 1735} +{"info/global_step": 1736, "train_info/time_within_train_step": 2.286219596862793, "step": 1736} +{"train_info/time_between_train_steps": 0.003175973892211914, "step": 1736} +{"info/global_step": 1737, "train_info/time_within_train_step": 2.286175012588501, "step": 1737} +{"train_info/time_between_train_steps": 0.0031366348266601562, "step": 1737} +{"info/global_step": 1738, "train_info/time_within_train_step": 2.2861459255218506, "step": 1738} +{"train_info/time_between_train_steps": 0.00318145751953125, "step": 1738} +{"info/global_step": 1739, "train_info/time_within_train_step": 2.2864842414855957, "step": 1739} +{"train_info/time_between_train_steps": 0.0031609535217285156, "step": 1739} +{"info/global_step": 1740, "train_info/time_within_train_step": 2.286712408065796, "step": 1740} +{"train_info/time_between_train_steps": 0.003179311752319336, "step": 1740} +{"info/global_step": 1741, "train_info/time_within_train_step": 2.2864480018615723, "step": 1741} +{"train_info/time_between_train_steps": 0.003194093704223633, "step": 1741} +{"info/global_step": 1742, "train_info/time_within_train_step": 2.2861063480377197, "step": 1742} +{"train_info/time_between_train_steps": 0.0031540393829345703, "step": 1742} +{"info/global_step": 1743, "train_info/time_within_train_step": 2.2923014163970947, "step": 1743} +{"train_info/time_between_train_steps": 0.003133535385131836, "step": 1743} +{"info/global_step": 1744, "train_info/time_within_train_step": 2.286367416381836, "step": 1744} +{"train_info/time_between_train_steps": 0.0031349658966064453, "step": 1744} +{"info/global_step": 1745, "train_info/time_within_train_step": 2.2857401371002197, "step": 1745} +{"train_info/time_between_train_steps": 0.0031630992889404297, "step": 1745} +{"info/global_step": 1746, "train_info/time_within_train_step": 2.286130428314209, "step": 1746} +{"train_info/time_between_train_steps": 0.003111124038696289, "step": 1746} +{"info/global_step": 1747, "train_info/time_within_train_step": 2.2856006622314453, "step": 1747} +{"train_info/time_between_train_steps": 0.003117084503173828, "step": 1747} +{"info/global_step": 1748, "train_info/time_within_train_step": 2.285341262817383, "step": 1748} +{"train_info/time_between_train_steps": 0.0031363964080810547, "step": 1748} +{"info/global_step": 1749, "train_info/time_within_train_step": 2.2855114936828613, "step": 1749} +{"train_info/time_between_train_steps": 0.0032045841217041016, "step": 1749} +{"info/global_step": 1750, "train_info/time_within_train_step": 2.6614773273468018, "step": 1750} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746348217, "_runtime": 4314}, "step": 1750} +{"logs": {"train/loss": 3.5669, "train/learning_rate": 0.0002777777777777778, "train/epoch": 1.22, "_timestamp": 1746348217, "_runtime": 4314}, "step": 1750} +{"train_info/time_between_train_steps": 0.024617671966552734, "step": 1750} +{"info/global_step": 1751, "train_info/time_within_train_step": 2.285679817199707, "step": 1751} +{"train_info/time_between_train_steps": 0.0031435489654541016, "step": 1751} +{"info/global_step": 1752, "train_info/time_within_train_step": 2.2857747077941895, "step": 1752} +{"train_info/time_between_train_steps": 0.003126859664916992, "step": 1752} +{"info/global_step": 1753, "train_info/time_within_train_step": 2.2857937812805176, "step": 1753} +{"train_info/time_between_train_steps": 0.0031387805938720703, "step": 1753} +{"info/global_step": 1754, "train_info/time_within_train_step": 2.2857117652893066, "step": 1754} +{"train_info/time_between_train_steps": 0.0031249523162841797, "step": 1754} +{"info/global_step": 1755, "train_info/time_within_train_step": 2.2856082916259766, "step": 1755} +{"train_info/time_between_train_steps": 0.003128528594970703, "step": 1755} +{"info/global_step": 1756, "train_info/time_within_train_step": 2.2858176231384277, "step": 1756} +{"train_info/time_between_train_steps": 0.003178834915161133, "step": 1756} +{"info/global_step": 1757, "train_info/time_within_train_step": 2.2861101627349854, "step": 1757} +{"train_info/time_between_train_steps": 0.003110647201538086, "step": 1757} +{"info/global_step": 1758, "train_info/time_within_train_step": 2.2856297492980957, "step": 1758} +{"train_info/time_between_train_steps": 0.0031616687774658203, "step": 1758} +{"info/global_step": 1759, "train_info/time_within_train_step": 2.284984588623047, "step": 1759} +{"train_info/time_between_train_steps": 0.0031239986419677734, "step": 1759} +{"info/global_step": 1760, "train_info/time_within_train_step": 2.285031318664551, "step": 1760} +{"train_info/time_between_train_steps": 0.0031566619873046875, "step": 1760} +{"info/global_step": 1761, "train_info/time_within_train_step": 2.285883665084839, "step": 1761} +{"train_info/time_between_train_steps": 0.003120899200439453, "step": 1761} +{"info/global_step": 1762, "train_info/time_within_train_step": 2.285714626312256, "step": 1762} +{"train_info/time_between_train_steps": 0.003134489059448242, "step": 1762} +{"info/global_step": 1763, "train_info/time_within_train_step": 2.2860331535339355, "step": 1763} +{"train_info/time_between_train_steps": 0.0031375885009765625, "step": 1763} +{"info/global_step": 1764, "train_info/time_within_train_step": 2.2859573364257812, "step": 1764} +{"train_info/time_between_train_steps": 0.0034623146057128906, "step": 1764} +{"info/global_step": 1765, "train_info/time_within_train_step": 2.2859363555908203, "step": 1765} +{"train_info/time_between_train_steps": 0.0031595230102539062, "step": 1765} +{"info/global_step": 1766, "train_info/time_within_train_step": 2.2868130207061768, "step": 1766} +{"train_info/time_between_train_steps": 0.003137826919555664, "step": 1766} +{"info/global_step": 1767, "train_info/time_within_train_step": 2.2858803272247314, "step": 1767} +{"train_info/time_between_train_steps": 0.0031430721282958984, "step": 1767} +{"info/global_step": 1768, "train_info/time_within_train_step": 2.286310911178589, "step": 1768} +{"train_info/time_between_train_steps": 0.0031614303588867188, "step": 1768} +{"info/global_step": 1769, "train_info/time_within_train_step": 2.2852110862731934, "step": 1769} +{"train_info/time_between_train_steps": 0.003110647201538086, "step": 1769} +{"info/global_step": 1770, "train_info/time_within_train_step": 2.2858219146728516, "step": 1770} +{"train_info/time_between_train_steps": 0.0031309127807617188, "step": 1770} +{"info/global_step": 1771, "train_info/time_within_train_step": 2.2862026691436768, "step": 1771} +{"train_info/time_between_train_steps": 0.003144502639770508, "step": 1771} +{"info/global_step": 1772, "train_info/time_within_train_step": 2.2860310077667236, "step": 1772} +{"train_info/time_between_train_steps": 0.0031659603118896484, "step": 1772} +{"info/global_step": 1773, "train_info/time_within_train_step": 2.285869836807251, "step": 1773} +{"train_info/time_between_train_steps": 0.0031380653381347656, "step": 1773} +{"info/global_step": 1774, "train_info/time_within_train_step": 2.2858633995056152, "step": 1774} +{"train_info/time_between_train_steps": 0.0031332969665527344, "step": 1774} +{"info/global_step": 1775, "train_info/time_within_train_step": 2.2860589027404785, "step": 1775} +{"train_info/time_between_train_steps": 0.0032453536987304688, "step": 1775} +{"info/global_step": 1776, "train_info/time_within_train_step": 2.2857234477996826, "step": 1776} +{"train_info/time_between_train_steps": 0.003141641616821289, "step": 1776} +{"info/global_step": 1777, "train_info/time_within_train_step": 2.285649061203003, "step": 1777} +{"train_info/time_between_train_steps": 0.003160715103149414, "step": 1777} +{"info/global_step": 1778, "train_info/time_within_train_step": 2.285858631134033, "step": 1778} +{"train_info/time_between_train_steps": 0.0031647682189941406, "step": 1778} +{"info/global_step": 1779, "train_info/time_within_train_step": 2.2857632637023926, "step": 1779} +{"train_info/time_between_train_steps": 0.003141641616821289, "step": 1779} +{"info/global_step": 1780, "train_info/time_within_train_step": 2.4108388423919678, "step": 1780} +{"train_info/time_between_train_steps": 0.003153562545776367, "step": 1780} +{"info/global_step": 1781, "train_info/time_within_train_step": 2.2861263751983643, "step": 1781} +{"train_info/time_between_train_steps": 0.0031740665435791016, "step": 1781} +{"info/global_step": 1782, "train_info/time_within_train_step": 2.2863051891326904, "step": 1782} +{"train_info/time_between_train_steps": 0.003142833709716797, "step": 1782} +{"info/global_step": 1783, "train_info/time_within_train_step": 2.2855091094970703, "step": 1783} +{"train_info/time_between_train_steps": 0.0031461715698242188, "step": 1783} +{"info/global_step": 1784, "train_info/time_within_train_step": 2.286090612411499, "step": 1784} +{"train_info/time_between_train_steps": 0.0031585693359375, "step": 1784} +{"info/global_step": 1785, "train_info/time_within_train_step": 2.2863821983337402, "step": 1785} +{"train_info/time_between_train_steps": 0.003195047378540039, "step": 1785} +{"info/global_step": 1786, "train_info/time_within_train_step": 2.286964178085327, "step": 1786} +{"train_info/time_between_train_steps": 0.003190279006958008, "step": 1786} +{"info/global_step": 1787, "train_info/time_within_train_step": 2.286360263824463, "step": 1787} +{"train_info/time_between_train_steps": 0.003175020217895508, "step": 1787} +{"info/global_step": 1788, "train_info/time_within_train_step": 2.286299467086792, "step": 1788} +{"train_info/time_between_train_steps": 0.0031905174255371094, "step": 1788} +{"info/global_step": 1789, "train_info/time_within_train_step": 2.286013126373291, "step": 1789} +{"train_info/time_between_train_steps": 0.0032203197479248047, "step": 1789} +{"info/global_step": 1790, "train_info/time_within_train_step": 2.2864768505096436, "step": 1790} +{"train_info/time_between_train_steps": 0.003175497055053711, "step": 1790} +{"info/global_step": 1791, "train_info/time_within_train_step": 2.286254644393921, "step": 1791} +{"train_info/time_between_train_steps": 0.003168821334838867, "step": 1791} +{"info/global_step": 1792, "train_info/time_within_train_step": 2.285306453704834, "step": 1792} +{"train_info/time_between_train_steps": 0.0031824111938476562, "step": 1792} +{"info/global_step": 1793, "train_info/time_within_train_step": 2.2859809398651123, "step": 1793} +{"train_info/time_between_train_steps": 0.0032236576080322266, "step": 1793} +{"info/global_step": 1794, "train_info/time_within_train_step": 2.285871982574463, "step": 1794} +{"train_info/time_between_train_steps": 0.003148317337036133, "step": 1794} +{"info/global_step": 1795, "train_info/time_within_train_step": 2.5441060066223145, "step": 1795} +{"train_info/time_between_train_steps": 0.003202199935913086, "step": 1795} +{"info/global_step": 1796, "train_info/time_within_train_step": 2.285578489303589, "step": 1796} +{"train_info/time_between_train_steps": 0.003188610076904297, "step": 1796} +{"info/global_step": 1797, "train_info/time_within_train_step": 2.2860987186431885, "step": 1797} +{"train_info/time_between_train_steps": 0.0032165050506591797, "step": 1797} +{"info/global_step": 1798, "train_info/time_within_train_step": 2.285719156265259, "step": 1798} +{"train_info/time_between_train_steps": 0.0031747817993164062, "step": 1798} +{"info/global_step": 1799, "train_info/time_within_train_step": 2.2859065532684326, "step": 1799} +{"train_info/time_between_train_steps": 0.003163576126098633, "step": 1799} +{"info/global_step": 1800, "train_info/time_within_train_step": 2.2861249446868896, "step": 1800} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746348333, "_runtime": 4430}, "step": 1800} +{"logs": {"train/loss": 3.5486, "train/learning_rate": 0.0002666666666666666, "train/epoch": 1.24, "_timestamp": 1746348333, "_runtime": 4430}, "step": 1800} +{"train_info/time_between_train_steps": 12.57667589187622, "step": 1800} +{"info/global_step": 1801, "train_info/time_within_train_step": 2.110943555831909, "step": 1801} +{"train_info/time_between_train_steps": 0.0031654834747314453, "step": 1801} +{"info/global_step": 1802, "train_info/time_within_train_step": 2.102459192276001, "step": 1802} +{"train_info/time_between_train_steps": 0.003190279006958008, "step": 1802} +{"info/global_step": 1803, "train_info/time_within_train_step": 2.218395471572876, "step": 1803} +{"train_info/time_between_train_steps": 0.003178834915161133, "step": 1803} +{"info/global_step": 1804, "train_info/time_within_train_step": 2.285564661026001, "step": 1804} +{"train_info/time_between_train_steps": 0.0032052993774414062, "step": 1804} +{"info/global_step": 1805, "train_info/time_within_train_step": 2.2854418754577637, "step": 1805} +{"train_info/time_between_train_steps": 0.0032699108123779297, "step": 1805} +{"info/global_step": 1806, "train_info/time_within_train_step": 2.2860372066497803, "step": 1806} +{"train_info/time_between_train_steps": 0.0031609535217285156, "step": 1806} +{"info/global_step": 1807, "train_info/time_within_train_step": 2.2852766513824463, "step": 1807} +{"train_info/time_between_train_steps": 0.0031578540802001953, "step": 1807} +{"info/global_step": 1808, "train_info/time_within_train_step": 2.2863357067108154, "step": 1808} +{"train_info/time_between_train_steps": 0.0031838417053222656, "step": 1808} +{"info/global_step": 1809, "train_info/time_within_train_step": 2.2861011028289795, "step": 1809} +{"train_info/time_between_train_steps": 0.003162860870361328, "step": 1809} +{"info/global_step": 1810, "train_info/time_within_train_step": 2.286353588104248, "step": 1810} +{"train_info/time_between_train_steps": 0.0031807422637939453, "step": 1810} +{"info/global_step": 1811, "train_info/time_within_train_step": 2.2862043380737305, "step": 1811} +{"train_info/time_between_train_steps": 0.0031387805938720703, "step": 1811} +{"info/global_step": 1812, "train_info/time_within_train_step": 2.2860400676727295, "step": 1812} +{"train_info/time_between_train_steps": 0.003187417984008789, "step": 1812} +{"info/global_step": 1813, "train_info/time_within_train_step": 2.2867207527160645, "step": 1813} +{"train_info/time_between_train_steps": 0.0031633377075195312, "step": 1813} +{"info/global_step": 1814, "train_info/time_within_train_step": 2.286668062210083, "step": 1814} +{"train_info/time_between_train_steps": 0.0032286643981933594, "step": 1814} +{"info/global_step": 1815, "train_info/time_within_train_step": 2.2874338626861572, "step": 1815} +{"train_info/time_between_train_steps": 0.003186941146850586, "step": 1815} +{"info/global_step": 1816, "train_info/time_within_train_step": 2.287158966064453, "step": 1816} +{"train_info/time_between_train_steps": 0.0031914710998535156, "step": 1816} +{"info/global_step": 1817, "train_info/time_within_train_step": 2.286785840988159, "step": 1817} +{"train_info/time_between_train_steps": 0.003164052963256836, "step": 1817} +{"info/global_step": 1818, "train_info/time_within_train_step": 2.286515235900879, "step": 1818} +{"train_info/time_between_train_steps": 0.003159046173095703, "step": 1818} +{"info/global_step": 1819, "train_info/time_within_train_step": 2.288698434829712, "step": 1819} +{"train_info/time_between_train_steps": 0.0031511783599853516, "step": 1819} +{"info/global_step": 1820, "train_info/time_within_train_step": 2.2871222496032715, "step": 1820} +{"train_info/time_between_train_steps": 0.003200531005859375, "step": 1820} +{"info/global_step": 1821, "train_info/time_within_train_step": 2.287466526031494, "step": 1821} +{"train_info/time_between_train_steps": 0.003203153610229492, "step": 1821} +{"info/global_step": 1822, "train_info/time_within_train_step": 2.2870559692382812, "step": 1822} +{"train_info/time_between_train_steps": 0.003205537796020508, "step": 1822} +{"info/global_step": 1823, "train_info/time_within_train_step": 2.2878987789154053, "step": 1823} +{"train_info/time_between_train_steps": 0.0032134056091308594, "step": 1823} +{"info/global_step": 1824, "train_info/time_within_train_step": 2.287182092666626, "step": 1824} +{"train_info/time_between_train_steps": 0.00316619873046875, "step": 1824} +{"info/global_step": 1825, "train_info/time_within_train_step": 2.286926031112671, "step": 1825} +{"train_info/time_between_train_steps": 0.003204345703125, "step": 1825} +{"info/global_step": 1826, "train_info/time_within_train_step": 2.2863099575042725, "step": 1826} +{"train_info/time_between_train_steps": 0.0032045841217041016, "step": 1826} +{"info/global_step": 1827, "train_info/time_within_train_step": 2.2870900630950928, "step": 1827} +{"train_info/time_between_train_steps": 0.0031578540802001953, "step": 1827} +{"info/global_step": 1828, "train_info/time_within_train_step": 2.286842107772827, "step": 1828} +{"train_info/time_between_train_steps": 0.0032041072845458984, "step": 1828} +{"info/global_step": 1829, "train_info/time_within_train_step": 2.287384271621704, "step": 1829} +{"train_info/time_between_train_steps": 0.003434896469116211, "step": 1829} +{"info/global_step": 1830, "train_info/time_within_train_step": 2.287235736846924, "step": 1830} +{"train_info/time_between_train_steps": 0.0031676292419433594, "step": 1830} +{"info/global_step": 1831, "train_info/time_within_train_step": 2.287100315093994, "step": 1831} +{"train_info/time_between_train_steps": 0.003175973892211914, "step": 1831} +{"info/global_step": 1832, "train_info/time_within_train_step": 2.286813497543335, "step": 1832} +{"train_info/time_between_train_steps": 0.003154754638671875, "step": 1832} +{"info/global_step": 1833, "train_info/time_within_train_step": 2.2869105339050293, "step": 1833} +{"train_info/time_between_train_steps": 0.0031647682189941406, "step": 1833} +{"info/global_step": 1834, "train_info/time_within_train_step": 2.286738157272339, "step": 1834} +{"train_info/time_between_train_steps": 0.003156423568725586, "step": 1834} +{"info/global_step": 1835, "train_info/time_within_train_step": 2.2869346141815186, "step": 1835} +{"train_info/time_between_train_steps": 0.003134489059448242, "step": 1835} +{"info/global_step": 1836, "train_info/time_within_train_step": 2.545806646347046, "step": 1836} +{"train_info/time_between_train_steps": 0.003192901611328125, "step": 1836} +{"info/global_step": 1837, "train_info/time_within_train_step": 2.287456750869751, "step": 1837} +{"train_info/time_between_train_steps": 0.003177165985107422, "step": 1837} +{"info/global_step": 1838, "train_info/time_within_train_step": 2.287263870239258, "step": 1838} +{"train_info/time_between_train_steps": 0.003185749053955078, "step": 1838} +{"info/global_step": 1839, "train_info/time_within_train_step": 2.2876639366149902, "step": 1839} +{"train_info/time_between_train_steps": 0.0031549930572509766, "step": 1839} +{"info/global_step": 1840, "train_info/time_within_train_step": 2.2872767448425293, "step": 1840} +{"train_info/time_between_train_steps": 0.0031328201293945312, "step": 1840} +{"info/global_step": 1841, "train_info/time_within_train_step": 2.287642002105713, "step": 1841} +{"train_info/time_between_train_steps": 0.003130674362182617, "step": 1841} +{"info/global_step": 1842, "train_info/time_within_train_step": 2.2876760959625244, "step": 1842} +{"train_info/time_between_train_steps": 0.07327747344970703, "step": 1842} +{"info/global_step": 1843, "train_info/time_within_train_step": 2.2876381874084473, "step": 1843} +{"train_info/time_between_train_steps": 0.0032198429107666016, "step": 1843} +{"info/global_step": 1844, "train_info/time_within_train_step": 2.2875537872314453, "step": 1844} +{"train_info/time_between_train_steps": 0.003207683563232422, "step": 1844} +{"info/global_step": 1845, "train_info/time_within_train_step": 2.2881903648376465, "step": 1845} +{"train_info/time_between_train_steps": 0.003208637237548828, "step": 1845} +{"info/global_step": 1846, "train_info/time_within_train_step": 2.287895441055298, "step": 1846} +{"train_info/time_between_train_steps": 0.0031919479370117188, "step": 1846} +{"info/global_step": 1847, "train_info/time_within_train_step": 2.2882227897644043, "step": 1847} +{"train_info/time_between_train_steps": 0.0032083988189697266, "step": 1847} +{"info/global_step": 1848, "train_info/time_within_train_step": 2.2874667644500732, "step": 1848} +{"train_info/time_between_train_steps": 0.003202199935913086, "step": 1848} +{"info/global_step": 1849, "train_info/time_within_train_step": 2.2872073650360107, "step": 1849} +{"train_info/time_between_train_steps": 0.0031404495239257812, "step": 1849} +{"info/global_step": 1850, "train_info/time_within_train_step": 2.2872426509857178, "step": 1850} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746348461, "_runtime": 4558}, "step": 1850} +{"logs": {"train/loss": 3.5352, "train/learning_rate": 0.00025555555555555553, "train/epoch": 1.25, "_timestamp": 1746348461, "_runtime": 4558}, "step": 1850} +{"train_info/time_between_train_steps": 0.025029897689819336, "step": 1850} +{"info/global_step": 1851, "train_info/time_within_train_step": 2.287393093109131, "step": 1851} +{"train_info/time_between_train_steps": 0.0032205581665039062, "step": 1851} +{"info/global_step": 1852, "train_info/time_within_train_step": 2.287203550338745, "step": 1852} +{"train_info/time_between_train_steps": 0.0032041072845458984, "step": 1852} +{"info/global_step": 1853, "train_info/time_within_train_step": 2.286745309829712, "step": 1853} +{"train_info/time_between_train_steps": 0.003326892852783203, "step": 1853} +{"info/global_step": 1854, "train_info/time_within_train_step": 2.2864651679992676, "step": 1854} +{"train_info/time_between_train_steps": 0.003148794174194336, "step": 1854} +{"info/global_step": 1855, "train_info/time_within_train_step": 2.28669810295105, "step": 1855} +{"train_info/time_between_train_steps": 0.0031702518463134766, "step": 1855} +{"info/global_step": 1856, "train_info/time_within_train_step": 2.286719799041748, "step": 1856} +{"train_info/time_between_train_steps": 0.0031425952911376953, "step": 1856} +{"info/global_step": 1857, "train_info/time_within_train_step": 2.287360191345215, "step": 1857} +{"train_info/time_between_train_steps": 0.003151416778564453, "step": 1857} +{"info/global_step": 1858, "train_info/time_within_train_step": 2.286665678024292, "step": 1858} +{"train_info/time_between_train_steps": 0.0031890869140625, "step": 1858} +{"info/global_step": 1859, "train_info/time_within_train_step": 2.2870655059814453, "step": 1859} +{"train_info/time_between_train_steps": 0.0031714439392089844, "step": 1859} +{"info/global_step": 1860, "train_info/time_within_train_step": 2.2871930599212646, "step": 1860} +{"train_info/time_between_train_steps": 0.003214597702026367, "step": 1860} +{"info/global_step": 1861, "train_info/time_within_train_step": 2.2867271900177, "step": 1861} +{"train_info/time_between_train_steps": 0.0031769275665283203, "step": 1861} +{"info/global_step": 1862, "train_info/time_within_train_step": 2.2870872020721436, "step": 1862} +{"train_info/time_between_train_steps": 0.0031828880310058594, "step": 1862} +{"info/global_step": 1863, "train_info/time_within_train_step": 2.28721022605896, "step": 1863} +{"train_info/time_between_train_steps": 0.003126859664916992, "step": 1863} +{"info/global_step": 1864, "train_info/time_within_train_step": 2.287058115005493, "step": 1864} +{"train_info/time_between_train_steps": 0.0034074783325195312, "step": 1864} +{"info/global_step": 1865, "train_info/time_within_train_step": 2.287540912628174, "step": 1865} +{"train_info/time_between_train_steps": 0.0031652450561523438, "step": 1865} +{"info/global_step": 1866, "train_info/time_within_train_step": 2.2878925800323486, "step": 1866} +{"train_info/time_between_train_steps": 0.0031366348266601562, "step": 1866} +{"info/global_step": 1867, "train_info/time_within_train_step": 2.2877564430236816, "step": 1867} +{"train_info/time_between_train_steps": 0.0031805038452148438, "step": 1867} +{"info/global_step": 1868, "train_info/time_within_train_step": 2.2871758937835693, "step": 1868} +{"train_info/time_between_train_steps": 0.003158092498779297, "step": 1868} +{"info/global_step": 1869, "train_info/time_within_train_step": 2.287278413772583, "step": 1869} +{"train_info/time_between_train_steps": 0.003178119659423828, "step": 1869} +{"info/global_step": 1870, "train_info/time_within_train_step": 2.2867202758789062, "step": 1870} +{"train_info/time_between_train_steps": 0.0031647682189941406, "step": 1870} +{"info/global_step": 1871, "train_info/time_within_train_step": 2.286827564239502, "step": 1871} +{"train_info/time_between_train_steps": 0.003183126449584961, "step": 1871} +{"info/global_step": 1872, "train_info/time_within_train_step": 2.3005411624908447, "step": 1872} +{"train_info/time_between_train_steps": 0.0028748512268066406, "step": 1872} +{"info/global_step": 1873, "train_info/time_within_train_step": 2.2857449054718018, "step": 1873} +{"train_info/time_between_train_steps": 0.002844572067260742, "step": 1873} +{"info/global_step": 1874, "train_info/time_within_train_step": 2.2845618724823, "step": 1874} +{"train_info/time_between_train_steps": 0.002864360809326172, "step": 1874} +{"info/global_step": 1875, "train_info/time_within_train_step": 2.2851243019104004, "step": 1875} +{"train_info/time_between_train_steps": 0.0028655529022216797, "step": 1875} +{"info/global_step": 1876, "train_info/time_within_train_step": 2.2850193977355957, "step": 1876} +{"train_info/time_between_train_steps": 0.002866506576538086, "step": 1876} +{"info/global_step": 1877, "train_info/time_within_train_step": 2.2843167781829834, "step": 1877} +{"train_info/time_between_train_steps": 0.002843618392944336, "step": 1877} +{"info/global_step": 1878, "train_info/time_within_train_step": 2.2850606441497803, "step": 1878} +{"train_info/time_between_train_steps": 0.002863645553588867, "step": 1878} +{"info/global_step": 1879, "train_info/time_within_train_step": 2.2850654125213623, "step": 1879} +{"train_info/time_between_train_steps": 0.0028934478759765625, "step": 1879} +{"info/global_step": 1880, "train_info/time_within_train_step": 2.285804033279419, "step": 1880} +{"train_info/time_between_train_steps": 0.0028655529022216797, "step": 1880} +{"info/global_step": 1881, "train_info/time_within_train_step": 2.2861223220825195, "step": 1881} +{"train_info/time_between_train_steps": 0.0028734207153320312, "step": 1881} +{"info/global_step": 1882, "train_info/time_within_train_step": 2.285709857940674, "step": 1882} +{"train_info/time_between_train_steps": 0.0028853416442871094, "step": 1882} +{"info/global_step": 1883, "train_info/time_within_train_step": 2.2859349250793457, "step": 1883} +{"train_info/time_between_train_steps": 0.0028753280639648438, "step": 1883} +{"info/global_step": 1884, "train_info/time_within_train_step": 2.2858927249908447, "step": 1884} +{"train_info/time_between_train_steps": 0.0029494762420654297, "step": 1884} +{"info/global_step": 1885, "train_info/time_within_train_step": 2.286428689956665, "step": 1885} +{"train_info/time_between_train_steps": 0.002857208251953125, "step": 1885} +{"info/global_step": 1886, "train_info/time_within_train_step": 2.2860262393951416, "step": 1886} +{"train_info/time_between_train_steps": 0.00286102294921875, "step": 1886} +{"info/global_step": 1887, "train_info/time_within_train_step": 2.285778045654297, "step": 1887} +{"train_info/time_between_train_steps": 0.0028848648071289062, "step": 1887} +{"info/global_step": 1888, "train_info/time_within_train_step": 2.2856521606445312, "step": 1888} +{"train_info/time_between_train_steps": 0.0028514862060546875, "step": 1888} +{"info/global_step": 1889, "train_info/time_within_train_step": 2.2861287593841553, "step": 1889} +{"train_info/time_between_train_steps": 0.0028824806213378906, "step": 1889} +{"info/global_step": 1890, "train_info/time_within_train_step": 2.2868666648864746, "step": 1890} +{"train_info/time_between_train_steps": 0.002850055694580078, "step": 1890} +{"info/global_step": 1891, "train_info/time_within_train_step": 2.285722255706787, "step": 1891} +{"train_info/time_between_train_steps": 0.0029022693634033203, "step": 1891} +{"info/global_step": 1892, "train_info/time_within_train_step": 2.285879135131836, "step": 1892} +{"train_info/time_between_train_steps": 0.0028655529022216797, "step": 1892} +{"info/global_step": 1893, "train_info/time_within_train_step": 2.286027669906616, "step": 1893} +{"train_info/time_between_train_steps": 0.0029098987579345703, "step": 1893} +{"info/global_step": 1894, "train_info/time_within_train_step": 2.2850990295410156, "step": 1894} +{"train_info/time_between_train_steps": 0.0028781890869140625, "step": 1894} +{"info/global_step": 1895, "train_info/time_within_train_step": 2.2849342823028564, "step": 1895} +{"train_info/time_between_train_steps": 0.0028672218322753906, "step": 1895} +{"info/global_step": 1896, "train_info/time_within_train_step": 2.2846245765686035, "step": 1896} +{"train_info/time_between_train_steps": 0.002836465835571289, "step": 1896} +{"info/global_step": 1897, "train_info/time_within_train_step": 2.285536527633667, "step": 1897} +{"train_info/time_between_train_steps": 0.0028533935546875, "step": 1897} +{"info/global_step": 1898, "train_info/time_within_train_step": 2.28523850440979, "step": 1898} +{"train_info/time_between_train_steps": 0.0028553009033203125, "step": 1898} +{"info/global_step": 1899, "train_info/time_within_train_step": 2.2849109172821045, "step": 1899} +{"train_info/time_between_train_steps": 0.0029211044311523438, "step": 1899} +{"info/global_step": 1900, "train_info/time_within_train_step": 2.2856714725494385, "step": 1900} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746348576, "_runtime": 4673}, "step": 1900} +{"logs": {"train/loss": 3.5145, "train/learning_rate": 0.00024444444444444443, "train/epoch": 1.27, "_timestamp": 1746348576, "_runtime": 4673}, "step": 1900} +{"train_info/time_between_train_steps": 11.309028625488281, "step": 1900} +{"info/global_step": 1901, "train_info/time_within_train_step": 2.118950843811035, "step": 1901} +{"train_info/time_between_train_steps": 0.0028748512268066406, "step": 1901} +{"info/global_step": 1902, "train_info/time_within_train_step": 2.098010540008545, "step": 1902} +{"train_info/time_between_train_steps": 0.0028574466705322266, "step": 1902} +{"info/global_step": 1903, "train_info/time_within_train_step": 2.2368385791778564, "step": 1903} +{"train_info/time_between_train_steps": 0.0028481483459472656, "step": 1903} +{"info/global_step": 1904, "train_info/time_within_train_step": 2.2821693420410156, "step": 1904} +{"train_info/time_between_train_steps": 0.0028655529022216797, "step": 1904} +{"info/global_step": 1905, "train_info/time_within_train_step": 2.2831172943115234, "step": 1905} +{"train_info/time_between_train_steps": 0.002874612808227539, "step": 1905} +{"info/global_step": 1906, "train_info/time_within_train_step": 2.284578800201416, "step": 1906} +{"train_info/time_between_train_steps": 0.002930879592895508, "step": 1906} +{"info/global_step": 1907, "train_info/time_within_train_step": 2.3356378078460693, "step": 1907} +{"train_info/time_between_train_steps": 0.0029053688049316406, "step": 1907} +{"info/global_step": 1908, "train_info/time_within_train_step": 2.284917116165161, "step": 1908} +{"train_info/time_between_train_steps": 0.0028998851776123047, "step": 1908} +{"info/global_step": 1909, "train_info/time_within_train_step": 2.284715175628662, "step": 1909} +{"train_info/time_between_train_steps": 0.002863645553588867, "step": 1909} +{"info/global_step": 1910, "train_info/time_within_train_step": 2.2850258350372314, "step": 1910} +{"train_info/time_between_train_steps": 0.0030677318572998047, "step": 1910} +{"info/global_step": 1911, "train_info/time_within_train_step": 2.2862696647644043, "step": 1911} +{"train_info/time_between_train_steps": 0.002863168716430664, "step": 1911} +{"info/global_step": 1912, "train_info/time_within_train_step": 2.2853591442108154, "step": 1912} +{"train_info/time_between_train_steps": 0.0028617382049560547, "step": 1912} +{"info/global_step": 1913, "train_info/time_within_train_step": 2.286571979522705, "step": 1913} +{"train_info/time_between_train_steps": 0.002904653549194336, "step": 1913} +{"info/global_step": 1914, "train_info/time_within_train_step": 2.2856273651123047, "step": 1914} +{"train_info/time_between_train_steps": 0.00286102294921875, "step": 1914} +{"info/global_step": 1915, "train_info/time_within_train_step": 2.2858104705810547, "step": 1915} +{"train_info/time_between_train_steps": 0.002862691879272461, "step": 1915} +{"info/global_step": 1916, "train_info/time_within_train_step": 2.2858667373657227, "step": 1916} +{"train_info/time_between_train_steps": 0.002843141555786133, "step": 1916} +{"info/global_step": 1917, "train_info/time_within_train_step": 2.2856433391571045, "step": 1917} +{"train_info/time_between_train_steps": 0.0028934478759765625, "step": 1917} +{"info/global_step": 1918, "train_info/time_within_train_step": 2.2855188846588135, "step": 1918} +{"train_info/time_between_train_steps": 0.002852916717529297, "step": 1918} +{"info/global_step": 1919, "train_info/time_within_train_step": 2.2854034900665283, "step": 1919} +{"train_info/time_between_train_steps": 0.002861499786376953, "step": 1919} +{"info/global_step": 1920, "train_info/time_within_train_step": 2.285576105117798, "step": 1920} +{"train_info/time_between_train_steps": 0.002897977828979492, "step": 1920} +{"info/global_step": 1921, "train_info/time_within_train_step": 2.284888744354248, "step": 1921} +{"train_info/time_between_train_steps": 0.0028886795043945312, "step": 1921} +{"info/global_step": 1922, "train_info/time_within_train_step": 2.2849514484405518, "step": 1922} +{"train_info/time_between_train_steps": 0.00286865234375, "step": 1922} +{"info/global_step": 1923, "train_info/time_within_train_step": 2.284687042236328, "step": 1923} +{"train_info/time_between_train_steps": 0.002880096435546875, "step": 1923} +{"info/global_step": 1924, "train_info/time_within_train_step": 2.2852180004119873, "step": 1924} +{"train_info/time_between_train_steps": 0.0028977394104003906, "step": 1924} +{"info/global_step": 1925, "train_info/time_within_train_step": 2.2856552600860596, "step": 1925} +{"train_info/time_between_train_steps": 0.0028536319732666016, "step": 1925} +{"info/global_step": 1926, "train_info/time_within_train_step": 2.2853121757507324, "step": 1926} +{"train_info/time_between_train_steps": 0.0028650760650634766, "step": 1926} +{"info/global_step": 1927, "train_info/time_within_train_step": 2.2858386039733887, "step": 1927} +{"train_info/time_between_train_steps": 0.0029163360595703125, "step": 1927} +{"info/global_step": 1928, "train_info/time_within_train_step": 2.2859108448028564, "step": 1928} +{"train_info/time_between_train_steps": 0.0028810501098632812, "step": 1928} +{"info/global_step": 1929, "train_info/time_within_train_step": 2.285435438156128, "step": 1929} +{"train_info/time_between_train_steps": 0.0028603076934814453, "step": 1929} +{"info/global_step": 1930, "train_info/time_within_train_step": 2.2853634357452393, "step": 1930} +{"train_info/time_between_train_steps": 0.0028896331787109375, "step": 1930} +{"info/global_step": 1931, "train_info/time_within_train_step": 2.4793827533721924, "step": 1931} +{"train_info/time_between_train_steps": 0.002932310104370117, "step": 1931} +{"info/global_step": 1932, "train_info/time_within_train_step": 2.2860183715820312, "step": 1932} +{"train_info/time_between_train_steps": 0.0029087066650390625, "step": 1932} +{"info/global_step": 1933, "train_info/time_within_train_step": 2.336555004119873, "step": 1933} +{"train_info/time_between_train_steps": 0.002847433090209961, "step": 1933} +{"info/global_step": 1934, "train_info/time_within_train_step": 2.284989356994629, "step": 1934} +{"train_info/time_between_train_steps": 0.0028526782989501953, "step": 1934} +{"info/global_step": 1935, "train_info/time_within_train_step": 2.2855825424194336, "step": 1935} +{"train_info/time_between_train_steps": 0.002834796905517578, "step": 1935} +{"info/global_step": 1936, "train_info/time_within_train_step": 2.2851734161376953, "step": 1936} +{"train_info/time_between_train_steps": 0.0028324127197265625, "step": 1936} +{"info/global_step": 1937, "train_info/time_within_train_step": 2.284949779510498, "step": 1937} +{"train_info/time_between_train_steps": 0.0028884410858154297, "step": 1937} +{"info/global_step": 1938, "train_info/time_within_train_step": 2.28542160987854, "step": 1938} +{"train_info/time_between_train_steps": 0.0028820037841796875, "step": 1938} +{"info/global_step": 1939, "train_info/time_within_train_step": 2.284822463989258, "step": 1939} +{"train_info/time_between_train_steps": 0.0028624534606933594, "step": 1939} +{"info/global_step": 1940, "train_info/time_within_train_step": 2.284787654876709, "step": 1940} +{"train_info/time_between_train_steps": 0.0028541088104248047, "step": 1940} +{"info/global_step": 1941, "train_info/time_within_train_step": 2.2851402759552, "step": 1941} +{"train_info/time_between_train_steps": 0.0028693675994873047, "step": 1941} +{"info/global_step": 1942, "train_info/time_within_train_step": 2.2852697372436523, "step": 1942} +{"train_info/time_between_train_steps": 0.002889394760131836, "step": 1942} +{"info/global_step": 1943, "train_info/time_within_train_step": 2.28544282913208, "step": 1943} +{"train_info/time_between_train_steps": 0.002867460250854492, "step": 1943} +{"info/global_step": 1944, "train_info/time_within_train_step": 2.2856717109680176, "step": 1944} +{"train_info/time_between_train_steps": 0.002831697463989258, "step": 1944} +{"info/global_step": 1945, "train_info/time_within_train_step": 2.285475015640259, "step": 1945} +{"train_info/time_between_train_steps": 0.0028612613677978516, "step": 1945} +{"info/global_step": 1946, "train_info/time_within_train_step": 2.2855966091156006, "step": 1946} +{"train_info/time_between_train_steps": 0.002900362014770508, "step": 1946} +{"info/global_step": 1947, "train_info/time_within_train_step": 2.2862439155578613, "step": 1947} +{"train_info/time_between_train_steps": 0.0028295516967773438, "step": 1947} +{"info/global_step": 1948, "train_info/time_within_train_step": 2.2859644889831543, "step": 1948} +{"train_info/time_between_train_steps": 0.0028755664825439453, "step": 1948} +{"info/global_step": 1949, "train_info/time_within_train_step": 2.286590099334717, "step": 1949} +{"train_info/time_between_train_steps": 0.0028569698333740234, "step": 1949} +{"info/global_step": 1950, "train_info/time_within_train_step": 2.2869722843170166, "step": 1950} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746348703, "_runtime": 4800}, "step": 1950} +{"logs": {"train/loss": 3.5096, "train/learning_rate": 0.0002333333333333333, "train/epoch": 1.29, "_timestamp": 1746348703, "_runtime": 4800}, "step": 1950} +{"train_info/time_between_train_steps": 0.02451038360595703, "step": 1950} +{"info/global_step": 1951, "train_info/time_within_train_step": 2.285862922668457, "step": 1951} +{"train_info/time_between_train_steps": 0.002833843231201172, "step": 1951} +{"info/global_step": 1952, "train_info/time_within_train_step": 2.285640001296997, "step": 1952} +{"train_info/time_between_train_steps": 0.0028464794158935547, "step": 1952} +{"info/global_step": 1953, "train_info/time_within_train_step": 2.2907071113586426, "step": 1953} +{"train_info/time_between_train_steps": 0.0028808116912841797, "step": 1953} +{"info/global_step": 1954, "train_info/time_within_train_step": 2.2856574058532715, "step": 1954} +{"train_info/time_between_train_steps": 0.0029036998748779297, "step": 1954} +{"info/global_step": 1955, "train_info/time_within_train_step": 2.2850892543792725, "step": 1955} +{"train_info/time_between_train_steps": 0.0034072399139404297, "step": 1955} +{"info/global_step": 1956, "train_info/time_within_train_step": 2.285409450531006, "step": 1956} +{"train_info/time_between_train_steps": 0.002849578857421875, "step": 1956} +{"info/global_step": 1957, "train_info/time_within_train_step": 2.2848427295684814, "step": 1957} +{"train_info/time_between_train_steps": 0.002853870391845703, "step": 1957} +{"info/global_step": 1958, "train_info/time_within_train_step": 2.2849678993225098, "step": 1958} +{"train_info/time_between_train_steps": 0.0028679370880126953, "step": 1958} +{"info/global_step": 1959, "train_info/time_within_train_step": 2.337003707885742, "step": 1959} +{"train_info/time_between_train_steps": 0.0028471946716308594, "step": 1959} +{"info/global_step": 1960, "train_info/time_within_train_step": 2.285141706466675, "step": 1960} +{"train_info/time_between_train_steps": 0.002855539321899414, "step": 1960} +{"info/global_step": 1961, "train_info/time_within_train_step": 2.2845869064331055, "step": 1961} +{"train_info/time_between_train_steps": 0.0029363632202148438, "step": 1961} +{"info/global_step": 1962, "train_info/time_within_train_step": 2.285371780395508, "step": 1962} +{"train_info/time_between_train_steps": 0.002882242202758789, "step": 1962} +{"info/global_step": 1963, "train_info/time_within_train_step": 2.2850592136383057, "step": 1963} +{"train_info/time_between_train_steps": 0.002882719039916992, "step": 1963} +{"info/global_step": 1964, "train_info/time_within_train_step": 2.2855465412139893, "step": 1964} +{"train_info/time_between_train_steps": 0.0028650760650634766, "step": 1964} +{"info/global_step": 1965, "train_info/time_within_train_step": 2.285158395767212, "step": 1965} +{"train_info/time_between_train_steps": 0.002882719039916992, "step": 1965} +{"info/global_step": 1966, "train_info/time_within_train_step": 2.2856431007385254, "step": 1966} +{"train_info/time_between_train_steps": 0.0028595924377441406, "step": 1966} +{"info/global_step": 1967, "train_info/time_within_train_step": 2.2857813835144043, "step": 1967} +{"train_info/time_between_train_steps": 0.002897977828979492, "step": 1967} +{"info/global_step": 1968, "train_info/time_within_train_step": 2.285853385925293, "step": 1968} +{"train_info/time_between_train_steps": 0.0028629302978515625, "step": 1968} +{"info/global_step": 1969, "train_info/time_within_train_step": 2.285752296447754, "step": 1969} +{"train_info/time_between_train_steps": 0.0029137134552001953, "step": 1969} +{"info/global_step": 1970, "train_info/time_within_train_step": 2.2861547470092773, "step": 1970} +{"train_info/time_between_train_steps": 0.0029120445251464844, "step": 1970} +{"info/global_step": 1971, "train_info/time_within_train_step": 2.2865347862243652, "step": 1971} +{"train_info/time_between_train_steps": 0.002890348434448242, "step": 1971} +{"info/global_step": 1972, "train_info/time_within_train_step": 2.2860379219055176, "step": 1972} +{"train_info/time_between_train_steps": 0.002887248992919922, "step": 1972} +{"info/global_step": 1973, "train_info/time_within_train_step": 2.2847654819488525, "step": 1973} +{"train_info/time_between_train_steps": 0.0028917789459228516, "step": 1973} +{"info/global_step": 1974, "train_info/time_within_train_step": 2.2858660221099854, "step": 1974} +{"train_info/time_between_train_steps": 0.002879619598388672, "step": 1974} +{"info/global_step": 1975, "train_info/time_within_train_step": 2.2860031127929688, "step": 1975} +{"train_info/time_between_train_steps": 0.002869129180908203, "step": 1975} +{"info/global_step": 1976, "train_info/time_within_train_step": 2.2855992317199707, "step": 1976} +{"train_info/time_between_train_steps": 0.0030336380004882812, "step": 1976} +{"info/global_step": 1977, "train_info/time_within_train_step": 2.2850430011749268, "step": 1977} +{"train_info/time_between_train_steps": 0.0028679370880126953, "step": 1977} +{"info/global_step": 1978, "train_info/time_within_train_step": 2.285076379776001, "step": 1978} +{"train_info/time_between_train_steps": 0.0028760433197021484, "step": 1978} +{"info/global_step": 1979, "train_info/time_within_train_step": 2.2897567749023438, "step": 1979} +{"train_info/time_between_train_steps": 0.0029020309448242188, "step": 1979} +{"info/global_step": 1980, "train_info/time_within_train_step": 2.2845473289489746, "step": 1980} +{"train_info/time_between_train_steps": 0.0028905868530273438, "step": 1980} +{"info/global_step": 1981, "train_info/time_within_train_step": 2.285045623779297, "step": 1981} +{"train_info/time_between_train_steps": 0.0034160614013671875, "step": 1981} +{"info/global_step": 1982, "train_info/time_within_train_step": 2.2848923206329346, "step": 1982} +{"train_info/time_between_train_steps": 0.0029113292694091797, "step": 1982} +{"info/global_step": 1983, "train_info/time_within_train_step": 2.2851874828338623, "step": 1983} +{"train_info/time_between_train_steps": 0.0029397010803222656, "step": 1983} +{"info/global_step": 1984, "train_info/time_within_train_step": 2.2852272987365723, "step": 1984} +{"train_info/time_between_train_steps": 0.0028839111328125, "step": 1984} +{"info/global_step": 1985, "train_info/time_within_train_step": 2.3360960483551025, "step": 1985} +{"train_info/time_between_train_steps": 0.0028748512268066406, "step": 1985} +{"info/global_step": 1986, "train_info/time_within_train_step": 2.2855613231658936, "step": 1986} +{"train_info/time_between_train_steps": 0.002870321273803711, "step": 1986} +{"info/global_step": 1987, "train_info/time_within_train_step": 2.2854254245758057, "step": 1987} +{"train_info/time_between_train_steps": 0.0028531551361083984, "step": 1987} +{"info/global_step": 1988, "train_info/time_within_train_step": 2.284818410873413, "step": 1988} +{"train_info/time_between_train_steps": 0.002895832061767578, "step": 1988} +{"info/global_step": 1989, "train_info/time_within_train_step": 2.444438934326172, "step": 1989} +{"train_info/time_between_train_steps": 0.0029592514038085938, "step": 1989} +{"info/global_step": 1990, "train_info/time_within_train_step": 2.284181833267212, "step": 1990} +{"train_info/time_between_train_steps": 0.0028603076934814453, "step": 1990} +{"info/global_step": 1991, "train_info/time_within_train_step": 2.284449577331543, "step": 1991} +{"train_info/time_between_train_steps": 0.002851724624633789, "step": 1991} +{"info/global_step": 1992, "train_info/time_within_train_step": 2.2847561836242676, "step": 1992} +{"train_info/time_between_train_steps": 0.0028793811798095703, "step": 1992} +{"info/global_step": 1993, "train_info/time_within_train_step": 2.2846853733062744, "step": 1993} +{"train_info/time_between_train_steps": 0.0029146671295166016, "step": 1993} +{"info/global_step": 1994, "train_info/time_within_train_step": 2.2854251861572266, "step": 1994} +{"train_info/time_between_train_steps": 0.0028901100158691406, "step": 1994} +{"info/global_step": 1995, "train_info/time_within_train_step": 2.2854220867156982, "step": 1995} +{"train_info/time_between_train_steps": 0.0028951168060302734, "step": 1995} +{"info/global_step": 1996, "train_info/time_within_train_step": 2.285381555557251, "step": 1996} +{"train_info/time_between_train_steps": 0.0028700828552246094, "step": 1996} +{"info/global_step": 1997, "train_info/time_within_train_step": 2.285402297973633, "step": 1997} +{"train_info/time_between_train_steps": 0.002849578857421875, "step": 1997} +{"info/global_step": 1998, "train_info/time_within_train_step": 2.2852628231048584, "step": 1998} +{"train_info/time_between_train_steps": 0.0028705596923828125, "step": 1998} +{"info/global_step": 1999, "train_info/time_within_train_step": 2.2857494354248047, "step": 1999} +{"train_info/time_between_train_steps": 0.002877473831176758, "step": 1999} +{"info/global_step": 2000, "train_info/time_within_train_step": 2.6514341831207275, "step": 2000} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746348819, "_runtime": 4916}, "step": 2000} +{"logs": {"train/loss": 3.4832, "train/learning_rate": 0.00022222222222222218, "train/epoch": 1.3, "_timestamp": 1746348819, "_runtime": 4916}, "step": 2000} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746348825, "_runtime": 4922}, "step": 2000} +{"logs": {"eval/loss": 3.8021483421325684, "eval/runtime": 5.5757, "eval/samples_per_second": 43.761, "eval/steps_per_second": 1.435, "train/epoch": 1.3, "_timestamp": 1746348825, "_runtime": 4922}, "step": 2000} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746348825, "_runtime": 4922}, "step": 2000} +{"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 3.8021483421325684, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 44.79732116157541, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 5.5757, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 43.761, "train/epoch": 1.3, "_timestamp": 1746348825, "_runtime": 4922}, "step": 2000} +{"train_info/time_between_train_steps": 16.974738121032715, "step": 2000} +{"info/global_step": 2001, "train_info/time_within_train_step": 2.102060079574585, "step": 2001} +{"train_info/time_between_train_steps": 0.0028662681579589844, "step": 2001} +{"info/global_step": 2002, "train_info/time_within_train_step": 2.099951982498169, "step": 2002} +{"train_info/time_between_train_steps": 0.002919435501098633, "step": 2002} +{"info/global_step": 2003, "train_info/time_within_train_step": 2.2427866458892822, "step": 2003} +{"train_info/time_between_train_steps": 0.002864837646484375, "step": 2003} +{"info/global_step": 2004, "train_info/time_within_train_step": 2.2841711044311523, "step": 2004} +{"train_info/time_between_train_steps": 0.0028717517852783203, "step": 2004} +{"info/global_step": 2005, "train_info/time_within_train_step": 2.2840566635131836, "step": 2005} +{"train_info/time_between_train_steps": 0.002914905548095703, "step": 2005} +{"info/global_step": 2006, "train_info/time_within_train_step": 2.2849812507629395, "step": 2006} +{"train_info/time_between_train_steps": 0.00289154052734375, "step": 2006} +{"info/global_step": 2007, "train_info/time_within_train_step": 2.284775972366333, "step": 2007} +{"train_info/time_between_train_steps": 0.002920866012573242, "step": 2007} +{"info/global_step": 2008, "train_info/time_within_train_step": 2.2855966091156006, "step": 2008} +{"train_info/time_between_train_steps": 0.002928018569946289, "step": 2008} +{"info/global_step": 2009, "train_info/time_within_train_step": 2.285141706466675, "step": 2009} +{"train_info/time_between_train_steps": 0.002896547317504883, "step": 2009} +{"info/global_step": 2010, "train_info/time_within_train_step": 2.2861008644104004, "step": 2010} +{"train_info/time_between_train_steps": 0.0028638839721679688, "step": 2010} +{"info/global_step": 2011, "train_info/time_within_train_step": 2.286588430404663, "step": 2011} +{"train_info/time_between_train_steps": 0.0028848648071289062, "step": 2011} +{"info/global_step": 2012, "train_info/time_within_train_step": 2.286557674407959, "step": 2012} +{"train_info/time_between_train_steps": 0.002876758575439453, "step": 2012} +{"info/global_step": 2013, "train_info/time_within_train_step": 2.2865729331970215, "step": 2013} +{"train_info/time_between_train_steps": 0.0028884410858154297, "step": 2013} +{"info/global_step": 2014, "train_info/time_within_train_step": 2.2870585918426514, "step": 2014} +{"train_info/time_between_train_steps": 0.0028727054595947266, "step": 2014} +{"info/global_step": 2015, "train_info/time_within_train_step": 2.2875587940216064, "step": 2015} +{"train_info/time_between_train_steps": 0.0029091835021972656, "step": 2015} +{"info/global_step": 2016, "train_info/time_within_train_step": 2.287811040878296, "step": 2016} +{"train_info/time_between_train_steps": 0.002935647964477539, "step": 2016} +{"info/global_step": 2017, "train_info/time_within_train_step": 2.286682605743408, "step": 2017} +{"train_info/time_between_train_steps": 0.0028939247131347656, "step": 2017} +{"info/global_step": 2018, "train_info/time_within_train_step": 2.2860801219940186, "step": 2018} +{"train_info/time_between_train_steps": 0.0029249191284179688, "step": 2018} +{"info/global_step": 2019, "train_info/time_within_train_step": 2.2873780727386475, "step": 2019} +{"train_info/time_between_train_steps": 0.0028791427612304688, "step": 2019} +{"info/global_step": 2020, "train_info/time_within_train_step": 2.28715181350708, "step": 2020} +{"train_info/time_between_train_steps": 0.0029413700103759766, "step": 2020} +{"info/global_step": 2021, "train_info/time_within_train_step": 2.287447452545166, "step": 2021} +{"train_info/time_between_train_steps": 0.00286102294921875, "step": 2021} +{"info/global_step": 2022, "train_info/time_within_train_step": 2.2866249084472656, "step": 2022} +{"train_info/time_between_train_steps": 0.002851247787475586, "step": 2022} +{"info/global_step": 2023, "train_info/time_within_train_step": 2.2859740257263184, "step": 2023} +{"train_info/time_between_train_steps": 0.002877950668334961, "step": 2023} +{"info/global_step": 2024, "train_info/time_within_train_step": 2.2857143878936768, "step": 2024} +{"train_info/time_between_train_steps": 0.002893686294555664, "step": 2024} +{"info/global_step": 2025, "train_info/time_within_train_step": 2.285200357437134, "step": 2025} +{"train_info/time_between_train_steps": 0.0028998851776123047, "step": 2025} +{"info/global_step": 2026, "train_info/time_within_train_step": 2.286196708679199, "step": 2026} +{"train_info/time_between_train_steps": 0.0028929710388183594, "step": 2026} +{"info/global_step": 2027, "train_info/time_within_train_step": 2.2860565185546875, "step": 2027} +{"train_info/time_between_train_steps": 0.002878904342651367, "step": 2027} +{"info/global_step": 2028, "train_info/time_within_train_step": 2.2856125831604004, "step": 2028} +{"train_info/time_between_train_steps": 0.003010272979736328, "step": 2028} +{"info/global_step": 2029, "train_info/time_within_train_step": 2.2855582237243652, "step": 2029} +{"train_info/time_between_train_steps": 0.00284576416015625, "step": 2029} +{"info/global_step": 2030, "train_info/time_within_train_step": 2.2856380939483643, "step": 2030} +{"train_info/time_between_train_steps": 0.002850055694580078, "step": 2030} +{"info/global_step": 2031, "train_info/time_within_train_step": 2.285891056060791, "step": 2031} +{"train_info/time_between_train_steps": 0.0029096603393554688, "step": 2031} +{"info/global_step": 2032, "train_info/time_within_train_step": 2.2856786251068115, "step": 2032} +{"train_info/time_between_train_steps": 0.0028748512268066406, "step": 2032} +{"info/global_step": 2033, "train_info/time_within_train_step": 2.286776304244995, "step": 2033} +{"train_info/time_between_train_steps": 0.0028781890869140625, "step": 2033} +{"info/global_step": 2034, "train_info/time_within_train_step": 2.2863075733184814, "step": 2034} +{"train_info/time_between_train_steps": 0.0028727054595947266, "step": 2034} +{"info/global_step": 2035, "train_info/time_within_train_step": 2.286463499069214, "step": 2035} +{"train_info/time_between_train_steps": 0.0029506683349609375, "step": 2035} +{"info/global_step": 2036, "train_info/time_within_train_step": 2.286792278289795, "step": 2036} +{"train_info/time_between_train_steps": 0.0029070377349853516, "step": 2036} +{"info/global_step": 2037, "train_info/time_within_train_step": 2.418067455291748, "step": 2037} +{"train_info/time_between_train_steps": 0.0028662681579589844, "step": 2037} +{"info/global_step": 2038, "train_info/time_within_train_step": 2.286252737045288, "step": 2038} +{"train_info/time_between_train_steps": 0.0059931278228759766, "step": 2038} +{"info/global_step": 2039, "train_info/time_within_train_step": 2.286128520965576, "step": 2039} +{"train_info/time_between_train_steps": 0.0028829574584960938, "step": 2039} +{"info/global_step": 2040, "train_info/time_within_train_step": 2.286123275756836, "step": 2040} +{"train_info/time_between_train_steps": 0.0028798580169677734, "step": 2040} +{"info/global_step": 2041, "train_info/time_within_train_step": 2.286937952041626, "step": 2041} +{"train_info/time_between_train_steps": 0.0061190128326416016, "step": 2041} +{"info/global_step": 2042, "train_info/time_within_train_step": 2.286193609237671, "step": 2042} +{"train_info/time_between_train_steps": 0.006061553955078125, "step": 2042} +{"info/global_step": 2043, "train_info/time_within_train_step": 2.2858688831329346, "step": 2043} +{"train_info/time_between_train_steps": 0.0060577392578125, "step": 2043} +{"info/global_step": 2044, "train_info/time_within_train_step": 2.2860519886016846, "step": 2044} +{"train_info/time_between_train_steps": 0.0060346126556396484, "step": 2044} +{"info/global_step": 2045, "train_info/time_within_train_step": 2.285921573638916, "step": 2045} +{"train_info/time_between_train_steps": 0.006070852279663086, "step": 2045} +{"info/global_step": 2046, "train_info/time_within_train_step": 2.286224603652954, "step": 2046} +{"train_info/time_between_train_steps": 0.006069183349609375, "step": 2046} +{"info/global_step": 2047, "train_info/time_within_train_step": 2.286623239517212, "step": 2047} +{"train_info/time_between_train_steps": 0.0060825347900390625, "step": 2047} +{"info/global_step": 2048, "train_info/time_within_train_step": 2.28591251373291, "step": 2048} +{"train_info/time_between_train_steps": 0.006052970886230469, "step": 2048} +{"info/global_step": 2049, "train_info/time_within_train_step": 2.2867431640625, "step": 2049} +{"train_info/time_between_train_steps": 0.0060901641845703125, "step": 2049} +{"info/global_step": 2050, "train_info/time_within_train_step": 2.2862048149108887, "step": 2050} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746348951, "_runtime": 5048}, "step": 2050} +{"logs": {"train/loss": 3.4693, "train/learning_rate": 0.0002111111111111111, "train/epoch": 1.32, "_timestamp": 1746348951, "_runtime": 5048}, "step": 2050} +{"train_info/time_between_train_steps": 0.025437355041503906, "step": 2050} +{"info/global_step": 2051, "train_info/time_within_train_step": 2.2864344120025635, "step": 2051} +{"train_info/time_between_train_steps": 0.006589174270629883, "step": 2051} +{"info/global_step": 2052, "train_info/time_within_train_step": 2.2864532470703125, "step": 2052} +{"train_info/time_between_train_steps": 0.006039619445800781, "step": 2052} +{"info/global_step": 2053, "train_info/time_within_train_step": 2.2865684032440186, "step": 2053} +{"train_info/time_between_train_steps": 0.006046772003173828, "step": 2053} +{"info/global_step": 2054, "train_info/time_within_train_step": 2.2871346473693848, "step": 2054} +{"train_info/time_between_train_steps": 0.006024837493896484, "step": 2054} +{"info/global_step": 2055, "train_info/time_within_train_step": 2.286639928817749, "step": 2055} +{"train_info/time_between_train_steps": 0.006084442138671875, "step": 2055} +{"info/global_step": 2056, "train_info/time_within_train_step": 2.2865922451019287, "step": 2056} +{"train_info/time_between_train_steps": 0.006105899810791016, "step": 2056} +{"info/global_step": 2057, "train_info/time_within_train_step": 2.286649227142334, "step": 2057} +{"train_info/time_between_train_steps": 0.00600123405456543, "step": 2057} +{"info/global_step": 2058, "train_info/time_within_train_step": 2.286740303039551, "step": 2058} +{"train_info/time_between_train_steps": 0.0029222965240478516, "step": 2058} +{"info/global_step": 2059, "train_info/time_within_train_step": 2.2863054275512695, "step": 2059} +{"train_info/time_between_train_steps": 0.0029380321502685547, "step": 2059} +{"info/global_step": 2060, "train_info/time_within_train_step": 2.2868492603302, "step": 2060} +{"train_info/time_between_train_steps": 0.0029151439666748047, "step": 2060} +{"info/global_step": 2061, "train_info/time_within_train_step": 2.2867887020111084, "step": 2061} +{"train_info/time_between_train_steps": 0.002929210662841797, "step": 2061} +{"info/global_step": 2062, "train_info/time_within_train_step": 2.286609172821045, "step": 2062} +{"train_info/time_between_train_steps": 0.0028777122497558594, "step": 2062} +{"info/global_step": 2063, "train_info/time_within_train_step": 2.286449909210205, "step": 2063} +{"train_info/time_between_train_steps": 0.002908468246459961, "step": 2063} +{"info/global_step": 2064, "train_info/time_within_train_step": 2.287137031555176, "step": 2064} +{"train_info/time_between_train_steps": 0.0029289722442626953, "step": 2064} +{"info/global_step": 2065, "train_info/time_within_train_step": 2.2863268852233887, "step": 2065} +{"train_info/time_between_train_steps": 0.002917051315307617, "step": 2065} +{"info/global_step": 2066, "train_info/time_within_train_step": 2.2870419025421143, "step": 2066} +{"train_info/time_between_train_steps": 0.0028824806213378906, "step": 2066} +{"info/global_step": 2067, "train_info/time_within_train_step": 2.286175489425659, "step": 2067} +{"train_info/time_between_train_steps": 0.002923727035522461, "step": 2067} +{"info/global_step": 2068, "train_info/time_within_train_step": 2.2867271900177, "step": 2068} +{"train_info/time_between_train_steps": 0.0029370784759521484, "step": 2068} +{"info/global_step": 2069, "train_info/time_within_train_step": 2.2860796451568604, "step": 2069} +{"train_info/time_between_train_steps": 0.002896547317504883, "step": 2069} +{"info/global_step": 2070, "train_info/time_within_train_step": 2.285609006881714, "step": 2070} +{"train_info/time_between_train_steps": 0.0029456615447998047, "step": 2070} +{"info/global_step": 2071, "train_info/time_within_train_step": 2.2862555980682373, "step": 2071} +{"train_info/time_between_train_steps": 0.0029189586639404297, "step": 2071} +{"info/global_step": 2072, "train_info/time_within_train_step": 2.2855494022369385, "step": 2072} +{"train_info/time_between_train_steps": 0.0029115676879882812, "step": 2072} +{"info/global_step": 2073, "train_info/time_within_train_step": 2.2865335941314697, "step": 2073} +{"train_info/time_between_train_steps": 0.0029354095458984375, "step": 2073} +{"info/global_step": 2074, "train_info/time_within_train_step": 2.2859573364257812, "step": 2074} +{"train_info/time_between_train_steps": 0.002902507781982422, "step": 2074} +{"info/global_step": 2075, "train_info/time_within_train_step": 2.286513328552246, "step": 2075} +{"train_info/time_between_train_steps": 0.002875089645385742, "step": 2075} +{"info/global_step": 2076, "train_info/time_within_train_step": 2.393522024154663, "step": 2076} +{"train_info/time_between_train_steps": 0.0029675960540771484, "step": 2076} +{"info/global_step": 2077, "train_info/time_within_train_step": 2.286454439163208, "step": 2077} +{"train_info/time_between_train_steps": 0.0029151439666748047, "step": 2077} +{"info/global_step": 2078, "train_info/time_within_train_step": 2.286796808242798, "step": 2078} +{"train_info/time_between_train_steps": 0.0029070377349853516, "step": 2078} +{"info/global_step": 2079, "train_info/time_within_train_step": 2.2874672412872314, "step": 2079} +{"train_info/time_between_train_steps": 0.002930879592895508, "step": 2079} +{"info/global_step": 2080, "train_info/time_within_train_step": 2.2874622344970703, "step": 2080} +{"train_info/time_between_train_steps": 0.003012418746948242, "step": 2080} +{"info/global_step": 2081, "train_info/time_within_train_step": 2.2872560024261475, "step": 2081} +{"train_info/time_between_train_steps": 0.002949953079223633, "step": 2081} +{"info/global_step": 2082, "train_info/time_within_train_step": 2.2868258953094482, "step": 2082} +{"train_info/time_between_train_steps": 0.002904176712036133, "step": 2082} +{"info/global_step": 2083, "train_info/time_within_train_step": 2.286600112915039, "step": 2083} +{"train_info/time_between_train_steps": 0.0029113292694091797, "step": 2083} +{"info/global_step": 2084, "train_info/time_within_train_step": 2.286161184310913, "step": 2084} +{"train_info/time_between_train_steps": 0.00296783447265625, "step": 2084} +{"info/global_step": 2085, "train_info/time_within_train_step": 2.286965847015381, "step": 2085} +{"train_info/time_between_train_steps": 0.002921581268310547, "step": 2085} +{"info/global_step": 2086, "train_info/time_within_train_step": 2.286201238632202, "step": 2086} +{"train_info/time_between_train_steps": 0.002962350845336914, "step": 2086} +{"info/global_step": 2087, "train_info/time_within_train_step": 2.28566837310791, "step": 2087} +{"train_info/time_between_train_steps": 0.00295257568359375, "step": 2087} +{"info/global_step": 2088, "train_info/time_within_train_step": 2.2868049144744873, "step": 2088} +{"train_info/time_between_train_steps": 0.0029320716857910156, "step": 2088} +{"info/global_step": 2089, "train_info/time_within_train_step": 2.286404609680176, "step": 2089} +{"train_info/time_between_train_steps": 0.002925395965576172, "step": 2089} +{"info/global_step": 2090, "train_info/time_within_train_step": 2.2863008975982666, "step": 2090} +{"train_info/time_between_train_steps": 0.002933979034423828, "step": 2090} +{"info/global_step": 2091, "train_info/time_within_train_step": 2.286323308944702, "step": 2091} +{"train_info/time_between_train_steps": 0.0029184818267822266, "step": 2091} +{"info/global_step": 2092, "train_info/time_within_train_step": 2.2857208251953125, "step": 2092} +{"train_info/time_between_train_steps": 0.0029549598693847656, "step": 2092} +{"info/global_step": 2093, "train_info/time_within_train_step": 2.2860946655273438, "step": 2093} +{"train_info/time_between_train_steps": 0.0029001235961914062, "step": 2093} +{"info/global_step": 2094, "train_info/time_within_train_step": 2.2865755558013916, "step": 2094} +{"train_info/time_between_train_steps": 0.0029506683349609375, "step": 2094} +{"info/global_step": 2095, "train_info/time_within_train_step": 2.2871129512786865, "step": 2095} +{"train_info/time_between_train_steps": 0.002955913543701172, "step": 2095} +{"info/global_step": 2096, "train_info/time_within_train_step": 2.2862391471862793, "step": 2096} +{"train_info/time_between_train_steps": 0.0029282569885253906, "step": 2096} +{"info/global_step": 2097, "train_info/time_within_train_step": 2.287121295928955, "step": 2097} +{"train_info/time_between_train_steps": 0.002935171127319336, "step": 2097} +{"info/global_step": 2098, "train_info/time_within_train_step": 2.286942481994629, "step": 2098} +{"train_info/time_between_train_steps": 0.002910614013671875, "step": 2098} +{"info/global_step": 2099, "train_info/time_within_train_step": 2.2877719402313232, "step": 2099} +{"train_info/time_between_train_steps": 0.0029184818267822266, "step": 2099} +{"info/global_step": 2100, "train_info/time_within_train_step": 2.2872557640075684, "step": 2100} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746349067, "_runtime": 5164}, "step": 2100} +{"logs": {"train/loss": 3.4518, "train/learning_rate": 0.00019999999999999998, "train/epoch": 1.34, "_timestamp": 1746349067, "_runtime": 5164}, "step": 2100} +{"train_info/time_between_train_steps": 10.470855951309204, "step": 2100} +{"info/global_step": 2101, "train_info/time_within_train_step": 2.104010820388794, "step": 2101} +{"train_info/time_between_train_steps": 0.006066799163818359, "step": 2101} +{"info/global_step": 2102, "train_info/time_within_train_step": 2.1017563343048096, "step": 2102} +{"train_info/time_between_train_steps": 0.006023406982421875, "step": 2102} +{"info/global_step": 2103, "train_info/time_within_train_step": 2.258152484893799, "step": 2103} +{"train_info/time_between_train_steps": 0.006005525588989258, "step": 2103} +{"info/global_step": 2104, "train_info/time_within_train_step": 2.284721851348877, "step": 2104} +{"train_info/time_between_train_steps": 0.006025552749633789, "step": 2104} +{"info/global_step": 2105, "train_info/time_within_train_step": 2.284780740737915, "step": 2105} +{"train_info/time_between_train_steps": 0.006148576736450195, "step": 2105} +{"info/global_step": 2106, "train_info/time_within_train_step": 2.285459280014038, "step": 2106} +{"train_info/time_between_train_steps": 0.006090402603149414, "step": 2106} +{"info/global_step": 2107, "train_info/time_within_train_step": 2.2860097885131836, "step": 2107} +{"train_info/time_between_train_steps": 0.006098270416259766, "step": 2107} +{"info/global_step": 2108, "train_info/time_within_train_step": 2.2862112522125244, "step": 2108} +{"train_info/time_between_train_steps": 0.006011486053466797, "step": 2108} +{"info/global_step": 2109, "train_info/time_within_train_step": 2.286325216293335, "step": 2109} +{"train_info/time_between_train_steps": 0.00601959228515625, "step": 2109} +{"info/global_step": 2110, "train_info/time_within_train_step": 2.2858529090881348, "step": 2110} +{"train_info/time_between_train_steps": 0.006080150604248047, "step": 2110} +{"info/global_step": 2111, "train_info/time_within_train_step": 2.286357879638672, "step": 2111} +{"train_info/time_between_train_steps": 0.006033658981323242, "step": 2111} +{"info/global_step": 2112, "train_info/time_within_train_step": 2.286154270172119, "step": 2112} +{"train_info/time_between_train_steps": 0.006074666976928711, "step": 2112} +{"info/global_step": 2113, "train_info/time_within_train_step": 2.2859139442443848, "step": 2113} +{"train_info/time_between_train_steps": 0.006045818328857422, "step": 2113} +{"info/global_step": 2114, "train_info/time_within_train_step": 2.286524534225464, "step": 2114} +{"train_info/time_between_train_steps": 0.006047248840332031, "step": 2114} +{"info/global_step": 2115, "train_info/time_within_train_step": 2.2859079837799072, "step": 2115} +{"train_info/time_between_train_steps": 0.00603485107421875, "step": 2115} +{"info/global_step": 2116, "train_info/time_within_train_step": 2.285921335220337, "step": 2116} +{"train_info/time_between_train_steps": 0.006106138229370117, "step": 2116} +{"info/global_step": 2117, "train_info/time_within_train_step": 2.2863211631774902, "step": 2117} +{"train_info/time_between_train_steps": 0.005997180938720703, "step": 2117} +{"info/global_step": 2118, "train_info/time_within_train_step": 2.286407232284546, "step": 2118} +{"train_info/time_between_train_steps": 0.006073713302612305, "step": 2118} +{"info/global_step": 2119, "train_info/time_within_train_step": 2.2858400344848633, "step": 2119} +{"train_info/time_between_train_steps": 0.006052732467651367, "step": 2119} +{"info/global_step": 2120, "train_info/time_within_train_step": 2.2863738536834717, "step": 2120} +{"train_info/time_between_train_steps": 0.006127595901489258, "step": 2120} +{"info/global_step": 2121, "train_info/time_within_train_step": 2.2870423793792725, "step": 2121} +{"train_info/time_between_train_steps": 0.006098031997680664, "step": 2121} +{"info/global_step": 2122, "train_info/time_within_train_step": 2.2870724201202393, "step": 2122} +{"train_info/time_between_train_steps": 0.00603795051574707, "step": 2122} +{"info/global_step": 2123, "train_info/time_within_train_step": 2.287001132965088, "step": 2123} +{"train_info/time_between_train_steps": 0.006136178970336914, "step": 2123} +{"info/global_step": 2124, "train_info/time_within_train_step": 2.287092685699463, "step": 2124} +{"train_info/time_between_train_steps": 0.006034135818481445, "step": 2124} +{"info/global_step": 2125, "train_info/time_within_train_step": 2.2866032123565674, "step": 2125} +{"train_info/time_between_train_steps": 0.006028890609741211, "step": 2125} +{"info/global_step": 2126, "train_info/time_within_train_step": 2.2868027687072754, "step": 2126} +{"train_info/time_between_train_steps": 0.006100177764892578, "step": 2126} +{"info/global_step": 2127, "train_info/time_within_train_step": 2.286771535873413, "step": 2127} +{"train_info/time_between_train_steps": 0.006093502044677734, "step": 2127} +{"info/global_step": 2128, "train_info/time_within_train_step": 2.3659868240356445, "step": 2128} +{"train_info/time_between_train_steps": 0.006635189056396484, "step": 2128} +{"info/global_step": 2129, "train_info/time_within_train_step": 2.286635637283325, "step": 2129} +{"train_info/time_between_train_steps": 0.0030617713928222656, "step": 2129} +{"info/global_step": 2130, "train_info/time_within_train_step": 2.2868001461029053, "step": 2130} +{"train_info/time_between_train_steps": 0.006022453308105469, "step": 2130} +{"info/global_step": 2131, "train_info/time_within_train_step": 2.287393093109131, "step": 2131} +{"train_info/time_between_train_steps": 0.006067514419555664, "step": 2131} +{"info/global_step": 2132, "train_info/time_within_train_step": 2.2865257263183594, "step": 2132} +{"train_info/time_between_train_steps": 0.005993843078613281, "step": 2132} +{"info/global_step": 2133, "train_info/time_within_train_step": 2.2867350578308105, "step": 2133} +{"train_info/time_between_train_steps": 0.0060770511627197266, "step": 2133} +{"info/global_step": 2134, "train_info/time_within_train_step": 2.2863271236419678, "step": 2134} +{"train_info/time_between_train_steps": 0.006005048751831055, "step": 2134} +{"info/global_step": 2135, "train_info/time_within_train_step": 2.2860445976257324, "step": 2135} +{"train_info/time_between_train_steps": 0.006061553955078125, "step": 2135} +{"info/global_step": 2136, "train_info/time_within_train_step": 2.286137342453003, "step": 2136} +{"train_info/time_between_train_steps": 0.0061244964599609375, "step": 2136} +{"info/global_step": 2137, "train_info/time_within_train_step": 2.2860300540924072, "step": 2137} +{"train_info/time_between_train_steps": 0.006063938140869141, "step": 2137} +{"info/global_step": 2138, "train_info/time_within_train_step": 2.2862470149993896, "step": 2138} +{"train_info/time_between_train_steps": 0.006060123443603516, "step": 2138} +{"info/global_step": 2139, "train_info/time_within_train_step": 2.285446882247925, "step": 2139} +{"train_info/time_between_train_steps": 0.0060329437255859375, "step": 2139} +{"info/global_step": 2140, "train_info/time_within_train_step": 2.2861382961273193, "step": 2140} +{"train_info/time_between_train_steps": 0.006064176559448242, "step": 2140} +{"info/global_step": 2141, "train_info/time_within_train_step": 2.286153554916382, "step": 2141} +{"train_info/time_between_train_steps": 0.006084918975830078, "step": 2141} +{"info/global_step": 2142, "train_info/time_within_train_step": 2.2864177227020264, "step": 2142} +{"train_info/time_between_train_steps": 0.00611114501953125, "step": 2142} +{"info/global_step": 2143, "train_info/time_within_train_step": 2.286353826522827, "step": 2143} +{"train_info/time_between_train_steps": 0.0060236454010009766, "step": 2143} +{"info/global_step": 2144, "train_info/time_within_train_step": 2.2866034507751465, "step": 2144} +{"train_info/time_between_train_steps": 0.005991935729980469, "step": 2144} +{"info/global_step": 2145, "train_info/time_within_train_step": 2.2856385707855225, "step": 2145} +{"train_info/time_between_train_steps": 0.006127119064331055, "step": 2145} +{"info/global_step": 2146, "train_info/time_within_train_step": 2.2867650985717773, "step": 2146} +{"train_info/time_between_train_steps": 0.006085395812988281, "step": 2146} +{"info/global_step": 2147, "train_info/time_within_train_step": 2.2866740226745605, "step": 2147} +{"train_info/time_between_train_steps": 0.006045341491699219, "step": 2147} +{"info/global_step": 2148, "train_info/time_within_train_step": 2.286344051361084, "step": 2148} +{"train_info/time_between_train_steps": 0.006020784378051758, "step": 2148} +{"info/global_step": 2149, "train_info/time_within_train_step": 2.286741256713867, "step": 2149} +{"train_info/time_between_train_steps": 0.006016254425048828, "step": 2149} +{"info/global_step": 2150, "train_info/time_within_train_step": 2.286409378051758, "step": 2150} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746349193, "_runtime": 5290}, "step": 2150} +{"logs": {"train/loss": 3.4373, "train/learning_rate": 0.00018888888888888888, "train/epoch": 1.35, "_timestamp": 1746349193, "_runtime": 5290}, "step": 2150} +{"train_info/time_between_train_steps": 0.025820016860961914, "step": 2150} +{"info/global_step": 2151, "train_info/time_within_train_step": 2.2864816188812256, "step": 2151} +{"train_info/time_between_train_steps": 0.006021022796630859, "step": 2151} +{"info/global_step": 2152, "train_info/time_within_train_step": 2.2865278720855713, "step": 2152} +{"train_info/time_between_train_steps": 0.006093025207519531, "step": 2152} +{"info/global_step": 2153, "train_info/time_within_train_step": 2.2866039276123047, "step": 2153} +{"train_info/time_between_train_steps": 0.002996683120727539, "step": 2153} +{"info/global_step": 2154, "train_info/time_within_train_step": 2.2869179248809814, "step": 2154} +{"train_info/time_between_train_steps": 0.002897024154663086, "step": 2154} +{"info/global_step": 2155, "train_info/time_within_train_step": 2.286482334136963, "step": 2155} +{"train_info/time_between_train_steps": 0.0029363632202148438, "step": 2155} +{"info/global_step": 2156, "train_info/time_within_train_step": 2.2867724895477295, "step": 2156} +{"train_info/time_between_train_steps": 0.0029206275939941406, "step": 2156} +{"info/global_step": 2157, "train_info/time_within_train_step": 2.286926746368408, "step": 2157} +{"train_info/time_between_train_steps": 0.002882719039916992, "step": 2157} +{"info/global_step": 2158, "train_info/time_within_train_step": 2.286717653274536, "step": 2158} +{"train_info/time_between_train_steps": 0.002956867218017578, "step": 2158} +{"info/global_step": 2159, "train_info/time_within_train_step": 2.2864668369293213, "step": 2159} +{"train_info/time_between_train_steps": 0.003065824508666992, "step": 2159} +{"info/global_step": 2160, "train_info/time_within_train_step": 2.286587953567505, "step": 2160} +{"train_info/time_between_train_steps": 0.002962350845336914, "step": 2160} +{"info/global_step": 2161, "train_info/time_within_train_step": 2.2871179580688477, "step": 2161} +{"train_info/time_between_train_steps": 0.0030117034912109375, "step": 2161} +{"info/global_step": 2162, "train_info/time_within_train_step": 2.286886692047119, "step": 2162} +{"train_info/time_between_train_steps": 0.0029838085174560547, "step": 2162} +{"info/global_step": 2163, "train_info/time_within_train_step": 2.2864699363708496, "step": 2163} +{"train_info/time_between_train_steps": 0.0030977725982666016, "step": 2163} +{"info/global_step": 2164, "train_info/time_within_train_step": 2.2869112491607666, "step": 2164} +{"train_info/time_between_train_steps": 0.003083467483520508, "step": 2164} +{"info/global_step": 2165, "train_info/time_within_train_step": 2.2880594730377197, "step": 2165} +{"train_info/time_between_train_steps": 0.003123044967651367, "step": 2165} +{"info/global_step": 2166, "train_info/time_within_train_step": 2.2865149974823, "step": 2166} +{"train_info/time_between_train_steps": 0.003144979476928711, "step": 2166} +{"info/global_step": 2167, "train_info/time_within_train_step": 2.28837513923645, "step": 2167} +{"train_info/time_between_train_steps": 0.003077983856201172, "step": 2167} +{"info/global_step": 2168, "train_info/time_within_train_step": 2.287357807159424, "step": 2168} +{"train_info/time_between_train_steps": 0.0030641555786132812, "step": 2168} +{"info/global_step": 2169, "train_info/time_within_train_step": 2.2880241870880127, "step": 2169} +{"train_info/time_between_train_steps": 0.0032682418823242188, "step": 2169} +{"info/global_step": 2170, "train_info/time_within_train_step": 2.2877964973449707, "step": 2170} +{"train_info/time_between_train_steps": 0.0030596256256103516, "step": 2170} +{"info/global_step": 2171, "train_info/time_within_train_step": 2.2872750759124756, "step": 2171} +{"train_info/time_between_train_steps": 0.003144979476928711, "step": 2171} +{"info/global_step": 2172, "train_info/time_within_train_step": 2.2873709201812744, "step": 2172} +{"train_info/time_between_train_steps": 0.003233194351196289, "step": 2172} +{"info/global_step": 2173, "train_info/time_within_train_step": 2.2871696949005127, "step": 2173} +{"train_info/time_between_train_steps": 0.003306150436401367, "step": 2173} +{"info/global_step": 2174, "train_info/time_within_train_step": 2.287518262863159, "step": 2174} +{"train_info/time_between_train_steps": 0.0032210350036621094, "step": 2174} +{"info/global_step": 2175, "train_info/time_within_train_step": 2.287515878677368, "step": 2175} +{"train_info/time_between_train_steps": 0.0033674240112304688, "step": 2175} +{"info/global_step": 2176, "train_info/time_within_train_step": 2.2874093055725098, "step": 2176} +{"train_info/time_between_train_steps": 0.003453493118286133, "step": 2176} +{"info/global_step": 2177, "train_info/time_within_train_step": 2.2879555225372314, "step": 2177} +{"train_info/time_between_train_steps": 0.0033121109008789062, "step": 2177} +{"info/global_step": 2178, "train_info/time_within_train_step": 2.288445472717285, "step": 2178} +{"train_info/time_between_train_steps": 0.0033311843872070312, "step": 2178} +{"info/global_step": 2179, "train_info/time_within_train_step": 2.289699077606201, "step": 2179} +{"train_info/time_between_train_steps": 0.0035400390625, "step": 2179} +{"info/global_step": 2180, "train_info/time_within_train_step": 2.2893974781036377, "step": 2180} +{"train_info/time_between_train_steps": 0.0036897659301757812, "step": 2180} +{"info/global_step": 2181, "train_info/time_within_train_step": 2.289487600326538, "step": 2181} +{"train_info/time_between_train_steps": 0.004009723663330078, "step": 2181} +{"info/global_step": 2182, "train_info/time_within_train_step": 2.2892003059387207, "step": 2182} +{"train_info/time_between_train_steps": 0.0036928653717041016, "step": 2182} +{"info/global_step": 2183, "train_info/time_within_train_step": 2.2893881797790527, "step": 2183} +{"train_info/time_between_train_steps": 0.003984928131103516, "step": 2183} +{"info/global_step": 2184, "train_info/time_within_train_step": 2.2892720699310303, "step": 2184} +{"train_info/time_between_train_steps": 1.9623668193817139, "step": 2184} +{"info/global_step": 2185, "train_info/time_within_train_step": 2.2825818061828613, "step": 2185} +{"train_info/time_between_train_steps": 0.0031452178955078125, "step": 2185} +{"info/global_step": 2186, "train_info/time_within_train_step": 2.286048650741577, "step": 2186} +{"train_info/time_between_train_steps": 0.0033326148986816406, "step": 2186} +{"info/global_step": 2187, "train_info/time_within_train_step": 2.2858963012695312, "step": 2187} +{"train_info/time_between_train_steps": 0.0031261444091796875, "step": 2187} +{"info/global_step": 2188, "train_info/time_within_train_step": 2.28664493560791, "step": 2188} +{"train_info/time_between_train_steps": 0.0036797523498535156, "step": 2188} +{"info/global_step": 2189, "train_info/time_within_train_step": 2.2860493659973145, "step": 2189} +{"train_info/time_between_train_steps": 0.003106832504272461, "step": 2189} +{"info/global_step": 2190, "train_info/time_within_train_step": 2.2860913276672363, "step": 2190} +{"train_info/time_between_train_steps": 0.003138303756713867, "step": 2190} +{"info/global_step": 2191, "train_info/time_within_train_step": 2.2862117290496826, "step": 2191} +{"train_info/time_between_train_steps": 0.0031011104583740234, "step": 2191} +{"info/global_step": 2192, "train_info/time_within_train_step": 2.2858316898345947, "step": 2192} +{"train_info/time_between_train_steps": 0.003126382827758789, "step": 2192} +{"info/global_step": 2193, "train_info/time_within_train_step": 2.2854487895965576, "step": 2193} +{"train_info/time_between_train_steps": 0.003139019012451172, "step": 2193} +{"info/global_step": 2194, "train_info/time_within_train_step": 2.2857182025909424, "step": 2194} +{"train_info/time_between_train_steps": 0.0031108856201171875, "step": 2194} +{"info/global_step": 2195, "train_info/time_within_train_step": 2.2858800888061523, "step": 2195} +{"train_info/time_between_train_steps": 0.003097057342529297, "step": 2195} +{"info/global_step": 2196, "train_info/time_within_train_step": 2.2854247093200684, "step": 2196} +{"train_info/time_between_train_steps": 0.0030975341796875, "step": 2196} +{"info/global_step": 2197, "train_info/time_within_train_step": 2.2859675884246826, "step": 2197} +{"train_info/time_between_train_steps": 0.003129243850708008, "step": 2197} +{"info/global_step": 2198, "train_info/time_within_train_step": 2.286190986633301, "step": 2198} +{"train_info/time_between_train_steps": 0.003142833709716797, "step": 2198} +{"info/global_step": 2199, "train_info/time_within_train_step": 2.2856943607330322, "step": 2199} +{"train_info/time_between_train_steps": 0.0031197071075439453, "step": 2199} +{"info/global_step": 2200, "train_info/time_within_train_step": 2.285907506942749, "step": 2200} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746349310, "_runtime": 5407}, "step": 2200} +{"logs": {"train/loss": 3.4238, "train/learning_rate": 0.00017777777777777776, "train/epoch": 2.01, "_timestamp": 1746349310, "_runtime": 5407}, "step": 2200} +{"train_info/time_between_train_steps": 11.557120084762573, "step": 2200} +{"info/global_step": 2201, "train_info/time_within_train_step": 2.1206254959106445, "step": 2201} +{"train_info/time_between_train_steps": 0.003141641616821289, "step": 2201} +{"info/global_step": 2202, "train_info/time_within_train_step": 2.0961897373199463, "step": 2202} +{"train_info/time_between_train_steps": 0.006384611129760742, "step": 2202} +{"info/global_step": 2203, "train_info/time_within_train_step": 2.2244317531585693, "step": 2203} +{"train_info/time_between_train_steps": 0.0031366348266601562, "step": 2203} +{"info/global_step": 2204, "train_info/time_within_train_step": 2.283940315246582, "step": 2204} +{"train_info/time_between_train_steps": 0.0031578540802001953, "step": 2204} +{"info/global_step": 2205, "train_info/time_within_train_step": 2.284064531326294, "step": 2205} +{"train_info/time_between_train_steps": 0.0031595230102539062, "step": 2205} +{"info/global_step": 2206, "train_info/time_within_train_step": 2.2860453128814697, "step": 2206} +{"train_info/time_between_train_steps": 0.0031900405883789062, "step": 2206} +{"info/global_step": 2207, "train_info/time_within_train_step": 2.2855443954467773, "step": 2207} +{"train_info/time_between_train_steps": 0.003150463104248047, "step": 2207} +{"info/global_step": 2208, "train_info/time_within_train_step": 2.2860829830169678, "step": 2208} +{"train_info/time_between_train_steps": 0.0031032562255859375, "step": 2208} +{"info/global_step": 2209, "train_info/time_within_train_step": 2.2857933044433594, "step": 2209} +{"train_info/time_between_train_steps": 0.00312042236328125, "step": 2209} +{"info/global_step": 2210, "train_info/time_within_train_step": 2.286555528640747, "step": 2210} +{"train_info/time_between_train_steps": 0.0031270980834960938, "step": 2210} +{"info/global_step": 2211, "train_info/time_within_train_step": 2.286104679107666, "step": 2211} +{"train_info/time_between_train_steps": 0.0031311511993408203, "step": 2211} +{"info/global_step": 2212, "train_info/time_within_train_step": 2.2865328788757324, "step": 2212} +{"train_info/time_between_train_steps": 0.003163576126098633, "step": 2212} +{"info/global_step": 2213, "train_info/time_within_train_step": 2.2867088317871094, "step": 2213} +{"train_info/time_between_train_steps": 0.003163576126098633, "step": 2213} +{"info/global_step": 2214, "train_info/time_within_train_step": 2.286648750305176, "step": 2214} +{"train_info/time_between_train_steps": 0.003181934356689453, "step": 2214} +{"info/global_step": 2215, "train_info/time_within_train_step": 2.2869858741760254, "step": 2215} +{"train_info/time_between_train_steps": 0.00311279296875, "step": 2215} +{"info/global_step": 2216, "train_info/time_within_train_step": 2.286778688430786, "step": 2216} +{"train_info/time_between_train_steps": 0.003142833709716797, "step": 2216} +{"info/global_step": 2217, "train_info/time_within_train_step": 2.285897970199585, "step": 2217} +{"train_info/time_between_train_steps": 0.003638744354248047, "step": 2217} +{"info/global_step": 2218, "train_info/time_within_train_step": 2.286255359649658, "step": 2218} +{"train_info/time_between_train_steps": 0.003157377243041992, "step": 2218} +{"info/global_step": 2219, "train_info/time_within_train_step": 2.2870028018951416, "step": 2219} +{"train_info/time_between_train_steps": 0.003145933151245117, "step": 2219} +{"info/global_step": 2220, "train_info/time_within_train_step": 2.286961793899536, "step": 2220} +{"train_info/time_between_train_steps": 0.0031380653381347656, "step": 2220} +{"info/global_step": 2221, "train_info/time_within_train_step": 2.2866268157958984, "step": 2221} +{"train_info/time_between_train_steps": 0.0031669139862060547, "step": 2221} +{"info/global_step": 2222, "train_info/time_within_train_step": 2.2861440181732178, "step": 2222} +{"train_info/time_between_train_steps": 0.003190755844116211, "step": 2222} +{"info/global_step": 2223, "train_info/time_within_train_step": 2.287022590637207, "step": 2223} +{"train_info/time_between_train_steps": 0.0031311511993408203, "step": 2223} +{"info/global_step": 2224, "train_info/time_within_train_step": 2.2864630222320557, "step": 2224} +{"train_info/time_between_train_steps": 0.0031480789184570312, "step": 2224} +{"info/global_step": 2225, "train_info/time_within_train_step": 2.28731632232666, "step": 2225} +{"train_info/time_between_train_steps": 0.003144979476928711, "step": 2225} +{"info/global_step": 2226, "train_info/time_within_train_step": 2.2870402336120605, "step": 2226} +{"train_info/time_between_train_steps": 0.0030853748321533203, "step": 2226} +{"info/global_step": 2227, "train_info/time_within_train_step": 2.5003483295440674, "step": 2227} +{"train_info/time_between_train_steps": 0.0031516551971435547, "step": 2227} +{"info/global_step": 2228, "train_info/time_within_train_step": 2.2862954139709473, "step": 2228} +{"train_info/time_between_train_steps": 0.003129720687866211, "step": 2228} +{"info/global_step": 2229, "train_info/time_within_train_step": 2.2861764430999756, "step": 2229} +{"train_info/time_between_train_steps": 0.003141164779663086, "step": 2229} +{"info/global_step": 2230, "train_info/time_within_train_step": 2.2867701053619385, "step": 2230} +{"train_info/time_between_train_steps": 0.006374835968017578, "step": 2230} +{"info/global_step": 2231, "train_info/time_within_train_step": 2.286646842956543, "step": 2231} +{"train_info/time_between_train_steps": 0.006342649459838867, "step": 2231} +{"info/global_step": 2232, "train_info/time_within_train_step": 2.2865500450134277, "step": 2232} +{"train_info/time_between_train_steps": 0.00637507438659668, "step": 2232} +{"info/global_step": 2233, "train_info/time_within_train_step": 2.286051034927368, "step": 2233} +{"train_info/time_between_train_steps": 0.006378173828125, "step": 2233} +{"info/global_step": 2234, "train_info/time_within_train_step": 2.2867016792297363, "step": 2234} +{"train_info/time_between_train_steps": 0.006333351135253906, "step": 2234} +{"info/global_step": 2235, "train_info/time_within_train_step": 2.2864696979522705, "step": 2235} +{"train_info/time_between_train_steps": 0.006345987319946289, "step": 2235} +{"info/global_step": 2236, "train_info/time_within_train_step": 2.286280393600464, "step": 2236} +{"train_info/time_between_train_steps": 0.006437540054321289, "step": 2236} +{"info/global_step": 2237, "train_info/time_within_train_step": 2.285689115524292, "step": 2237} +{"train_info/time_between_train_steps": 0.0031130313873291016, "step": 2237} +{"info/global_step": 2238, "train_info/time_within_train_step": 2.2860922813415527, "step": 2238} +{"train_info/time_between_train_steps": 0.003148794174194336, "step": 2238} +{"info/global_step": 2239, "train_info/time_within_train_step": 2.285717248916626, "step": 2239} +{"train_info/time_between_train_steps": 0.003080129623413086, "step": 2239} +{"info/global_step": 2240, "train_info/time_within_train_step": 2.2858033180236816, "step": 2240} +{"train_info/time_between_train_steps": 0.0031065940856933594, "step": 2240} +{"info/global_step": 2241, "train_info/time_within_train_step": 2.285795211791992, "step": 2241} +{"train_info/time_between_train_steps": 0.003100156784057617, "step": 2241} +{"info/global_step": 2242, "train_info/time_within_train_step": 2.28587007522583, "step": 2242} +{"train_info/time_between_train_steps": 0.0032918453216552734, "step": 2242} +{"info/global_step": 2243, "train_info/time_within_train_step": 2.2853286266326904, "step": 2243} +{"train_info/time_between_train_steps": 0.006390571594238281, "step": 2243} +{"info/global_step": 2244, "train_info/time_within_train_step": 2.286223888397217, "step": 2244} +{"train_info/time_between_train_steps": 0.006922245025634766, "step": 2244} +{"info/global_step": 2245, "train_info/time_within_train_step": 2.28635835647583, "step": 2245} +{"train_info/time_between_train_steps": 0.006385087966918945, "step": 2245} +{"info/global_step": 2246, "train_info/time_within_train_step": 2.286576509475708, "step": 2246} +{"train_info/time_between_train_steps": 0.006407260894775391, "step": 2246} +{"info/global_step": 2247, "train_info/time_within_train_step": 2.4068219661712646, "step": 2247} +{"train_info/time_between_train_steps": 0.003161907196044922, "step": 2247} +{"info/global_step": 2248, "train_info/time_within_train_step": 2.286959409713745, "step": 2248} +{"train_info/time_between_train_steps": 0.0031082630157470703, "step": 2248} +{"info/global_step": 2249, "train_info/time_within_train_step": 2.2870073318481445, "step": 2249} +{"train_info/time_between_train_steps": 0.003132343292236328, "step": 2249} +{"info/global_step": 2250, "train_info/time_within_train_step": 2.663414239883423, "step": 2250} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746349438, "_runtime": 5535}, "step": 2250} +{"logs": {"train/loss": 3.4115, "train/learning_rate": 0.00016666666666666666, "train/epoch": 2.02, "_timestamp": 1746349438, "_runtime": 5535}, "step": 2250} +{"train_info/time_between_train_steps": 0.02476191520690918, "step": 2250} +{"info/global_step": 2251, "train_info/time_within_train_step": 2.287482738494873, "step": 2251} +{"train_info/time_between_train_steps": 0.003187894821166992, "step": 2251} +{"info/global_step": 2252, "train_info/time_within_train_step": 2.3291139602661133, "step": 2252} +{"train_info/time_between_train_steps": 0.0031507015228271484, "step": 2252} +{"info/global_step": 2253, "train_info/time_within_train_step": 2.2879464626312256, "step": 2253} +{"train_info/time_between_train_steps": 0.0031325817108154297, "step": 2253} +{"info/global_step": 2254, "train_info/time_within_train_step": 2.2869837284088135, "step": 2254} +{"train_info/time_between_train_steps": 0.003135204315185547, "step": 2254} +{"info/global_step": 2255, "train_info/time_within_train_step": 2.2874515056610107, "step": 2255} +{"train_info/time_between_train_steps": 0.0033609867095947266, "step": 2255} +{"info/global_step": 2256, "train_info/time_within_train_step": 2.286881446838379, "step": 2256} +{"train_info/time_between_train_steps": 0.0031168460845947266, "step": 2256} +{"info/global_step": 2257, "train_info/time_within_train_step": 2.287533760070801, "step": 2257} +{"train_info/time_between_train_steps": 0.0031538009643554688, "step": 2257} +{"info/global_step": 2258, "train_info/time_within_train_step": 2.286818742752075, "step": 2258} +{"train_info/time_between_train_steps": 0.003144502639770508, "step": 2258} +{"info/global_step": 2259, "train_info/time_within_train_step": 2.286835193634033, "step": 2259} +{"train_info/time_between_train_steps": 0.003153562545776367, "step": 2259} +{"info/global_step": 2260, "train_info/time_within_train_step": 2.2863314151763916, "step": 2260} +{"train_info/time_between_train_steps": 0.003155946731567383, "step": 2260} +{"info/global_step": 2261, "train_info/time_within_train_step": 2.2869014739990234, "step": 2261} +{"train_info/time_between_train_steps": 0.0031387805938720703, "step": 2261} +{"info/global_step": 2262, "train_info/time_within_train_step": 2.2865638732910156, "step": 2262} +{"train_info/time_between_train_steps": 0.0031309127807617188, "step": 2262} +{"info/global_step": 2263, "train_info/time_within_train_step": 2.2865214347839355, "step": 2263} +{"train_info/time_between_train_steps": 0.0031168460845947266, "step": 2263} +{"info/global_step": 2264, "train_info/time_within_train_step": 2.2861857414245605, "step": 2264} +{"train_info/time_between_train_steps": 0.0031151771545410156, "step": 2264} +{"info/global_step": 2265, "train_info/time_within_train_step": 2.285675048828125, "step": 2265} +{"train_info/time_between_train_steps": 0.0031099319458007812, "step": 2265} +{"info/global_step": 2266, "train_info/time_within_train_step": 2.2868733406066895, "step": 2266} +{"train_info/time_between_train_steps": 0.0031735897064208984, "step": 2266} +{"info/global_step": 2267, "train_info/time_within_train_step": 2.286726951599121, "step": 2267} +{"train_info/time_between_train_steps": 0.0031485557556152344, "step": 2267} +{"info/global_step": 2268, "train_info/time_within_train_step": 2.286868095397949, "step": 2268} +{"train_info/time_between_train_steps": 0.003140687942504883, "step": 2268} +{"info/global_step": 2269, "train_info/time_within_train_step": 2.28645920753479, "step": 2269} +{"train_info/time_between_train_steps": 0.003135204315185547, "step": 2269} +{"info/global_step": 2270, "train_info/time_within_train_step": 2.286548376083374, "step": 2270} +{"train_info/time_between_train_steps": 0.0031359195709228516, "step": 2270} +{"info/global_step": 2271, "train_info/time_within_train_step": 2.2866933345794678, "step": 2271} +{"train_info/time_between_train_steps": 0.0031363964080810547, "step": 2271} +{"info/global_step": 2272, "train_info/time_within_train_step": 2.286717653274536, "step": 2272} +{"train_info/time_between_train_steps": 0.003123044967651367, "step": 2272} +{"info/global_step": 2273, "train_info/time_within_train_step": 2.286991596221924, "step": 2273} +{"train_info/time_between_train_steps": 0.0031561851501464844, "step": 2273} +{"info/global_step": 2274, "train_info/time_within_train_step": 2.286696195602417, "step": 2274} +{"train_info/time_between_train_steps": 0.003133058547973633, "step": 2274} +{"info/global_step": 2275, "train_info/time_within_train_step": 2.286677598953247, "step": 2275} +{"train_info/time_between_train_steps": 0.003192424774169922, "step": 2275} +{"info/global_step": 2276, "train_info/time_within_train_step": 2.2868974208831787, "step": 2276} +{"train_info/time_between_train_steps": 0.0031647682189941406, "step": 2276} +{"info/global_step": 2277, "train_info/time_within_train_step": 2.2874844074249268, "step": 2277} +{"train_info/time_between_train_steps": 0.0031557083129882812, "step": 2277} +{"info/global_step": 2278, "train_info/time_within_train_step": 2.3286521434783936, "step": 2278} +{"train_info/time_between_train_steps": 0.003132343292236328, "step": 2278} +{"info/global_step": 2279, "train_info/time_within_train_step": 2.286334753036499, "step": 2279} +{"train_info/time_between_train_steps": 0.003119230270385742, "step": 2279} +{"info/global_step": 2280, "train_info/time_within_train_step": 2.2860159873962402, "step": 2280} +{"train_info/time_between_train_steps": 0.0031328201293945312, "step": 2280} +{"info/global_step": 2281, "train_info/time_within_train_step": 2.2861692905426025, "step": 2281} +{"train_info/time_between_train_steps": 0.0032868385314941406, "step": 2281} +{"info/global_step": 2282, "train_info/time_within_train_step": 2.285909652709961, "step": 2282} +{"train_info/time_between_train_steps": 0.0031309127807617188, "step": 2282} +{"info/global_step": 2283, "train_info/time_within_train_step": 2.2869277000427246, "step": 2283} +{"train_info/time_between_train_steps": 0.003145456314086914, "step": 2283} +{"info/global_step": 2284, "train_info/time_within_train_step": 2.2857918739318848, "step": 2284} +{"train_info/time_between_train_steps": 0.003185272216796875, "step": 2284} +{"info/global_step": 2285, "train_info/time_within_train_step": 2.285783529281616, "step": 2285} +{"train_info/time_between_train_steps": 0.0031003952026367188, "step": 2285} +{"info/global_step": 2286, "train_info/time_within_train_step": 2.2859013080596924, "step": 2286} +{"train_info/time_between_train_steps": 0.0031576156616210938, "step": 2286} +{"info/global_step": 2287, "train_info/time_within_train_step": 2.286024570465088, "step": 2287} +{"train_info/time_between_train_steps": 0.003115415573120117, "step": 2287} +{"info/global_step": 2288, "train_info/time_within_train_step": 2.2866709232330322, "step": 2288} +{"train_info/time_between_train_steps": 0.0031099319458007812, "step": 2288} +{"info/global_step": 2289, "train_info/time_within_train_step": 2.286757469177246, "step": 2289} +{"train_info/time_between_train_steps": 0.0031180381774902344, "step": 2289} +{"info/global_step": 2290, "train_info/time_within_train_step": 2.2862019538879395, "step": 2290} +{"train_info/time_between_train_steps": 0.003161907196044922, "step": 2290} +{"info/global_step": 2291, "train_info/time_within_train_step": 2.286341667175293, "step": 2291} +{"train_info/time_between_train_steps": 0.003145456314086914, "step": 2291} +{"info/global_step": 2292, "train_info/time_within_train_step": 2.2869861125946045, "step": 2292} +{"train_info/time_between_train_steps": 0.006395101547241211, "step": 2292} +{"info/global_step": 2293, "train_info/time_within_train_step": 2.286496877670288, "step": 2293} +{"train_info/time_between_train_steps": 0.006445884704589844, "step": 2293} +{"info/global_step": 2294, "train_info/time_within_train_step": 2.286675214767456, "step": 2294} +{"train_info/time_between_train_steps": 0.0031316280364990234, "step": 2294} +{"info/global_step": 2295, "train_info/time_within_train_step": 2.2870213985443115, "step": 2295} +{"train_info/time_between_train_steps": 0.003180980682373047, "step": 2295} +{"info/global_step": 2296, "train_info/time_within_train_step": 2.2875585556030273, "step": 2296} +{"train_info/time_between_train_steps": 0.00312042236328125, "step": 2296} +{"info/global_step": 2297, "train_info/time_within_train_step": 2.2861316204071045, "step": 2297} +{"train_info/time_between_train_steps": 0.0031299591064453125, "step": 2297} +{"info/global_step": 2298, "train_info/time_within_train_step": 2.2862324714660645, "step": 2298} +{"train_info/time_between_train_steps": 0.0031096935272216797, "step": 2298} +{"info/global_step": 2299, "train_info/time_within_train_step": 2.286095142364502, "step": 2299} +{"train_info/time_between_train_steps": 0.0031549930572509766, "step": 2299} +{"info/global_step": 2300, "train_info/time_within_train_step": 2.286264181137085, "step": 2300} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746349553, "_runtime": 5650}, "step": 2300} +{"logs": {"train/loss": 3.403, "train/learning_rate": 0.00015555555555555554, "train/epoch": 2.04, "_timestamp": 1746349553, "_runtime": 5650}, "step": 2300} +{"train_info/time_between_train_steps": 18.106094360351562, "step": 2300} +{"info/global_step": 2301, "train_info/time_within_train_step": 2.1241812705993652, "step": 2301} +{"train_info/time_between_train_steps": 0.00626826286315918, "step": 2301} +{"info/global_step": 2302, "train_info/time_within_train_step": 2.092365026473999, "step": 2302} +{"train_info/time_between_train_steps": 0.00638890266418457, "step": 2302} +{"info/global_step": 2303, "train_info/time_within_train_step": 2.1498031616210938, "step": 2303} +{"train_info/time_between_train_steps": 0.006413936614990234, "step": 2303} +{"info/global_step": 2304, "train_info/time_within_train_step": 2.284369707107544, "step": 2304} +{"train_info/time_between_train_steps": 0.006403446197509766, "step": 2304} +{"info/global_step": 2305, "train_info/time_within_train_step": 2.28485107421875, "step": 2305} +{"train_info/time_between_train_steps": 0.006403923034667969, "step": 2305} +{"info/global_step": 2306, "train_info/time_within_train_step": 2.29003643989563, "step": 2306} +{"train_info/time_between_train_steps": 0.006363630294799805, "step": 2306} +{"info/global_step": 2307, "train_info/time_within_train_step": 2.285208225250244, "step": 2307} +{"train_info/time_between_train_steps": 0.0063648223876953125, "step": 2307} +{"info/global_step": 2308, "train_info/time_within_train_step": 2.2851521968841553, "step": 2308} +{"train_info/time_between_train_steps": 0.006421566009521484, "step": 2308} +{"info/global_step": 2309, "train_info/time_within_train_step": 2.2853469848632812, "step": 2309} +{"train_info/time_between_train_steps": 0.1261453628540039, "step": 2309} +{"info/global_step": 2310, "train_info/time_within_train_step": 2.2856314182281494, "step": 2310} +{"train_info/time_between_train_steps": 0.006445407867431641, "step": 2310} +{"info/global_step": 2311, "train_info/time_within_train_step": 2.285505533218384, "step": 2311} +{"train_info/time_between_train_steps": 0.0064356327056884766, "step": 2311} +{"info/global_step": 2312, "train_info/time_within_train_step": 2.2863423824310303, "step": 2312} +{"train_info/time_between_train_steps": 0.006407499313354492, "step": 2312} +{"info/global_step": 2313, "train_info/time_within_train_step": 2.286076545715332, "step": 2313} +{"train_info/time_between_train_steps": 0.006426572799682617, "step": 2313} +{"info/global_step": 2314, "train_info/time_within_train_step": 2.5002527236938477, "step": 2314} +{"train_info/time_between_train_steps": 0.0064928531646728516, "step": 2314} +{"info/global_step": 2315, "train_info/time_within_train_step": 2.2856605052948, "step": 2315} +{"train_info/time_between_train_steps": 0.006421089172363281, "step": 2315} +{"info/global_step": 2316, "train_info/time_within_train_step": 2.285743236541748, "step": 2316} +{"train_info/time_between_train_steps": 0.006437063217163086, "step": 2316} +{"info/global_step": 2317, "train_info/time_within_train_step": 2.285942316055298, "step": 2317} +{"train_info/time_between_train_steps": 0.007001161575317383, "step": 2317} +{"info/global_step": 2318, "train_info/time_within_train_step": 2.2864248752593994, "step": 2318} +{"train_info/time_between_train_steps": 0.006417274475097656, "step": 2318} +{"info/global_step": 2319, "train_info/time_within_train_step": 2.286594867706299, "step": 2319} +{"train_info/time_between_train_steps": 0.0064122676849365234, "step": 2319} +{"info/global_step": 2320, "train_info/time_within_train_step": 2.28716778755188, "step": 2320} +{"train_info/time_between_train_steps": 0.0064580440521240234, "step": 2320} +{"info/global_step": 2321, "train_info/time_within_train_step": 2.287064790725708, "step": 2321} +{"train_info/time_between_train_steps": 0.006413459777832031, "step": 2321} +{"info/global_step": 2322, "train_info/time_within_train_step": 2.2871084213256836, "step": 2322} +{"train_info/time_between_train_steps": 0.006440162658691406, "step": 2322} +{"info/global_step": 2323, "train_info/time_within_train_step": 2.286999464035034, "step": 2323} +{"train_info/time_between_train_steps": 0.00644230842590332, "step": 2323} +{"info/global_step": 2324, "train_info/time_within_train_step": 2.286653995513916, "step": 2324} +{"train_info/time_between_train_steps": 0.006400346755981445, "step": 2324} +{"info/global_step": 2325, "train_info/time_within_train_step": 2.2868642807006836, "step": 2325} +{"train_info/time_between_train_steps": 0.006410837173461914, "step": 2325} +{"info/global_step": 2326, "train_info/time_within_train_step": 2.3783907890319824, "step": 2326} +{"train_info/time_between_train_steps": 0.0064432621002197266, "step": 2326} +{"info/global_step": 2327, "train_info/time_within_train_step": 2.286637544631958, "step": 2327} +{"train_info/time_between_train_steps": 0.005591154098510742, "step": 2327} +{"info/global_step": 2328, "train_info/time_within_train_step": 2.2866053581237793, "step": 2328} +{"train_info/time_between_train_steps": 0.006478309631347656, "step": 2328} +{"info/global_step": 2329, "train_info/time_within_train_step": 2.2863452434539795, "step": 2329} +{"train_info/time_between_train_steps": 0.0064697265625, "step": 2329} +{"info/global_step": 2330, "train_info/time_within_train_step": 2.2857415676116943, "step": 2330} +{"train_info/time_between_train_steps": 0.006397724151611328, "step": 2330} +{"info/global_step": 2331, "train_info/time_within_train_step": 2.285736083984375, "step": 2331} +{"train_info/time_between_train_steps": 0.0064313411712646484, "step": 2331} +{"info/global_step": 2332, "train_info/time_within_train_step": 2.2869434356689453, "step": 2332} +{"train_info/time_between_train_steps": 0.0064623355865478516, "step": 2332} +{"info/global_step": 2333, "train_info/time_within_train_step": 2.2863800525665283, "step": 2333} +{"train_info/time_between_train_steps": 0.0064432621002197266, "step": 2333} +{"info/global_step": 2334, "train_info/time_within_train_step": 2.2857933044433594, "step": 2334} +{"train_info/time_between_train_steps": 0.006418943405151367, "step": 2334} +{"info/global_step": 2335, "train_info/time_within_train_step": 2.286616086959839, "step": 2335} +{"train_info/time_between_train_steps": 0.006442070007324219, "step": 2335} +{"info/global_step": 2336, "train_info/time_within_train_step": 2.286181688308716, "step": 2336} +{"train_info/time_between_train_steps": 0.006404876708984375, "step": 2336} +{"info/global_step": 2337, "train_info/time_within_train_step": 2.287400007247925, "step": 2337} +{"train_info/time_between_train_steps": 0.006411314010620117, "step": 2337} +{"info/global_step": 2338, "train_info/time_within_train_step": 2.286665916442871, "step": 2338} +{"train_info/time_between_train_steps": 0.006407976150512695, "step": 2338} +{"info/global_step": 2339, "train_info/time_within_train_step": 2.2870426177978516, "step": 2339} +{"train_info/time_between_train_steps": 0.006412029266357422, "step": 2339} +{"info/global_step": 2340, "train_info/time_within_train_step": 2.286820888519287, "step": 2340} +{"train_info/time_between_train_steps": 0.006395101547241211, "step": 2340} +{"info/global_step": 2341, "train_info/time_within_train_step": 2.287219524383545, "step": 2341} +{"train_info/time_between_train_steps": 0.006411314010620117, "step": 2341} +{"info/global_step": 2342, "train_info/time_within_train_step": 2.2868988513946533, "step": 2342} +{"train_info/time_between_train_steps": 0.0064847469329833984, "step": 2342} +{"info/global_step": 2343, "train_info/time_within_train_step": 2.286771774291992, "step": 2343} +{"train_info/time_between_train_steps": 0.006422758102416992, "step": 2343} +{"info/global_step": 2344, "train_info/time_within_train_step": 2.286816358566284, "step": 2344} +{"train_info/time_between_train_steps": 0.0064013004302978516, "step": 2344} +{"info/global_step": 2345, "train_info/time_within_train_step": 2.286269426345825, "step": 2345} +{"train_info/time_between_train_steps": 0.0031747817993164062, "step": 2345} +{"info/global_step": 2346, "train_info/time_within_train_step": 2.2865757942199707, "step": 2346} +{"train_info/time_between_train_steps": 0.003143787384033203, "step": 2346} +{"info/global_step": 2347, "train_info/time_within_train_step": 2.286252975463867, "step": 2347} +{"train_info/time_between_train_steps": 0.0031256675720214844, "step": 2347} +{"info/global_step": 2348, "train_info/time_within_train_step": 2.2866718769073486, "step": 2348} +{"train_info/time_between_train_steps": 0.0031359195709228516, "step": 2348} +{"info/global_step": 2349, "train_info/time_within_train_step": 2.286357879638672, "step": 2349} +{"train_info/time_between_train_steps": 0.003179311752319336, "step": 2349} +{"info/global_step": 2350, "train_info/time_within_train_step": 2.286329984664917, "step": 2350} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746349687, "_runtime": 5784}, "step": 2350} +{"logs": {"train/loss": 3.3814, "train/learning_rate": 0.0001444444444444444, "train/epoch": 2.06, "_timestamp": 1746349687, "_runtime": 5784}, "step": 2350} +{"train_info/time_between_train_steps": 0.02422046661376953, "step": 2350} +{"info/global_step": 2351, "train_info/time_within_train_step": 2.2866599559783936, "step": 2351} +{"train_info/time_between_train_steps": 0.006404876708984375, "step": 2351} +{"info/global_step": 2352, "train_info/time_within_train_step": 2.3777718544006348, "step": 2352} +{"train_info/time_between_train_steps": 0.0064394474029541016, "step": 2352} +{"info/global_step": 2353, "train_info/time_within_train_step": 2.2865703105926514, "step": 2353} +{"train_info/time_between_train_steps": 0.003170490264892578, "step": 2353} +{"info/global_step": 2354, "train_info/time_within_train_step": 2.2868881225585938, "step": 2354} +{"train_info/time_between_train_steps": 0.0031280517578125, "step": 2354} +{"info/global_step": 2355, "train_info/time_within_train_step": 2.286059856414795, "step": 2355} +{"train_info/time_between_train_steps": 0.003122091293334961, "step": 2355} +{"info/global_step": 2356, "train_info/time_within_train_step": 2.286350727081299, "step": 2356} +{"train_info/time_between_train_steps": 0.003161907196044922, "step": 2356} +{"info/global_step": 2357, "train_info/time_within_train_step": 2.2865214347839355, "step": 2357} +{"train_info/time_between_train_steps": 0.0032198429107666016, "step": 2357} +{"info/global_step": 2358, "train_info/time_within_train_step": 2.2868449687957764, "step": 2358} +{"train_info/time_between_train_steps": 0.003155946731567383, "step": 2358} +{"info/global_step": 2359, "train_info/time_within_train_step": 2.2867159843444824, "step": 2359} +{"train_info/time_between_train_steps": 0.003133535385131836, "step": 2359} +{"info/global_step": 2360, "train_info/time_within_train_step": 2.2872138023376465, "step": 2360} +{"train_info/time_between_train_steps": 0.0031499862670898438, "step": 2360} +{"info/global_step": 2361, "train_info/time_within_train_step": 2.2869112491607666, "step": 2361} +{"train_info/time_between_train_steps": 0.0031790733337402344, "step": 2361} +{"info/global_step": 2362, "train_info/time_within_train_step": 2.286827564239502, "step": 2362} +{"train_info/time_between_train_steps": 0.003146648406982422, "step": 2362} +{"info/global_step": 2363, "train_info/time_within_train_step": 2.2861785888671875, "step": 2363} +{"train_info/time_between_train_steps": 0.0031201839447021484, "step": 2363} +{"info/global_step": 2364, "train_info/time_within_train_step": 2.286869764328003, "step": 2364} +{"train_info/time_between_train_steps": 0.0031447410583496094, "step": 2364} +{"info/global_step": 2365, "train_info/time_within_train_step": 2.286421775817871, "step": 2365} +{"train_info/time_between_train_steps": 0.006333827972412109, "step": 2365} +{"info/global_step": 2366, "train_info/time_within_train_step": 2.28550124168396, "step": 2366} +{"train_info/time_between_train_steps": 0.006454944610595703, "step": 2366} +{"info/global_step": 2367, "train_info/time_within_train_step": 2.2860076427459717, "step": 2367} +{"train_info/time_between_train_steps": 0.006337881088256836, "step": 2367} +{"info/global_step": 2368, "train_info/time_within_train_step": 2.5065102577209473, "step": 2368} +{"train_info/time_between_train_steps": 0.006427288055419922, "step": 2368} +{"info/global_step": 2369, "train_info/time_within_train_step": 2.2866299152374268, "step": 2369} +{"train_info/time_between_train_steps": 0.006368875503540039, "step": 2369} +{"info/global_step": 2370, "train_info/time_within_train_step": 2.2862470149993896, "step": 2370} +{"train_info/time_between_train_steps": 0.006450176239013672, "step": 2370} +{"info/global_step": 2371, "train_info/time_within_train_step": 2.2860050201416016, "step": 2371} +{"train_info/time_between_train_steps": 0.006531238555908203, "step": 2371} +{"info/global_step": 2372, "train_info/time_within_train_step": 2.4072983264923096, "step": 2372} +{"train_info/time_between_train_steps": 0.006471395492553711, "step": 2372} +{"info/global_step": 2373, "train_info/time_within_train_step": 2.286320924758911, "step": 2373} +{"train_info/time_between_train_steps": 0.0065097808837890625, "step": 2373} +{"info/global_step": 2374, "train_info/time_within_train_step": 2.285871982574463, "step": 2374} +{"train_info/time_between_train_steps": 0.006402015686035156, "step": 2374} +{"info/global_step": 2375, "train_info/time_within_train_step": 2.285815715789795, "step": 2375} +{"train_info/time_between_train_steps": 0.006407737731933594, "step": 2375} +{"info/global_step": 2376, "train_info/time_within_train_step": 2.2858128547668457, "step": 2376} +{"train_info/time_between_train_steps": 0.00639033317565918, "step": 2376} +{"info/global_step": 2377, "train_info/time_within_train_step": 2.2860538959503174, "step": 2377} +{"train_info/time_between_train_steps": 0.006481647491455078, "step": 2377} +{"info/global_step": 2378, "train_info/time_within_train_step": 2.2865793704986572, "step": 2378} +{"train_info/time_between_train_steps": 0.0031461715698242188, "step": 2378} +{"info/global_step": 2379, "train_info/time_within_train_step": 2.28631591796875, "step": 2379} +{"train_info/time_between_train_steps": 0.0032050609588623047, "step": 2379} +{"info/global_step": 2380, "train_info/time_within_train_step": 2.2870752811431885, "step": 2380} +{"train_info/time_between_train_steps": 0.0031671524047851562, "step": 2380} +{"info/global_step": 2381, "train_info/time_within_train_step": 2.286355495452881, "step": 2381} +{"train_info/time_between_train_steps": 0.0032165050506591797, "step": 2381} +{"info/global_step": 2382, "train_info/time_within_train_step": 2.2862532138824463, "step": 2382} +{"train_info/time_between_train_steps": 0.0031888484954833984, "step": 2382} +{"info/global_step": 2383, "train_info/time_within_train_step": 2.28646183013916, "step": 2383} +{"train_info/time_between_train_steps": 0.0031685829162597656, "step": 2383} +{"info/global_step": 2384, "train_info/time_within_train_step": 2.286252737045288, "step": 2384} +{"train_info/time_between_train_steps": 0.003119945526123047, "step": 2384} +{"info/global_step": 2385, "train_info/time_within_train_step": 2.286071300506592, "step": 2385} +{"train_info/time_between_train_steps": 0.0064089298248291016, "step": 2385} +{"info/global_step": 2386, "train_info/time_within_train_step": 2.285818576812744, "step": 2386} +{"train_info/time_between_train_steps": 0.006402730941772461, "step": 2386} +{"info/global_step": 2387, "train_info/time_within_train_step": 2.286102056503296, "step": 2387} +{"train_info/time_between_train_steps": 0.006423473358154297, "step": 2387} +{"info/global_step": 2388, "train_info/time_within_train_step": 2.285536289215088, "step": 2388} +{"train_info/time_between_train_steps": 0.006463050842285156, "step": 2388} +{"info/global_step": 2389, "train_info/time_within_train_step": 2.2860803604125977, "step": 2389} +{"train_info/time_between_train_steps": 0.00646209716796875, "step": 2389} +{"info/global_step": 2390, "train_info/time_within_train_step": 2.2857956886291504, "step": 2390} +{"train_info/time_between_train_steps": 0.0064907073974609375, "step": 2390} +{"info/global_step": 2391, "train_info/time_within_train_step": 2.2859764099121094, "step": 2391} +{"train_info/time_between_train_steps": 0.0064334869384765625, "step": 2391} +{"info/global_step": 2392, "train_info/time_within_train_step": 2.286344289779663, "step": 2392} +{"train_info/time_between_train_steps": 0.006404876708984375, "step": 2392} +{"info/global_step": 2393, "train_info/time_within_train_step": 2.2858476638793945, "step": 2393} +{"train_info/time_between_train_steps": 0.006438016891479492, "step": 2393} +{"info/global_step": 2394, "train_info/time_within_train_step": 2.286205291748047, "step": 2394} +{"train_info/time_between_train_steps": 0.006373167037963867, "step": 2394} +{"info/global_step": 2395, "train_info/time_within_train_step": 2.2857346534729004, "step": 2395} +{"train_info/time_between_train_steps": 0.006396293640136719, "step": 2395} +{"info/global_step": 2396, "train_info/time_within_train_step": 2.2857251167297363, "step": 2396} +{"train_info/time_between_train_steps": 0.006451129913330078, "step": 2396} +{"info/global_step": 2397, "train_info/time_within_train_step": 2.2856221199035645, "step": 2397} +{"train_info/time_between_train_steps": 0.006438732147216797, "step": 2397} +{"info/global_step": 2398, "train_info/time_within_train_step": 2.285294532775879, "step": 2398} +{"train_info/time_between_train_steps": 0.006422519683837891, "step": 2398} +{"info/global_step": 2399, "train_info/time_within_train_step": 2.2860066890716553, "step": 2399} +{"train_info/time_between_train_steps": 0.006474018096923828, "step": 2399} +{"info/global_step": 2400, "train_info/time_within_train_step": 2.286388397216797, "step": 2400} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746349803, "_runtime": 5900}, "step": 2400} +{"logs": {"train/loss": 3.3715, "train/learning_rate": 0.0001333333333333333, "train/epoch": 2.07, "_timestamp": 1746349803, "_runtime": 5900}, "step": 2400} +{"train_info/time_between_train_steps": 18.15576696395874, "step": 2400} +{"info/global_step": 2401, "train_info/time_within_train_step": 2.120495557785034, "step": 2401} +{"train_info/time_between_train_steps": 0.003140687942504883, "step": 2401} +{"info/global_step": 2402, "train_info/time_within_train_step": 2.0997939109802246, "step": 2402} +{"train_info/time_between_train_steps": 0.0031332969665527344, "step": 2402} +{"info/global_step": 2403, "train_info/time_within_train_step": 2.147710084915161, "step": 2403} +{"train_info/time_between_train_steps": 0.003192901611328125, "step": 2403} +{"info/global_step": 2404, "train_info/time_within_train_step": 2.284353494644165, "step": 2404} +{"train_info/time_between_train_steps": 0.0031211376190185547, "step": 2404} +{"info/global_step": 2405, "train_info/time_within_train_step": 2.2848193645477295, "step": 2405} +{"train_info/time_between_train_steps": 0.0031528472900390625, "step": 2405} +{"info/global_step": 2406, "train_info/time_within_train_step": 2.2845711708068848, "step": 2406} +{"train_info/time_between_train_steps": 0.0031414031982421875, "step": 2406} +{"info/global_step": 2407, "train_info/time_within_train_step": 2.2851481437683105, "step": 2407} +{"train_info/time_between_train_steps": 0.003187894821166992, "step": 2407} +{"info/global_step": 2408, "train_info/time_within_train_step": 2.2858591079711914, "step": 2408} +{"train_info/time_between_train_steps": 0.0031976699829101562, "step": 2408} +{"info/global_step": 2409, "train_info/time_within_train_step": 2.285815477371216, "step": 2409} +{"train_info/time_between_train_steps": 0.003217935562133789, "step": 2409} +{"info/global_step": 2410, "train_info/time_within_train_step": 2.285958766937256, "step": 2410} +{"train_info/time_between_train_steps": 0.0031647682189941406, "step": 2410} +{"info/global_step": 2411, "train_info/time_within_train_step": 2.2864279747009277, "step": 2411} +{"train_info/time_between_train_steps": 0.003203868865966797, "step": 2411} +{"info/global_step": 2412, "train_info/time_within_train_step": 2.2865219116210938, "step": 2412} +{"train_info/time_between_train_steps": 0.0031278133392333984, "step": 2412} +{"info/global_step": 2413, "train_info/time_within_train_step": 2.286187171936035, "step": 2413} +{"train_info/time_between_train_steps": 0.0032117366790771484, "step": 2413} +{"info/global_step": 2414, "train_info/time_within_train_step": 2.2864480018615723, "step": 2414} +{"train_info/time_between_train_steps": 0.0031630992889404297, "step": 2414} +{"info/global_step": 2415, "train_info/time_within_train_step": 2.514194965362549, "step": 2415} +{"train_info/time_between_train_steps": 0.0031893253326416016, "step": 2415} +{"info/global_step": 2416, "train_info/time_within_train_step": 2.2861788272857666, "step": 2416} +{"train_info/time_between_train_steps": 0.003193378448486328, "step": 2416} +{"info/global_step": 2417, "train_info/time_within_train_step": 2.2863755226135254, "step": 2417} +{"train_info/time_between_train_steps": 0.003166675567626953, "step": 2417} +{"info/global_step": 2418, "train_info/time_within_train_step": 2.2864608764648438, "step": 2418} +{"train_info/time_between_train_steps": 0.003126382827758789, "step": 2418} +{"info/global_step": 2419, "train_info/time_within_train_step": 2.2857537269592285, "step": 2419} +{"train_info/time_between_train_steps": 0.003128528594970703, "step": 2419} +{"info/global_step": 2420, "train_info/time_within_train_step": 2.2868576049804688, "step": 2420} +{"train_info/time_between_train_steps": 0.0031414031982421875, "step": 2420} +{"info/global_step": 2421, "train_info/time_within_train_step": 2.2865593433380127, "step": 2421} +{"train_info/time_between_train_steps": 0.003128528594970703, "step": 2421} +{"info/global_step": 2422, "train_info/time_within_train_step": 2.286961078643799, "step": 2422} +{"train_info/time_between_train_steps": 0.003193378448486328, "step": 2422} +{"info/global_step": 2423, "train_info/time_within_train_step": 2.2867166996002197, "step": 2423} +{"train_info/time_between_train_steps": 0.003155231475830078, "step": 2423} +{"info/global_step": 2424, "train_info/time_within_train_step": 2.2869765758514404, "step": 2424} +{"train_info/time_between_train_steps": 0.0032181739807128906, "step": 2424} +{"info/global_step": 2425, "train_info/time_within_train_step": 2.2867655754089355, "step": 2425} +{"train_info/time_between_train_steps": 0.0031604766845703125, "step": 2425} +{"info/global_step": 2426, "train_info/time_within_train_step": 2.287254810333252, "step": 2426} +{"train_info/time_between_train_steps": 0.003175020217895508, "step": 2426} +{"info/global_step": 2427, "train_info/time_within_train_step": 2.286660671234131, "step": 2427} +{"train_info/time_between_train_steps": 0.0031249523162841797, "step": 2427} +{"info/global_step": 2428, "train_info/time_within_train_step": 2.2918925285339355, "step": 2428} +{"train_info/time_between_train_steps": 0.0031142234802246094, "step": 2428} +{"info/global_step": 2429, "train_info/time_within_train_step": 2.2867279052734375, "step": 2429} +{"train_info/time_between_train_steps": 0.003144502639770508, "step": 2429} +{"info/global_step": 2430, "train_info/time_within_train_step": 2.2861328125, "step": 2430} +{"train_info/time_between_train_steps": 0.0031626224517822266, "step": 2430} +{"info/global_step": 2431, "train_info/time_within_train_step": 2.2859504222869873, "step": 2431} +{"train_info/time_between_train_steps": 0.0031490325927734375, "step": 2431} +{"info/global_step": 2432, "train_info/time_within_train_step": 2.2861099243164062, "step": 2432} +{"train_info/time_between_train_steps": 0.0031871795654296875, "step": 2432} +{"info/global_step": 2433, "train_info/time_within_train_step": 2.2858333587646484, "step": 2433} +{"train_info/time_between_train_steps": 0.0032067298889160156, "step": 2433} +{"info/global_step": 2434, "train_info/time_within_train_step": 2.2863869667053223, "step": 2434} +{"train_info/time_between_train_steps": 0.1294257640838623, "step": 2434} +{"info/global_step": 2435, "train_info/time_within_train_step": 2.2854366302490234, "step": 2435} +{"train_info/time_between_train_steps": 0.00318145751953125, "step": 2435} +{"info/global_step": 2436, "train_info/time_within_train_step": 2.2858526706695557, "step": 2436} +{"train_info/time_between_train_steps": 0.003160238265991211, "step": 2436} +{"info/global_step": 2437, "train_info/time_within_train_step": 2.285541296005249, "step": 2437} +{"train_info/time_between_train_steps": 0.003211498260498047, "step": 2437} +{"info/global_step": 2438, "train_info/time_within_train_step": 2.2859904766082764, "step": 2438} +{"train_info/time_between_train_steps": 0.003184080123901367, "step": 2438} +{"info/global_step": 2439, "train_info/time_within_train_step": 2.285459041595459, "step": 2439} +{"train_info/time_between_train_steps": 0.0031838417053222656, "step": 2439} +{"info/global_step": 2440, "train_info/time_within_train_step": 2.2856969833374023, "step": 2440} +{"train_info/time_between_train_steps": 0.0031952857971191406, "step": 2440} +{"info/global_step": 2441, "train_info/time_within_train_step": 2.2856180667877197, "step": 2441} +{"train_info/time_between_train_steps": 0.003169536590576172, "step": 2441} +{"info/global_step": 2442, "train_info/time_within_train_step": 2.2858855724334717, "step": 2442} +{"train_info/time_between_train_steps": 0.0031447410583496094, "step": 2442} +{"info/global_step": 2443, "train_info/time_within_train_step": 2.28597092628479, "step": 2443} +{"train_info/time_between_train_steps": 0.003136873245239258, "step": 2443} +{"info/global_step": 2444, "train_info/time_within_train_step": 2.2855303287506104, "step": 2444} +{"train_info/time_between_train_steps": 0.0031282901763916016, "step": 2444} +{"info/global_step": 2445, "train_info/time_within_train_step": 2.2858846187591553, "step": 2445} +{"train_info/time_between_train_steps": 0.003129243850708008, "step": 2445} +{"info/global_step": 2446, "train_info/time_within_train_step": 2.2864327430725098, "step": 2446} +{"train_info/time_between_train_steps": 0.0031995773315429688, "step": 2446} +{"info/global_step": 2447, "train_info/time_within_train_step": 2.285579204559326, "step": 2447} +{"train_info/time_between_train_steps": 0.0031633377075195312, "step": 2447} +{"info/global_step": 2448, "train_info/time_within_train_step": 2.2864201068878174, "step": 2448} +{"train_info/time_between_train_steps": 0.003162860870361328, "step": 2448} +{"info/global_step": 2449, "train_info/time_within_train_step": 2.2859301567077637, "step": 2449} +{"train_info/time_between_train_steps": 0.003165006637573242, "step": 2449} +{"info/global_step": 2450, "train_info/time_within_train_step": 2.286212682723999, "step": 2450} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746349937, "_runtime": 6034}, "step": 2450} +{"logs": {"train/loss": 3.3577, "train/learning_rate": 0.00012222222222222221, "train/epoch": 2.09, "_timestamp": 1746349937, "_runtime": 6034}, "step": 2450} +{"train_info/time_between_train_steps": 0.024731874465942383, "step": 2450} +{"info/global_step": 2451, "train_info/time_within_train_step": 2.285851240158081, "step": 2451} +{"train_info/time_between_train_steps": 0.003138303756713867, "step": 2451} +{"info/global_step": 2452, "train_info/time_within_train_step": 2.286496162414551, "step": 2452} +{"train_info/time_between_train_steps": 0.0031363964080810547, "step": 2452} +{"info/global_step": 2453, "train_info/time_within_train_step": 2.286233901977539, "step": 2453} +{"train_info/time_between_train_steps": 0.003168344497680664, "step": 2453} +{"info/global_step": 2454, "train_info/time_within_train_step": 2.2910609245300293, "step": 2454} +{"train_info/time_between_train_steps": 0.0031707286834716797, "step": 2454} +{"info/global_step": 2455, "train_info/time_within_train_step": 2.2858853340148926, "step": 2455} +{"train_info/time_between_train_steps": 0.0031638145446777344, "step": 2455} +{"info/global_step": 2456, "train_info/time_within_train_step": 2.2867178916931152, "step": 2456} +{"train_info/time_between_train_steps": 0.0031938552856445312, "step": 2456} +{"info/global_step": 2457, "train_info/time_within_train_step": 2.2858898639678955, "step": 2457} +{"train_info/time_between_train_steps": 0.0031499862670898438, "step": 2457} +{"info/global_step": 2458, "train_info/time_within_train_step": 2.2861154079437256, "step": 2458} +{"train_info/time_between_train_steps": 0.003156423568725586, "step": 2458} +{"info/global_step": 2459, "train_info/time_within_train_step": 2.2861316204071045, "step": 2459} +{"train_info/time_between_train_steps": 0.0031690597534179688, "step": 2459} +{"info/global_step": 2460, "train_info/time_within_train_step": 2.286252021789551, "step": 2460} +{"train_info/time_between_train_steps": 0.0031435489654541016, "step": 2460} +{"info/global_step": 2461, "train_info/time_within_train_step": 2.2855608463287354, "step": 2461} +{"train_info/time_between_train_steps": 0.003180265426635742, "step": 2461} +{"info/global_step": 2462, "train_info/time_within_train_step": 2.2861077785491943, "step": 2462} +{"train_info/time_between_train_steps": 0.0031642913818359375, "step": 2462} +{"info/global_step": 2463, "train_info/time_within_train_step": 2.2854678630828857, "step": 2463} +{"train_info/time_between_train_steps": 0.0031585693359375, "step": 2463} +{"info/global_step": 2464, "train_info/time_within_train_step": 2.2847301959991455, "step": 2464} +{"train_info/time_between_train_steps": 0.0031900405883789062, "step": 2464} +{"info/global_step": 2465, "train_info/time_within_train_step": 2.286093235015869, "step": 2465} +{"train_info/time_between_train_steps": 0.003196239471435547, "step": 2465} +{"info/global_step": 2466, "train_info/time_within_train_step": 2.286058187484741, "step": 2466} +{"train_info/time_between_train_steps": 0.0032274723052978516, "step": 2466} +{"info/global_step": 2467, "train_info/time_within_train_step": 2.285233497619629, "step": 2467} +{"train_info/time_between_train_steps": 0.003132343292236328, "step": 2467} +{"info/global_step": 2468, "train_info/time_within_train_step": 2.285423994064331, "step": 2468} +{"train_info/time_between_train_steps": 0.0031502246856689453, "step": 2468} +{"info/global_step": 2469, "train_info/time_within_train_step": 2.5183353424072266, "step": 2469} +{"train_info/time_between_train_steps": 0.003174304962158203, "step": 2469} +{"info/global_step": 2470, "train_info/time_within_train_step": 2.2864043712615967, "step": 2470} +{"train_info/time_between_train_steps": 0.0031669139862060547, "step": 2470} +{"info/global_step": 2471, "train_info/time_within_train_step": 2.28595232963562, "step": 2471} +{"train_info/time_between_train_steps": 0.003180265426635742, "step": 2471} +{"info/global_step": 2472, "train_info/time_within_train_step": 2.2859652042388916, "step": 2472} +{"train_info/time_between_train_steps": 0.0031800270080566406, "step": 2472} +{"info/global_step": 2473, "train_info/time_within_train_step": 2.2860114574432373, "step": 2473} +{"train_info/time_between_train_steps": 0.0031881332397460938, "step": 2473} +{"info/global_step": 2474, "train_info/time_within_train_step": 2.28574800491333, "step": 2474} +{"train_info/time_between_train_steps": 0.003155946731567383, "step": 2474} +{"info/global_step": 2475, "train_info/time_within_train_step": 2.2851319313049316, "step": 2475} +{"train_info/time_between_train_steps": 0.003141641616821289, "step": 2475} +{"info/global_step": 2476, "train_info/time_within_train_step": 2.2855868339538574, "step": 2476} +{"train_info/time_between_train_steps": 0.0031495094299316406, "step": 2476} +{"info/global_step": 2477, "train_info/time_within_train_step": 2.2856392860412598, "step": 2477} +{"train_info/time_between_train_steps": 0.0031440258026123047, "step": 2477} +{"info/global_step": 2478, "train_info/time_within_train_step": 2.3728525638580322, "step": 2478} +{"train_info/time_between_train_steps": 0.0031795501708984375, "step": 2478} +{"info/global_step": 2479, "train_info/time_within_train_step": 2.2857773303985596, "step": 2479} +{"train_info/time_between_train_steps": 0.0032198429107666016, "step": 2479} +{"info/global_step": 2480, "train_info/time_within_train_step": 2.2852768898010254, "step": 2480} +{"train_info/time_between_train_steps": 0.0031599998474121094, "step": 2480} +{"info/global_step": 2481, "train_info/time_within_train_step": 2.2850990295410156, "step": 2481} +{"train_info/time_between_train_steps": 0.003140687942504883, "step": 2481} +{"info/global_step": 2482, "train_info/time_within_train_step": 2.284597873687744, "step": 2482} +{"train_info/time_between_train_steps": 0.003165721893310547, "step": 2482} +{"info/global_step": 2483, "train_info/time_within_train_step": 2.284484624862671, "step": 2483} +{"train_info/time_between_train_steps": 0.003145933151245117, "step": 2483} +{"info/global_step": 2484, "train_info/time_within_train_step": 2.2844951152801514, "step": 2484} +{"train_info/time_between_train_steps": 0.0031211376190185547, "step": 2484} +{"info/global_step": 2485, "train_info/time_within_train_step": 2.2846291065216064, "step": 2485} +{"train_info/time_between_train_steps": 0.003144979476928711, "step": 2485} +{"info/global_step": 2486, "train_info/time_within_train_step": 2.285188674926758, "step": 2486} +{"train_info/time_between_train_steps": 0.00318145751953125, "step": 2486} +{"info/global_step": 2487, "train_info/time_within_train_step": 2.285494089126587, "step": 2487} +{"train_info/time_between_train_steps": 0.003168821334838867, "step": 2487} +{"info/global_step": 2488, "train_info/time_within_train_step": 2.284977674484253, "step": 2488} +{"train_info/time_between_train_steps": 0.0031828880310058594, "step": 2488} +{"info/global_step": 2489, "train_info/time_within_train_step": 2.2852420806884766, "step": 2489} +{"train_info/time_between_train_steps": 0.003151416778564453, "step": 2489} +{"info/global_step": 2490, "train_info/time_within_train_step": 2.285616159439087, "step": 2490} +{"train_info/time_between_train_steps": 0.0037665367126464844, "step": 2490} +{"info/global_step": 2491, "train_info/time_within_train_step": 2.286154270172119, "step": 2491} +{"train_info/time_between_train_steps": 0.0031452178955078125, "step": 2491} +{"info/global_step": 2492, "train_info/time_within_train_step": 2.2852742671966553, "step": 2492} +{"train_info/time_between_train_steps": 0.0031189918518066406, "step": 2492} +{"info/global_step": 2493, "train_info/time_within_train_step": 2.2911293506622314, "step": 2493} +{"train_info/time_between_train_steps": 0.003141164779663086, "step": 2493} +{"info/global_step": 2494, "train_info/time_within_train_step": 2.286092519760132, "step": 2494} +{"train_info/time_between_train_steps": 0.0031735897064208984, "step": 2494} +{"info/global_step": 2495, "train_info/time_within_train_step": 2.2857565879821777, "step": 2495} +{"train_info/time_between_train_steps": 0.003175020217895508, "step": 2495} +{"info/global_step": 2496, "train_info/time_within_train_step": 2.2869131565093994, "step": 2496} +{"train_info/time_between_train_steps": 0.003161191940307617, "step": 2496} +{"info/global_step": 2497, "train_info/time_within_train_step": 2.4380452632904053, "step": 2497} +{"train_info/time_between_train_steps": 0.003150463104248047, "step": 2497} +{"info/global_step": 2498, "train_info/time_within_train_step": 2.2853353023529053, "step": 2498} +{"train_info/time_between_train_steps": 0.003177642822265625, "step": 2498} +{"info/global_step": 2499, "train_info/time_within_train_step": 2.2856462001800537, "step": 2499} +{"train_info/time_between_train_steps": 0.0031423568725585938, "step": 2499} +{"info/global_step": 2500, "train_info/time_within_train_step": 2.6538243293762207, "step": 2500} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746350053, "_runtime": 6150}, "step": 2500} +{"logs": {"train/loss": 3.349, "train/learning_rate": 0.00011111111111111109, "train/epoch": 2.11, "_timestamp": 1746350053, "_runtime": 6150}, "step": 2500} +{"train_info/time_between_train_steps": 11.507647275924683, "step": 2500} +{"info/global_step": 2501, "train_info/time_within_train_step": 2.1178221702575684, "step": 2501} +{"train_info/time_between_train_steps": 0.0031762123107910156, "step": 2501} +{"info/global_step": 2502, "train_info/time_within_train_step": 2.0970823764801025, "step": 2502} +{"train_info/time_between_train_steps": 0.0031735897064208984, "step": 2502} +{"info/global_step": 2503, "train_info/time_within_train_step": 2.2235143184661865, "step": 2503} +{"train_info/time_between_train_steps": 0.003172636032104492, "step": 2503} +{"info/global_step": 2504, "train_info/time_within_train_step": 2.2848291397094727, "step": 2504} +{"train_info/time_between_train_steps": 0.003152608871459961, "step": 2504} +{"info/global_step": 2505, "train_info/time_within_train_step": 2.2840964794158936, "step": 2505} +{"train_info/time_between_train_steps": 0.0031783580780029297, "step": 2505} +{"info/global_step": 2506, "train_info/time_within_train_step": 2.284724235534668, "step": 2506} +{"train_info/time_between_train_steps": 0.0032134056091308594, "step": 2506} +{"info/global_step": 2507, "train_info/time_within_train_step": 2.2854368686676025, "step": 2507} +{"train_info/time_between_train_steps": 0.00322723388671875, "step": 2507} +{"info/global_step": 2508, "train_info/time_within_train_step": 2.285572052001953, "step": 2508} +{"train_info/time_between_train_steps": 0.0031843185424804688, "step": 2508} +{"info/global_step": 2509, "train_info/time_within_train_step": 2.285508632659912, "step": 2509} +{"train_info/time_between_train_steps": 0.0031464099884033203, "step": 2509} +{"info/global_step": 2510, "train_info/time_within_train_step": 2.285609722137451, "step": 2510} +{"train_info/time_between_train_steps": 0.0031549930572509766, "step": 2510} +{"info/global_step": 2511, "train_info/time_within_train_step": 2.285733938217163, "step": 2511} +{"train_info/time_between_train_steps": 0.0031671524047851562, "step": 2511} +{"info/global_step": 2512, "train_info/time_within_train_step": 2.286522626876831, "step": 2512} +{"train_info/time_between_train_steps": 0.0031397342681884766, "step": 2512} +{"info/global_step": 2513, "train_info/time_within_train_step": 2.2863543033599854, "step": 2513} +{"train_info/time_between_train_steps": 0.003204822540283203, "step": 2513} +{"info/global_step": 2514, "train_info/time_within_train_step": 2.2918667793273926, "step": 2514} +{"train_info/time_between_train_steps": 0.0031774044036865234, "step": 2514} +{"info/global_step": 2515, "train_info/time_within_train_step": 2.2867279052734375, "step": 2515} +{"train_info/time_between_train_steps": 0.0031805038452148438, "step": 2515} +{"info/global_step": 2516, "train_info/time_within_train_step": 2.2871012687683105, "step": 2516} +{"train_info/time_between_train_steps": 0.003183126449584961, "step": 2516} +{"info/global_step": 2517, "train_info/time_within_train_step": 2.524345636367798, "step": 2517} +{"train_info/time_between_train_steps": 0.0031554698944091797, "step": 2517} +{"info/global_step": 2518, "train_info/time_within_train_step": 2.286578893661499, "step": 2518} +{"train_info/time_between_train_steps": 0.0031769275665283203, "step": 2518} +{"info/global_step": 2519, "train_info/time_within_train_step": 2.286583662033081, "step": 2519} +{"train_info/time_between_train_steps": 0.003166675567626953, "step": 2519} +{"info/global_step": 2520, "train_info/time_within_train_step": 2.2870922088623047, "step": 2520} +{"train_info/time_between_train_steps": 0.0031974315643310547, "step": 2520} +{"info/global_step": 2521, "train_info/time_within_train_step": 2.287010431289673, "step": 2521} +{"train_info/time_between_train_steps": 0.003168821334838867, "step": 2521} +{"info/global_step": 2522, "train_info/time_within_train_step": 2.2871501445770264, "step": 2522} +{"train_info/time_between_train_steps": 0.003192901611328125, "step": 2522} +{"info/global_step": 2523, "train_info/time_within_train_step": 2.2874391078948975, "step": 2523} +{"train_info/time_between_train_steps": 0.0031995773315429688, "step": 2523} +{"info/global_step": 2524, "train_info/time_within_train_step": 2.2864298820495605, "step": 2524} +{"train_info/time_between_train_steps": 0.0031595230102539062, "step": 2524} +{"info/global_step": 2525, "train_info/time_within_train_step": 2.2866883277893066, "step": 2525} +{"train_info/time_between_train_steps": 0.0031664371490478516, "step": 2525} +{"info/global_step": 2526, "train_info/time_within_train_step": 2.2867815494537354, "step": 2526} +{"train_info/time_between_train_steps": 0.0031585693359375, "step": 2526} +{"info/global_step": 2527, "train_info/time_within_train_step": 2.286590576171875, "step": 2527} +{"train_info/time_between_train_steps": 0.003171205520629883, "step": 2527} +{"info/global_step": 2528, "train_info/time_within_train_step": 2.287010431289673, "step": 2528} +{"train_info/time_between_train_steps": 0.003197193145751953, "step": 2528} +{"info/global_step": 2529, "train_info/time_within_train_step": 2.2871451377868652, "step": 2529} +{"train_info/time_between_train_steps": 0.003212451934814453, "step": 2529} +{"info/global_step": 2530, "train_info/time_within_train_step": 2.2867066860198975, "step": 2530} +{"train_info/time_between_train_steps": 0.0031876564025878906, "step": 2530} +{"info/global_step": 2531, "train_info/time_within_train_step": 2.2866051197052, "step": 2531} +{"train_info/time_between_train_steps": 0.0032346248626708984, "step": 2531} +{"info/global_step": 2532, "train_info/time_within_train_step": 2.287222146987915, "step": 2532} +{"train_info/time_between_train_steps": 0.0031545162200927734, "step": 2532} +{"info/global_step": 2533, "train_info/time_within_train_step": 2.2869248390197754, "step": 2533} +{"train_info/time_between_train_steps": 0.0034170150756835938, "step": 2533} +{"info/global_step": 2534, "train_info/time_within_train_step": 2.2878873348236084, "step": 2534} +{"train_info/time_between_train_steps": 0.003175020217895508, "step": 2534} +{"info/global_step": 2535, "train_info/time_within_train_step": 2.286815881729126, "step": 2535} +{"train_info/time_between_train_steps": 0.003161191940307617, "step": 2535} +{"info/global_step": 2536, "train_info/time_within_train_step": 2.2876217365264893, "step": 2536} +{"train_info/time_between_train_steps": 0.003188610076904297, "step": 2536} +{"info/global_step": 2537, "train_info/time_within_train_step": 2.2865395545959473, "step": 2537} +{"train_info/time_between_train_steps": 0.003203868865966797, "step": 2537} +{"info/global_step": 2538, "train_info/time_within_train_step": 2.286450147628784, "step": 2538} +{"train_info/time_between_train_steps": 0.00316619873046875, "step": 2538} +{"info/global_step": 2539, "train_info/time_within_train_step": 2.2864999771118164, "step": 2539} +{"train_info/time_between_train_steps": 0.0031402111053466797, "step": 2539} +{"info/global_step": 2540, "train_info/time_within_train_step": 2.2910144329071045, "step": 2540} +{"train_info/time_between_train_steps": 0.0031757354736328125, "step": 2540} +{"info/global_step": 2541, "train_info/time_within_train_step": 2.286266326904297, "step": 2541} +{"train_info/time_between_train_steps": 0.0031294822692871094, "step": 2541} +{"info/global_step": 2542, "train_info/time_within_train_step": 2.28694486618042, "step": 2542} +{"train_info/time_between_train_steps": 0.0032072067260742188, "step": 2542} +{"info/global_step": 2543, "train_info/time_within_train_step": 2.2869982719421387, "step": 2543} +{"train_info/time_between_train_steps": 0.0032646656036376953, "step": 2543} +{"info/global_step": 2544, "train_info/time_within_train_step": 2.2873902320861816, "step": 2544} +{"train_info/time_between_train_steps": 0.0032775402069091797, "step": 2544} +{"info/global_step": 2545, "train_info/time_within_train_step": 2.2869200706481934, "step": 2545} +{"train_info/time_between_train_steps": 0.003281831741333008, "step": 2545} +{"info/global_step": 2546, "train_info/time_within_train_step": 2.2867746353149414, "step": 2546} +{"train_info/time_between_train_steps": 0.0032889842987060547, "step": 2546} +{"info/global_step": 2547, "train_info/time_within_train_step": 2.28650164604187, "step": 2547} +{"train_info/time_between_train_steps": 0.0031969547271728516, "step": 2547} +{"info/global_step": 2548, "train_info/time_within_train_step": 2.286379098892212, "step": 2548} +{"train_info/time_between_train_steps": 0.003218412399291992, "step": 2548} +{"info/global_step": 2549, "train_info/time_within_train_step": 2.286780834197998, "step": 2549} +{"train_info/time_between_train_steps": 0.003200054168701172, "step": 2549} +{"info/global_step": 2550, "train_info/time_within_train_step": 2.2864389419555664, "step": 2550} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746350180, "_runtime": 6277}, "step": 2550} +{"logs": {"train/loss": 3.3314, "train/learning_rate": 9.999999999999999e-05, "train/epoch": 2.12, "_timestamp": 1746350180, "_runtime": 6277}, "step": 2550} +{"train_info/time_between_train_steps": 0.02434086799621582, "step": 2550} +{"info/global_step": 2551, "train_info/time_within_train_step": 2.2865312099456787, "step": 2551} +{"train_info/time_between_train_steps": 0.0031981468200683594, "step": 2551} +{"info/global_step": 2552, "train_info/time_within_train_step": 2.2866618633270264, "step": 2552} +{"train_info/time_between_train_steps": 0.0032775402069091797, "step": 2552} +{"info/global_step": 2553, "train_info/time_within_train_step": 2.2867491245269775, "step": 2553} +{"train_info/time_between_train_steps": 0.0032820701599121094, "step": 2553} +{"info/global_step": 2554, "train_info/time_within_train_step": 2.286390781402588, "step": 2554} +{"train_info/time_between_train_steps": 0.0033071041107177734, "step": 2554} +{"info/global_step": 2555, "train_info/time_within_train_step": 2.2877728939056396, "step": 2555} +{"train_info/time_between_train_steps": 0.0031998157501220703, "step": 2555} +{"info/global_step": 2556, "train_info/time_within_train_step": 2.2868900299072266, "step": 2556} +{"train_info/time_between_train_steps": 0.003185272216796875, "step": 2556} +{"info/global_step": 2557, "train_info/time_within_train_step": 2.286963701248169, "step": 2557} +{"train_info/time_between_train_steps": 0.0032143592834472656, "step": 2557} +{"info/global_step": 2558, "train_info/time_within_train_step": 2.2870051860809326, "step": 2558} +{"train_info/time_between_train_steps": 0.003194570541381836, "step": 2558} +{"info/global_step": 2559, "train_info/time_within_train_step": 2.287353992462158, "step": 2559} +{"train_info/time_between_train_steps": 0.13025665283203125, "step": 2559} +{"info/global_step": 2560, "train_info/time_within_train_step": 2.2871906757354736, "step": 2560} +{"train_info/time_between_train_steps": 0.0031957626342773438, "step": 2560} +{"info/global_step": 2561, "train_info/time_within_train_step": 2.287750482559204, "step": 2561} +{"train_info/time_between_train_steps": 0.003172636032104492, "step": 2561} +{"info/global_step": 2562, "train_info/time_within_train_step": 2.287182569503784, "step": 2562} +{"train_info/time_between_train_steps": 0.0032231807708740234, "step": 2562} +{"info/global_step": 2563, "train_info/time_within_train_step": 2.286212682723999, "step": 2563} +{"train_info/time_between_train_steps": 0.003196239471435547, "step": 2563} +{"info/global_step": 2564, "train_info/time_within_train_step": 2.2864294052124023, "step": 2564} +{"train_info/time_between_train_steps": 0.003236532211303711, "step": 2564} +{"info/global_step": 2565, "train_info/time_within_train_step": 2.287014961242676, "step": 2565} +{"train_info/time_between_train_steps": 0.003186464309692383, "step": 2565} +{"info/global_step": 2566, "train_info/time_within_train_step": 2.2911126613616943, "step": 2566} +{"train_info/time_between_train_steps": 0.003205537796020508, "step": 2566} +{"info/global_step": 2567, "train_info/time_within_train_step": 2.2862884998321533, "step": 2567} +{"train_info/time_between_train_steps": 0.0031392574310302734, "step": 2567} +{"info/global_step": 2568, "train_info/time_within_train_step": 2.2868895530700684, "step": 2568} +{"train_info/time_between_train_steps": 0.003198862075805664, "step": 2568} +{"info/global_step": 2569, "train_info/time_within_train_step": 2.286677122116089, "step": 2569} +{"train_info/time_between_train_steps": 0.003196239471435547, "step": 2569} +{"info/global_step": 2570, "train_info/time_within_train_step": 2.286334753036499, "step": 2570} +{"train_info/time_between_train_steps": 0.003159046173095703, "step": 2570} +{"info/global_step": 2571, "train_info/time_within_train_step": 2.5380868911743164, "step": 2571} +{"train_info/time_between_train_steps": 0.0031976699829101562, "step": 2571} +{"info/global_step": 2572, "train_info/time_within_train_step": 2.287407875061035, "step": 2572} +{"train_info/time_between_train_steps": 0.003142118453979492, "step": 2572} +{"info/global_step": 2573, "train_info/time_within_train_step": 2.2864274978637695, "step": 2573} +{"train_info/time_between_train_steps": 0.0031480789184570312, "step": 2573} +{"info/global_step": 2574, "train_info/time_within_train_step": 2.2864294052124023, "step": 2574} +{"train_info/time_between_train_steps": 0.003142118453979492, "step": 2574} +{"info/global_step": 2575, "train_info/time_within_train_step": 2.286895751953125, "step": 2575} +{"train_info/time_between_train_steps": 0.003236532211303711, "step": 2575} +{"info/global_step": 2576, "train_info/time_within_train_step": 2.287191867828369, "step": 2576} +{"train_info/time_between_train_steps": 0.0032062530517578125, "step": 2576} +{"info/global_step": 2577, "train_info/time_within_train_step": 2.2871360778808594, "step": 2577} +{"train_info/time_between_train_steps": 0.0032062530517578125, "step": 2577} +{"info/global_step": 2578, "train_info/time_within_train_step": 2.373788356781006, "step": 2578} +{"train_info/time_between_train_steps": 0.0032036304473876953, "step": 2578} +{"info/global_step": 2579, "train_info/time_within_train_step": 2.2868878841400146, "step": 2579} +{"train_info/time_between_train_steps": 0.0032186508178710938, "step": 2579} +{"info/global_step": 2580, "train_info/time_within_train_step": 2.287898302078247, "step": 2580} +{"train_info/time_between_train_steps": 0.0033752918243408203, "step": 2580} +{"info/global_step": 2581, "train_info/time_within_train_step": 2.291430711746216, "step": 2581} +{"train_info/time_between_train_steps": 0.003671407699584961, "step": 2581} +{"info/global_step": 2582, "train_info/time_within_train_step": 2.289438009262085, "step": 2582} +{"train_info/time_between_train_steps": 0.003414154052734375, "step": 2582} +{"info/global_step": 2583, "train_info/time_within_train_step": 2.2920165061950684, "step": 2583} +{"train_info/time_between_train_steps": 0.003769397735595703, "step": 2583} +{"info/global_step": 2584, "train_info/time_within_train_step": 2.289781332015991, "step": 2584} +{"train_info/time_between_train_steps": 0.003355741500854492, "step": 2584} +{"info/global_step": 2585, "train_info/time_within_train_step": 2.289088010787964, "step": 2585} +{"train_info/time_between_train_steps": 0.003347158432006836, "step": 2585} +{"info/global_step": 2586, "train_info/time_within_train_step": 2.2897512912750244, "step": 2586} +{"train_info/time_between_train_steps": 0.003293752670288086, "step": 2586} +{"info/global_step": 2587, "train_info/time_within_train_step": 2.2900924682617188, "step": 2587} +{"train_info/time_between_train_steps": 0.0036749839782714844, "step": 2587} +{"info/global_step": 2588, "train_info/time_within_train_step": 2.2884480953216553, "step": 2588} +{"train_info/time_between_train_steps": 0.003202676773071289, "step": 2588} +{"info/global_step": 2589, "train_info/time_within_train_step": 2.2860803604125977, "step": 2589} +{"train_info/time_between_train_steps": 0.003155946731567383, "step": 2589} +{"info/global_step": 2590, "train_info/time_within_train_step": 2.286259412765503, "step": 2590} +{"train_info/time_between_train_steps": 0.003173828125, "step": 2590} +{"info/global_step": 2591, "train_info/time_within_train_step": 2.286470651626587, "step": 2591} +{"train_info/time_between_train_steps": 0.003143310546875, "step": 2591} +{"info/global_step": 2592, "train_info/time_within_train_step": 2.285822868347168, "step": 2592} +{"train_info/time_between_train_steps": 0.003191709518432617, "step": 2592} +{"info/global_step": 2593, "train_info/time_within_train_step": 2.286696434020996, "step": 2593} +{"train_info/time_between_train_steps": 0.003161191940307617, "step": 2593} +{"info/global_step": 2594, "train_info/time_within_train_step": 2.286146879196167, "step": 2594} +{"train_info/time_between_train_steps": 0.0031261444091796875, "step": 2594} +{"info/global_step": 2595, "train_info/time_within_train_step": 2.2858388423919678, "step": 2595} +{"train_info/time_between_train_steps": 0.0031766891479492188, "step": 2595} +{"info/global_step": 2596, "train_info/time_within_train_step": 2.2864489555358887, "step": 2596} +{"train_info/time_between_train_steps": 0.0032188892364501953, "step": 2596} +{"info/global_step": 2597, "train_info/time_within_train_step": 2.2870001792907715, "step": 2597} +{"train_info/time_between_train_steps": 0.0031850337982177734, "step": 2597} +{"info/global_step": 2598, "train_info/time_within_train_step": 2.2874510288238525, "step": 2598} +{"train_info/time_between_train_steps": 0.003246784210205078, "step": 2598} +{"info/global_step": 2599, "train_info/time_within_train_step": 2.287335157394409, "step": 2599} +{"train_info/time_between_train_steps": 0.0031816959381103516, "step": 2599} +{"info/global_step": 2600, "train_info/time_within_train_step": 2.2861649990081787, "step": 2600} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746350297, "_runtime": 6394}, "step": 2600} +{"logs": {"train/loss": 3.311, "train/learning_rate": 8.888888888888888e-05, "train/epoch": 2.14, "_timestamp": 1746350297, "_runtime": 6394}, "step": 2600} +{"train_info/time_between_train_steps": 17.24481725692749, "step": 2600} +{"info/global_step": 2601, "train_info/time_within_train_step": 2.1182680130004883, "step": 2601} +{"train_info/time_between_train_steps": 0.0031728744506835938, "step": 2601} +{"info/global_step": 2602, "train_info/time_within_train_step": 2.10166072845459, "step": 2602} +{"train_info/time_between_train_steps": 0.003337383270263672, "step": 2602} +{"info/global_step": 2603, "train_info/time_within_train_step": 2.1371192932128906, "step": 2603} +{"train_info/time_between_train_steps": 0.005086183547973633, "step": 2603} +{"info/global_step": 2604, "train_info/time_within_train_step": 2.2852933406829834, "step": 2604} +{"train_info/time_between_train_steps": 0.003151416778564453, "step": 2604} +{"info/global_step": 2605, "train_info/time_within_train_step": 2.2846901416778564, "step": 2605} +{"train_info/time_between_train_steps": 0.0031304359436035156, "step": 2605} +{"info/global_step": 2606, "train_info/time_within_train_step": 2.2850871086120605, "step": 2606} +{"train_info/time_between_train_steps": 0.003125905990600586, "step": 2606} +{"info/global_step": 2607, "train_info/time_within_train_step": 2.28590726852417, "step": 2607} +{"train_info/time_between_train_steps": 0.0031197071075439453, "step": 2607} +{"info/global_step": 2608, "train_info/time_within_train_step": 2.2852563858032227, "step": 2608} +{"train_info/time_between_train_steps": 0.0031113624572753906, "step": 2608} +{"info/global_step": 2609, "train_info/time_within_train_step": 2.285635471343994, "step": 2609} +{"train_info/time_between_train_steps": 0.003141641616821289, "step": 2609} +{"info/global_step": 2610, "train_info/time_within_train_step": 2.2859411239624023, "step": 2610} +{"train_info/time_between_train_steps": 0.0031549930572509766, "step": 2610} +{"info/global_step": 2611, "train_info/time_within_train_step": 2.2860400676727295, "step": 2611} +{"train_info/time_between_train_steps": 0.0031495094299316406, "step": 2611} +{"info/global_step": 2612, "train_info/time_within_train_step": 2.2859418392181396, "step": 2612} +{"train_info/time_between_train_steps": 0.0031566619873046875, "step": 2612} +{"info/global_step": 2613, "train_info/time_within_train_step": 2.285914182662964, "step": 2613} +{"train_info/time_between_train_steps": 0.0031316280364990234, "step": 2613} +{"info/global_step": 2614, "train_info/time_within_train_step": 2.285609245300293, "step": 2614} +{"train_info/time_between_train_steps": 0.003115415573120117, "step": 2614} +{"info/global_step": 2615, "train_info/time_within_train_step": 2.285771369934082, "step": 2615} +{"train_info/time_between_train_steps": 0.0031232833862304688, "step": 2615} +{"info/global_step": 2616, "train_info/time_within_train_step": 2.286466598510742, "step": 2616} +{"train_info/time_between_train_steps": 0.003148317337036133, "step": 2616} +{"info/global_step": 2617, "train_info/time_within_train_step": 2.286698341369629, "step": 2617} +{"train_info/time_between_train_steps": 0.0031251907348632812, "step": 2617} +{"info/global_step": 2618, "train_info/time_within_train_step": 2.2864327430725098, "step": 2618} +{"train_info/time_between_train_steps": 0.003168344497680664, "step": 2618} +{"info/global_step": 2619, "train_info/time_within_train_step": 2.287532329559326, "step": 2619} +{"train_info/time_between_train_steps": 0.0031757354736328125, "step": 2619} +{"info/global_step": 2620, "train_info/time_within_train_step": 2.287567377090454, "step": 2620} +{"train_info/time_between_train_steps": 0.003200531005859375, "step": 2620} +{"info/global_step": 2621, "train_info/time_within_train_step": 2.2871205806732178, "step": 2621} +{"train_info/time_between_train_steps": 0.003157377243041992, "step": 2621} +{"info/global_step": 2622, "train_info/time_within_train_step": 2.6537914276123047, "step": 2622} +{"train_info/time_between_train_steps": 0.003141641616821289, "step": 2622} +{"info/global_step": 2623, "train_info/time_within_train_step": 2.28682017326355, "step": 2623} +{"train_info/time_between_train_steps": 0.0031397342681884766, "step": 2623} +{"info/global_step": 2624, "train_info/time_within_train_step": 2.287430763244629, "step": 2624} +{"train_info/time_between_train_steps": 0.0031538009643554688, "step": 2624} +{"info/global_step": 2625, "train_info/time_within_train_step": 2.287440776824951, "step": 2625} +{"train_info/time_between_train_steps": 0.0031828880310058594, "step": 2625} +{"info/global_step": 2626, "train_info/time_within_train_step": 2.3752052783966064, "step": 2626} +{"train_info/time_between_train_steps": 0.0031795501708984375, "step": 2626} +{"info/global_step": 2627, "train_info/time_within_train_step": 2.2874350547790527, "step": 2627} +{"train_info/time_between_train_steps": 0.003125429153442383, "step": 2627} +{"info/global_step": 2628, "train_info/time_within_train_step": 2.286726236343384, "step": 2628} +{"train_info/time_between_train_steps": 0.003163576126098633, "step": 2628} +{"info/global_step": 2629, "train_info/time_within_train_step": 2.287248373031616, "step": 2629} +{"train_info/time_between_train_steps": 0.003117799758911133, "step": 2629} +{"info/global_step": 2630, "train_info/time_within_train_step": 2.286712169647217, "step": 2630} +{"train_info/time_between_train_steps": 0.003118753433227539, "step": 2630} +{"info/global_step": 2631, "train_info/time_within_train_step": 2.2860965728759766, "step": 2631} +{"train_info/time_between_train_steps": 0.0031120777130126953, "step": 2631} +{"info/global_step": 2632, "train_info/time_within_train_step": 2.2870213985443115, "step": 2632} +{"train_info/time_between_train_steps": 0.0031435489654541016, "step": 2632} +{"info/global_step": 2633, "train_info/time_within_train_step": 2.2864248752593994, "step": 2633} +{"train_info/time_between_train_steps": 0.0031867027282714844, "step": 2633} +{"info/global_step": 2634, "train_info/time_within_train_step": 2.2860207557678223, "step": 2634} +{"train_info/time_between_train_steps": 0.003134489059448242, "step": 2634} +{"info/global_step": 2635, "train_info/time_within_train_step": 2.28611421585083, "step": 2635} +{"train_info/time_between_train_steps": 0.003126859664916992, "step": 2635} +{"info/global_step": 2636, "train_info/time_within_train_step": 2.286369562149048, "step": 2636} +{"train_info/time_between_train_steps": 0.0031280517578125, "step": 2636} +{"info/global_step": 2637, "train_info/time_within_train_step": 2.286766290664673, "step": 2637} +{"train_info/time_between_train_steps": 0.0031189918518066406, "step": 2637} +{"info/global_step": 2638, "train_info/time_within_train_step": 2.287968397140503, "step": 2638} +{"train_info/time_between_train_steps": 0.0031719207763671875, "step": 2638} +{"info/global_step": 2639, "train_info/time_within_train_step": 2.287205457687378, "step": 2639} +{"train_info/time_between_train_steps": 0.003146648406982422, "step": 2639} +{"info/global_step": 2640, "train_info/time_within_train_step": 2.2918219566345215, "step": 2640} +{"train_info/time_between_train_steps": 0.003165721893310547, "step": 2640} +{"info/global_step": 2641, "train_info/time_within_train_step": 2.2871170043945312, "step": 2641} +{"train_info/time_between_train_steps": 0.003314971923828125, "step": 2641} +{"info/global_step": 2642, "train_info/time_within_train_step": 2.2871336936950684, "step": 2642} +{"train_info/time_between_train_steps": 0.0031816959381103516, "step": 2642} +{"info/global_step": 2643, "train_info/time_within_train_step": 2.2872841358184814, "step": 2643} +{"train_info/time_between_train_steps": 0.0031099319458007812, "step": 2643} +{"info/global_step": 2644, "train_info/time_within_train_step": 2.287564516067505, "step": 2644} +{"train_info/time_between_train_steps": 0.003186941146850586, "step": 2644} +{"info/global_step": 2645, "train_info/time_within_train_step": 2.288207769393921, "step": 2645} +{"train_info/time_between_train_steps": 0.0031919479370117188, "step": 2645} +{"info/global_step": 2646, "train_info/time_within_train_step": 2.2886104583740234, "step": 2646} +{"train_info/time_between_train_steps": 0.0031197071075439453, "step": 2646} +{"info/global_step": 2647, "train_info/time_within_train_step": 2.291874885559082, "step": 2647} +{"train_info/time_between_train_steps": 0.0065996646881103516, "step": 2647} +{"info/global_step": 2648, "train_info/time_within_train_step": 2.289257764816284, "step": 2648} +{"train_info/time_between_train_steps": 0.003160715103149414, "step": 2648} +{"info/global_step": 2649, "train_info/time_within_train_step": 2.287339925765991, "step": 2649} +{"train_info/time_between_train_steps": 0.0031538009643554688, "step": 2649} +{"info/global_step": 2650, "train_info/time_within_train_step": 2.2866668701171875, "step": 2650} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746350430, "_runtime": 6527}, "step": 2650} +{"logs": {"train/loss": 3.3167, "train/learning_rate": 7.777777777777777e-05, "train/epoch": 2.16, "_timestamp": 1746350430, "_runtime": 6527}, "step": 2650} +{"train_info/time_between_train_steps": 0.024161815643310547, "step": 2650} +{"info/global_step": 2651, "train_info/time_within_train_step": 2.2870523929595947, "step": 2651} +{"train_info/time_between_train_steps": 0.003134012222290039, "step": 2651} +{"info/global_step": 2652, "train_info/time_within_train_step": 2.3752121925354004, "step": 2652} +{"train_info/time_between_train_steps": 0.0031349658966064453, "step": 2652} +{"info/global_step": 2653, "train_info/time_within_train_step": 2.293997049331665, "step": 2653} +{"train_info/time_between_train_steps": 0.0031404495239257812, "step": 2653} +{"info/global_step": 2654, "train_info/time_within_train_step": 2.286038875579834, "step": 2654} +{"train_info/time_between_train_steps": 0.003123044967651367, "step": 2654} +{"info/global_step": 2655, "train_info/time_within_train_step": 2.2860262393951416, "step": 2655} +{"train_info/time_between_train_steps": 0.003149747848510742, "step": 2655} +{"info/global_step": 2656, "train_info/time_within_train_step": 2.2857213020324707, "step": 2656} +{"train_info/time_between_train_steps": 0.0030994415283203125, "step": 2656} +{"info/global_step": 2657, "train_info/time_within_train_step": 2.2862114906311035, "step": 2657} +{"train_info/time_between_train_steps": 0.0031440258026123047, "step": 2657} +{"info/global_step": 2658, "train_info/time_within_train_step": 2.285778760910034, "step": 2658} +{"train_info/time_between_train_steps": 0.003161907196044922, "step": 2658} +{"info/global_step": 2659, "train_info/time_within_train_step": 2.286715269088745, "step": 2659} +{"train_info/time_between_train_steps": 0.003450155258178711, "step": 2659} +{"info/global_step": 2660, "train_info/time_within_train_step": 2.2955172061920166, "step": 2660} +{"train_info/time_between_train_steps": 0.0031232833862304688, "step": 2660} +{"info/global_step": 2661, "train_info/time_within_train_step": 2.2865943908691406, "step": 2661} +{"train_info/time_between_train_steps": 0.0031137466430664062, "step": 2661} +{"info/global_step": 2662, "train_info/time_within_train_step": 2.2860896587371826, "step": 2662} +{"train_info/time_between_train_steps": 0.003106355667114258, "step": 2662} +{"info/global_step": 2663, "train_info/time_within_train_step": 2.2872889041900635, "step": 2663} +{"train_info/time_between_train_steps": 0.003370523452758789, "step": 2663} +{"info/global_step": 2664, "train_info/time_within_train_step": 2.2895214557647705, "step": 2664} +{"train_info/time_between_train_steps": 0.0032193660736083984, "step": 2664} +{"info/global_step": 2665, "train_info/time_within_train_step": 2.288749933242798, "step": 2665} +{"train_info/time_between_train_steps": 0.0032317638397216797, "step": 2665} +{"info/global_step": 2666, "train_info/time_within_train_step": 2.2919704914093018, "step": 2666} +{"train_info/time_between_train_steps": 0.0031778812408447266, "step": 2666} +{"info/global_step": 2667, "train_info/time_within_train_step": 2.287534713745117, "step": 2667} +{"train_info/time_between_train_steps": 0.0031235218048095703, "step": 2667} +{"info/global_step": 2668, "train_info/time_within_train_step": 2.287172317504883, "step": 2668} +{"train_info/time_between_train_steps": 0.0031669139862060547, "step": 2668} +{"info/global_step": 2669, "train_info/time_within_train_step": 2.287607431411743, "step": 2669} +{"train_info/time_between_train_steps": 0.0031266212463378906, "step": 2669} +{"info/global_step": 2670, "train_info/time_within_train_step": 2.2874577045440674, "step": 2670} +{"train_info/time_between_train_steps": 0.003129243850708008, "step": 2670} +{"info/global_step": 2671, "train_info/time_within_train_step": 2.287466526031494, "step": 2671} +{"train_info/time_between_train_steps": 0.003103971481323242, "step": 2671} +{"info/global_step": 2672, "train_info/time_within_train_step": 2.2863967418670654, "step": 2672} +{"train_info/time_between_train_steps": 0.003108978271484375, "step": 2672} +{"info/global_step": 2673, "train_info/time_within_train_step": 2.286158561706543, "step": 2673} +{"train_info/time_between_train_steps": 0.003143787384033203, "step": 2673} +{"info/global_step": 2674, "train_info/time_within_train_step": 2.2864041328430176, "step": 2674} +{"train_info/time_between_train_steps": 0.0031838417053222656, "step": 2674} +{"info/global_step": 2675, "train_info/time_within_train_step": 2.2865920066833496, "step": 2675} +{"train_info/time_between_train_steps": 0.003176450729370117, "step": 2675} +{"info/global_step": 2676, "train_info/time_within_train_step": 2.286715507507324, "step": 2676} +{"train_info/time_between_train_steps": 0.003129720687866211, "step": 2676} +{"info/global_step": 2677, "train_info/time_within_train_step": 2.286574602127075, "step": 2677} +{"train_info/time_between_train_steps": 0.003149271011352539, "step": 2677} +{"info/global_step": 2678, "train_info/time_within_train_step": 2.3734776973724365, "step": 2678} +{"train_info/time_between_train_steps": 0.003129720687866211, "step": 2678} +{"info/global_step": 2679, "train_info/time_within_train_step": 2.286266565322876, "step": 2679} +{"train_info/time_between_train_steps": 0.0031158924102783203, "step": 2679} +{"info/global_step": 2680, "train_info/time_within_train_step": 2.2883079051971436, "step": 2680} +{"train_info/time_between_train_steps": 0.0031328201293945312, "step": 2680} +{"info/global_step": 2681, "train_info/time_within_train_step": 2.2880117893218994, "step": 2681} +{"train_info/time_between_train_steps": 0.003132343292236328, "step": 2681} +{"info/global_step": 2682, "train_info/time_within_train_step": 2.286377429962158, "step": 2682} +{"train_info/time_between_train_steps": 0.003145456314086914, "step": 2682} +{"info/global_step": 2683, "train_info/time_within_train_step": 2.2862937450408936, "step": 2683} +{"train_info/time_between_train_steps": 0.0031409263610839844, "step": 2683} +{"info/global_step": 2684, "train_info/time_within_train_step": 2.286531925201416, "step": 2684} +{"train_info/time_between_train_steps": 0.12539243698120117, "step": 2684} +{"info/global_step": 2685, "train_info/time_within_train_step": 2.2875239849090576, "step": 2685} +{"train_info/time_between_train_steps": 0.003146648406982422, "step": 2685} +{"info/global_step": 2686, "train_info/time_within_train_step": 2.286512851715088, "step": 2686} +{"train_info/time_between_train_steps": 0.0031461715698242188, "step": 2686} +{"info/global_step": 2687, "train_info/time_within_train_step": 2.2867472171783447, "step": 2687} +{"train_info/time_between_train_steps": 0.003103971481323242, "step": 2687} +{"info/global_step": 2688, "train_info/time_within_train_step": 2.286846160888672, "step": 2688} +{"train_info/time_between_train_steps": 0.003140687942504883, "step": 2688} +{"info/global_step": 2689, "train_info/time_within_train_step": 2.2870991230010986, "step": 2689} +{"train_info/time_between_train_steps": 0.0031554698944091797, "step": 2689} +{"info/global_step": 2690, "train_info/time_within_train_step": 2.2866899967193604, "step": 2690} +{"train_info/time_between_train_steps": 0.0031583309173583984, "step": 2690} +{"info/global_step": 2691, "train_info/time_within_train_step": 2.2872610092163086, "step": 2691} +{"train_info/time_between_train_steps": 0.0031728744506835938, "step": 2691} +{"info/global_step": 2692, "train_info/time_within_train_step": 2.2913084030151367, "step": 2692} +{"train_info/time_between_train_steps": 0.0031270980834960938, "step": 2692} +{"info/global_step": 2693, "train_info/time_within_train_step": 2.2871267795562744, "step": 2693} +{"train_info/time_between_train_steps": 0.0031213760375976562, "step": 2693} +{"info/global_step": 2694, "train_info/time_within_train_step": 2.2875518798828125, "step": 2694} +{"train_info/time_between_train_steps": 0.0032024383544921875, "step": 2694} +{"info/global_step": 2695, "train_info/time_within_train_step": 2.28817081451416, "step": 2695} +{"train_info/time_between_train_steps": 0.003251791000366211, "step": 2695} +{"info/global_step": 2696, "train_info/time_within_train_step": 2.288433313369751, "step": 2696} +{"train_info/time_between_train_steps": 0.0034241676330566406, "step": 2696} +{"info/global_step": 2697, "train_info/time_within_train_step": 2.2898504734039307, "step": 2697} +{"train_info/time_between_train_steps": 0.003233194351196289, "step": 2697} +{"info/global_step": 2698, "train_info/time_within_train_step": 2.287672281265259, "step": 2698} +{"train_info/time_between_train_steps": 0.003161907196044922, "step": 2698} +{"info/global_step": 2699, "train_info/time_within_train_step": 2.2877063751220703, "step": 2699} +{"train_info/time_between_train_steps": 0.0031867027282714844, "step": 2699} +{"info/global_step": 2700, "train_info/time_within_train_step": 2.2867424488067627, "step": 2700} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746350546, "_runtime": 6643}, "step": 2700} +{"logs": {"train/loss": 3.3069, "train/learning_rate": 6.666666666666666e-05, "train/epoch": 2.17, "_timestamp": 1746350546, "_runtime": 6643}, "step": 2700} +{"train_info/time_between_train_steps": 16.35616183280945, "step": 2700} +{"info/global_step": 2701, "train_info/time_within_train_step": 2.1139883995056152, "step": 2701} +{"train_info/time_between_train_steps": 0.0031883716583251953, "step": 2701} +{"info/global_step": 2702, "train_info/time_within_train_step": 2.096583366394043, "step": 2702} +{"train_info/time_between_train_steps": 0.003161191940307617, "step": 2702} +{"info/global_step": 2703, "train_info/time_within_train_step": 2.150338888168335, "step": 2703} +{"train_info/time_between_train_steps": 0.0031366348266601562, "step": 2703} +{"info/global_step": 2704, "train_info/time_within_train_step": 2.5395524501800537, "step": 2704} +{"train_info/time_between_train_steps": 0.0032253265380859375, "step": 2704} +{"info/global_step": 2705, "train_info/time_within_train_step": 2.2862703800201416, "step": 2705} +{"train_info/time_between_train_steps": 0.003187894821166992, "step": 2705} +{"info/global_step": 2706, "train_info/time_within_train_step": 2.2870023250579834, "step": 2706} +{"train_info/time_between_train_steps": 0.0031981468200683594, "step": 2706} +{"info/global_step": 2707, "train_info/time_within_train_step": 2.2867095470428467, "step": 2707} +{"train_info/time_between_train_steps": 0.003177642822265625, "step": 2707} +{"info/global_step": 2708, "train_info/time_within_train_step": 2.286740303039551, "step": 2708} +{"train_info/time_between_train_steps": 0.0032732486724853516, "step": 2708} +{"info/global_step": 2709, "train_info/time_within_train_step": 2.2869036197662354, "step": 2709} +{"train_info/time_between_train_steps": 0.0031561851501464844, "step": 2709} +{"info/global_step": 2710, "train_info/time_within_train_step": 2.2864089012145996, "step": 2710} +{"train_info/time_between_train_steps": 0.003137350082397461, "step": 2710} +{"info/global_step": 2711, "train_info/time_within_train_step": 2.291783094406128, "step": 2711} +{"train_info/time_between_train_steps": 0.0031592845916748047, "step": 2711} +{"info/global_step": 2712, "train_info/time_within_train_step": 2.287290573120117, "step": 2712} +{"train_info/time_between_train_steps": 0.0031745433807373047, "step": 2712} +{"info/global_step": 2713, "train_info/time_within_train_step": 2.2867815494537354, "step": 2713} +{"train_info/time_between_train_steps": 0.003130197525024414, "step": 2713} +{"info/global_step": 2714, "train_info/time_within_train_step": 2.2868735790252686, "step": 2714} +{"train_info/time_between_train_steps": 0.0031747817993164062, "step": 2714} +{"info/global_step": 2715, "train_info/time_within_train_step": 2.287132501602173, "step": 2715} +{"train_info/time_between_train_steps": 0.0031752586364746094, "step": 2715} +{"info/global_step": 2716, "train_info/time_within_train_step": 2.2872138023376465, "step": 2716} +{"train_info/time_between_train_steps": 0.003156423568725586, "step": 2716} +{"info/global_step": 2717, "train_info/time_within_train_step": 2.287379741668701, "step": 2717} +{"train_info/time_between_train_steps": 0.003142833709716797, "step": 2717} +{"info/global_step": 2718, "train_info/time_within_train_step": 2.287482738494873, "step": 2718} +{"train_info/time_between_train_steps": 0.0031578540802001953, "step": 2718} +{"info/global_step": 2719, "train_info/time_within_train_step": 2.2876672744750977, "step": 2719} +{"train_info/time_between_train_steps": 0.0031375885009765625, "step": 2719} +{"info/global_step": 2720, "train_info/time_within_train_step": 2.2875239849090576, "step": 2720} +{"train_info/time_between_train_steps": 0.0031061172485351562, "step": 2720} +{"info/global_step": 2721, "train_info/time_within_train_step": 2.2875094413757324, "step": 2721} +{"train_info/time_between_train_steps": 0.003174304962158203, "step": 2721} +{"info/global_step": 2722, "train_info/time_within_train_step": 2.2871007919311523, "step": 2722} +{"train_info/time_between_train_steps": 0.003139495849609375, "step": 2722} +{"info/global_step": 2723, "train_info/time_within_train_step": 2.2885820865631104, "step": 2723} +{"train_info/time_between_train_steps": 0.0031731128692626953, "step": 2723} +{"info/global_step": 2724, "train_info/time_within_train_step": 2.2876808643341064, "step": 2724} +{"train_info/time_between_train_steps": 0.0031859874725341797, "step": 2724} +{"info/global_step": 2725, "train_info/time_within_train_step": 2.287083148956299, "step": 2725} +{"train_info/time_between_train_steps": 0.003155231475830078, "step": 2725} +{"info/global_step": 2726, "train_info/time_within_train_step": 2.2876694202423096, "step": 2726} +{"train_info/time_between_train_steps": 0.003135204315185547, "step": 2726} +{"info/global_step": 2727, "train_info/time_within_train_step": 2.2869725227355957, "step": 2727} +{"train_info/time_between_train_steps": 0.0031251907348632812, "step": 2727} +{"info/global_step": 2728, "train_info/time_within_train_step": 2.2879557609558105, "step": 2728} +{"train_info/time_between_train_steps": 0.0031740665435791016, "step": 2728} +{"info/global_step": 2729, "train_info/time_within_train_step": 2.2875587940216064, "step": 2729} +{"train_info/time_between_train_steps": 0.003124713897705078, "step": 2729} +{"info/global_step": 2730, "train_info/time_within_train_step": 2.2875354290008545, "step": 2730} +{"train_info/time_between_train_steps": 0.003142118453979492, "step": 2730} +{"info/global_step": 2731, "train_info/time_within_train_step": 2.287177324295044, "step": 2731} +{"train_info/time_between_train_steps": 0.0031824111938476562, "step": 2731} +{"info/global_step": 2732, "train_info/time_within_train_step": 2.2873945236206055, "step": 2732} +{"train_info/time_between_train_steps": 0.0031800270080566406, "step": 2732} +{"info/global_step": 2733, "train_info/time_within_train_step": 2.287651538848877, "step": 2733} +{"train_info/time_between_train_steps": 0.003154277801513672, "step": 2733} +{"info/global_step": 2734, "train_info/time_within_train_step": 2.286851644515991, "step": 2734} +{"train_info/time_between_train_steps": 0.0031938552856445312, "step": 2734} +{"info/global_step": 2735, "train_info/time_within_train_step": 2.2874107360839844, "step": 2735} +{"train_info/time_between_train_steps": 0.003141164779663086, "step": 2735} +{"info/global_step": 2736, "train_info/time_within_train_step": 2.2877719402313232, "step": 2736} +{"train_info/time_between_train_steps": 0.0031692981719970703, "step": 2736} +{"info/global_step": 2737, "train_info/time_within_train_step": 2.2915215492248535, "step": 2737} +{"train_info/time_between_train_steps": 0.0031473636627197266, "step": 2737} +{"info/global_step": 2738, "train_info/time_within_train_step": 2.288208484649658, "step": 2738} +{"train_info/time_between_train_steps": 0.003143787384033203, "step": 2738} +{"info/global_step": 2739, "train_info/time_within_train_step": 2.2874948978424072, "step": 2739} +{"train_info/time_between_train_steps": 0.0031523704528808594, "step": 2739} +{"info/global_step": 2740, "train_info/time_within_train_step": 2.2875092029571533, "step": 2740} +{"train_info/time_between_train_steps": 0.0032241344451904297, "step": 2740} +{"info/global_step": 2741, "train_info/time_within_train_step": 2.2871952056884766, "step": 2741} +{"train_info/time_between_train_steps": 0.0031948089599609375, "step": 2741} +{"info/global_step": 2742, "train_info/time_within_train_step": 2.287393093109131, "step": 2742} +{"train_info/time_between_train_steps": 0.0031447410583496094, "step": 2742} +{"info/global_step": 2743, "train_info/time_within_train_step": 2.287210464477539, "step": 2743} +{"train_info/time_between_train_steps": 0.003145933151245117, "step": 2743} +{"info/global_step": 2744, "train_info/time_within_train_step": 2.287106513977051, "step": 2744} +{"train_info/time_between_train_steps": 0.0031638145446777344, "step": 2744} +{"info/global_step": 2745, "train_info/time_within_train_step": 2.287252187728882, "step": 2745} +{"train_info/time_between_train_steps": 0.0031576156616210938, "step": 2745} +{"info/global_step": 2746, "train_info/time_within_train_step": 2.287186622619629, "step": 2746} +{"train_info/time_between_train_steps": 0.0031349658966064453, "step": 2746} +{"info/global_step": 2747, "train_info/time_within_train_step": 2.4108762741088867, "step": 2747} +{"train_info/time_between_train_steps": 0.0032143592834472656, "step": 2747} +{"info/global_step": 2748, "train_info/time_within_train_step": 2.287261724472046, "step": 2748} +{"train_info/time_between_train_steps": 0.0031669139862060547, "step": 2748} +{"info/global_step": 2749, "train_info/time_within_train_step": 2.286983013153076, "step": 2749} +{"train_info/time_between_train_steps": 0.0031681060791015625, "step": 2749} +{"info/global_step": 2750, "train_info/time_within_train_step": 2.6594364643096924, "step": 2750} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746350678, "_runtime": 6775}, "step": 2750} +{"logs": {"train/loss": 3.2964, "train/learning_rate": 5.5555555555555545e-05, "train/epoch": 2.19, "_timestamp": 1746350678, "_runtime": 6775}, "step": 2750} +{"train_info/time_between_train_steps": 0.023748159408569336, "step": 2750} +{"info/global_step": 2751, "train_info/time_within_train_step": 2.2858216762542725, "step": 2751} +{"train_info/time_between_train_steps": 0.0031452178955078125, "step": 2751} +{"info/global_step": 2752, "train_info/time_within_train_step": 2.3738245964050293, "step": 2752} +{"train_info/time_between_train_steps": 0.0031273365020751953, "step": 2752} +{"info/global_step": 2753, "train_info/time_within_train_step": 2.2863821983337402, "step": 2753} +{"train_info/time_between_train_steps": 0.003248453140258789, "step": 2753} +{"info/global_step": 2754, "train_info/time_within_train_step": 2.286227226257324, "step": 2754} +{"train_info/time_between_train_steps": 0.0031697750091552734, "step": 2754} +{"info/global_step": 2755, "train_info/time_within_train_step": 2.2870099544525146, "step": 2755} +{"train_info/time_between_train_steps": 0.0031659603118896484, "step": 2755} +{"info/global_step": 2756, "train_info/time_within_train_step": 2.2863197326660156, "step": 2756} +{"train_info/time_between_train_steps": 0.003151416778564453, "step": 2756} +{"info/global_step": 2757, "train_info/time_within_train_step": 2.286769390106201, "step": 2757} +{"train_info/time_between_train_steps": 0.003153562545776367, "step": 2757} +{"info/global_step": 2758, "train_info/time_within_train_step": 2.28654146194458, "step": 2758} +{"train_info/time_between_train_steps": 0.0031347274780273438, "step": 2758} +{"info/global_step": 2759, "train_info/time_within_train_step": 2.286550283432007, "step": 2759} +{"train_info/time_between_train_steps": 0.0031576156616210938, "step": 2759} +{"info/global_step": 2760, "train_info/time_within_train_step": 2.2867422103881836, "step": 2760} +{"train_info/time_between_train_steps": 0.0031206607818603516, "step": 2760} +{"info/global_step": 2761, "train_info/time_within_train_step": 2.2857584953308105, "step": 2761} +{"train_info/time_between_train_steps": 0.003172159194946289, "step": 2761} +{"info/global_step": 2762, "train_info/time_within_train_step": 2.287368059158325, "step": 2762} +{"train_info/time_between_train_steps": 0.007164955139160156, "step": 2762} +{"info/global_step": 2763, "train_info/time_within_train_step": 2.287315845489502, "step": 2763} +{"train_info/time_between_train_steps": 0.006658077239990234, "step": 2763} +{"info/global_step": 2764, "train_info/time_within_train_step": 2.286945104598999, "step": 2764} +{"train_info/time_between_train_steps": 0.006488323211669922, "step": 2764} +{"info/global_step": 2765, "train_info/time_within_train_step": 2.2866876125335693, "step": 2765} +{"train_info/time_between_train_steps": 0.006502866744995117, "step": 2765} +{"info/global_step": 2766, "train_info/time_within_train_step": 2.2869293689727783, "step": 2766} +{"train_info/time_between_train_steps": 0.0064852237701416016, "step": 2766} +{"info/global_step": 2767, "train_info/time_within_train_step": 2.287400722503662, "step": 2767} +{"train_info/time_between_train_steps": 0.006561279296875, "step": 2767} +{"info/global_step": 2768, "train_info/time_within_train_step": 2.28768253326416, "step": 2768} +{"train_info/time_between_train_steps": 0.0064394474029541016, "step": 2768} +{"info/global_step": 2769, "train_info/time_within_train_step": 2.286592721939087, "step": 2769} +{"train_info/time_between_train_steps": 0.006534099578857422, "step": 2769} +{"info/global_step": 2770, "train_info/time_within_train_step": 2.2870914936065674, "step": 2770} +{"train_info/time_between_train_steps": 0.006522655487060547, "step": 2770} +{"info/global_step": 2771, "train_info/time_within_train_step": 2.2875654697418213, "step": 2771} +{"train_info/time_between_train_steps": 0.0032079219818115234, "step": 2771} +{"info/global_step": 2772, "train_info/time_within_train_step": 2.287050247192383, "step": 2772} +{"train_info/time_between_train_steps": 0.0032396316528320312, "step": 2772} +{"info/global_step": 2773, "train_info/time_within_train_step": 2.287121534347534, "step": 2773} +{"train_info/time_between_train_steps": 0.0032052993774414062, "step": 2773} +{"info/global_step": 2774, "train_info/time_within_train_step": 2.287043333053589, "step": 2774} +{"train_info/time_between_train_steps": 0.00319671630859375, "step": 2774} +{"info/global_step": 2775, "train_info/time_within_train_step": 2.287560224533081, "step": 2775} +{"train_info/time_between_train_steps": 0.0031881332397460938, "step": 2775} +{"info/global_step": 2776, "train_info/time_within_train_step": 2.2868196964263916, "step": 2776} +{"train_info/time_between_train_steps": 0.0031347274780273438, "step": 2776} +{"info/global_step": 2777, "train_info/time_within_train_step": 2.2874808311462402, "step": 2777} +{"train_info/time_between_train_steps": 0.0031981468200683594, "step": 2777} +{"info/global_step": 2778, "train_info/time_within_train_step": 2.373908281326294, "step": 2778} +{"train_info/time_between_train_steps": 0.0031671524047851562, "step": 2778} +{"info/global_step": 2779, "train_info/time_within_train_step": 2.2874066829681396, "step": 2779} +{"train_info/time_between_train_steps": 0.003159761428833008, "step": 2779} +{"info/global_step": 2780, "train_info/time_within_train_step": 2.2868781089782715, "step": 2780} +{"train_info/time_between_train_steps": 0.003147602081298828, "step": 2780} +{"info/global_step": 2781, "train_info/time_within_train_step": 2.287550926208496, "step": 2781} +{"train_info/time_between_train_steps": 0.003185272216796875, "step": 2781} +{"info/global_step": 2782, "train_info/time_within_train_step": 2.2867612838745117, "step": 2782} +{"train_info/time_between_train_steps": 0.003180980682373047, "step": 2782} +{"info/global_step": 2783, "train_info/time_within_train_step": 2.2863855361938477, "step": 2783} +{"train_info/time_between_train_steps": 0.0031461715698242188, "step": 2783} +{"info/global_step": 2784, "train_info/time_within_train_step": 2.286602735519409, "step": 2784} +{"train_info/time_between_train_steps": 0.003131866455078125, "step": 2784} +{"info/global_step": 2785, "train_info/time_within_train_step": 2.2865593433380127, "step": 2785} +{"train_info/time_between_train_steps": 0.0031685829162597656, "step": 2785} +{"info/global_step": 2786, "train_info/time_within_train_step": 2.287330150604248, "step": 2786} +{"train_info/time_between_train_steps": 0.003200054168701172, "step": 2786} +{"info/global_step": 2787, "train_info/time_within_train_step": 2.2865219116210938, "step": 2787} +{"train_info/time_between_train_steps": 0.003150463104248047, "step": 2787} +{"info/global_step": 2788, "train_info/time_within_train_step": 2.2864742279052734, "step": 2788} +{"train_info/time_between_train_steps": 0.003175497055053711, "step": 2788} +{"info/global_step": 2789, "train_info/time_within_train_step": 2.2864017486572266, "step": 2789} +{"train_info/time_between_train_steps": 0.003135204315185547, "step": 2789} +{"info/global_step": 2790, "train_info/time_within_train_step": 2.286632776260376, "step": 2790} +{"train_info/time_between_train_steps": 0.003151416778564453, "step": 2790} +{"info/global_step": 2791, "train_info/time_within_train_step": 2.5426619052886963, "step": 2791} +{"train_info/time_between_train_steps": 0.003178834915161133, "step": 2791} +{"info/global_step": 2792, "train_info/time_within_train_step": 2.286167621612549, "step": 2792} +{"train_info/time_between_train_steps": 0.003195524215698242, "step": 2792} +{"info/global_step": 2793, "train_info/time_within_train_step": 2.2861411571502686, "step": 2793} +{"train_info/time_between_train_steps": 0.003162384033203125, "step": 2793} +{"info/global_step": 2794, "train_info/time_within_train_step": 2.2866737842559814, "step": 2794} +{"train_info/time_between_train_steps": 0.0032088756561279297, "step": 2794} +{"info/global_step": 2795, "train_info/time_within_train_step": 2.286076784133911, "step": 2795} +{"train_info/time_between_train_steps": 0.0031585693359375, "step": 2795} +{"info/global_step": 2796, "train_info/time_within_train_step": 2.2860183715820312, "step": 2796} +{"train_info/time_between_train_steps": 0.0031321048736572266, "step": 2796} +{"info/global_step": 2797, "train_info/time_within_train_step": 2.2859957218170166, "step": 2797} +{"train_info/time_between_train_steps": 0.0031278133392333984, "step": 2797} +{"info/global_step": 2798, "train_info/time_within_train_step": 2.2863311767578125, "step": 2798} +{"train_info/time_between_train_steps": 0.0031638145446777344, "step": 2798} +{"info/global_step": 2799, "train_info/time_within_train_step": 2.286931276321411, "step": 2799} +{"train_info/time_between_train_steps": 0.0032105445861816406, "step": 2799} +{"info/global_step": 2800, "train_info/time_within_train_step": 2.286961793899536, "step": 2800} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746350794, "_runtime": 6891}, "step": 2800} +{"logs": {"train/loss": 3.274, "train/learning_rate": 4.444444444444444e-05, "train/epoch": 2.21, "_timestamp": 1746350794, "_runtime": 6891}, "step": 2800} +{"train_info/time_between_train_steps": 16.24183440208435, "step": 2800} +{"info/global_step": 2801, "train_info/time_within_train_step": 2.119265079498291, "step": 2801} +{"train_info/time_between_train_steps": 0.0032186508178710938, "step": 2801} +{"info/global_step": 2802, "train_info/time_within_train_step": 2.0951409339904785, "step": 2802} +{"train_info/time_between_train_steps": 0.0032112598419189453, "step": 2802} +{"info/global_step": 2803, "train_info/time_within_train_step": 2.1264610290527344, "step": 2803} +{"train_info/time_between_train_steps": 0.003233671188354492, "step": 2803} +{"info/global_step": 2804, "train_info/time_within_train_step": 2.2807230949401855, "step": 2804} +{"train_info/time_between_train_steps": 0.0033779144287109375, "step": 2804} +{"info/global_step": 2805, "train_info/time_within_train_step": 2.285918951034546, "step": 2805} +{"train_info/time_between_train_steps": 0.0033779144287109375, "step": 2805} +{"info/global_step": 2806, "train_info/time_within_train_step": 2.2867767810821533, "step": 2806} +{"train_info/time_between_train_steps": 0.003401517868041992, "step": 2806} +{"info/global_step": 2807, "train_info/time_within_train_step": 2.2872262001037598, "step": 2807} +{"train_info/time_between_train_steps": 0.003357410430908203, "step": 2807} +{"info/global_step": 2808, "train_info/time_within_train_step": 2.2919485569000244, "step": 2808} +{"train_info/time_between_train_steps": 0.003370523452758789, "step": 2808} +{"info/global_step": 2809, "train_info/time_within_train_step": 2.2873730659484863, "step": 2809} +{"train_info/time_between_train_steps": 0.15690279006958008, "step": 2809} +{"info/global_step": 2810, "train_info/time_within_train_step": 2.28867244720459, "step": 2810} +{"train_info/time_between_train_steps": 0.00323486328125, "step": 2810} +{"info/global_step": 2811, "train_info/time_within_train_step": 2.2874457836151123, "step": 2811} +{"train_info/time_between_train_steps": 0.003237485885620117, "step": 2811} +{"info/global_step": 2812, "train_info/time_within_train_step": 2.2871787548065186, "step": 2812} +{"train_info/time_between_train_steps": 0.003246307373046875, "step": 2812} +{"info/global_step": 2813, "train_info/time_within_train_step": 2.2873575687408447, "step": 2813} +{"train_info/time_between_train_steps": 0.003222227096557617, "step": 2813} +{"info/global_step": 2814, "train_info/time_within_train_step": 2.287606716156006, "step": 2814} +{"train_info/time_between_train_steps": 0.003244161605834961, "step": 2814} +{"info/global_step": 2815, "train_info/time_within_train_step": 2.2870426177978516, "step": 2815} +{"train_info/time_between_train_steps": 0.003232240676879883, "step": 2815} +{"info/global_step": 2816, "train_info/time_within_train_step": 2.286921977996826, "step": 2816} +{"train_info/time_between_train_steps": 0.003192901611328125, "step": 2816} +{"info/global_step": 2817, "train_info/time_within_train_step": 2.286616802215576, "step": 2817} +{"train_info/time_between_train_steps": 0.0031714439392089844, "step": 2817} +{"info/global_step": 2818, "train_info/time_within_train_step": 2.286841869354248, "step": 2818} +{"train_info/time_between_train_steps": 0.0033235549926757812, "step": 2818} +{"info/global_step": 2819, "train_info/time_within_train_step": 2.287289619445801, "step": 2819} +{"train_info/time_between_train_steps": 0.003202676773071289, "step": 2819} +{"info/global_step": 2820, "train_info/time_within_train_step": 2.287219285964966, "step": 2820} +{"train_info/time_between_train_steps": 0.0032236576080322266, "step": 2820} +{"info/global_step": 2821, "train_info/time_within_train_step": 2.2878551483154297, "step": 2821} +{"train_info/time_between_train_steps": 0.0032434463500976562, "step": 2821} +{"info/global_step": 2822, "train_info/time_within_train_step": 2.2876667976379395, "step": 2822} +{"train_info/time_between_train_steps": 0.0032515525817871094, "step": 2822} +{"info/global_step": 2823, "train_info/time_within_train_step": 2.287999153137207, "step": 2823} +{"train_info/time_between_train_steps": 0.003235340118408203, "step": 2823} +{"info/global_step": 2824, "train_info/time_within_train_step": 2.2876999378204346, "step": 2824} +{"train_info/time_between_train_steps": 0.0032138824462890625, "step": 2824} +{"info/global_step": 2825, "train_info/time_within_train_step": 2.287485122680664, "step": 2825} +{"train_info/time_between_train_steps": 0.003203153610229492, "step": 2825} +{"info/global_step": 2826, "train_info/time_within_train_step": 2.287367820739746, "step": 2826} +{"train_info/time_between_train_steps": 0.0031986236572265625, "step": 2826} +{"info/global_step": 2827, "train_info/time_within_train_step": 2.2882938385009766, "step": 2827} +{"train_info/time_between_train_steps": 0.0033288002014160156, "step": 2827} +{"info/global_step": 2828, "train_info/time_within_train_step": 2.2884318828582764, "step": 2828} +{"train_info/time_between_train_steps": 0.003266572952270508, "step": 2828} +{"info/global_step": 2829, "train_info/time_within_train_step": 2.287827730178833, "step": 2829} +{"train_info/time_between_train_steps": 0.0032262802124023438, "step": 2829} +{"info/global_step": 2830, "train_info/time_within_train_step": 2.287916898727417, "step": 2830} +{"train_info/time_between_train_steps": 0.0032150745391845703, "step": 2830} +{"info/global_step": 2831, "train_info/time_within_train_step": 2.2875680923461914, "step": 2831} +{"train_info/time_between_train_steps": 0.003239154815673828, "step": 2831} +{"info/global_step": 2832, "train_info/time_within_train_step": 2.288149118423462, "step": 2832} +{"train_info/time_between_train_steps": 0.003249645233154297, "step": 2832} +{"info/global_step": 2833, "train_info/time_within_train_step": 2.5635311603546143, "step": 2833} +{"train_info/time_between_train_steps": 0.0031654834747314453, "step": 2833} +{"info/global_step": 2834, "train_info/time_within_train_step": 2.2882628440856934, "step": 2834} +{"train_info/time_between_train_steps": 0.0031747817993164062, "step": 2834} +{"info/global_step": 2835, "train_info/time_within_train_step": 2.2867870330810547, "step": 2835} +{"train_info/time_between_train_steps": 0.0031855106353759766, "step": 2835} +{"info/global_step": 2836, "train_info/time_within_train_step": 2.2926828861236572, "step": 2836} +{"train_info/time_between_train_steps": 0.0032176971435546875, "step": 2836} +{"info/global_step": 2837, "train_info/time_within_train_step": 2.287125825881958, "step": 2837} +{"train_info/time_between_train_steps": 0.003143787384033203, "step": 2837} +{"info/global_step": 2838, "train_info/time_within_train_step": 2.2874298095703125, "step": 2838} +{"train_info/time_between_train_steps": 0.003192901611328125, "step": 2838} +{"info/global_step": 2839, "train_info/time_within_train_step": 2.28752064704895, "step": 2839} +{"train_info/time_between_train_steps": 0.0031452178955078125, "step": 2839} +{"info/global_step": 2840, "train_info/time_within_train_step": 2.2869391441345215, "step": 2840} +{"train_info/time_between_train_steps": 0.003169536590576172, "step": 2840} +{"info/global_step": 2841, "train_info/time_within_train_step": 2.2878196239471436, "step": 2841} +{"train_info/time_between_train_steps": 0.003164052963256836, "step": 2841} +{"info/global_step": 2842, "train_info/time_within_train_step": 2.287644147872925, "step": 2842} +{"train_info/time_between_train_steps": 0.003197908401489258, "step": 2842} +{"info/global_step": 2843, "train_info/time_within_train_step": 2.286726713180542, "step": 2843} +{"train_info/time_between_train_steps": 0.0031909942626953125, "step": 2843} +{"info/global_step": 2844, "train_info/time_within_train_step": 2.2865076065063477, "step": 2844} +{"train_info/time_between_train_steps": 0.0031745433807373047, "step": 2844} +{"info/global_step": 2845, "train_info/time_within_train_step": 2.2879161834716797, "step": 2845} +{"train_info/time_between_train_steps": 0.0032024383544921875, "step": 2845} +{"info/global_step": 2846, "train_info/time_within_train_step": 2.2873785495758057, "step": 2846} +{"train_info/time_between_train_steps": 0.0031592845916748047, "step": 2846} +{"info/global_step": 2847, "train_info/time_within_train_step": 2.286733865737915, "step": 2847} +{"train_info/time_between_train_steps": 0.003102540969848633, "step": 2847} +{"info/global_step": 2848, "train_info/time_within_train_step": 2.2867050170898438, "step": 2848} +{"train_info/time_between_train_steps": 0.0031304359436035156, "step": 2848} +{"info/global_step": 2849, "train_info/time_within_train_step": 2.2874374389648438, "step": 2849} +{"train_info/time_between_train_steps": 0.0032160282135009766, "step": 2849} +{"info/global_step": 2850, "train_info/time_within_train_step": 2.287264585494995, "step": 2850} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746350925, "_runtime": 7022}, "step": 2850} +{"logs": {"train/loss": 3.2683, "train/learning_rate": 3.333333333333333e-05, "train/epoch": 2.22, "_timestamp": 1746350925, "_runtime": 7022}, "step": 2850} +{"train_info/time_between_train_steps": 0.024062156677246094, "step": 2850} +{"info/global_step": 2851, "train_info/time_within_train_step": 2.2872750759124756, "step": 2851} +{"train_info/time_between_train_steps": 0.0031414031982421875, "step": 2851} +{"info/global_step": 2852, "train_info/time_within_train_step": 2.3740007877349854, "step": 2852} +{"train_info/time_between_train_steps": 0.0031561851501464844, "step": 2852} +{"info/global_step": 2853, "train_info/time_within_train_step": 2.2868988513946533, "step": 2853} +{"train_info/time_between_train_steps": 0.0031316280364990234, "step": 2853} +{"info/global_step": 2854, "train_info/time_within_train_step": 2.2868947982788086, "step": 2854} +{"train_info/time_between_train_steps": 0.0030989646911621094, "step": 2854} +{"info/global_step": 2855, "train_info/time_within_train_step": 2.2870213985443115, "step": 2855} +{"train_info/time_between_train_steps": 0.0031249523162841797, "step": 2855} +{"info/global_step": 2856, "train_info/time_within_train_step": 2.286407470703125, "step": 2856} +{"train_info/time_between_train_steps": 0.0031228065490722656, "step": 2856} +{"info/global_step": 2857, "train_info/time_within_train_step": 2.2864320278167725, "step": 2857} +{"train_info/time_between_train_steps": 0.003106832504272461, "step": 2857} +{"info/global_step": 2858, "train_info/time_within_train_step": 2.287287950515747, "step": 2858} +{"train_info/time_between_train_steps": 0.0031583309173583984, "step": 2858} +{"info/global_step": 2859, "train_info/time_within_train_step": 2.285951614379883, "step": 2859} +{"train_info/time_between_train_steps": 0.0031938552856445312, "step": 2859} +{"info/global_step": 2860, "train_info/time_within_train_step": 2.286252021789551, "step": 2860} +{"train_info/time_between_train_steps": 0.003190755844116211, "step": 2860} +{"info/global_step": 2861, "train_info/time_within_train_step": 2.2862966060638428, "step": 2861} +{"train_info/time_between_train_steps": 0.003141164779663086, "step": 2861} +{"info/global_step": 2862, "train_info/time_within_train_step": 2.2859368324279785, "step": 2862} +{"train_info/time_between_train_steps": 0.003147125244140625, "step": 2862} +{"info/global_step": 2863, "train_info/time_within_train_step": 2.286477565765381, "step": 2863} +{"train_info/time_between_train_steps": 0.0031423568725585938, "step": 2863} +{"info/global_step": 2864, "train_info/time_within_train_step": 2.2855753898620605, "step": 2864} +{"train_info/time_between_train_steps": 0.003137826919555664, "step": 2864} +{"info/global_step": 2865, "train_info/time_within_train_step": 2.286015510559082, "step": 2865} +{"train_info/time_between_train_steps": 0.0031409263610839844, "step": 2865} +{"info/global_step": 2866, "train_info/time_within_train_step": 2.285571575164795, "step": 2866} +{"train_info/time_between_train_steps": 0.0032193660736083984, "step": 2866} +{"info/global_step": 2867, "train_info/time_within_train_step": 2.2869880199432373, "step": 2867} +{"train_info/time_between_train_steps": 0.003185749053955078, "step": 2867} +{"info/global_step": 2868, "train_info/time_within_train_step": 2.2864842414855957, "step": 2868} +{"train_info/time_between_train_steps": 0.0031249523162841797, "step": 2868} +{"info/global_step": 2869, "train_info/time_within_train_step": 2.2876925468444824, "step": 2869} +{"train_info/time_between_train_steps": 0.0031473636627197266, "step": 2869} +{"info/global_step": 2870, "train_info/time_within_train_step": 2.286518096923828, "step": 2870} +{"train_info/time_between_train_steps": 0.0031554698944091797, "step": 2870} +{"info/global_step": 2871, "train_info/time_within_train_step": 2.2866575717926025, "step": 2871} +{"train_info/time_between_train_steps": 0.003365039825439453, "step": 2871} +{"info/global_step": 2872, "train_info/time_within_train_step": 2.4100053310394287, "step": 2872} +{"train_info/time_between_train_steps": 0.0031702518463134766, "step": 2872} +{"info/global_step": 2873, "train_info/time_within_train_step": 2.286761999130249, "step": 2873} +{"train_info/time_between_train_steps": 0.0031647682189941406, "step": 2873} +{"info/global_step": 2874, "train_info/time_within_train_step": 2.286120653152466, "step": 2874} +{"train_info/time_between_train_steps": 0.0031769275665283203, "step": 2874} +{"info/global_step": 2875, "train_info/time_within_train_step": 2.286897659301758, "step": 2875} +{"train_info/time_between_train_steps": 0.003202676773071289, "step": 2875} +{"info/global_step": 2876, "train_info/time_within_train_step": 2.288053274154663, "step": 2876} +{"train_info/time_between_train_steps": 0.003175973892211914, "step": 2876} +{"info/global_step": 2877, "train_info/time_within_train_step": 2.2866904735565186, "step": 2877} +{"train_info/time_between_train_steps": 0.0031774044036865234, "step": 2877} +{"info/global_step": 2878, "train_info/time_within_train_step": 2.374755382537842, "step": 2878} +{"train_info/time_between_train_steps": 0.0031948089599609375, "step": 2878} +{"info/global_step": 2879, "train_info/time_within_train_step": 2.2863051891326904, "step": 2879} +{"train_info/time_between_train_steps": 0.0031838417053222656, "step": 2879} +{"info/global_step": 2880, "train_info/time_within_train_step": 2.286407470703125, "step": 2880} +{"train_info/time_between_train_steps": 0.003294706344604492, "step": 2880} +{"info/global_step": 2881, "train_info/time_within_train_step": 2.286876916885376, "step": 2881} +{"train_info/time_between_train_steps": 0.0031630992889404297, "step": 2881} +{"info/global_step": 2882, "train_info/time_within_train_step": 2.2859485149383545, "step": 2882} +{"train_info/time_between_train_steps": 0.003168821334838867, "step": 2882} +{"info/global_step": 2883, "train_info/time_within_train_step": 2.2870547771453857, "step": 2883} +{"train_info/time_between_train_steps": 0.003175973892211914, "step": 2883} +{"info/global_step": 2884, "train_info/time_within_train_step": 2.2866554260253906, "step": 2884} +{"train_info/time_between_train_steps": 0.0031499862670898438, "step": 2884} +{"info/global_step": 2885, "train_info/time_within_train_step": 2.2871367931365967, "step": 2885} +{"train_info/time_between_train_steps": 0.0031676292419433594, "step": 2885} +{"info/global_step": 2886, "train_info/time_within_train_step": 2.2855968475341797, "step": 2886} +{"train_info/time_between_train_steps": 0.003152132034301758, "step": 2886} +{"info/global_step": 2887, "train_info/time_within_train_step": 2.2861180305480957, "step": 2887} +{"train_info/time_between_train_steps": 0.0031604766845703125, "step": 2887} +{"info/global_step": 2888, "train_info/time_within_train_step": 2.2865495681762695, "step": 2888} +{"train_info/time_between_train_steps": 0.0031893253326416016, "step": 2888} +{"info/global_step": 2889, "train_info/time_within_train_step": 2.2876274585723877, "step": 2889} +{"train_info/time_between_train_steps": 0.0031669139862060547, "step": 2889} +{"info/global_step": 2890, "train_info/time_within_train_step": 2.2864997386932373, "step": 2890} +{"train_info/time_between_train_steps": 0.0032224655151367188, "step": 2890} +{"info/global_step": 2891, "train_info/time_within_train_step": 2.2862937450408936, "step": 2891} +{"train_info/time_between_train_steps": 0.003252744674682617, "step": 2891} +{"info/global_step": 2892, "train_info/time_within_train_step": 2.2877700328826904, "step": 2892} +{"train_info/time_between_train_steps": 0.0031719207763671875, "step": 2892} +{"info/global_step": 2893, "train_info/time_within_train_step": 2.2862863540649414, "step": 2893} +{"train_info/time_between_train_steps": 0.003176450729370117, "step": 2893} +{"info/global_step": 2894, "train_info/time_within_train_step": 2.2878966331481934, "step": 2894} +{"train_info/time_between_train_steps": 0.0031676292419433594, "step": 2894} +{"info/global_step": 2895, "train_info/time_within_train_step": 2.2870054244995117, "step": 2895} +{"train_info/time_between_train_steps": 0.0031495094299316406, "step": 2895} +{"info/global_step": 2896, "train_info/time_within_train_step": 2.2868056297302246, "step": 2896} +{"train_info/time_between_train_steps": 0.003179788589477539, "step": 2896} +{"info/global_step": 2897, "train_info/time_within_train_step": 2.287175178527832, "step": 2897} +{"train_info/time_between_train_steps": 0.0031309127807617188, "step": 2897} +{"info/global_step": 2898, "train_info/time_within_train_step": 2.287163496017456, "step": 2898} +{"train_info/time_between_train_steps": 0.0032148361206054688, "step": 2898} +{"info/global_step": 2899, "train_info/time_within_train_step": 2.2865142822265625, "step": 2899} +{"train_info/time_between_train_steps": 0.0031795501708984375, "step": 2899} +{"info/global_step": 2900, "train_info/time_within_train_step": 2.2870402336120605, "step": 2900} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746351041, "_runtime": 7138}, "step": 2900} +{"logs": {"train/loss": 3.259, "train/learning_rate": 2.222222222222222e-05, "train/epoch": 2.24, "_timestamp": 1746351041, "_runtime": 7138}, "step": 2900} +{"train_info/time_between_train_steps": 18.10087752342224, "step": 2900} +{"info/global_step": 2901, "train_info/time_within_train_step": 2.1304147243499756, "step": 2901} +{"train_info/time_between_train_steps": 0.0031671524047851562, "step": 2901} +{"info/global_step": 2902, "train_info/time_within_train_step": 2.096874713897705, "step": 2902} +{"train_info/time_between_train_steps": 0.003203153610229492, "step": 2902} +{"info/global_step": 2903, "train_info/time_within_train_step": 2.1771273612976074, "step": 2903} +{"train_info/time_between_train_steps": 0.003167390823364258, "step": 2903} +{"info/global_step": 2904, "train_info/time_within_train_step": 2.284081220626831, "step": 2904} +{"train_info/time_between_train_steps": 0.003146648406982422, "step": 2904} +{"info/global_step": 2905, "train_info/time_within_train_step": 2.2841908931732178, "step": 2905} +{"train_info/time_between_train_steps": 0.003123760223388672, "step": 2905} +{"info/global_step": 2906, "train_info/time_within_train_step": 2.2844080924987793, "step": 2906} +{"train_info/time_between_train_steps": 0.003103494644165039, "step": 2906} +{"info/global_step": 2907, "train_info/time_within_train_step": 2.2853190898895264, "step": 2907} +{"train_info/time_between_train_steps": 0.003139019012451172, "step": 2907} +{"info/global_step": 2908, "train_info/time_within_train_step": 2.2850937843322754, "step": 2908} +{"train_info/time_between_train_steps": 0.003110647201538086, "step": 2908} +{"info/global_step": 2909, "train_info/time_within_train_step": 2.2856743335723877, "step": 2909} +{"train_info/time_between_train_steps": 0.003132343292236328, "step": 2909} +{"info/global_step": 2910, "train_info/time_within_train_step": 2.2857565879821777, "step": 2910} +{"train_info/time_between_train_steps": 0.0031659603118896484, "step": 2910} +{"info/global_step": 2911, "train_info/time_within_train_step": 2.2866010665893555, "step": 2911} +{"train_info/time_between_train_steps": 0.0031659603118896484, "step": 2911} +{"info/global_step": 2912, "train_info/time_within_train_step": 2.286547899246216, "step": 2912} +{"train_info/time_between_train_steps": 0.0031614303588867188, "step": 2912} +{"info/global_step": 2913, "train_info/time_within_train_step": 2.529716968536377, "step": 2913} +{"train_info/time_between_train_steps": 0.0031290054321289062, "step": 2913} +{"info/global_step": 2914, "train_info/time_within_train_step": 2.286705493927002, "step": 2914} +{"train_info/time_between_train_steps": 0.003107309341430664, "step": 2914} +{"info/global_step": 2915, "train_info/time_within_train_step": 2.2868258953094482, "step": 2915} +{"train_info/time_between_train_steps": 0.0031249523162841797, "step": 2915} +{"info/global_step": 2916, "train_info/time_within_train_step": 2.2872776985168457, "step": 2916} +{"train_info/time_between_train_steps": 0.0030951499938964844, "step": 2916} +{"info/global_step": 2917, "train_info/time_within_train_step": 2.287137269973755, "step": 2917} +{"train_info/time_between_train_steps": 0.0031557083129882812, "step": 2917} +{"info/global_step": 2918, "train_info/time_within_train_step": 2.286856174468994, "step": 2918} +{"train_info/time_between_train_steps": 0.003144979476928711, "step": 2918} +{"info/global_step": 2919, "train_info/time_within_train_step": 2.287522792816162, "step": 2919} +{"train_info/time_between_train_steps": 0.003112316131591797, "step": 2919} +{"info/global_step": 2920, "train_info/time_within_train_step": 2.2872824668884277, "step": 2920} +{"train_info/time_between_train_steps": 0.0031042098999023438, "step": 2920} +{"info/global_step": 2921, "train_info/time_within_train_step": 2.2867493629455566, "step": 2921} +{"train_info/time_between_train_steps": 0.0031168460845947266, "step": 2921} +{"info/global_step": 2922, "train_info/time_within_train_step": 2.287254571914673, "step": 2922} +{"train_info/time_between_train_steps": 0.003113985061645508, "step": 2922} +{"info/global_step": 2923, "train_info/time_within_train_step": 2.2873198986053467, "step": 2923} +{"train_info/time_between_train_steps": 0.0031485557556152344, "step": 2923} +{"info/global_step": 2924, "train_info/time_within_train_step": 2.286998748779297, "step": 2924} +{"train_info/time_between_train_steps": 0.0031044483184814453, "step": 2924} +{"info/global_step": 2925, "train_info/time_within_train_step": 2.2866828441619873, "step": 2925} +{"train_info/time_between_train_steps": 0.0031735897064208984, "step": 2925} +{"info/global_step": 2926, "train_info/time_within_train_step": 2.2873404026031494, "step": 2926} +{"train_info/time_between_train_steps": 0.003175020217895508, "step": 2926} +{"info/global_step": 2927, "train_info/time_within_train_step": 2.2869787216186523, "step": 2927} +{"train_info/time_between_train_steps": 0.0031194686889648438, "step": 2927} +{"info/global_step": 2928, "train_info/time_within_train_step": 2.286924362182617, "step": 2928} +{"train_info/time_between_train_steps": 0.00315093994140625, "step": 2928} +{"info/global_step": 2929, "train_info/time_within_train_step": 2.285975694656372, "step": 2929} +{"train_info/time_between_train_steps": 0.003110170364379883, "step": 2929} +{"info/global_step": 2930, "train_info/time_within_train_step": 2.286184310913086, "step": 2930} +{"train_info/time_between_train_steps": 0.0031363964080810547, "step": 2930} +{"info/global_step": 2931, "train_info/time_within_train_step": 2.2874245643615723, "step": 2931} +{"train_info/time_between_train_steps": 0.003100156784057617, "step": 2931} +{"info/global_step": 2932, "train_info/time_within_train_step": 2.2862823009490967, "step": 2932} +{"train_info/time_between_train_steps": 0.0031304359436035156, "step": 2932} +{"info/global_step": 2933, "train_info/time_within_train_step": 2.286353588104248, "step": 2933} +{"train_info/time_between_train_steps": 0.0031855106353759766, "step": 2933} +{"info/global_step": 2934, "train_info/time_within_train_step": 2.2857093811035156, "step": 2934} +{"train_info/time_between_train_steps": 0.0726478099822998, "step": 2934} +{"info/global_step": 2935, "train_info/time_within_train_step": 2.2866573333740234, "step": 2935} +{"train_info/time_between_train_steps": 0.003142833709716797, "step": 2935} +{"info/global_step": 2936, "train_info/time_within_train_step": 2.286000967025757, "step": 2936} +{"train_info/time_between_train_steps": 0.003149271011352539, "step": 2936} +{"info/global_step": 2937, "train_info/time_within_train_step": 2.28643798828125, "step": 2937} +{"train_info/time_between_train_steps": 0.0031397342681884766, "step": 2937} +{"info/global_step": 2938, "train_info/time_within_train_step": 2.2870688438415527, "step": 2938} +{"train_info/time_between_train_steps": 0.00313568115234375, "step": 2938} +{"info/global_step": 2939, "train_info/time_within_train_step": 2.2864537239074707, "step": 2939} +{"train_info/time_between_train_steps": 0.003129720687866211, "step": 2939} +{"info/global_step": 2940, "train_info/time_within_train_step": 2.287186622619629, "step": 2940} +{"train_info/time_between_train_steps": 0.0031328201293945312, "step": 2940} +{"info/global_step": 2941, "train_info/time_within_train_step": 2.286480665206909, "step": 2941} +{"train_info/time_between_train_steps": 0.0031540393829345703, "step": 2941} +{"info/global_step": 2942, "train_info/time_within_train_step": 2.2869818210601807, "step": 2942} +{"train_info/time_between_train_steps": 0.003165006637573242, "step": 2942} +{"info/global_step": 2943, "train_info/time_within_train_step": 2.286959409713745, "step": 2943} +{"train_info/time_between_train_steps": 0.0031571388244628906, "step": 2943} +{"info/global_step": 2944, "train_info/time_within_train_step": 2.2866756916046143, "step": 2944} +{"train_info/time_between_train_steps": 0.0031366348266601562, "step": 2944} +{"info/global_step": 2945, "train_info/time_within_train_step": 2.286557912826538, "step": 2945} +{"train_info/time_between_train_steps": 0.003164052963256836, "step": 2945} +{"info/global_step": 2946, "train_info/time_within_train_step": 2.286142587661743, "step": 2946} +{"train_info/time_between_train_steps": 0.0031549930572509766, "step": 2946} +{"info/global_step": 2947, "train_info/time_within_train_step": 2.2861878871917725, "step": 2947} +{"train_info/time_between_train_steps": 0.003107786178588867, "step": 2947} +{"info/global_step": 2948, "train_info/time_within_train_step": 2.286128282546997, "step": 2948} +{"train_info/time_between_train_steps": 0.003130197525024414, "step": 2948} +{"info/global_step": 2949, "train_info/time_within_train_step": 2.286357879638672, "step": 2949} +{"train_info/time_between_train_steps": 0.0031464099884033203, "step": 2949} +{"info/global_step": 2950, "train_info/time_within_train_step": 2.285930633544922, "step": 2950} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746351175, "_runtime": 7272}, "step": 2950} +{"logs": {"train/loss": 3.2556, "train/learning_rate": 1.111111111111111e-05, "train/epoch": 2.26, "_timestamp": 1746351175, "_runtime": 7272}, "step": 2950} +{"train_info/time_between_train_steps": 0.0242156982421875, "step": 2950} +{"info/global_step": 2951, "train_info/time_within_train_step": 2.286161422729492, "step": 2951} +{"train_info/time_between_train_steps": 0.003142118453979492, "step": 2951} +{"info/global_step": 2952, "train_info/time_within_train_step": 2.2858662605285645, "step": 2952} +{"train_info/time_between_train_steps": 0.003138303756713867, "step": 2952} +{"info/global_step": 2953, "train_info/time_within_train_step": 2.286653757095337, "step": 2953} +{"train_info/time_between_train_steps": 0.003129243850708008, "step": 2953} +{"info/global_step": 2954, "train_info/time_within_train_step": 2.286470413208008, "step": 2954} +{"train_info/time_between_train_steps": 0.0031392574310302734, "step": 2954} +{"info/global_step": 2955, "train_info/time_within_train_step": 2.2860052585601807, "step": 2955} +{"train_info/time_between_train_steps": 0.003118753433227539, "step": 2955} +{"info/global_step": 2956, "train_info/time_within_train_step": 2.286181926727295, "step": 2956} +{"train_info/time_between_train_steps": 0.0031456947326660156, "step": 2956} +{"info/global_step": 2957, "train_info/time_within_train_step": 2.2862837314605713, "step": 2957} +{"train_info/time_between_train_steps": 0.0031502246856689453, "step": 2957} +{"info/global_step": 2958, "train_info/time_within_train_step": 2.286691904067993, "step": 2958} +{"train_info/time_between_train_steps": 0.003160715103149414, "step": 2958} +{"info/global_step": 2959, "train_info/time_within_train_step": 2.28629732131958, "step": 2959} +{"train_info/time_between_train_steps": 0.0031392574310302734, "step": 2959} +{"info/global_step": 2960, "train_info/time_within_train_step": 2.2863452434539795, "step": 2960} +{"train_info/time_between_train_steps": 0.003134489059448242, "step": 2960} +{"info/global_step": 2961, "train_info/time_within_train_step": 2.2866129875183105, "step": 2961} +{"train_info/time_between_train_steps": 0.0031168460845947266, "step": 2961} +{"info/global_step": 2962, "train_info/time_within_train_step": 2.2870781421661377, "step": 2962} +{"train_info/time_between_train_steps": 0.003160238265991211, "step": 2962} +{"info/global_step": 2963, "train_info/time_within_train_step": 2.287520170211792, "step": 2963} +{"train_info/time_between_train_steps": 0.0031528472900390625, "step": 2963} +{"info/global_step": 2964, "train_info/time_within_train_step": 2.2994325160980225, "step": 2964} +{"train_info/time_between_train_steps": 0.0028448104858398438, "step": 2964} +{"info/global_step": 2965, "train_info/time_within_train_step": 2.286206007003784, "step": 2965} +{"train_info/time_between_train_steps": 0.0028624534606933594, "step": 2965} +{"info/global_step": 2966, "train_info/time_within_train_step": 2.286688804626465, "step": 2966} +{"train_info/time_between_train_steps": 0.0029032230377197266, "step": 2966} +{"info/global_step": 2967, "train_info/time_within_train_step": 2.2857775688171387, "step": 2967} +{"train_info/time_between_train_steps": 0.0028858184814453125, "step": 2967} +{"info/global_step": 2968, "train_info/time_within_train_step": 2.5009191036224365, "step": 2968} +{"train_info/time_between_train_steps": 0.002882719039916992, "step": 2968} +{"info/global_step": 2969, "train_info/time_within_train_step": 2.2846927642822266, "step": 2969} +{"train_info/time_between_train_steps": 0.002817869186401367, "step": 2969} +{"info/global_step": 2970, "train_info/time_within_train_step": 2.2846667766571045, "step": 2970} +{"train_info/time_between_train_steps": 0.002852916717529297, "step": 2970} +{"info/global_step": 2971, "train_info/time_within_train_step": 2.285167694091797, "step": 2971} +{"train_info/time_between_train_steps": 0.002846956253051758, "step": 2971} +{"info/global_step": 2972, "train_info/time_within_train_step": 2.2845261096954346, "step": 2972} +{"train_info/time_between_train_steps": 0.002864360809326172, "step": 2972} +{"info/global_step": 2973, "train_info/time_within_train_step": 2.2848942279815674, "step": 2973} +{"train_info/time_between_train_steps": 0.0028815269470214844, "step": 2973} +{"info/global_step": 2974, "train_info/time_within_train_step": 2.2852847576141357, "step": 2974} +{"train_info/time_between_train_steps": 0.002855062484741211, "step": 2974} +{"info/global_step": 2975, "train_info/time_within_train_step": 2.2846662998199463, "step": 2975} +{"train_info/time_between_train_steps": 0.0028526782989501953, "step": 2975} +{"info/global_step": 2976, "train_info/time_within_train_step": 2.2854416370391846, "step": 2976} +{"train_info/time_between_train_steps": 0.002836942672729492, "step": 2976} +{"info/global_step": 2977, "train_info/time_within_train_step": 2.2847583293914795, "step": 2977} +{"train_info/time_between_train_steps": 0.002847909927368164, "step": 2977} +{"info/global_step": 2978, "train_info/time_within_train_step": 2.2858901023864746, "step": 2978} +{"train_info/time_between_train_steps": 0.0029027462005615234, "step": 2978} +{"info/global_step": 2979, "train_info/time_within_train_step": 2.2859742641448975, "step": 2979} +{"train_info/time_between_train_steps": 0.0028295516967773438, "step": 2979} +{"info/global_step": 2980, "train_info/time_within_train_step": 2.2856616973876953, "step": 2980} +{"train_info/time_between_train_steps": 0.0028696060180664062, "step": 2980} +{"info/global_step": 2981, "train_info/time_within_train_step": 2.286130428314209, "step": 2981} +{"train_info/time_between_train_steps": 0.0028595924377441406, "step": 2981} +{"info/global_step": 2982, "train_info/time_within_train_step": 2.285121202468872, "step": 2982} +{"train_info/time_between_train_steps": 0.003098726272583008, "step": 2982} +{"info/global_step": 2983, "train_info/time_within_train_step": 2.2863547801971436, "step": 2983} +{"train_info/time_between_train_steps": 0.0028502941131591797, "step": 2983} +{"info/global_step": 2984, "train_info/time_within_train_step": 2.286158561706543, "step": 2984} +{"train_info/time_between_train_steps": 0.0028486251831054688, "step": 2984} +{"info/global_step": 2985, "train_info/time_within_train_step": 2.285648822784424, "step": 2985} +{"train_info/time_between_train_steps": 0.00284576416015625, "step": 2985} +{"info/global_step": 2986, "train_info/time_within_train_step": 2.2853448390960693, "step": 2986} +{"train_info/time_between_train_steps": 0.0028612613677978516, "step": 2986} +{"info/global_step": 2987, "train_info/time_within_train_step": 2.28629207611084, "step": 2987} +{"train_info/time_between_train_steps": 0.002844572067260742, "step": 2987} +{"info/global_step": 2988, "train_info/time_within_train_step": 2.286036968231201, "step": 2988} +{"train_info/time_between_train_steps": 0.002861499786376953, "step": 2988} +{"info/global_step": 2989, "train_info/time_within_train_step": 2.286316156387329, "step": 2989} +{"train_info/time_between_train_steps": 0.002913236618041992, "step": 2989} +{"info/global_step": 2990, "train_info/time_within_train_step": 2.2853219509124756, "step": 2990} +{"train_info/time_between_train_steps": 0.0028769969940185547, "step": 2990} +{"info/global_step": 2991, "train_info/time_within_train_step": 2.2849326133728027, "step": 2991} +{"train_info/time_between_train_steps": 0.0029206275939941406, "step": 2991} +{"info/global_step": 2992, "train_info/time_within_train_step": 2.2851672172546387, "step": 2992} +{"train_info/time_between_train_steps": 0.0028553009033203125, "step": 2992} +{"info/global_step": 2993, "train_info/time_within_train_step": 2.28450345993042, "step": 2993} +{"train_info/time_between_train_steps": 0.002851247787475586, "step": 2993} +{"info/global_step": 2994, "train_info/time_within_train_step": 2.285353183746338, "step": 2994} +{"train_info/time_between_train_steps": 0.0028901100158691406, "step": 2994} +{"info/global_step": 2995, "train_info/time_within_train_step": 2.285226583480835, "step": 2995} +{"train_info/time_between_train_steps": 0.0028557777404785156, "step": 2995} +{"info/global_step": 2996, "train_info/time_within_train_step": 2.285301923751831, "step": 2996} +{"train_info/time_between_train_steps": 0.0028426647186279297, "step": 2996} +{"info/global_step": 2997, "train_info/time_within_train_step": 2.284956932067871, "step": 2997} +{"train_info/time_between_train_steps": 0.0028638839721679688, "step": 2997} +{"info/global_step": 2998, "train_info/time_within_train_step": 2.285371780395508, "step": 2998} +{"train_info/time_between_train_steps": 0.002864837646484375, "step": 2998} +{"info/global_step": 2999, "train_info/time_within_train_step": 2.285520076751709, "step": 2999} +{"train_info/time_between_train_steps": 0.002870321273803711, "step": 2999} +{"info/global_step": 3000, "train_info/time_within_train_step": 2.671865940093994, "step": 3000} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746351291, "_runtime": 7388}, "step": 3000} +{"logs": {"train/loss": 3.2507, "train/learning_rate": 0.0, "train/epoch": 2.27, "_timestamp": 1746351291, "_runtime": 7388}, "step": 3000} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746351296, "_runtime": 7393}, "step": 3000} +{"logs": {"eval/loss": 3.652341604232788, "eval/runtime": 5.5797, "eval/samples_per_second": 43.73, "eval/steps_per_second": 1.434, "train/epoch": 2.27, "_timestamp": 1746351296, "_runtime": 7393}, "step": 3000} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746351296, "_runtime": 7393}, "step": 3000} +{"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 3.652341604232788, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 38.56486405270745, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 5.5797, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 43.73, "train/epoch": 2.27, "_timestamp": 1746351296, "_runtime": 7393}, "step": 3000} +{"train_info": {"train_info/memory_allocated": 1389.1708984375, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746351309, "_runtime": 7406}, "step": 3000} +{"logs": {"train/train_runtime": 7407.689, "train/train_samples_per_second": 25.919, "train/train_steps_per_second": 0.405, "train/total_flos": 2.5084035072e+16, "train/train_loss": 3.955010881106059, "train/epoch": 2.27, "_timestamp": 1746351309, "_runtime": 7406}, "step": 3000} +{"train_info": {"train_info/memory_allocated": 1389.169921875, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746351319, "_runtime": 7416}, "step": 3000} +{"logs": {"eval/loss": 3.652341604232788, "eval/runtime": 5.0621, "eval/samples_per_second": 48.202, "eval/steps_per_second": 1.58, "train/epoch": 2.27, "_timestamp": 1746351319, "_runtime": 7416}, "step": 3000} +{"train_info": {"train_info/memory_allocated": 1389.169921875, "train_info/memory_max_allocated": 4337.82568359375, "train_info/memory_reserved": 5128.0, "train_info/memory_max_reserved": 5128.0, "_timestamp": 1746351319, "_runtime": 7416}, "step": 3000} +{"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 3.652341604232788, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 38.56486405270745, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 5.0621, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 48.202, "train/epoch": 2.27, "_timestamp": 1746351319, "_runtime": 7416}, "step": 3000}