shuffle_even_odd_EN53 / metrics.json
xiulinyang's picture
Adding model checkpoints and config files
47faf24
Invalid JSON: Unexpected non-whitespace character after JSONat line 2, column 1
{"num_parameters": 124439808, "trainable_parameters": 124439808, "step": 0}
{"train_info/time_between_train_steps": 3.5661585330963135, "step": 0}
{"info/global_step": 1, "train_info/time_within_train_step": 28.733912229537964, "step": 1}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 19761.71484375, "train_info/memory_reserved": 22624.0, "train_info/memory_max_reserved": 22624.0, "_timestamp": 1733837501, "_runtime": 35}, "step": 1}
{"logs": {"train/loss": 11.0177, "train/learning_rate": 4.9999999999999996e-06, "train/epoch": 0.0, "_timestamp": 1733837501, "_runtime": 35}, "step": 1}
{"train_info/time_between_train_steps": 0.12664556503295898, "step": 1}
{"info/global_step": 2, "train_info/time_within_train_step": 28.04296088218689, "step": 2}
{"train_info/time_between_train_steps": 0.00669407844543457, "step": 2}
{"info/global_step": 3, "train_info/time_within_train_step": 27.811320304870605, "step": 3}
{"train_info/time_between_train_steps": 0.005866050720214844, "step": 3}
{"info/global_step": 4, "train_info/time_within_train_step": 27.973292350769043, "step": 4}
{"train_info/time_between_train_steps": 0.0055522918701171875, "step": 4}
{"info/global_step": 5, "train_info/time_within_train_step": 27.830296516418457, "step": 5}
{"train_info/time_between_train_steps": 0.005861997604370117, "step": 5}
{"info/global_step": 6, "train_info/time_within_train_step": 27.950855016708374, "step": 6}
{"train_info/time_between_train_steps": 0.005522489547729492, "step": 6}
{"info/global_step": 7, "train_info/time_within_train_step": 27.83670711517334, "step": 7}
{"train_info/time_between_train_steps": 0.0057773590087890625, "step": 7}
{"info/global_step": 8, "train_info/time_within_train_step": 27.97235679626465, "step": 8}
{"train_info/time_between_train_steps": 0.006056547164916992, "step": 8}
{"info/global_step": 9, "train_info/time_within_train_step": 27.8474018573761, "step": 9}
{"train_info/time_between_train_steps": 0.0053937435150146484, "step": 9}
{"info/global_step": 10, "train_info/time_within_train_step": 27.78600311279297, "step": 10}
{"train_info/time_between_train_steps": 0.005706310272216797, "step": 10}
{"info/global_step": 11, "train_info/time_within_train_step": 27.789557218551636, "step": 11}
{"train_info/time_between_train_steps": 0.005579710006713867, "step": 11}
{"info/global_step": 12, "train_info/time_within_train_step": 27.781293392181396, "step": 12}
{"train_info/time_between_train_steps": 0.005411624908447266, "step": 12}
{"info/global_step": 13, "train_info/time_within_train_step": 27.748928785324097, "step": 13}
{"train_info/time_between_train_steps": 0.005354881286621094, "step": 13}
{"info/global_step": 14, "train_info/time_within_train_step": 27.721388578414917, "step": 14}
{"train_info/time_between_train_steps": 0.005423784255981445, "step": 14}
{"info/global_step": 15, "train_info/time_within_train_step": 27.755425214767456, "step": 15}
{"train_info/time_between_train_steps": 0.00530552864074707, "step": 15}
{"info/global_step": 16, "train_info/time_within_train_step": 27.819061994552612, "step": 16}
{"train_info/time_between_train_steps": 0.0052335262298583984, "step": 16}
{"info/global_step": 17, "train_info/time_within_train_step": 27.727974891662598, "step": 17}
{"train_info/time_between_train_steps": 0.005509138107299805, "step": 17}
{"info/global_step": 18, "train_info/time_within_train_step": 27.741708278656006, "step": 18}
{"train_info/time_between_train_steps": 0.010358095169067383, "step": 18}
{"info/global_step": 19, "train_info/time_within_train_step": 27.722426176071167, "step": 19}
{"train_info/time_between_train_steps": 0.010646820068359375, "step": 19}
{"info/global_step": 20, "train_info/time_within_train_step": 27.740498781204224, "step": 20}
{"train_info/time_between_train_steps": 0.005198001861572266, "step": 20}
{"info/global_step": 21, "train_info/time_within_train_step": 27.73815655708313, "step": 21}
{"train_info/time_between_train_steps": 0.00529170036315918, "step": 21}
{"info/global_step": 22, "train_info/time_within_train_step": 27.753146171569824, "step": 22}
{"train_info/time_between_train_steps": 0.006624460220336914, "step": 22}
{"info/global_step": 23, "train_info/time_within_train_step": 27.73341703414917, "step": 23}
{"train_info/time_between_train_steps": 0.0052835941314697266, "step": 23}
{"info/global_step": 24, "train_info/time_within_train_step": 27.746006965637207, "step": 24}
{"train_info/time_between_train_steps": 0.005952596664428711, "step": 24}
{"info/global_step": 25, "train_info/time_within_train_step": 27.75028657913208, "step": 25}
{"train_info/time_between_train_steps": 0.0061953067779541016, "step": 25}
{"info/global_step": 26, "train_info/time_within_train_step": 27.769542932510376, "step": 26}
{"train_info/time_between_train_steps": 0.005715131759643555, "step": 26}
{"info/global_step": 27, "train_info/time_within_train_step": 27.748931169509888, "step": 27}
{"train_info/time_between_train_steps": 0.011360883712768555, "step": 27}
{"train_info/time_between_train_steps": 20.849161624908447, "step": 27}
{"info/global_step": 28, "train_info/time_within_train_step": 27.750688552856445, "step": 28}
{"train_info/time_between_train_steps": 0.005620718002319336, "step": 28}
{"info/global_step": 29, "train_info/time_within_train_step": 27.90155029296875, "step": 29}
{"train_info/time_between_train_steps": 0.0058825016021728516, "step": 29}
{"info/global_step": 30, "train_info/time_within_train_step": 27.7693190574646, "step": 30}
{"train_info/time_between_train_steps": 0.005227327346801758, "step": 30}
{"info/global_step": 31, "train_info/time_within_train_step": 28.006361961364746, "step": 31}
{"train_info/time_between_train_steps": 0.0056836605072021484, "step": 31}
{"info/global_step": 32, "train_info/time_within_train_step": 27.735578298568726, "step": 32}
{"train_info/time_between_train_steps": 0.00552678108215332, "step": 32}
{"info/global_step": 33, "train_info/time_within_train_step": 27.921395540237427, "step": 33}
{"train_info/time_between_train_steps": 0.005297660827636719, "step": 33}
{"info/global_step": 34, "train_info/time_within_train_step": 27.76257634162903, "step": 34}
{"train_info/time_between_train_steps": 0.005494117736816406, "step": 34}
{"info/global_step": 35, "train_info/time_within_train_step": 27.782541513442993, "step": 35}
{"train_info/time_between_train_steps": 0.0051462650299072266, "step": 35}
{"info/global_step": 36, "train_info/time_within_train_step": 27.751847743988037, "step": 36}
{"train_info/time_between_train_steps": 0.005060434341430664, "step": 36}
{"info/global_step": 37, "train_info/time_within_train_step": 27.730563163757324, "step": 37}
{"train_info/time_between_train_steps": 0.0050716400146484375, "step": 37}
{"info/global_step": 38, "train_info/time_within_train_step": 27.72866940498352, "step": 38}
{"train_info/time_between_train_steps": 0.005013465881347656, "step": 38}
{"info/global_step": 39, "train_info/time_within_train_step": 27.742274045944214, "step": 39}
{"train_info/time_between_train_steps": 0.0051953792572021484, "step": 39}
{"info/global_step": 40, "train_info/time_within_train_step": 27.724833965301514, "step": 40}
{"train_info/time_between_train_steps": 0.009978294372558594, "step": 40}
{"info/global_step": 41, "train_info/time_within_train_step": 27.717860460281372, "step": 41}
{"train_info/time_between_train_steps": 0.005153656005859375, "step": 41}
{"info/global_step": 42, "train_info/time_within_train_step": 27.71069598197937, "step": 42}
{"train_info/time_between_train_steps": 0.005235910415649414, "step": 42}
{"info/global_step": 43, "train_info/time_within_train_step": 27.77744770050049, "step": 43}
{"train_info/time_between_train_steps": 0.0050313472747802734, "step": 43}
{"info/global_step": 44, "train_info/time_within_train_step": 27.741045236587524, "step": 44}
{"train_info/time_between_train_steps": 0.0053539276123046875, "step": 44}
{"info/global_step": 45, "train_info/time_within_train_step": 27.76729130744934, "step": 45}
{"train_info/time_between_train_steps": 0.004990339279174805, "step": 45}
{"info/global_step": 46, "train_info/time_within_train_step": 27.724063873291016, "step": 46}
{"train_info/time_between_train_steps": 0.00509953498840332, "step": 46}
{"info/global_step": 47, "train_info/time_within_train_step": 27.860365867614746, "step": 47}
{"train_info/time_between_train_steps": 0.005232095718383789, "step": 47}
{"info/global_step": 48, "train_info/time_within_train_step": 27.712042331695557, "step": 48}
{"train_info/time_between_train_steps": 0.01005411148071289, "step": 48}
{"info/global_step": 49, "train_info/time_within_train_step": 27.722922801971436, "step": 49}
{"train_info/time_between_train_steps": 0.010619163513183594, "step": 49}
{"info/global_step": 50, "train_info/time_within_train_step": 27.71678113937378, "step": 50}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733838884, "_runtime": 1418}, "step": 50}
{"logs": {"train/loss": 8.1405, "train/learning_rate": 0.00025, "train/epoch": 1.02, "_timestamp": 1733838884, "_runtime": 1418}, "step": 50}
{"train_info/time_between_train_steps": 0.013057947158813477, "step": 50}
{"info/global_step": 51, "train_info/time_within_train_step": 27.720324754714966, "step": 51}
{"train_info/time_between_train_steps": 0.01037287712097168, "step": 51}
{"info/global_step": 52, "train_info/time_within_train_step": 27.730428218841553, "step": 52}
{"train_info/time_between_train_steps": 0.010454416275024414, "step": 52}
{"info/global_step": 53, "train_info/time_within_train_step": 27.73339605331421, "step": 53}
{"train_info/time_between_train_steps": 0.005627155303955078, "step": 53}
{"info/global_step": 54, "train_info/time_within_train_step": 27.75397825241089, "step": 54}
{"train_info/time_between_train_steps": 0.005733489990234375, "step": 54}
{"train_info/time_between_train_steps": 20.703773260116577, "step": 54}
{"info/global_step": 55, "train_info/time_within_train_step": 27.737854480743408, "step": 55}
{"train_info/time_between_train_steps": 0.005608081817626953, "step": 55}
{"info/global_step": 56, "train_info/time_within_train_step": 27.897504568099976, "step": 56}
{"train_info/time_between_train_steps": 0.005407571792602539, "step": 56}
{"info/global_step": 57, "train_info/time_within_train_step": 27.743273973464966, "step": 57}
{"train_info/time_between_train_steps": 0.005193233489990234, "step": 57}
{"info/global_step": 58, "train_info/time_within_train_step": 27.895511627197266, "step": 58}
{"train_info/time_between_train_steps": 0.0053484439849853516, "step": 58}
{"info/global_step": 59, "train_info/time_within_train_step": 27.72433114051819, "step": 59}
{"train_info/time_between_train_steps": 0.005383729934692383, "step": 59}
{"info/global_step": 60, "train_info/time_within_train_step": 27.861709356307983, "step": 60}
{"train_info/time_between_train_steps": 0.005393505096435547, "step": 60}
{"info/global_step": 61, "train_info/time_within_train_step": 27.758777618408203, "step": 61}
{"train_info/time_between_train_steps": 0.005669832229614258, "step": 61}
{"info/global_step": 62, "train_info/time_within_train_step": 27.888258695602417, "step": 62}
{"train_info/time_between_train_steps": 0.005342960357666016, "step": 62}
{"info/global_step": 63, "train_info/time_within_train_step": 27.727490425109863, "step": 63}
{"train_info/time_between_train_steps": 0.005553722381591797, "step": 63}
{"info/global_step": 64, "train_info/time_within_train_step": 27.72862982749939, "step": 64}
{"train_info/time_between_train_steps": 0.005176544189453125, "step": 64}
{"info/global_step": 65, "train_info/time_within_train_step": 27.783156633377075, "step": 65}
{"train_info/time_between_train_steps": 0.006574392318725586, "step": 65}
{"info/global_step": 66, "train_info/time_within_train_step": 27.72012233734131, "step": 66}
{"train_info/time_between_train_steps": 0.005198001861572266, "step": 66}
{"info/global_step": 67, "train_info/time_within_train_step": 27.715561151504517, "step": 67}
{"train_info/time_between_train_steps": 0.00501561164855957, "step": 67}
{"info/global_step": 68, "train_info/time_within_train_step": 27.732725381851196, "step": 68}
{"train_info/time_between_train_steps": 0.010250329971313477, "step": 68}
{"info/global_step": 69, "train_info/time_within_train_step": 27.77450132369995, "step": 69}
{"train_info/time_between_train_steps": 0.005239009857177734, "step": 69}
{"info/global_step": 70, "train_info/time_within_train_step": 27.714961767196655, "step": 70}
{"train_info/time_between_train_steps": 0.005712032318115234, "step": 70}
{"info/global_step": 71, "train_info/time_within_train_step": 27.716126441955566, "step": 71}
{"train_info/time_between_train_steps": 0.005340099334716797, "step": 71}
{"info/global_step": 72, "train_info/time_within_train_step": 27.713478803634644, "step": 72}
{"train_info/time_between_train_steps": 0.005127668380737305, "step": 72}
{"info/global_step": 73, "train_info/time_within_train_step": 27.7197163105011, "step": 73}
{"train_info/time_between_train_steps": 0.005273342132568359, "step": 73}
{"info/global_step": 74, "train_info/time_within_train_step": 27.71224570274353, "step": 74}
{"train_info/time_between_train_steps": 0.005260467529296875, "step": 74}
{"info/global_step": 75, "train_info/time_within_train_step": 27.710806131362915, "step": 75}
{"train_info/time_between_train_steps": 0.005199909210205078, "step": 75}
{"info/global_step": 76, "train_info/time_within_train_step": 27.76404118537903, "step": 76}
{"train_info/time_between_train_steps": 0.005358695983886719, "step": 76}
{"info/global_step": 77, "train_info/time_within_train_step": 27.83384609222412, "step": 77}
{"train_info/time_between_train_steps": 0.005067348480224609, "step": 77}
{"info/global_step": 78, "train_info/time_within_train_step": 27.719746351242065, "step": 78}
{"train_info/time_between_train_steps": 0.00547480583190918, "step": 78}
{"info/global_step": 79, "train_info/time_within_train_step": 27.735016107559204, "step": 79}
{"train_info/time_between_train_steps": 0.005327463150024414, "step": 79}
{"info/global_step": 80, "train_info/time_within_train_step": 27.781301021575928, "step": 80}
{"train_info/time_between_train_steps": 0.005623340606689453, "step": 80}
{"info/global_step": 81, "train_info/time_within_train_step": 27.79283881187439, "step": 81}
{"train_info/time_between_train_steps": 0.005867481231689453, "step": 81}
{"train_info/time_between_train_steps": 20.759703874588013, "step": 81}
{"info/global_step": 82, "train_info/time_within_train_step": 27.714932441711426, "step": 82}
{"train_info/time_between_train_steps": 0.005234718322753906, "step": 82}
{"info/global_step": 83, "train_info/time_within_train_step": 27.87445592880249, "step": 83}
{"train_info/time_between_train_steps": 0.005285739898681641, "step": 83}
{"info/global_step": 84, "train_info/time_within_train_step": 27.72213864326477, "step": 84}
{"train_info/time_between_train_steps": 0.0053081512451171875, "step": 84}
{"info/global_step": 85, "train_info/time_within_train_step": 27.886104345321655, "step": 85}
{"train_info/time_between_train_steps": 0.005448579788208008, "step": 85}
{"info/global_step": 86, "train_info/time_within_train_step": 27.73092007637024, "step": 86}
{"train_info/time_between_train_steps": 0.0055501461029052734, "step": 86}
{"info/global_step": 87, "train_info/time_within_train_step": 27.87819194793701, "step": 87}
{"train_info/time_between_train_steps": 0.0052754878997802734, "step": 87}
{"info/global_step": 88, "train_info/time_within_train_step": 27.852813243865967, "step": 88}
{"train_info/time_between_train_steps": 0.005420684814453125, "step": 88}
{"info/global_step": 89, "train_info/time_within_train_step": 27.904248476028442, "step": 89}
{"train_info/time_between_train_steps": 0.007916927337646484, "step": 89}
{"info/global_step": 90, "train_info/time_within_train_step": 27.81662130355835, "step": 90}
{"train_info/time_between_train_steps": 0.00778508186340332, "step": 90}
{"info/global_step": 91, "train_info/time_within_train_step": 27.812597274780273, "step": 91}
{"train_info/time_between_train_steps": 0.0051004886627197266, "step": 91}
{"info/global_step": 92, "train_info/time_within_train_step": 27.8768789768219, "step": 92}
{"train_info/time_between_train_steps": 0.010967731475830078, "step": 92}
{"info/global_step": 93, "train_info/time_within_train_step": 27.784394025802612, "step": 93}
{"train_info/time_between_train_steps": 0.005038738250732422, "step": 93}
{"info/global_step": 94, "train_info/time_within_train_step": 27.756287336349487, "step": 94}
{"train_info/time_between_train_steps": 0.005447864532470703, "step": 94}
{"info/global_step": 95, "train_info/time_within_train_step": 27.782982110977173, "step": 95}
{"train_info/time_between_train_steps": 0.005303621292114258, "step": 95}
{"info/global_step": 96, "train_info/time_within_train_step": 27.80786895751953, "step": 96}
{"train_info/time_between_train_steps": 0.0063669681549072266, "step": 96}
{"info/global_step": 97, "train_info/time_within_train_step": 27.74100947380066, "step": 97}
{"train_info/time_between_train_steps": 0.0051801204681396484, "step": 97}
{"info/global_step": 98, "train_info/time_within_train_step": 27.73648476600647, "step": 98}
{"train_info/time_between_train_steps": 0.005108833312988281, "step": 98}
{"info/global_step": 99, "train_info/time_within_train_step": 27.709775686264038, "step": 99}
{"train_info/time_between_train_steps": 0.005139589309692383, "step": 99}
{"info/global_step": 100, "train_info/time_within_train_step": 27.712428331375122, "step": 100}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733840314, "_runtime": 2848}, "step": 100}
{"logs": {"train/loss": 6.4716, "train/learning_rate": 0.0005, "train/epoch": 3.02, "_timestamp": 1733840314, "_runtime": 2848}, "step": 100}
{"train_info/time_between_train_steps": 2.2050609588623047, "step": 100}
{"info/global_step": 101, "train_info/time_within_train_step": 27.70801305770874, "step": 101}
{"train_info/time_between_train_steps": 0.005063056945800781, "step": 101}
{"info/global_step": 102, "train_info/time_within_train_step": 27.719131231307983, "step": 102}
{"train_info/time_between_train_steps": 0.005234956741333008, "step": 102}
{"info/global_step": 103, "train_info/time_within_train_step": 27.710596323013306, "step": 103}
{"train_info/time_between_train_steps": 0.0051462650299072266, "step": 103}
{"info/global_step": 104, "train_info/time_within_train_step": 27.741906881332397, "step": 104}
{"train_info/time_between_train_steps": 0.005414485931396484, "step": 104}
{"info/global_step": 105, "train_info/time_within_train_step": 27.721107244491577, "step": 105}
{"train_info/time_between_train_steps": 0.0053789615631103516, "step": 105}
{"info/global_step": 106, "train_info/time_within_train_step": 27.74693727493286, "step": 106}
{"train_info/time_between_train_steps": 0.0052356719970703125, "step": 106}
{"info/global_step": 107, "train_info/time_within_train_step": 27.726534605026245, "step": 107}
{"train_info/time_between_train_steps": 0.005602836608886719, "step": 107}
{"info/global_step": 108, "train_info/time_within_train_step": 27.83772373199463, "step": 108}
{"train_info/time_between_train_steps": 0.00569462776184082, "step": 108}
{"train_info/time_between_train_steps": 20.83094072341919, "step": 108}
{"info/global_step": 109, "train_info/time_within_train_step": 27.70792245864868, "step": 109}
{"train_info/time_between_train_steps": 0.0049190521240234375, "step": 109}
{"info/global_step": 110, "train_info/time_within_train_step": 27.84247589111328, "step": 110}
{"train_info/time_between_train_steps": 0.005204677581787109, "step": 110}
{"info/global_step": 111, "train_info/time_within_train_step": 27.730313777923584, "step": 111}
{"train_info/time_between_train_steps": 0.005080223083496094, "step": 111}
{"info/global_step": 112, "train_info/time_within_train_step": 27.850870609283447, "step": 112}
{"train_info/time_between_train_steps": 0.005304574966430664, "step": 112}
{"info/global_step": 113, "train_info/time_within_train_step": 27.71386981010437, "step": 113}
{"train_info/time_between_train_steps": 0.0052378177642822266, "step": 113}
{"info/global_step": 114, "train_info/time_within_train_step": 27.936407566070557, "step": 114}
{"train_info/time_between_train_steps": 0.007483720779418945, "step": 114}
{"info/global_step": 115, "train_info/time_within_train_step": 27.73186993598938, "step": 115}
{"train_info/time_between_train_steps": 0.005778789520263672, "step": 115}
{"info/global_step": 116, "train_info/time_within_train_step": 27.766840934753418, "step": 116}
{"train_info/time_between_train_steps": 0.005391836166381836, "step": 116}
{"info/global_step": 117, "train_info/time_within_train_step": 27.7218337059021, "step": 117}
{"train_info/time_between_train_steps": 0.005150556564331055, "step": 117}
{"info/global_step": 118, "train_info/time_within_train_step": 27.710172653198242, "step": 118}
{"train_info/time_between_train_steps": 0.004906892776489258, "step": 118}
{"info/global_step": 119, "train_info/time_within_train_step": 27.71315026283264, "step": 119}
{"train_info/time_between_train_steps": 0.005022525787353516, "step": 119}
{"info/global_step": 120, "train_info/time_within_train_step": 27.706647396087646, "step": 120}
{"train_info/time_between_train_steps": 0.005079030990600586, "step": 120}
{"info/global_step": 121, "train_info/time_within_train_step": 27.73076343536377, "step": 121}
{"train_info/time_between_train_steps": 0.0051195621490478516, "step": 121}
{"info/global_step": 122, "train_info/time_within_train_step": 27.798895597457886, "step": 122}
{"train_info/time_between_train_steps": 0.005306243896484375, "step": 122}
{"info/global_step": 123, "train_info/time_within_train_step": 27.89584708213806, "step": 123}
{"train_info/time_between_train_steps": 0.005125284194946289, "step": 123}
{"info/global_step": 124, "train_info/time_within_train_step": 27.769075393676758, "step": 124}
{"train_info/time_between_train_steps": 0.010271072387695312, "step": 124}
{"info/global_step": 125, "train_info/time_within_train_step": 27.787164211273193, "step": 125}
{"train_info/time_between_train_steps": 0.005578756332397461, "step": 125}
{"info/global_step": 126, "train_info/time_within_train_step": 27.760987281799316, "step": 126}
{"train_info/time_between_train_steps": 0.005111217498779297, "step": 126}
{"info/global_step": 127, "train_info/time_within_train_step": 27.804280519485474, "step": 127}
{"train_info/time_between_train_steps": 0.0052869319915771484, "step": 127}
{"info/global_step": 128, "train_info/time_within_train_step": 27.858105182647705, "step": 128}
{"train_info/time_between_train_steps": 0.006243467330932617, "step": 128}
{"info/global_step": 129, "train_info/time_within_train_step": 27.782270193099976, "step": 129}
{"train_info/time_between_train_steps": 0.005207061767578125, "step": 129}
{"info/global_step": 130, "train_info/time_within_train_step": 27.78261947631836, "step": 130}
{"train_info/time_between_train_steps": 0.0053021907806396484, "step": 130}
{"info/global_step": 131, "train_info/time_within_train_step": 27.78946304321289, "step": 131}
{"train_info/time_between_train_steps": 0.0052394866943359375, "step": 131}
{"info/global_step": 132, "train_info/time_within_train_step": 27.797452211380005, "step": 132}
{"train_info/time_between_train_steps": 0.005518913269042969, "step": 132}
{"info/global_step": 133, "train_info/time_within_train_step": 27.787040948867798, "step": 133}
{"train_info/time_between_train_steps": 0.0060577392578125, "step": 133}
{"info/global_step": 134, "train_info/time_within_train_step": 27.839051246643066, "step": 134}
{"train_info/time_between_train_steps": 0.005713701248168945, "step": 134}
{"info/global_step": 135, "train_info/time_within_train_step": 27.796879768371582, "step": 135}
{"train_info/time_between_train_steps": 0.005947113037109375, "step": 135}
{"train_info/time_between_train_steps": 20.622538805007935, "step": 135}
{"info/global_step": 136, "train_info/time_within_train_step": 27.759724617004395, "step": 136}
{"train_info/time_between_train_steps": 0.010233879089355469, "step": 136}
{"info/global_step": 137, "train_info/time_within_train_step": 27.94436264038086, "step": 137}
{"train_info/time_between_train_steps": 0.010376453399658203, "step": 137}
{"info/global_step": 138, "train_info/time_within_train_step": 27.8594388961792, "step": 138}
{"train_info/time_between_train_steps": 0.010729312896728516, "step": 138}
{"info/global_step": 139, "train_info/time_within_train_step": 27.90585732460022, "step": 139}
{"train_info/time_between_train_steps": 0.005295753479003906, "step": 139}
{"info/global_step": 140, "train_info/time_within_train_step": 27.78616762161255, "step": 140}
{"train_info/time_between_train_steps": 0.005437612533569336, "step": 140}
{"info/global_step": 141, "train_info/time_within_train_step": 27.947160243988037, "step": 141}
{"train_info/time_between_train_steps": 0.005507707595825195, "step": 141}
{"info/global_step": 142, "train_info/time_within_train_step": 27.807966470718384, "step": 142}
{"train_info/time_between_train_steps": 0.0054378509521484375, "step": 142}
{"info/global_step": 143, "train_info/time_within_train_step": 27.817466259002686, "step": 143}
{"train_info/time_between_train_steps": 0.005610466003417969, "step": 143}
{"info/global_step": 144, "train_info/time_within_train_step": 27.828092098236084, "step": 144}
{"train_info/time_between_train_steps": 0.0052776336669921875, "step": 144}
{"info/global_step": 145, "train_info/time_within_train_step": 27.77499270439148, "step": 145}
{"train_info/time_between_train_steps": 0.005235433578491211, "step": 145}
{"info/global_step": 146, "train_info/time_within_train_step": 27.820592880249023, "step": 146}
{"train_info/time_between_train_steps": 0.005173444747924805, "step": 146}
{"info/global_step": 147, "train_info/time_within_train_step": 27.769060850143433, "step": 147}
{"train_info/time_between_train_steps": 0.005511760711669922, "step": 147}
{"info/global_step": 148, "train_info/time_within_train_step": 27.814704418182373, "step": 148}
{"train_info/time_between_train_steps": 0.005424022674560547, "step": 148}
{"info/global_step": 149, "train_info/time_within_train_step": 27.808425426483154, "step": 149}
{"train_info/time_between_train_steps": 0.005387783050537109, "step": 149}
{"info/global_step": 150, "train_info/time_within_train_step": 27.790331840515137, "step": 150}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733841747, "_runtime": 4281}, "step": 150}
{"logs": {"train/loss": 6.1549, "train/learning_rate": 0.0005833333333333333, "train/epoch": 5.01, "_timestamp": 1733841747, "_runtime": 4281}, "step": 150}
{"train_info/time_between_train_steps": 0.007974386215209961, "step": 150}
{"info/global_step": 151, "train_info/time_within_train_step": 27.77284002304077, "step": 151}
{"train_info/time_between_train_steps": 0.005398988723754883, "step": 151}
{"info/global_step": 152, "train_info/time_within_train_step": 27.778287172317505, "step": 152}
{"train_info/time_between_train_steps": 0.010795116424560547, "step": 152}
{"info/global_step": 153, "train_info/time_within_train_step": 27.807738780975342, "step": 153}
{"train_info/time_between_train_steps": 0.005260944366455078, "step": 153}
{"info/global_step": 154, "train_info/time_within_train_step": 27.84944200515747, "step": 154}
{"train_info/time_between_train_steps": 0.005903720855712891, "step": 154}
{"info/global_step": 155, "train_info/time_within_train_step": 27.783904552459717, "step": 155}
{"train_info/time_between_train_steps": 0.0051898956298828125, "step": 155}
{"info/global_step": 156, "train_info/time_within_train_step": 27.752029418945312, "step": 156}
{"train_info/time_between_train_steps": 0.005116939544677734, "step": 156}
{"info/global_step": 157, "train_info/time_within_train_step": 27.788411617279053, "step": 157}
{"train_info/time_between_train_steps": 0.005337953567504883, "step": 157}
{"info/global_step": 158, "train_info/time_within_train_step": 27.78265690803528, "step": 158}
{"train_info/time_between_train_steps": 0.005337953567504883, "step": 158}
{"info/global_step": 159, "train_info/time_within_train_step": 27.777082920074463, "step": 159}
{"train_info/time_between_train_steps": 0.0054492950439453125, "step": 159}
{"info/global_step": 160, "train_info/time_within_train_step": 27.795780897140503, "step": 160}
{"train_info/time_between_train_steps": 0.005697965621948242, "step": 160}
{"info/global_step": 161, "train_info/time_within_train_step": 27.791589736938477, "step": 161}
{"train_info/time_between_train_steps": 0.0056610107421875, "step": 161}
{"info/global_step": 162, "train_info/time_within_train_step": 27.792977809906006, "step": 162}
{"train_info/time_between_train_steps": 0.005780696868896484, "step": 162}
{"train_info/time_between_train_steps": 20.668280363082886, "step": 162}
{"info/global_step": 163, "train_info/time_within_train_step": 27.783740282058716, "step": 163}
{"train_info/time_between_train_steps": 0.0049037933349609375, "step": 163}
{"info/global_step": 164, "train_info/time_within_train_step": 27.93974494934082, "step": 164}
{"train_info/time_between_train_steps": 0.005199432373046875, "step": 164}
{"info/global_step": 165, "train_info/time_within_train_step": 27.79984140396118, "step": 165}
{"train_info/time_between_train_steps": 0.005215167999267578, "step": 165}
{"info/global_step": 166, "train_info/time_within_train_step": 27.906408548355103, "step": 166}
{"train_info/time_between_train_steps": 0.005331277847290039, "step": 166}
{"info/global_step": 167, "train_info/time_within_train_step": 27.78060269355774, "step": 167}
{"train_info/time_between_train_steps": 0.0055234432220458984, "step": 167}
{"info/global_step": 168, "train_info/time_within_train_step": 27.97565507888794, "step": 168}
{"train_info/time_between_train_steps": 0.005685567855834961, "step": 168}
{"info/global_step": 169, "train_info/time_within_train_step": 27.901318788528442, "step": 169}
{"train_info/time_between_train_steps": 0.005725383758544922, "step": 169}
{"info/global_step": 170, "train_info/time_within_train_step": 27.827449083328247, "step": 170}
{"train_info/time_between_train_steps": 0.005342006683349609, "step": 170}
{"info/global_step": 171, "train_info/time_within_train_step": 27.7829852104187, "step": 171}
{"train_info/time_between_train_steps": 0.0053708553314208984, "step": 171}
{"info/global_step": 172, "train_info/time_within_train_step": 27.87431573867798, "step": 172}
{"train_info/time_between_train_steps": 0.005422830581665039, "step": 172}
{"info/global_step": 173, "train_info/time_within_train_step": 27.784424304962158, "step": 173}
{"train_info/time_between_train_steps": 0.0068705081939697266, "step": 173}
{"info/global_step": 174, "train_info/time_within_train_step": 27.790708780288696, "step": 174}
{"train_info/time_between_train_steps": 0.0053560733795166016, "step": 174}
{"info/global_step": 175, "train_info/time_within_train_step": 27.793811798095703, "step": 175}
{"train_info/time_between_train_steps": 0.005135059356689453, "step": 175}
{"info/global_step": 176, "train_info/time_within_train_step": 27.772608995437622, "step": 176}
{"train_info/time_between_train_steps": 0.005182504653930664, "step": 176}
{"info/global_step": 177, "train_info/time_within_train_step": 27.816760063171387, "step": 177}
{"train_info/time_between_train_steps": 0.005373239517211914, "step": 177}
{"info/global_step": 178, "train_info/time_within_train_step": 27.8133385181427, "step": 178}
{"train_info/time_between_train_steps": 0.005644321441650391, "step": 178}
{"info/global_step": 179, "train_info/time_within_train_step": 27.801661014556885, "step": 179}
{"train_info/time_between_train_steps": 0.005604267120361328, "step": 179}
{"info/global_step": 180, "train_info/time_within_train_step": 27.79430866241455, "step": 180}
{"train_info/time_between_train_steps": 0.005341053009033203, "step": 180}
{"info/global_step": 181, "train_info/time_within_train_step": 27.941084623336792, "step": 181}
{"train_info/time_between_train_steps": 0.009958744049072266, "step": 181}
{"info/global_step": 182, "train_info/time_within_train_step": 27.832467317581177, "step": 182}
{"train_info/time_between_train_steps": 0.01006770133972168, "step": 182}
{"info/global_step": 183, "train_info/time_within_train_step": 27.766769886016846, "step": 183}
{"train_info/time_between_train_steps": 0.00525665283203125, "step": 183}
{"info/global_step": 184, "train_info/time_within_train_step": 27.837531566619873, "step": 184}
{"train_info/time_between_train_steps": 0.005311250686645508, "step": 184}
{"info/global_step": 185, "train_info/time_within_train_step": 27.784476041793823, "step": 185}
{"train_info/time_between_train_steps": 0.005507707595825195, "step": 185}
{"info/global_step": 186, "train_info/time_within_train_step": 27.928765535354614, "step": 186}
{"train_info/time_between_train_steps": 0.006604194641113281, "step": 186}
{"info/global_step": 187, "train_info/time_within_train_step": 27.814002513885498, "step": 187}
{"train_info/time_between_train_steps": 0.005678653717041016, "step": 187}
{"info/global_step": 188, "train_info/time_within_train_step": 27.798136949539185, "step": 188}
{"train_info/time_between_train_steps": 0.005987644195556641, "step": 188}
{"info/global_step": 189, "train_info/time_within_train_step": 27.79625129699707, "step": 189}
{"train_info/time_between_train_steps": 0.006533384323120117, "step": 189}
{"train_info/time_between_train_steps": 20.861188411712646, "step": 189}
{"info/global_step": 190, "train_info/time_within_train_step": 27.771064519882202, "step": 190}
{"train_info/time_between_train_steps": 0.005881786346435547, "step": 190}
{"info/global_step": 191, "train_info/time_within_train_step": 27.95099377632141, "step": 191}
{"train_info/time_between_train_steps": 0.005635261535644531, "step": 191}
{"info/global_step": 192, "train_info/time_within_train_step": 27.777775764465332, "step": 192}
{"train_info/time_between_train_steps": 0.005402088165283203, "step": 192}
{"info/global_step": 193, "train_info/time_within_train_step": 27.995983839035034, "step": 193}
{"train_info/time_between_train_steps": 0.0055005550384521484, "step": 193}
{"info/global_step": 194, "train_info/time_within_train_step": 27.756285905838013, "step": 194}
{"train_info/time_between_train_steps": 0.005264997482299805, "step": 194}
{"info/global_step": 195, "train_info/time_within_train_step": 28.060556411743164, "step": 195}
{"train_info/time_between_train_steps": 0.006955146789550781, "step": 195}
{"info/global_step": 196, "train_info/time_within_train_step": 27.834251880645752, "step": 196}
{"train_info/time_between_train_steps": 0.006435871124267578, "step": 196}
{"info/global_step": 197, "train_info/time_within_train_step": 28.047918558120728, "step": 197}
{"train_info/time_between_train_steps": 0.01115870475769043, "step": 197}
{"info/global_step": 198, "train_info/time_within_train_step": 27.809983491897583, "step": 198}
{"train_info/time_between_train_steps": 0.00640559196472168, "step": 198}
{"info/global_step": 199, "train_info/time_within_train_step": 27.908466339111328, "step": 199}
{"train_info/time_between_train_steps": 0.007135629653930664, "step": 199}
{"info/global_step": 200, "train_info/time_within_train_step": 27.802139282226562, "step": 200}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733843181, "_runtime": 5715}, "step": 200}
{"logs": {"train/loss": 5.99, "train/learning_rate": 0.0005555555555555556, "train/epoch": 7.01, "_timestamp": 1733843181, "_runtime": 5715}, "step": 200}
{"train_info/time_between_train_steps": 4.1576526165008545, "step": 200}
{"info/global_step": 201, "train_info/time_within_train_step": 27.797770738601685, "step": 201}
{"train_info/time_between_train_steps": 0.006787300109863281, "step": 201}
{"info/global_step": 202, "train_info/time_within_train_step": 27.789104461669922, "step": 202}
{"train_info/time_between_train_steps": 0.005521059036254883, "step": 202}
{"info/global_step": 203, "train_info/time_within_train_step": 27.774933338165283, "step": 203}
{"train_info/time_between_train_steps": 0.005544185638427734, "step": 203}
{"info/global_step": 204, "train_info/time_within_train_step": 27.78113579750061, "step": 204}
{"train_info/time_between_train_steps": 0.005602836608886719, "step": 204}
{"info/global_step": 205, "train_info/time_within_train_step": 27.774287223815918, "step": 205}
{"train_info/time_between_train_steps": 0.010415077209472656, "step": 205}
{"info/global_step": 206, "train_info/time_within_train_step": 27.780940771102905, "step": 206}
{"train_info/time_between_train_steps": 0.0058629512786865234, "step": 206}
{"info/global_step": 207, "train_info/time_within_train_step": 27.78213381767273, "step": 207}
{"train_info/time_between_train_steps": 0.005545377731323242, "step": 207}
{"info/global_step": 208, "train_info/time_within_train_step": 27.824424982070923, "step": 208}
{"train_info/time_between_train_steps": 0.00556635856628418, "step": 208}
{"info/global_step": 209, "train_info/time_within_train_step": 27.781598567962646, "step": 209}
{"train_info/time_between_train_steps": 0.0054454803466796875, "step": 209}
{"info/global_step": 210, "train_info/time_within_train_step": 27.81200361251831, "step": 210}
{"train_info/time_between_train_steps": 0.00530242919921875, "step": 210}
{"info/global_step": 211, "train_info/time_within_train_step": 27.777809619903564, "step": 211}
{"train_info/time_between_train_steps": 0.005836963653564453, "step": 211}
{"info/global_step": 212, "train_info/time_within_train_step": 27.762998819351196, "step": 212}
{"train_info/time_between_train_steps": 0.005067586898803711, "step": 212}
{"info/global_step": 213, "train_info/time_within_train_step": 27.793835163116455, "step": 213}
{"train_info/time_between_train_steps": 0.0053026676177978516, "step": 213}
{"info/global_step": 214, "train_info/time_within_train_step": 27.769960165023804, "step": 214}
{"train_info/time_between_train_steps": 0.010227203369140625, "step": 214}
{"info/global_step": 215, "train_info/time_within_train_step": 27.870702505111694, "step": 215}
{"train_info/time_between_train_steps": 0.005346775054931641, "step": 215}
{"info/global_step": 216, "train_info/time_within_train_step": 27.80680227279663, "step": 216}
{"train_info/time_between_train_steps": 0.0053675174713134766, "step": 216}
{"train_info/time_between_train_steps": 20.589505672454834, "step": 216}
{"info/global_step": 217, "train_info/time_within_train_step": 27.777304887771606, "step": 217}
{"train_info/time_between_train_steps": 0.006784200668334961, "step": 217}
{"info/global_step": 218, "train_info/time_within_train_step": 27.916396379470825, "step": 218}
{"train_info/time_between_train_steps": 0.005280733108520508, "step": 218}
{"info/global_step": 219, "train_info/time_within_train_step": 27.776479482650757, "step": 219}
{"train_info/time_between_train_steps": 0.005284786224365234, "step": 219}
{"info/global_step": 220, "train_info/time_within_train_step": 27.902915954589844, "step": 220}
{"train_info/time_between_train_steps": 0.0052030086517333984, "step": 220}
{"info/global_step": 221, "train_info/time_within_train_step": 27.78316068649292, "step": 221}
{"train_info/time_between_train_steps": 0.005256175994873047, "step": 221}
{"info/global_step": 222, "train_info/time_within_train_step": 27.978546619415283, "step": 222}
{"train_info/time_between_train_steps": 0.005378246307373047, "step": 222}
{"info/global_step": 223, "train_info/time_within_train_step": 27.84538459777832, "step": 223}
{"train_info/time_between_train_steps": 0.005809783935546875, "step": 223}
{"info/global_step": 224, "train_info/time_within_train_step": 27.818939685821533, "step": 224}
{"train_info/time_between_train_steps": 0.005376338958740234, "step": 224}
{"info/global_step": 225, "train_info/time_within_train_step": 27.84450101852417, "step": 225}
{"train_info/time_between_train_steps": 0.005414009094238281, "step": 225}
{"info/global_step": 226, "train_info/time_within_train_step": 27.78175663948059, "step": 226}
{"train_info/time_between_train_steps": 0.0056304931640625, "step": 226}
{"info/global_step": 227, "train_info/time_within_train_step": 27.774110078811646, "step": 227}
{"train_info/time_between_train_steps": 0.005397796630859375, "step": 227}
{"info/global_step": 228, "train_info/time_within_train_step": 27.80106544494629, "step": 228}
{"train_info/time_between_train_steps": 0.004994869232177734, "step": 228}
{"info/global_step": 229, "train_info/time_within_train_step": 27.770222425460815, "step": 229}
{"train_info/time_between_train_steps": 0.005409717559814453, "step": 229}
{"info/global_step": 230, "train_info/time_within_train_step": 27.866915702819824, "step": 230}
{"train_info/time_between_train_steps": 0.005426645278930664, "step": 230}
{"info/global_step": 231, "train_info/time_within_train_step": 27.77304744720459, "step": 231}
{"train_info/time_between_train_steps": 0.0050220489501953125, "step": 231}
{"info/global_step": 232, "train_info/time_within_train_step": 27.74883484840393, "step": 232}
{"train_info/time_between_train_steps": 0.005315065383911133, "step": 232}
{"info/global_step": 233, "train_info/time_within_train_step": 27.786521911621094, "step": 233}
{"train_info/time_between_train_steps": 0.00563812255859375, "step": 233}
{"info/global_step": 234, "train_info/time_within_train_step": 27.932568788528442, "step": 234}
{"train_info/time_between_train_steps": 0.005163669586181641, "step": 234}
{"info/global_step": 235, "train_info/time_within_train_step": 27.838732481002808, "step": 235}
{"train_info/time_between_train_steps": 0.005042552947998047, "step": 235}
{"info/global_step": 236, "train_info/time_within_train_step": 27.78341579437256, "step": 236}
{"train_info/time_between_train_steps": 0.005057096481323242, "step": 236}
{"info/global_step": 237, "train_info/time_within_train_step": 27.76950454711914, "step": 237}
{"train_info/time_between_train_steps": 0.00567936897277832, "step": 237}
{"info/global_step": 238, "train_info/time_within_train_step": 27.780670642852783, "step": 238}
{"train_info/time_between_train_steps": 0.005253314971923828, "step": 238}
{"info/global_step": 239, "train_info/time_within_train_step": 27.77419424057007, "step": 239}
{"train_info/time_between_train_steps": 0.005175113677978516, "step": 239}
{"info/global_step": 240, "train_info/time_within_train_step": 27.77387523651123, "step": 240}
{"train_info/time_between_train_steps": 0.005021095275878906, "step": 240}
{"info/global_step": 241, "train_info/time_within_train_step": 27.797873735427856, "step": 241}
{"train_info/time_between_train_steps": 0.005230426788330078, "step": 241}
{"info/global_step": 242, "train_info/time_within_train_step": 27.80621910095215, "step": 242}
{"train_info/time_between_train_steps": 0.010744094848632812, "step": 242}
{"info/global_step": 243, "train_info/time_within_train_step": 27.84630274772644, "step": 243}
{"train_info/time_between_train_steps": 0.00556182861328125, "step": 243}
{"train_info/time_between_train_steps": 20.942267656326294, "step": 243}
{"info/global_step": 244, "train_info/time_within_train_step": 27.76746106147766, "step": 244}
{"train_info/time_between_train_steps": 0.010721445083618164, "step": 244}
{"info/global_step": 245, "train_info/time_within_train_step": 28.068228006362915, "step": 245}
{"train_info/time_between_train_steps": 0.005939483642578125, "step": 245}
{"info/global_step": 246, "train_info/time_within_train_step": 27.797964096069336, "step": 246}
{"train_info/time_between_train_steps": 0.0054416656494140625, "step": 246}
{"info/global_step": 247, "train_info/time_within_train_step": 28.004786014556885, "step": 247}
{"train_info/time_between_train_steps": 0.005405902862548828, "step": 247}
{"info/global_step": 248, "train_info/time_within_train_step": 27.780683755874634, "step": 248}
{"train_info/time_between_train_steps": 0.011178970336914062, "step": 248}
{"info/global_step": 249, "train_info/time_within_train_step": 27.900601625442505, "step": 249}
{"train_info/time_between_train_steps": 0.00521540641784668, "step": 249}
{"info/global_step": 250, "train_info/time_within_train_step": 27.759706258773804, "step": 250}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733844618, "_runtime": 7152}, "step": 250}
{"logs": {"train/loss": 5.8497, "train/learning_rate": 0.0005277777777777777, "train/epoch": 9.01, "_timestamp": 1733844618, "_runtime": 7152}, "step": 250}
{"train_info/time_between_train_steps": 0.013261079788208008, "step": 250}
{"info/global_step": 251, "train_info/time_within_train_step": 27.861596822738647, "step": 251}
{"train_info/time_between_train_steps": 0.005546092987060547, "step": 251}
{"info/global_step": 252, "train_info/time_within_train_step": 27.78571653366089, "step": 252}
{"train_info/time_between_train_steps": 0.005548954010009766, "step": 252}
{"info/global_step": 253, "train_info/time_within_train_step": 27.754745721817017, "step": 253}
{"train_info/time_between_train_steps": 0.005223512649536133, "step": 253}
{"info/global_step": 254, "train_info/time_within_train_step": 27.76583766937256, "step": 254}
{"train_info/time_between_train_steps": 0.005166530609130859, "step": 254}
{"info/global_step": 255, "train_info/time_within_train_step": 27.78714919090271, "step": 255}
{"train_info/time_between_train_steps": 0.00504755973815918, "step": 255}
{"info/global_step": 256, "train_info/time_within_train_step": 27.781872987747192, "step": 256}
{"train_info/time_between_train_steps": 0.005993366241455078, "step": 256}
{"info/global_step": 257, "train_info/time_within_train_step": 27.781855583190918, "step": 257}
{"train_info/time_between_train_steps": 0.005723237991333008, "step": 257}
{"info/global_step": 258, "train_info/time_within_train_step": 27.76736569404602, "step": 258}
{"train_info/time_between_train_steps": 0.005758523941040039, "step": 258}
{"info/global_step": 259, "train_info/time_within_train_step": 27.7641863822937, "step": 259}
{"train_info/time_between_train_steps": 0.010204315185546875, "step": 259}
{"info/global_step": 260, "train_info/time_within_train_step": 27.846733570098877, "step": 260}
{"train_info/time_between_train_steps": 0.010477542877197266, "step": 260}
{"info/global_step": 261, "train_info/time_within_train_step": 27.76079559326172, "step": 261}
{"train_info/time_between_train_steps": 0.005419015884399414, "step": 261}
{"info/global_step": 262, "train_info/time_within_train_step": 27.760104179382324, "step": 262}
{"train_info/time_between_train_steps": 0.005988597869873047, "step": 262}
{"info/global_step": 263, "train_info/time_within_train_step": 27.778953313827515, "step": 263}
{"train_info/time_between_train_steps": 0.005586385726928711, "step": 263}
{"info/global_step": 264, "train_info/time_within_train_step": 27.762701272964478, "step": 264}
{"train_info/time_between_train_steps": 0.0054280757904052734, "step": 264}
{"info/global_step": 265, "train_info/time_within_train_step": 27.819160223007202, "step": 265}
{"train_info/time_between_train_steps": 0.010360240936279297, "step": 265}
{"info/global_step": 266, "train_info/time_within_train_step": 27.787659883499146, "step": 266}
{"train_info/time_between_train_steps": 0.010061264038085938, "step": 266}
{"info/global_step": 267, "train_info/time_within_train_step": 27.7621648311615, "step": 267}
{"train_info/time_between_train_steps": 0.0057294368743896484, "step": 267}
{"info/global_step": 268, "train_info/time_within_train_step": 27.772554874420166, "step": 268}
{"train_info/time_between_train_steps": 0.005652904510498047, "step": 268}
{"info/global_step": 269, "train_info/time_within_train_step": 27.778602361679077, "step": 269}
{"train_info/time_between_train_steps": 0.006760835647583008, "step": 269}
{"info/global_step": 270, "train_info/time_within_train_step": 27.800073623657227, "step": 270}
{"train_info/time_between_train_steps": 0.005889892578125, "step": 270}
{"train_info/time_between_train_steps": 21.023128747940063, "step": 270}
{"info/global_step": 271, "train_info/time_within_train_step": 27.825814485549927, "step": 271}
{"train_info/time_between_train_steps": 0.011151313781738281, "step": 271}
{"info/global_step": 272, "train_info/time_within_train_step": 28.070935487747192, "step": 272}
{"train_info/time_between_train_steps": 0.0054666996002197266, "step": 272}
{"info/global_step": 273, "train_info/time_within_train_step": 27.793835878372192, "step": 273}
{"train_info/time_between_train_steps": 0.00546717643737793, "step": 273}
{"info/global_step": 274, "train_info/time_within_train_step": 27.972053289413452, "step": 274}
{"train_info/time_between_train_steps": 0.005799531936645508, "step": 274}
{"info/global_step": 275, "train_info/time_within_train_step": 27.938775777816772, "step": 275}
{"train_info/time_between_train_steps": 0.00563359260559082, "step": 275}
{"info/global_step": 276, "train_info/time_within_train_step": 28.00203013420105, "step": 276}
{"train_info/time_between_train_steps": 0.0056629180908203125, "step": 276}
{"info/global_step": 277, "train_info/time_within_train_step": 27.768211126327515, "step": 277}
{"train_info/time_between_train_steps": 0.013026714324951172, "step": 277}
{"info/global_step": 278, "train_info/time_within_train_step": 27.832865476608276, "step": 278}
{"train_info/time_between_train_steps": 0.005602359771728516, "step": 278}
{"info/global_step": 279, "train_info/time_within_train_step": 27.76181435585022, "step": 279}
{"train_info/time_between_train_steps": 0.010231256484985352, "step": 279}
{"info/global_step": 280, "train_info/time_within_train_step": 27.734403133392334, "step": 280}
{"train_info/time_between_train_steps": 0.004944324493408203, "step": 280}
{"info/global_step": 281, "train_info/time_within_train_step": 27.795332431793213, "step": 281}
{"train_info/time_between_train_steps": 0.005214214324951172, "step": 281}
{"info/global_step": 282, "train_info/time_within_train_step": 27.741026878356934, "step": 282}
{"train_info/time_between_train_steps": 0.005294084548950195, "step": 282}
{"info/global_step": 283, "train_info/time_within_train_step": 27.740252256393433, "step": 283}
{"train_info/time_between_train_steps": 0.005507946014404297, "step": 283}
{"info/global_step": 284, "train_info/time_within_train_step": 27.73820471763611, "step": 284}
{"train_info/time_between_train_steps": 0.005347490310668945, "step": 284}
{"info/global_step": 285, "train_info/time_within_train_step": 27.765541553497314, "step": 285}
{"train_info/time_between_train_steps": 0.005200862884521484, "step": 285}
{"info/global_step": 286, "train_info/time_within_train_step": 27.74992561340332, "step": 286}
{"train_info/time_between_train_steps": 0.005232810974121094, "step": 286}
{"info/global_step": 287, "train_info/time_within_train_step": 27.757882833480835, "step": 287}
{"train_info/time_between_train_steps": 0.01061868667602539, "step": 287}
{"info/global_step": 288, "train_info/time_within_train_step": 27.75575852394104, "step": 288}
{"train_info/time_between_train_steps": 0.005313873291015625, "step": 288}
{"info/global_step": 289, "train_info/time_within_train_step": 27.759763479232788, "step": 289}
{"train_info/time_between_train_steps": 0.005257129669189453, "step": 289}
{"info/global_step": 290, "train_info/time_within_train_step": 27.749056816101074, "step": 290}
{"train_info/time_between_train_steps": 0.005181312561035156, "step": 290}
{"info/global_step": 291, "train_info/time_within_train_step": 27.8547420501709, "step": 291}
{"train_info/time_between_train_steps": 0.0068743228912353516, "step": 291}
{"info/global_step": 292, "train_info/time_within_train_step": 27.74655842781067, "step": 292}
{"train_info/time_between_train_steps": 0.005380868911743164, "step": 292}
{"info/global_step": 293, "train_info/time_within_train_step": 27.734779119491577, "step": 293}
{"train_info/time_between_train_steps": 0.005224704742431641, "step": 293}
{"info/global_step": 294, "train_info/time_within_train_step": 27.73393225669861, "step": 294}
{"train_info/time_between_train_steps": 0.005283832550048828, "step": 294}
{"info/global_step": 295, "train_info/time_within_train_step": 27.734158754348755, "step": 295}
{"train_info/time_between_train_steps": 0.005605459213256836, "step": 295}
{"info/global_step": 296, "train_info/time_within_train_step": 27.745798110961914, "step": 296}
{"train_info/time_between_train_steps": 0.005578756332397461, "step": 296}
{"info/global_step": 297, "train_info/time_within_train_step": 27.769197702407837, "step": 297}
{"train_info/time_between_train_steps": 0.01742100715637207, "step": 297}
{"train_info/time_between_train_steps": 20.423726797103882, "step": 297}
{"info/global_step": 298, "train_info/time_within_train_step": 27.716364860534668, "step": 298}
{"train_info/time_between_train_steps": 0.0048770904541015625, "step": 298}
{"info/global_step": 299, "train_info/time_within_train_step": 27.822099447250366, "step": 299}
{"train_info/time_between_train_steps": 0.0049359798431396484, "step": 299}
{"info/global_step": 300, "train_info/time_within_train_step": 27.729496002197266, "step": 300}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733846049, "_runtime": 8583}, "step": 300}
{"logs": {"train/loss": 5.6576, "train/learning_rate": 0.0005, "train/epoch": 11.0, "_timestamp": 1733846049, "_runtime": 8583}, "step": 300}
{"train_info/time_between_train_steps": 2.7539329528808594, "step": 300}
{"info/global_step": 301, "train_info/time_within_train_step": 27.880887746810913, "step": 301}
{"train_info/time_between_train_steps": 0.008655786514282227, "step": 301}
{"info/global_step": 302, "train_info/time_within_train_step": 27.886101245880127, "step": 302}
{"train_info/time_between_train_steps": 0.005267143249511719, "step": 302}
{"info/global_step": 303, "train_info/time_within_train_step": 27.895750045776367, "step": 303}
{"train_info/time_between_train_steps": 0.005275726318359375, "step": 303}
{"info/global_step": 304, "train_info/time_within_train_step": 27.73401379585266, "step": 304}
{"train_info/time_between_train_steps": 0.005382537841796875, "step": 304}
{"info/global_step": 305, "train_info/time_within_train_step": 27.826446533203125, "step": 305}
{"train_info/time_between_train_steps": 0.005269050598144531, "step": 305}
{"info/global_step": 306, "train_info/time_within_train_step": 27.84080982208252, "step": 306}
{"train_info/time_between_train_steps": 0.005003929138183594, "step": 306}
{"info/global_step": 307, "train_info/time_within_train_step": 27.721405029296875, "step": 307}
{"train_info/time_between_train_steps": 0.007535696029663086, "step": 307}
{"info/global_step": 308, "train_info/time_within_train_step": 27.743082284927368, "step": 308}
{"train_info/time_between_train_steps": 0.0051839351654052734, "step": 308}
{"info/global_step": 309, "train_info/time_within_train_step": 27.722338676452637, "step": 309}
{"train_info/time_between_train_steps": 0.0051746368408203125, "step": 309}
{"info/global_step": 310, "train_info/time_within_train_step": 27.720990896224976, "step": 310}
{"train_info/time_between_train_steps": 0.005125522613525391, "step": 310}
{"info/global_step": 311, "train_info/time_within_train_step": 27.73161220550537, "step": 311}
{"train_info/time_between_train_steps": 0.005139589309692383, "step": 311}
{"info/global_step": 312, "train_info/time_within_train_step": 27.743971586227417, "step": 312}
{"train_info/time_between_train_steps": 0.005072116851806641, "step": 312}
{"info/global_step": 313, "train_info/time_within_train_step": 27.73596215248108, "step": 313}
{"train_info/time_between_train_steps": 0.005125284194946289, "step": 313}
{"info/global_step": 314, "train_info/time_within_train_step": 27.7408447265625, "step": 314}
{"train_info/time_between_train_steps": 0.010077953338623047, "step": 314}
{"info/global_step": 315, "train_info/time_within_train_step": 27.7279212474823, "step": 315}
{"train_info/time_between_train_steps": 0.01007533073425293, "step": 315}
{"info/global_step": 316, "train_info/time_within_train_step": 27.74484419822693, "step": 316}
{"train_info/time_between_train_steps": 0.0050694942474365234, "step": 316}
{"info/global_step": 317, "train_info/time_within_train_step": 27.717705011367798, "step": 317}
{"train_info/time_between_train_steps": 0.0052433013916015625, "step": 317}
{"info/global_step": 318, "train_info/time_within_train_step": 27.732136249542236, "step": 318}
{"train_info/time_between_train_steps": 0.010149955749511719, "step": 318}
{"info/global_step": 319, "train_info/time_within_train_step": 27.719392776489258, "step": 319}
{"train_info/time_between_train_steps": 0.00507044792175293, "step": 319}
{"info/global_step": 320, "train_info/time_within_train_step": 27.721543550491333, "step": 320}
{"train_info/time_between_train_steps": 0.004971504211425781, "step": 320}
{"info/global_step": 321, "train_info/time_within_train_step": 27.728548049926758, "step": 321}
{"train_info/time_between_train_steps": 0.005342960357666016, "step": 321}
{"info/global_step": 322, "train_info/time_within_train_step": 27.818559169769287, "step": 322}
{"train_info/time_between_train_steps": 0.0052068233489990234, "step": 322}
{"info/global_step": 323, "train_info/time_within_train_step": 27.7599778175354, "step": 323}
{"train_info/time_between_train_steps": 0.01067495346069336, "step": 323}
{"info/global_step": 324, "train_info/time_within_train_step": 27.79781723022461, "step": 324}
{"train_info/time_between_train_steps": 0.005524396896362305, "step": 324}
{"train_info/time_between_train_steps": 20.52922534942627, "step": 324}
{"info/global_step": 325, "train_info/time_within_train_step": 27.734939575195312, "step": 325}
{"train_info/time_between_train_steps": 0.00511622428894043, "step": 325}
{"info/global_step": 326, "train_info/time_within_train_step": 27.846824169158936, "step": 326}
{"train_info/time_between_train_steps": 0.004900693893432617, "step": 326}
{"info/global_step": 327, "train_info/time_within_train_step": 27.722298622131348, "step": 327}
{"train_info/time_between_train_steps": 0.004973888397216797, "step": 327}
{"info/global_step": 328, "train_info/time_within_train_step": 27.8894681930542, "step": 328}
{"train_info/time_between_train_steps": 0.00516200065612793, "step": 328}
{"info/global_step": 329, "train_info/time_within_train_step": 27.731228351593018, "step": 329}
{"train_info/time_between_train_steps": 0.0051920413970947266, "step": 329}
{"info/global_step": 330, "train_info/time_within_train_step": 27.886327981948853, "step": 330}
{"train_info/time_between_train_steps": 0.005409955978393555, "step": 330}
{"info/global_step": 331, "train_info/time_within_train_step": 28.14689016342163, "step": 331}
{"train_info/time_between_train_steps": 0.009638547897338867, "step": 331}
{"info/global_step": 332, "train_info/time_within_train_step": 27.803853511810303, "step": 332}
{"train_info/time_between_train_steps": 0.005159854888916016, "step": 332}
{"info/global_step": 333, "train_info/time_within_train_step": 27.752869844436646, "step": 333}
{"train_info/time_between_train_steps": 0.004914045333862305, "step": 333}
{"info/global_step": 334, "train_info/time_within_train_step": 27.85798478126526, "step": 334}
{"train_info/time_between_train_steps": 0.00507807731628418, "step": 334}
{"info/global_step": 335, "train_info/time_within_train_step": 27.94043755531311, "step": 335}
{"train_info/time_between_train_steps": 0.0061109066009521484, "step": 335}
{"info/global_step": 336, "train_info/time_within_train_step": 27.75639510154724, "step": 336}
{"train_info/time_between_train_steps": 0.005135297775268555, "step": 336}
{"info/global_step": 337, "train_info/time_within_train_step": 27.916022539138794, "step": 337}
{"train_info/time_between_train_steps": 0.005925178527832031, "step": 337}
{"info/global_step": 338, "train_info/time_within_train_step": 27.831701278686523, "step": 338}
{"train_info/time_between_train_steps": 0.005036592483520508, "step": 338}
{"info/global_step": 339, "train_info/time_within_train_step": 27.73387098312378, "step": 339}
{"train_info/time_between_train_steps": 0.005012035369873047, "step": 339}
{"info/global_step": 340, "train_info/time_within_train_step": 27.826111555099487, "step": 340}
{"train_info/time_between_train_steps": 0.01022648811340332, "step": 340}
{"info/global_step": 341, "train_info/time_within_train_step": 27.731702089309692, "step": 341}
{"train_info/time_between_train_steps": 0.005140781402587891, "step": 341}
{"info/global_step": 342, "train_info/time_within_train_step": 27.72467064857483, "step": 342}
{"train_info/time_between_train_steps": 0.0051801204681396484, "step": 342}
{"info/global_step": 343, "train_info/time_within_train_step": 27.744710445404053, "step": 343}
{"train_info/time_between_train_steps": 0.004996776580810547, "step": 343}
{"info/global_step": 344, "train_info/time_within_train_step": 27.74058699607849, "step": 344}
{"train_info/time_between_train_steps": 0.005035877227783203, "step": 344}
{"info/global_step": 345, "train_info/time_within_train_step": 27.812019109725952, "step": 345}
{"train_info/time_between_train_steps": 0.006716251373291016, "step": 345}
{"info/global_step": 346, "train_info/time_within_train_step": 27.883836030960083, "step": 346}
{"train_info/time_between_train_steps": 0.005408048629760742, "step": 346}
{"info/global_step": 347, "train_info/time_within_train_step": 27.864848613739014, "step": 347}
{"train_info/time_between_train_steps": 0.005125284194946289, "step": 347}
{"info/global_step": 348, "train_info/time_within_train_step": 27.7562997341156, "step": 348}
{"train_info/time_between_train_steps": 0.005705118179321289, "step": 348}
{"info/global_step": 349, "train_info/time_within_train_step": 27.809571504592896, "step": 349}
{"train_info/time_between_train_steps": 0.00543212890625, "step": 349}
{"info/global_step": 350, "train_info/time_within_train_step": 27.89029026031494, "step": 350}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733847463, "_runtime": 9997}, "step": 350}
{"logs": {"train/loss": 5.3915, "train/learning_rate": 0.00047222222222222224, "train/epoch": 12.02, "_timestamp": 1733847462, "_runtime": 9996}, "step": 350}
{"train_info/time_between_train_steps": 0.013315439224243164, "step": 350}
{"info/global_step": 351, "train_info/time_within_train_step": 28.034992456436157, "step": 351}
{"train_info/time_between_train_steps": 0.012298822402954102, "step": 351}
{"train_info/time_between_train_steps": 20.835104942321777, "step": 351}
{"info/global_step": 352, "train_info/time_within_train_step": 27.838627099990845, "step": 352}
{"train_info/time_between_train_steps": 0.004965305328369141, "step": 352}
{"info/global_step": 353, "train_info/time_within_train_step": 27.86530876159668, "step": 353}
{"train_info/time_between_train_steps": 0.005539417266845703, "step": 353}
{"info/global_step": 354, "train_info/time_within_train_step": 27.86088514328003, "step": 354}
{"train_info/time_between_train_steps": 0.005331754684448242, "step": 354}
{"info/global_step": 355, "train_info/time_within_train_step": 27.932851552963257, "step": 355}
{"train_info/time_between_train_steps": 0.005402565002441406, "step": 355}
{"info/global_step": 356, "train_info/time_within_train_step": 27.763731718063354, "step": 356}
{"train_info/time_between_train_steps": 0.005354166030883789, "step": 356}
{"info/global_step": 357, "train_info/time_within_train_step": 28.083488702774048, "step": 357}
{"train_info/time_between_train_steps": 0.010519027709960938, "step": 357}
{"info/global_step": 358, "train_info/time_within_train_step": 27.785070419311523, "step": 358}
{"train_info/time_between_train_steps": 0.005342006683349609, "step": 358}
{"info/global_step": 359, "train_info/time_within_train_step": 27.898256063461304, "step": 359}
{"train_info/time_between_train_steps": 0.010256290435791016, "step": 359}
{"info/global_step": 360, "train_info/time_within_train_step": 27.761725425720215, "step": 360}
{"train_info/time_between_train_steps": 0.00529170036315918, "step": 360}
{"info/global_step": 361, "train_info/time_within_train_step": 27.79618191719055, "step": 361}
{"train_info/time_between_train_steps": 0.00996851921081543, "step": 361}
{"info/global_step": 362, "train_info/time_within_train_step": 27.965372800827026, "step": 362}
{"train_info/time_between_train_steps": 0.009181022644042969, "step": 362}
{"info/global_step": 363, "train_info/time_within_train_step": 27.749699115753174, "step": 363}
{"train_info/time_between_train_steps": 0.005236625671386719, "step": 363}
{"info/global_step": 364, "train_info/time_within_train_step": 27.748154401779175, "step": 364}
{"train_info/time_between_train_steps": 0.005272626876831055, "step": 364}
{"info/global_step": 365, "train_info/time_within_train_step": 27.742531538009644, "step": 365}
{"train_info/time_between_train_steps": 0.005281925201416016, "step": 365}
{"info/global_step": 366, "train_info/time_within_train_step": 27.740730047225952, "step": 366}
{"train_info/time_between_train_steps": 0.005228996276855469, "step": 366}
{"info/global_step": 367, "train_info/time_within_train_step": 27.970027685165405, "step": 367}
{"train_info/time_between_train_steps": 0.009281635284423828, "step": 367}
{"info/global_step": 368, "train_info/time_within_train_step": 27.757256984710693, "step": 368}
{"train_info/time_between_train_steps": 0.005117654800415039, "step": 368}
{"info/global_step": 369, "train_info/time_within_train_step": 27.748980283737183, "step": 369}
{"train_info/time_between_train_steps": 0.005200624465942383, "step": 369}
{"info/global_step": 370, "train_info/time_within_train_step": 27.765353441238403, "step": 370}
{"train_info/time_between_train_steps": 0.005095005035400391, "step": 370}
{"info/global_step": 371, "train_info/time_within_train_step": 27.73067331314087, "step": 371}
{"train_info/time_between_train_steps": 0.005021810531616211, "step": 371}
{"info/global_step": 372, "train_info/time_within_train_step": 27.72425079345703, "step": 372}
{"train_info/time_between_train_steps": 0.005029439926147461, "step": 372}
{"info/global_step": 373, "train_info/time_within_train_step": 27.752453804016113, "step": 373}
{"train_info/time_between_train_steps": 0.005039691925048828, "step": 373}
{"info/global_step": 374, "train_info/time_within_train_step": 27.799493551254272, "step": 374}
{"train_info/time_between_train_steps": 0.010115861892700195, "step": 374}
{"info/global_step": 375, "train_info/time_within_train_step": 27.857868194580078, "step": 375}
{"train_info/time_between_train_steps": 0.012094259262084961, "step": 375}
{"info/global_step": 376, "train_info/time_within_train_step": 27.82172393798828, "step": 376}
{"train_info/time_between_train_steps": 0.005137443542480469, "step": 376}
{"info/global_step": 377, "train_info/time_within_train_step": 27.779067754745483, "step": 377}
{"train_info/time_between_train_steps": 0.009011268615722656, "step": 377}
{"info/global_step": 378, "train_info/time_within_train_step": 27.904896020889282, "step": 378}
{"train_info/time_between_train_steps": 0.005731821060180664, "step": 378}
{"train_info/time_between_train_steps": 20.576889038085938, "step": 378}
{"info/global_step": 379, "train_info/time_within_train_step": 27.994921445846558, "step": 379}
{"train_info/time_between_train_steps": 0.009894609451293945, "step": 379}
{"info/global_step": 380, "train_info/time_within_train_step": 27.895705938339233, "step": 380}
{"train_info/time_between_train_steps": 0.004934072494506836, "step": 380}
{"info/global_step": 381, "train_info/time_within_train_step": 27.753315687179565, "step": 381}
{"train_info/time_between_train_steps": 0.00986170768737793, "step": 381}
{"info/global_step": 382, "train_info/time_within_train_step": 28.091212511062622, "step": 382}
{"train_info/time_between_train_steps": 0.005196809768676758, "step": 382}
{"info/global_step": 383, "train_info/time_within_train_step": 27.878876209259033, "step": 383}
{"train_info/time_between_train_steps": 0.010180234909057617, "step": 383}
{"info/global_step": 384, "train_info/time_within_train_step": 27.96492576599121, "step": 384}
{"train_info/time_between_train_steps": 0.00519251823425293, "step": 384}
{"info/global_step": 385, "train_info/time_within_train_step": 27.899820804595947, "step": 385}
{"train_info/time_between_train_steps": 0.006366729736328125, "step": 385}
{"info/global_step": 386, "train_info/time_within_train_step": 27.786014556884766, "step": 386}
{"train_info/time_between_train_steps": 0.005334377288818359, "step": 386}
{"info/global_step": 387, "train_info/time_within_train_step": 27.8052339553833, "step": 387}
{"train_info/time_between_train_steps": 0.004858493804931641, "step": 387}
{"info/global_step": 388, "train_info/time_within_train_step": 27.762908458709717, "step": 388}
{"train_info/time_between_train_steps": 0.005022287368774414, "step": 388}
{"info/global_step": 389, "train_info/time_within_train_step": 27.865958213806152, "step": 389}
{"train_info/time_between_train_steps": 0.011814355850219727, "step": 389}
{"info/global_step": 390, "train_info/time_within_train_step": 27.805355072021484, "step": 390}
{"train_info/time_between_train_steps": 0.005197286605834961, "step": 390}
{"info/global_step": 391, "train_info/time_within_train_step": 27.729746341705322, "step": 391}
{"train_info/time_between_train_steps": 0.005089998245239258, "step": 391}
{"info/global_step": 392, "train_info/time_within_train_step": 27.747085094451904, "step": 392}
{"train_info/time_between_train_steps": 0.005151033401489258, "step": 392}
{"info/global_step": 393, "train_info/time_within_train_step": 27.73450779914856, "step": 393}
{"train_info/time_between_train_steps": 0.005227327346801758, "step": 393}
{"info/global_step": 394, "train_info/time_within_train_step": 27.737751483917236, "step": 394}
{"train_info/time_between_train_steps": 0.005028963088989258, "step": 394}
{"info/global_step": 395, "train_info/time_within_train_step": 27.813656091690063, "step": 395}
{"train_info/time_between_train_steps": 0.0050811767578125, "step": 395}
{"info/global_step": 396, "train_info/time_within_train_step": 27.73879098892212, "step": 396}
{"train_info/time_between_train_steps": 0.010061979293823242, "step": 396}
{"info/global_step": 397, "train_info/time_within_train_step": 27.756526231765747, "step": 397}
{"train_info/time_between_train_steps": 0.005067348480224609, "step": 397}
{"info/global_step": 398, "train_info/time_within_train_step": 27.85475730895996, "step": 398}
{"train_info/time_between_train_steps": 0.009316682815551758, "step": 398}
{"info/global_step": 399, "train_info/time_within_train_step": 27.949864387512207, "step": 399}
{"train_info/time_between_train_steps": 0.014608144760131836, "step": 399}
{"info/global_step": 400, "train_info/time_within_train_step": 27.76034903526306, "step": 400}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733848896, "_runtime": 11430}, "step": 400}
{"logs": {"train/loss": 5.2919, "train/learning_rate": 0.00044444444444444436, "train/epoch": 14.02, "_timestamp": 1733848896, "_runtime": 11430}, "step": 400}
{"train_info/time_between_train_steps": 2.3271186351776123, "step": 400}
{"info/global_step": 401, "train_info/time_within_train_step": 27.758819103240967, "step": 401}
{"train_info/time_between_train_steps": 0.005136728286743164, "step": 401}
{"info/global_step": 402, "train_info/time_within_train_step": 28.02059054374695, "step": 402}
{"train_info/time_between_train_steps": 0.005312681198120117, "step": 402}
{"info/global_step": 403, "train_info/time_within_train_step": 27.729578495025635, "step": 403}
{"train_info/time_between_train_steps": 0.005157947540283203, "step": 403}
{"info/global_step": 404, "train_info/time_within_train_step": 27.74694323539734, "step": 404}
{"train_info/time_between_train_steps": 0.0054662227630615234, "step": 404}
{"info/global_step": 405, "train_info/time_within_train_step": 27.754746913909912, "step": 405}
{"train_info/time_between_train_steps": 0.005640745162963867, "step": 405}
{"train_info/time_between_train_steps": 20.535749673843384, "step": 405}
{"info/global_step": 406, "train_info/time_within_train_step": 27.781424283981323, "step": 406}
{"train_info/time_between_train_steps": 0.0050220489501953125, "step": 406}
{"info/global_step": 407, "train_info/time_within_train_step": 28.14889168739319, "step": 407}
{"train_info/time_between_train_steps": 0.009765625, "step": 407}
{"info/global_step": 408, "train_info/time_within_train_step": 27.714982986450195, "step": 408}
{"train_info/time_between_train_steps": 0.004858970642089844, "step": 408}
{"info/global_step": 409, "train_info/time_within_train_step": 27.897136449813843, "step": 409}
{"train_info/time_between_train_steps": 0.006959676742553711, "step": 409}
{"info/global_step": 410, "train_info/time_within_train_step": 27.790531635284424, "step": 410}
{"train_info/time_between_train_steps": 0.0054111480712890625, "step": 410}
{"info/global_step": 411, "train_info/time_within_train_step": 27.89456081390381, "step": 411}
{"train_info/time_between_train_steps": 0.005204200744628906, "step": 411}
{"info/global_step": 412, "train_info/time_within_train_step": 27.77201247215271, "step": 412}
{"train_info/time_between_train_steps": 0.014965057373046875, "step": 412}
{"info/global_step": 413, "train_info/time_within_train_step": 27.926236152648926, "step": 413}
{"train_info/time_between_train_steps": 0.0052411556243896484, "step": 413}
{"info/global_step": 414, "train_info/time_within_train_step": 27.75125026702881, "step": 414}
{"train_info/time_between_train_steps": 0.014559745788574219, "step": 414}
{"info/global_step": 415, "train_info/time_within_train_step": 27.768598079681396, "step": 415}
{"train_info/time_between_train_steps": 0.00505375862121582, "step": 415}
{"info/global_step": 416, "train_info/time_within_train_step": 27.741361141204834, "step": 416}
{"train_info/time_between_train_steps": 0.005194425582885742, "step": 416}
{"info/global_step": 417, "train_info/time_within_train_step": 27.783833265304565, "step": 417}
{"train_info/time_between_train_steps": 0.005002737045288086, "step": 417}
{"info/global_step": 418, "train_info/time_within_train_step": 27.794346570968628, "step": 418}
{"train_info/time_between_train_steps": 0.005013465881347656, "step": 418}
{"info/global_step": 419, "train_info/time_within_train_step": 27.74139094352722, "step": 419}
{"train_info/time_between_train_steps": 0.010063886642456055, "step": 419}
{"info/global_step": 420, "train_info/time_within_train_step": 27.776925802230835, "step": 420}
{"train_info/time_between_train_steps": 0.005097389221191406, "step": 420}
{"info/global_step": 421, "train_info/time_within_train_step": 27.738834857940674, "step": 421}
{"train_info/time_between_train_steps": 0.005158185958862305, "step": 421}
{"info/global_step": 422, "train_info/time_within_train_step": 27.874447345733643, "step": 422}
{"train_info/time_between_train_steps": 0.005089998245239258, "step": 422}
{"info/global_step": 423, "train_info/time_within_train_step": 27.769465923309326, "step": 423}
{"train_info/time_between_train_steps": 0.014439582824707031, "step": 423}
{"info/global_step": 424, "train_info/time_within_train_step": 27.728301525115967, "step": 424}
{"train_info/time_between_train_steps": 0.005005836486816406, "step": 424}
{"info/global_step": 425, "train_info/time_within_train_step": 27.73901915550232, "step": 425}
{"train_info/time_between_train_steps": 0.005102634429931641, "step": 425}
{"info/global_step": 426, "train_info/time_within_train_step": 27.823200225830078, "step": 426}
{"train_info/time_between_train_steps": 0.0053026676177978516, "step": 426}
{"info/global_step": 427, "train_info/time_within_train_step": 27.9656662940979, "step": 427}
{"train_info/time_between_train_steps": 0.005090236663818359, "step": 427}
{"info/global_step": 428, "train_info/time_within_train_step": 27.85083532333374, "step": 428}
{"train_info/time_between_train_steps": 0.005076169967651367, "step": 428}
{"info/global_step": 429, "train_info/time_within_train_step": 27.908479928970337, "step": 429}
{"train_info/time_between_train_steps": 0.0103607177734375, "step": 429}
{"info/global_step": 430, "train_info/time_within_train_step": 27.79194188117981, "step": 430}
{"train_info/time_between_train_steps": 0.0052759647369384766, "step": 430}
{"info/global_step": 431, "train_info/time_within_train_step": 27.76353645324707, "step": 431}
{"train_info/time_between_train_steps": 0.005711555480957031, "step": 431}
{"info/global_step": 432, "train_info/time_within_train_step": 27.782108545303345, "step": 432}
{"train_info/time_between_train_steps": 0.00569462776184082, "step": 432}
{"train_info/time_between_train_steps": 20.67615556716919, "step": 432}
{"info/global_step": 433, "train_info/time_within_train_step": 27.832301139831543, "step": 433}
{"train_info/time_between_train_steps": 0.0103759765625, "step": 433}
{"info/global_step": 434, "train_info/time_within_train_step": 28.029566049575806, "step": 434}
{"train_info/time_between_train_steps": 0.00540471076965332, "step": 434}
{"info/global_step": 435, "train_info/time_within_train_step": 27.74751043319702, "step": 435}
{"train_info/time_between_train_steps": 0.0051555633544921875, "step": 435}
{"info/global_step": 436, "train_info/time_within_train_step": 27.851636171340942, "step": 436}
{"train_info/time_between_train_steps": 0.005338430404663086, "step": 436}
{"info/global_step": 437, "train_info/time_within_train_step": 27.767147064208984, "step": 437}
{"train_info/time_between_train_steps": 0.005290031433105469, "step": 437}
{"info/global_step": 438, "train_info/time_within_train_step": 27.87998342514038, "step": 438}
{"train_info/time_between_train_steps": 0.005120277404785156, "step": 438}
{"info/global_step": 439, "train_info/time_within_train_step": 27.802748441696167, "step": 439}
{"train_info/time_between_train_steps": 0.005309581756591797, "step": 439}
{"info/global_step": 440, "train_info/time_within_train_step": 27.831783056259155, "step": 440}
{"train_info/time_between_train_steps": 0.005369901657104492, "step": 440}
{"info/global_step": 441, "train_info/time_within_train_step": 27.780241012573242, "step": 441}
{"train_info/time_between_train_steps": 0.005509853363037109, "step": 441}
{"info/global_step": 442, "train_info/time_within_train_step": 27.742167711257935, "step": 442}
{"train_info/time_between_train_steps": 0.0050201416015625, "step": 442}
{"info/global_step": 443, "train_info/time_within_train_step": 27.831027030944824, "step": 443}
{"train_info/time_between_train_steps": 0.007970809936523438, "step": 443}
{"info/global_step": 444, "train_info/time_within_train_step": 27.87764573097229, "step": 444}
{"train_info/time_between_train_steps": 0.0050313472747802734, "step": 444}
{"info/global_step": 445, "train_info/time_within_train_step": 27.865816354751587, "step": 445}
{"train_info/time_between_train_steps": 0.005097866058349609, "step": 445}
{"info/global_step": 446, "train_info/time_within_train_step": 27.738517999649048, "step": 446}
{"train_info/time_between_train_steps": 0.005026578903198242, "step": 446}
{"info/global_step": 447, "train_info/time_within_train_step": 27.760932445526123, "step": 447}
{"train_info/time_between_train_steps": 0.016861915588378906, "step": 447}
{"info/global_step": 448, "train_info/time_within_train_step": 27.75521969795227, "step": 448}
{"train_info/time_between_train_steps": 0.005162239074707031, "step": 448}
{"info/global_step": 449, "train_info/time_within_train_step": 27.789053201675415, "step": 449}
{"train_info/time_between_train_steps": 0.006273984909057617, "step": 449}
{"info/global_step": 450, "train_info/time_within_train_step": 27.748817920684814, "step": 450}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733850330, "_runtime": 12864}, "step": 450}
{"logs": {"train/loss": 5.1374, "train/learning_rate": 0.00041666666666666664, "train/epoch": 16.02, "_timestamp": 1733850330, "_runtime": 12864}, "step": 450}
{"train_info/time_between_train_steps": 0.007113933563232422, "step": 450}
{"info/global_step": 451, "train_info/time_within_train_step": 27.76095676422119, "step": 451}
{"train_info/time_between_train_steps": 0.0050601959228515625, "step": 451}
{"info/global_step": 452, "train_info/time_within_train_step": 27.741503477096558, "step": 452}
{"train_info/time_between_train_steps": 0.005109071731567383, "step": 452}
{"info/global_step": 453, "train_info/time_within_train_step": 27.747575759887695, "step": 453}
{"train_info/time_between_train_steps": 0.005141496658325195, "step": 453}
{"info/global_step": 454, "train_info/time_within_train_step": 27.742950201034546, "step": 454}
{"train_info/time_between_train_steps": 0.00497126579284668, "step": 454}
{"info/global_step": 455, "train_info/time_within_train_step": 27.76782202720642, "step": 455}
{"train_info/time_between_train_steps": 0.005158185958862305, "step": 455}
{"info/global_step": 456, "train_info/time_within_train_step": 27.741227865219116, "step": 456}
{"train_info/time_between_train_steps": 0.005218982696533203, "step": 456}
{"info/global_step": 457, "train_info/time_within_train_step": 27.757461071014404, "step": 457}
{"train_info/time_between_train_steps": 0.005216360092163086, "step": 457}
{"info/global_step": 458, "train_info/time_within_train_step": 27.783867835998535, "step": 458}
{"train_info/time_between_train_steps": 0.005308866500854492, "step": 458}
{"info/global_step": 459, "train_info/time_within_train_step": 27.874332666397095, "step": 459}
{"train_info/time_between_train_steps": 0.005657196044921875, "step": 459}
{"train_info/time_between_train_steps": 20.79917860031128, "step": 459}
{"info/global_step": 460, "train_info/time_within_train_step": 27.73839545249939, "step": 460}
{"train_info/time_between_train_steps": 0.0053555965423583984, "step": 460}
{"info/global_step": 461, "train_info/time_within_train_step": 27.904632329940796, "step": 461}
{"train_info/time_between_train_steps": 0.005204677581787109, "step": 461}
{"info/global_step": 462, "train_info/time_within_train_step": 27.821991682052612, "step": 462}
{"train_info/time_between_train_steps": 0.010267972946166992, "step": 462}
{"info/global_step": 463, "train_info/time_within_train_step": 27.918384075164795, "step": 463}
{"train_info/time_between_train_steps": 0.010690927505493164, "step": 463}
{"info/global_step": 464, "train_info/time_within_train_step": 27.79801321029663, "step": 464}
{"train_info/time_between_train_steps": 0.005879402160644531, "step": 464}
{"info/global_step": 465, "train_info/time_within_train_step": 27.92726230621338, "step": 465}
{"train_info/time_between_train_steps": 0.005147457122802734, "step": 465}
{"info/global_step": 466, "train_info/time_within_train_step": 27.72624969482422, "step": 466}
{"train_info/time_between_train_steps": 0.005268096923828125, "step": 466}
{"info/global_step": 467, "train_info/time_within_train_step": 27.760415077209473, "step": 467}
{"train_info/time_between_train_steps": 0.0052258968353271484, "step": 467}
{"info/global_step": 468, "train_info/time_within_train_step": 27.737510204315186, "step": 468}
{"train_info/time_between_train_steps": 0.005028247833251953, "step": 468}
{"info/global_step": 469, "train_info/time_within_train_step": 27.729257106781006, "step": 469}
{"train_info/time_between_train_steps": 0.00995635986328125, "step": 469}
{"info/global_step": 470, "train_info/time_within_train_step": 27.726659297943115, "step": 470}
{"train_info/time_between_train_steps": 0.004998445510864258, "step": 470}
{"info/global_step": 471, "train_info/time_within_train_step": 27.745108127593994, "step": 471}
{"train_info/time_between_train_steps": 0.0049915313720703125, "step": 471}
{"info/global_step": 472, "train_info/time_within_train_step": 27.737191915512085, "step": 472}
{"train_info/time_between_train_steps": 0.009885072708129883, "step": 472}
{"info/global_step": 473, "train_info/time_within_train_step": 27.740577459335327, "step": 473}
{"train_info/time_between_train_steps": 0.010278940200805664, "step": 473}
{"info/global_step": 474, "train_info/time_within_train_step": 27.881752252578735, "step": 474}
{"train_info/time_between_train_steps": 0.005083322525024414, "step": 474}
{"info/global_step": 475, "train_info/time_within_train_step": 27.787505865097046, "step": 475}
{"train_info/time_between_train_steps": 0.015291929244995117, "step": 475}
{"info/global_step": 476, "train_info/time_within_train_step": 27.734116554260254, "step": 476}
{"train_info/time_between_train_steps": 0.005072116851806641, "step": 476}
{"info/global_step": 477, "train_info/time_within_train_step": 27.730920791625977, "step": 477}
{"train_info/time_between_train_steps": 0.005055665969848633, "step": 477}
{"info/global_step": 478, "train_info/time_within_train_step": 27.74897527694702, "step": 478}
{"train_info/time_between_train_steps": 0.005132198333740234, "step": 478}
{"info/global_step": 479, "train_info/time_within_train_step": 27.741734743118286, "step": 479}
{"train_info/time_between_train_steps": 0.005113363265991211, "step": 479}
{"info/global_step": 480, "train_info/time_within_train_step": 27.81471061706543, "step": 480}
{"train_info/time_between_train_steps": 0.005048513412475586, "step": 480}
{"info/global_step": 481, "train_info/time_within_train_step": 27.923840761184692, "step": 481}
{"train_info/time_between_train_steps": 0.0050411224365234375, "step": 481}
{"info/global_step": 482, "train_info/time_within_train_step": 27.73684859275818, "step": 482}
{"train_info/time_between_train_steps": 0.005318880081176758, "step": 482}
{"info/global_step": 483, "train_info/time_within_train_step": 27.833930253982544, "step": 483}
{"train_info/time_between_train_steps": 0.00538182258605957, "step": 483}
{"info/global_step": 484, "train_info/time_within_train_step": 27.74021625518799, "step": 484}
{"train_info/time_between_train_steps": 0.005328178405761719, "step": 484}
{"info/global_step": 485, "train_info/time_within_train_step": 27.7747962474823, "step": 485}
{"train_info/time_between_train_steps": 0.005568265914916992, "step": 485}
{"info/global_step": 486, "train_info/time_within_train_step": 27.81424903869629, "step": 486}
{"train_info/time_between_train_steps": 0.005482196807861328, "step": 486}
{"train_info/time_between_train_steps": 20.35525870323181, "step": 486}
{"info/global_step": 487, "train_info/time_within_train_step": 27.727092504501343, "step": 487}
{"train_info/time_between_train_steps": 0.005250453948974609, "step": 487}
{"info/global_step": 488, "train_info/time_within_train_step": 27.956749439239502, "step": 488}
{"train_info/time_between_train_steps": 0.0053293704986572266, "step": 488}
{"info/global_step": 489, "train_info/time_within_train_step": 27.89732027053833, "step": 489}
{"train_info/time_between_train_steps": 0.009800195693969727, "step": 489}
{"info/global_step": 490, "train_info/time_within_train_step": 27.875550746917725, "step": 490}
{"train_info/time_between_train_steps": 0.005266666412353516, "step": 490}
{"info/global_step": 491, "train_info/time_within_train_step": 27.753535985946655, "step": 491}
{"train_info/time_between_train_steps": 0.005110740661621094, "step": 491}
{"info/global_step": 492, "train_info/time_within_train_step": 27.867799997329712, "step": 492}
{"train_info/time_between_train_steps": 0.005168437957763672, "step": 492}
{"info/global_step": 493, "train_info/time_within_train_step": 27.747122764587402, "step": 493}
{"train_info/time_between_train_steps": 0.015269994735717773, "step": 493}
{"info/global_step": 494, "train_info/time_within_train_step": 27.812132596969604, "step": 494}
{"train_info/time_between_train_steps": 0.0053958892822265625, "step": 494}
{"info/global_step": 495, "train_info/time_within_train_step": 27.844094038009644, "step": 495}
{"train_info/time_between_train_steps": 0.005109071731567383, "step": 495}
{"info/global_step": 496, "train_info/time_within_train_step": 27.720019817352295, "step": 496}
{"train_info/time_between_train_steps": 0.005018472671508789, "step": 496}
{"info/global_step": 497, "train_info/time_within_train_step": 27.766876459121704, "step": 497}
{"train_info/time_between_train_steps": 0.004979133605957031, "step": 497}
{"info/global_step": 498, "train_info/time_within_train_step": 27.724001169204712, "step": 498}
{"train_info/time_between_train_steps": 0.004948616027832031, "step": 498}
{"info/global_step": 499, "train_info/time_within_train_step": 27.74709129333496, "step": 499}
{"train_info/time_between_train_steps": 0.005049705505371094, "step": 499}
{"info/global_step": 500, "train_info/time_within_train_step": 27.77884078025818, "step": 500}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733851761, "_runtime": 14295}, "step": 500}
{"logs": {"train/loss": 4.9743, "train/learning_rate": 0.00038888888888888887, "train/epoch": 18.01, "_timestamp": 1733851761, "_runtime": 14295}, "step": 500}
{"train_info/time_between_train_steps": 2.479358673095703, "step": 500}
{"info/global_step": 501, "train_info/time_within_train_step": 27.734944105148315, "step": 501}
{"train_info/time_between_train_steps": 0.00496363639831543, "step": 501}
{"info/global_step": 502, "train_info/time_within_train_step": 27.773504495620728, "step": 502}
{"train_info/time_between_train_steps": 0.005080461502075195, "step": 502}
{"info/global_step": 503, "train_info/time_within_train_step": 27.79955554008484, "step": 503}
{"train_info/time_between_train_steps": 0.00993037223815918, "step": 503}
{"info/global_step": 504, "train_info/time_within_train_step": 27.82411766052246, "step": 504}
{"train_info/time_between_train_steps": 0.0051076412200927734, "step": 504}
{"info/global_step": 505, "train_info/time_within_train_step": 27.89469337463379, "step": 505}
{"train_info/time_between_train_steps": 0.00510859489440918, "step": 505}
{"info/global_step": 506, "train_info/time_within_train_step": 27.750964403152466, "step": 506}
{"train_info/time_between_train_steps": 0.004985332489013672, "step": 506}
{"info/global_step": 507, "train_info/time_within_train_step": 27.875659227371216, "step": 507}
{"train_info/time_between_train_steps": 0.0051250457763671875, "step": 507}
{"info/global_step": 508, "train_info/time_within_train_step": 27.738070011138916, "step": 508}
{"train_info/time_between_train_steps": 0.005110263824462891, "step": 508}
{"info/global_step": 509, "train_info/time_within_train_step": 27.785931825637817, "step": 509}
{"train_info/time_between_train_steps": 0.005138874053955078, "step": 509}
{"info/global_step": 510, "train_info/time_within_train_step": 27.80075216293335, "step": 510}
{"train_info/time_between_train_steps": 0.005467653274536133, "step": 510}
{"info/global_step": 511, "train_info/time_within_train_step": 27.786115169525146, "step": 511}
{"train_info/time_between_train_steps": 0.005323648452758789, "step": 511}
{"info/global_step": 512, "train_info/time_within_train_step": 27.807491540908813, "step": 512}
{"train_info/time_between_train_steps": 0.00561976432800293, "step": 512}
{"info/global_step": 513, "train_info/time_within_train_step": 27.961431980133057, "step": 513}
{"train_info/time_between_train_steps": 0.011227130889892578, "step": 513}
{"train_info/time_between_train_steps": 20.697267055511475, "step": 513}
{"info/global_step": 514, "train_info/time_within_train_step": 27.78836750984192, "step": 514}
{"train_info/time_between_train_steps": 0.005481243133544922, "step": 514}
{"info/global_step": 515, "train_info/time_within_train_step": 27.982995748519897, "step": 515}
{"train_info/time_between_train_steps": 0.005597114562988281, "step": 515}
{"info/global_step": 516, "train_info/time_within_train_step": 27.811208248138428, "step": 516}
{"train_info/time_between_train_steps": 0.005969047546386719, "step": 516}
{"info/global_step": 517, "train_info/time_within_train_step": 27.959312915802002, "step": 517}
{"train_info/time_between_train_steps": 0.010221719741821289, "step": 517}
{"info/global_step": 518, "train_info/time_within_train_step": 27.843581199645996, "step": 518}
{"train_info/time_between_train_steps": 0.0051839351654052734, "step": 518}
{"info/global_step": 519, "train_info/time_within_train_step": 27.959177494049072, "step": 519}
{"train_info/time_between_train_steps": 0.010284900665283203, "step": 519}
{"info/global_step": 520, "train_info/time_within_train_step": 27.892686128616333, "step": 520}
{"train_info/time_between_train_steps": 0.00549006462097168, "step": 520}
{"info/global_step": 521, "train_info/time_within_train_step": 27.88175630569458, "step": 521}
{"train_info/time_between_train_steps": 0.005183219909667969, "step": 521}
{"info/global_step": 522, "train_info/time_within_train_step": 27.8208429813385, "step": 522}
{"train_info/time_between_train_steps": 0.0050733089447021484, "step": 522}
{"info/global_step": 523, "train_info/time_within_train_step": 27.725430727005005, "step": 523}
{"train_info/time_between_train_steps": 0.00497889518737793, "step": 523}
{"info/global_step": 524, "train_info/time_within_train_step": 27.91330909729004, "step": 524}
{"train_info/time_between_train_steps": 0.00508880615234375, "step": 524}
{"info/global_step": 525, "train_info/time_within_train_step": 27.74242663383484, "step": 525}
{"train_info/time_between_train_steps": 0.004965066909790039, "step": 525}
{"info/global_step": 526, "train_info/time_within_train_step": 27.79505228996277, "step": 526}
{"train_info/time_between_train_steps": 0.009979248046875, "step": 526}
{"info/global_step": 527, "train_info/time_within_train_step": 27.770639419555664, "step": 527}
{"train_info/time_between_train_steps": 0.005091190338134766, "step": 527}
{"info/global_step": 528, "train_info/time_within_train_step": 27.788414239883423, "step": 528}
{"train_info/time_between_train_steps": 0.005141735076904297, "step": 528}
{"info/global_step": 529, "train_info/time_within_train_step": 27.76095986366272, "step": 529}
{"train_info/time_between_train_steps": 0.005112886428833008, "step": 529}
{"info/global_step": 530, "train_info/time_within_train_step": 27.741177320480347, "step": 530}
{"train_info/time_between_train_steps": 0.010050773620605469, "step": 530}
{"info/global_step": 531, "train_info/time_within_train_step": 27.79655432701111, "step": 531}
{"train_info/time_between_train_steps": 0.016010284423828125, "step": 531}
{"info/global_step": 532, "train_info/time_within_train_step": 27.969181299209595, "step": 532}
{"train_info/time_between_train_steps": 0.004994630813598633, "step": 532}
{"info/global_step": 533, "train_info/time_within_train_step": 27.751714944839478, "step": 533}
{"train_info/time_between_train_steps": 0.016512393951416016, "step": 533}
{"info/global_step": 534, "train_info/time_within_train_step": 27.77729034423828, "step": 534}
{"train_info/time_between_train_steps": 0.005259037017822266, "step": 534}
{"info/global_step": 535, "train_info/time_within_train_step": 27.86000657081604, "step": 535}
{"train_info/time_between_train_steps": 0.004935264587402344, "step": 535}
{"info/global_step": 536, "train_info/time_within_train_step": 27.732414484024048, "step": 536}
{"train_info/time_between_train_steps": 0.0049686431884765625, "step": 536}
{"info/global_step": 537, "train_info/time_within_train_step": 27.77794051170349, "step": 537}
{"train_info/time_between_train_steps": 0.005300760269165039, "step": 537}
{"info/global_step": 538, "train_info/time_within_train_step": 27.796300411224365, "step": 538}
{"train_info/time_between_train_steps": 0.005274295806884766, "step": 538}
{"info/global_step": 539, "train_info/time_within_train_step": 27.76822304725647, "step": 539}
{"train_info/time_between_train_steps": 0.0054738521575927734, "step": 539}
{"info/global_step": 540, "train_info/time_within_train_step": 27.80933666229248, "step": 540}
{"train_info/time_between_train_steps": 0.016819000244140625, "step": 540}
{"train_info/time_between_train_steps": 20.781395435333252, "step": 540}
{"info/global_step": 541, "train_info/time_within_train_step": 27.753413677215576, "step": 541}
{"train_info/time_between_train_steps": 0.005414485931396484, "step": 541}
{"info/global_step": 542, "train_info/time_within_train_step": 27.952946186065674, "step": 542}
{"train_info/time_between_train_steps": 0.005220890045166016, "step": 542}
{"info/global_step": 543, "train_info/time_within_train_step": 27.78562092781067, "step": 543}
{"train_info/time_between_train_steps": 0.01018667221069336, "step": 543}
{"info/global_step": 544, "train_info/time_within_train_step": 27.893250703811646, "step": 544}
{"train_info/time_between_train_steps": 0.005184650421142578, "step": 544}
{"info/global_step": 545, "train_info/time_within_train_step": 27.763105869293213, "step": 545}
{"train_info/time_between_train_steps": 0.005633354187011719, "step": 545}
{"info/global_step": 546, "train_info/time_within_train_step": 27.971553087234497, "step": 546}
{"train_info/time_between_train_steps": 0.005116462707519531, "step": 546}
{"info/global_step": 547, "train_info/time_within_train_step": 27.748326063156128, "step": 547}
{"train_info/time_between_train_steps": 0.00529170036315918, "step": 547}
{"info/global_step": 548, "train_info/time_within_train_step": 27.87013339996338, "step": 548}
{"train_info/time_between_train_steps": 0.005911588668823242, "step": 548}
{"info/global_step": 549, "train_info/time_within_train_step": 27.76372528076172, "step": 549}
{"train_info/time_between_train_steps": 0.005123138427734375, "step": 549}
{"info/global_step": 550, "train_info/time_within_train_step": 27.890082359313965, "step": 550}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733853197, "_runtime": 15731}, "step": 550}
{"logs": {"train/loss": 4.8204, "train/learning_rate": 0.0003611111111111111, "train/epoch": 20.01, "_timestamp": 1733853197, "_runtime": 15731}, "step": 550}
{"train_info/time_between_train_steps": 0.006836891174316406, "step": 550}
{"info/global_step": 551, "train_info/time_within_train_step": 27.737542867660522, "step": 551}
{"train_info/time_between_train_steps": 0.005034923553466797, "step": 551}
{"info/global_step": 552, "train_info/time_within_train_step": 27.793015718460083, "step": 552}
{"train_info/time_between_train_steps": 0.00500035285949707, "step": 552}
{"info/global_step": 553, "train_info/time_within_train_step": 27.7851824760437, "step": 553}
{"train_info/time_between_train_steps": 0.0050983428955078125, "step": 553}
{"info/global_step": 554, "train_info/time_within_train_step": 27.748215198516846, "step": 554}
{"train_info/time_between_train_steps": 0.010146379470825195, "step": 554}
{"info/global_step": 555, "train_info/time_within_train_step": 27.84894347190857, "step": 555}
{"train_info/time_between_train_steps": 0.0056836605072021484, "step": 555}
{"info/global_step": 556, "train_info/time_within_train_step": 27.809518098831177, "step": 556}
{"train_info/time_between_train_steps": 0.0051250457763671875, "step": 556}
{"info/global_step": 557, "train_info/time_within_train_step": 27.782158136367798, "step": 557}
{"train_info/time_between_train_steps": 0.005117177963256836, "step": 557}
{"info/global_step": 558, "train_info/time_within_train_step": 28.08929443359375, "step": 558}
{"train_info/time_between_train_steps": 0.010344505310058594, "step": 558}
{"info/global_step": 559, "train_info/time_within_train_step": 27.902549743652344, "step": 559}
{"train_info/time_between_train_steps": 0.005010843276977539, "step": 559}
{"info/global_step": 560, "train_info/time_within_train_step": 27.98092794418335, "step": 560}
{"train_info/time_between_train_steps": 0.004990100860595703, "step": 560}
{"info/global_step": 561, "train_info/time_within_train_step": 27.810869693756104, "step": 561}
{"train_info/time_between_train_steps": 0.005236387252807617, "step": 561}
{"info/global_step": 562, "train_info/time_within_train_step": 27.89516568183899, "step": 562}
{"train_info/time_between_train_steps": 0.005097150802612305, "step": 562}
{"info/global_step": 563, "train_info/time_within_train_step": 27.850146293640137, "step": 563}
{"train_info/time_between_train_steps": 0.005034923553466797, "step": 563}
{"info/global_step": 564, "train_info/time_within_train_step": 27.890215396881104, "step": 564}
{"train_info/time_between_train_steps": 0.005169391632080078, "step": 564}
{"info/global_step": 565, "train_info/time_within_train_step": 27.79915952682495, "step": 565}
{"train_info/time_between_train_steps": 0.0050771236419677734, "step": 565}
{"info/global_step": 566, "train_info/time_within_train_step": 27.971616983413696, "step": 566}
{"train_info/time_between_train_steps": 0.00548100471496582, "step": 566}
{"info/global_step": 567, "train_info/time_within_train_step": 27.77874779701233, "step": 567}
{"train_info/time_between_train_steps": 0.005533456802368164, "step": 567}
{"train_info/time_between_train_steps": 21.089324474334717, "step": 567}
{"info/global_step": 568, "train_info/time_within_train_step": 27.94830822944641, "step": 568}
{"train_info/time_between_train_steps": 0.004976987838745117, "step": 568}
{"info/global_step": 569, "train_info/time_within_train_step": 27.893412828445435, "step": 569}
{"train_info/time_between_train_steps": 0.005021333694458008, "step": 569}
{"info/global_step": 570, "train_info/time_within_train_step": 27.83604121208191, "step": 570}
{"train_info/time_between_train_steps": 0.005027294158935547, "step": 570}
{"info/global_step": 571, "train_info/time_within_train_step": 28.024390697479248, "step": 571}
{"train_info/time_between_train_steps": 0.005679607391357422, "step": 571}
{"info/global_step": 572, "train_info/time_within_train_step": 27.806896209716797, "step": 572}
{"train_info/time_between_train_steps": 0.010991811752319336, "step": 572}
{"info/global_step": 573, "train_info/time_within_train_step": 28.050896167755127, "step": 573}
{"train_info/time_between_train_steps": 0.005946636199951172, "step": 573}
{"info/global_step": 574, "train_info/time_within_train_step": 27.76360297203064, "step": 574}
{"train_info/time_between_train_steps": 0.010476350784301758, "step": 574}
{"info/global_step": 575, "train_info/time_within_train_step": 27.931800603866577, "step": 575}
{"train_info/time_between_train_steps": 0.006583213806152344, "step": 575}
{"info/global_step": 576, "train_info/time_within_train_step": 28.099846124649048, "step": 576}
{"train_info/time_between_train_steps": 0.0054438114166259766, "step": 576}
{"info/global_step": 577, "train_info/time_within_train_step": 27.764897108078003, "step": 577}
{"train_info/time_between_train_steps": 0.005318403244018555, "step": 577}
{"info/global_step": 578, "train_info/time_within_train_step": 27.77156710624695, "step": 578}
{"train_info/time_between_train_steps": 0.005410909652709961, "step": 578}
{"info/global_step": 579, "train_info/time_within_train_step": 28.02047061920166, "step": 579}
{"train_info/time_between_train_steps": 0.010875463485717773, "step": 579}
{"info/global_step": 580, "train_info/time_within_train_step": 28.140138626098633, "step": 580}
{"train_info/time_between_train_steps": 0.010795354843139648, "step": 580}
{"info/global_step": 581, "train_info/time_within_train_step": 28.02069592475891, "step": 581}
{"train_info/time_between_train_steps": 0.01094675064086914, "step": 581}
{"info/global_step": 582, "train_info/time_within_train_step": 27.90436029434204, "step": 582}
{"train_info/time_between_train_steps": 0.010825395584106445, "step": 582}
{"info/global_step": 583, "train_info/time_within_train_step": 27.884374141693115, "step": 583}
{"train_info/time_between_train_steps": 0.005451202392578125, "step": 583}
{"info/global_step": 584, "train_info/time_within_train_step": 27.852046728134155, "step": 584}
{"train_info/time_between_train_steps": 0.01002359390258789, "step": 584}
{"info/global_step": 585, "train_info/time_within_train_step": 27.939176321029663, "step": 585}
{"train_info/time_between_train_steps": 0.010056018829345703, "step": 585}
{"info/global_step": 586, "train_info/time_within_train_step": 27.872305393218994, "step": 586}
{"train_info/time_between_train_steps": 0.005373954772949219, "step": 586}
{"info/global_step": 587, "train_info/time_within_train_step": 27.820082902908325, "step": 587}
{"train_info/time_between_train_steps": 0.01133871078491211, "step": 587}
{"info/global_step": 588, "train_info/time_within_train_step": 27.78410005569458, "step": 588}
{"train_info/time_between_train_steps": 0.006173372268676758, "step": 588}
{"info/global_step": 589, "train_info/time_within_train_step": 27.80401372909546, "step": 589}
{"train_info/time_between_train_steps": 0.005357980728149414, "step": 589}
{"info/global_step": 590, "train_info/time_within_train_step": 27.766045570373535, "step": 590}
{"train_info/time_between_train_steps": 0.010436773300170898, "step": 590}
{"info/global_step": 591, "train_info/time_within_train_step": 27.903330087661743, "step": 591}
{"train_info/time_between_train_steps": 0.006276369094848633, "step": 591}
{"info/global_step": 592, "train_info/time_within_train_step": 27.965572357177734, "step": 592}
{"train_info/time_between_train_steps": 0.005601644515991211, "step": 592}
{"info/global_step": 593, "train_info/time_within_train_step": 28.019894123077393, "step": 593}
{"train_info/time_between_train_steps": 0.006953716278076172, "step": 593}
{"info/global_step": 594, "train_info/time_within_train_step": 27.94039273262024, "step": 594}
{"train_info/time_between_train_steps": 0.006424427032470703, "step": 594}
{"train_info/time_between_train_steps": 21.216071367263794, "step": 594}
{"info/global_step": 595, "train_info/time_within_train_step": 27.911230087280273, "step": 595}
{"train_info/time_between_train_steps": 0.00578761100769043, "step": 595}
{"info/global_step": 596, "train_info/time_within_train_step": 28.320131540298462, "step": 596}
{"train_info/time_between_train_steps": 0.0055348873138427734, "step": 596}
{"info/global_step": 597, "train_info/time_within_train_step": 27.95195722579956, "step": 597}
{"train_info/time_between_train_steps": 0.00564265251159668, "step": 597}
{"info/global_step": 598, "train_info/time_within_train_step": 28.25046157836914, "step": 598}
{"train_info/time_between_train_steps": 0.011124372482299805, "step": 598}
{"info/global_step": 599, "train_info/time_within_train_step": 27.953253269195557, "step": 599}
{"train_info/time_between_train_steps": 0.006514310836791992, "step": 599}
{"info/global_step": 600, "train_info/time_within_train_step": 28.18518567085266, "step": 600}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733854635, "_runtime": 17169}, "step": 600}
{"logs": {"train/loss": 4.6671, "train/learning_rate": 0.0003333333333333333, "train/epoch": 22.0, "_timestamp": 1733854635, "_runtime": 17169}, "step": 600}
{"train_info/time_between_train_steps": 2.793304681777954, "step": 600}
{"info/global_step": 601, "train_info/time_within_train_step": 27.958436965942383, "step": 601}
{"train_info/time_between_train_steps": 0.0058782100677490234, "step": 601}
{"info/global_step": 602, "train_info/time_within_train_step": 27.934520959854126, "step": 602}
{"train_info/time_between_train_steps": 0.005429983139038086, "step": 602}
{"info/global_step": 603, "train_info/time_within_train_step": 27.96462869644165, "step": 603}
{"train_info/time_between_train_steps": 0.010719060897827148, "step": 603}
{"info/global_step": 604, "train_info/time_within_train_step": 28.014018774032593, "step": 604}
{"train_info/time_between_train_steps": 0.010432243347167969, "step": 604}
{"info/global_step": 605, "train_info/time_within_train_step": 27.922189235687256, "step": 605}
{"train_info/time_between_train_steps": 0.01070094108581543, "step": 605}
{"info/global_step": 606, "train_info/time_within_train_step": 27.97312903404236, "step": 606}
{"train_info/time_between_train_steps": 0.006020307540893555, "step": 606}
{"info/global_step": 607, "train_info/time_within_train_step": 27.905691862106323, "step": 607}
{"train_info/time_between_train_steps": 0.01076960563659668, "step": 607}
{"info/global_step": 608, "train_info/time_within_train_step": 27.870823860168457, "step": 608}
{"train_info/time_between_train_steps": 0.01103353500366211, "step": 608}
{"info/global_step": 609, "train_info/time_within_train_step": 28.073745250701904, "step": 609}
{"train_info/time_between_train_steps": 0.011206388473510742, "step": 609}
{"info/global_step": 610, "train_info/time_within_train_step": 27.931486129760742, "step": 610}
{"train_info/time_between_train_steps": 0.010334968566894531, "step": 610}
{"info/global_step": 611, "train_info/time_within_train_step": 27.875121593475342, "step": 611}
{"train_info/time_between_train_steps": 0.005469083786010742, "step": 611}
{"info/global_step": 612, "train_info/time_within_train_step": 27.954004764556885, "step": 612}
{"train_info/time_between_train_steps": 0.005389213562011719, "step": 612}
{"info/global_step": 613, "train_info/time_within_train_step": 27.987138032913208, "step": 613}
{"train_info/time_between_train_steps": 0.005554914474487305, "step": 613}
{"info/global_step": 614, "train_info/time_within_train_step": 27.90639901161194, "step": 614}
{"train_info/time_between_train_steps": 0.005526304244995117, "step": 614}
{"info/global_step": 615, "train_info/time_within_train_step": 27.82663869857788, "step": 615}
{"train_info/time_between_train_steps": 0.006463050842285156, "step": 615}
{"info/global_step": 616, "train_info/time_within_train_step": 27.948970079421997, "step": 616}
{"train_info/time_between_train_steps": 0.0053348541259765625, "step": 616}
{"info/global_step": 617, "train_info/time_within_train_step": 27.84089946746826, "step": 617}
{"train_info/time_between_train_steps": 0.005352497100830078, "step": 617}
{"info/global_step": 618, "train_info/time_within_train_step": 27.86152672767639, "step": 618}
{"train_info/time_between_train_steps": 0.0062482357025146484, "step": 618}
{"info/global_step": 619, "train_info/time_within_train_step": 27.827874183654785, "step": 619}
{"train_info/time_between_train_steps": 0.0054552555084228516, "step": 619}
{"info/global_step": 620, "train_info/time_within_train_step": 27.91460680961609, "step": 620}
{"train_info/time_between_train_steps": 0.006365060806274414, "step": 620}
{"info/global_step": 621, "train_info/time_within_train_step": 27.85257339477539, "step": 621}
{"train_info/time_between_train_steps": 0.010889053344726562, "step": 621}
{"train_info/time_between_train_steps": 21.206992626190186, "step": 621}
{"info/global_step": 622, "train_info/time_within_train_step": 27.855181455612183, "step": 622}
{"train_info/time_between_train_steps": 0.007985591888427734, "step": 622}
{"info/global_step": 623, "train_info/time_within_train_step": 28.127175092697144, "step": 623}
{"train_info/time_between_train_steps": 0.005510807037353516, "step": 623}
{"info/global_step": 624, "train_info/time_within_train_step": 28.1604106426239, "step": 624}
{"train_info/time_between_train_steps": 0.014424562454223633, "step": 624}
{"info/global_step": 625, "train_info/time_within_train_step": 27.905579328536987, "step": 625}
{"train_info/time_between_train_steps": 0.005525112152099609, "step": 625}
{"info/global_step": 626, "train_info/time_within_train_step": 27.845949172973633, "step": 626}
{"train_info/time_between_train_steps": 0.0055599212646484375, "step": 626}
{"info/global_step": 627, "train_info/time_within_train_step": 28.161969423294067, "step": 627}
{"train_info/time_between_train_steps": 0.0063626766204833984, "step": 627}
{"info/global_step": 628, "train_info/time_within_train_step": 27.801751136779785, "step": 628}
{"train_info/time_between_train_steps": 0.005354166030883789, "step": 628}
{"info/global_step": 629, "train_info/time_within_train_step": 27.82379460334778, "step": 629}
{"train_info/time_between_train_steps": 0.010513782501220703, "step": 629}
{"info/global_step": 630, "train_info/time_within_train_step": 27.834096431732178, "step": 630}
{"train_info/time_between_train_steps": 0.005209207534790039, "step": 630}
{"info/global_step": 631, "train_info/time_within_train_step": 27.804591178894043, "step": 631}
{"train_info/time_between_train_steps": 0.005049705505371094, "step": 631}
{"info/global_step": 632, "train_info/time_within_train_step": 27.79986262321472, "step": 632}
{"train_info/time_between_train_steps": 0.005098104476928711, "step": 632}
{"info/global_step": 633, "train_info/time_within_train_step": 27.828861474990845, "step": 633}
{"train_info/time_between_train_steps": 0.010622262954711914, "step": 633}
{"info/global_step": 634, "train_info/time_within_train_step": 27.831250190734863, "step": 634}
{"train_info/time_between_train_steps": 0.0053806304931640625, "step": 634}
{"info/global_step": 635, "train_info/time_within_train_step": 27.876962423324585, "step": 635}
{"train_info/time_between_train_steps": 0.009634971618652344, "step": 635}
{"info/global_step": 636, "train_info/time_within_train_step": 27.798203945159912, "step": 636}
{"train_info/time_between_train_steps": 0.005879878997802734, "step": 636}
{"info/global_step": 637, "train_info/time_within_train_step": 27.75410270690918, "step": 637}
{"train_info/time_between_train_steps": 0.0051615238189697266, "step": 637}
{"info/global_step": 638, "train_info/time_within_train_step": 27.778909921646118, "step": 638}
{"train_info/time_between_train_steps": 0.01660919189453125, "step": 638}
{"info/global_step": 639, "train_info/time_within_train_step": 27.793434143066406, "step": 639}
{"train_info/time_between_train_steps": 0.005910634994506836, "step": 639}
{"info/global_step": 640, "train_info/time_within_train_step": 27.771116495132446, "step": 640}
{"train_info/time_between_train_steps": 0.0052869319915771484, "step": 640}
{"info/global_step": 641, "train_info/time_within_train_step": 27.80940842628479, "step": 641}
{"train_info/time_between_train_steps": 0.010343074798583984, "step": 641}
{"info/global_step": 642, "train_info/time_within_train_step": 27.980544567108154, "step": 642}
{"train_info/time_between_train_steps": 0.0054056644439697266, "step": 642}
{"info/global_step": 643, "train_info/time_within_train_step": 27.79040217399597, "step": 643}
{"train_info/time_between_train_steps": 0.005262851715087891, "step": 643}
{"info/global_step": 644, "train_info/time_within_train_step": 27.79410672187805, "step": 644}
{"train_info/time_between_train_steps": 0.0052225589752197266, "step": 644}
{"info/global_step": 645, "train_info/time_within_train_step": 27.90350866317749, "step": 645}
{"train_info/time_between_train_steps": 0.005544185638427734, "step": 645}
{"info/global_step": 646, "train_info/time_within_train_step": 27.799930572509766, "step": 646}
{"train_info/time_between_train_steps": 0.005366802215576172, "step": 646}
{"info/global_step": 647, "train_info/time_within_train_step": 27.776558876037598, "step": 647}
{"train_info/time_between_train_steps": 0.005445003509521484, "step": 647}
{"info/global_step": 648, "train_info/time_within_train_step": 27.789154529571533, "step": 648}
{"train_info/time_between_train_steps": 0.0062406063079833984, "step": 648}
{"train_info/time_between_train_steps": 20.70108723640442, "step": 648}
{"info/global_step": 649, "train_info/time_within_train_step": 27.75318932533264, "step": 649}
{"train_info/time_between_train_steps": 0.005107879638671875, "step": 649}
{"info/global_step": 650, "train_info/time_within_train_step": 27.91938042640686, "step": 650}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733856074, "_runtime": 18608}, "step": 650}
{"logs": {"train/loss": 4.5276, "train/learning_rate": 0.00030555555555555555, "train/epoch": 24.0, "_timestamp": 1733856074, "_runtime": 18608}, "step": 650}
{"train_info/time_between_train_steps": 0.012094259262084961, "step": 650}
{"info/global_step": 651, "train_info/time_within_train_step": 27.762935876846313, "step": 651}
{"train_info/time_between_train_steps": 0.005298137664794922, "step": 651}
{"info/global_step": 652, "train_info/time_within_train_step": 27.879934787750244, "step": 652}
{"train_info/time_between_train_steps": 0.006113529205322266, "step": 652}
{"info/global_step": 653, "train_info/time_within_train_step": 27.754592418670654, "step": 653}
{"train_info/time_between_train_steps": 0.005719661712646484, "step": 653}
{"info/global_step": 654, "train_info/time_within_train_step": 27.97938299179077, "step": 654}
{"train_info/time_between_train_steps": 0.008781671524047852, "step": 654}
{"info/global_step": 655, "train_info/time_within_train_step": 27.841780185699463, "step": 655}
{"train_info/time_between_train_steps": 0.010985374450683594, "step": 655}
{"info/global_step": 656, "train_info/time_within_train_step": 27.869123220443726, "step": 656}
{"train_info/time_between_train_steps": 0.0059947967529296875, "step": 656}
{"info/global_step": 657, "train_info/time_within_train_step": 27.899354696273804, "step": 657}
{"train_info/time_between_train_steps": 0.005312204360961914, "step": 657}
{"info/global_step": 658, "train_info/time_within_train_step": 27.835631847381592, "step": 658}
{"train_info/time_between_train_steps": 0.00571131706237793, "step": 658}
{"info/global_step": 659, "train_info/time_within_train_step": 27.951767444610596, "step": 659}
{"train_info/time_between_train_steps": 0.010261774063110352, "step": 659}
{"info/global_step": 660, "train_info/time_within_train_step": 27.916048765182495, "step": 660}
{"train_info/time_between_train_steps": 0.006877899169921875, "step": 660}
{"info/global_step": 661, "train_info/time_within_train_step": 27.829536199569702, "step": 661}
{"train_info/time_between_train_steps": 0.005832672119140625, "step": 661}
{"info/global_step": 662, "train_info/time_within_train_step": 28.04342484474182, "step": 662}
{"train_info/time_between_train_steps": 0.005547761917114258, "step": 662}
{"info/global_step": 663, "train_info/time_within_train_step": 27.753429889678955, "step": 663}
{"train_info/time_between_train_steps": 0.005468845367431641, "step": 663}
{"info/global_step": 664, "train_info/time_within_train_step": 27.743741750717163, "step": 664}
{"train_info/time_between_train_steps": 0.005133152008056641, "step": 664}
{"info/global_step": 665, "train_info/time_within_train_step": 27.742017030715942, "step": 665}
{"train_info/time_between_train_steps": 0.005177736282348633, "step": 665}
{"info/global_step": 666, "train_info/time_within_train_step": 27.798463821411133, "step": 666}
{"train_info/time_between_train_steps": 0.005221843719482422, "step": 666}
{"info/global_step": 667, "train_info/time_within_train_step": 27.76040816307068, "step": 667}
{"train_info/time_between_train_steps": 0.005212306976318359, "step": 667}
{"info/global_step": 668, "train_info/time_within_train_step": 27.853240251541138, "step": 668}
{"train_info/time_between_train_steps": 0.010475635528564453, "step": 668}
{"info/global_step": 669, "train_info/time_within_train_step": 28.01011872291565, "step": 669}
{"train_info/time_between_train_steps": 0.005549430847167969, "step": 669}
{"info/global_step": 670, "train_info/time_within_train_step": 27.762644052505493, "step": 670}
{"train_info/time_between_train_steps": 0.00513911247253418, "step": 670}
{"info/global_step": 671, "train_info/time_within_train_step": 27.742703199386597, "step": 671}
{"train_info/time_between_train_steps": 0.005187273025512695, "step": 671}
{"info/global_step": 672, "train_info/time_within_train_step": 27.802873849868774, "step": 672}
{"train_info/time_between_train_steps": 0.006439685821533203, "step": 672}
{"info/global_step": 673, "train_info/time_within_train_step": 27.90689444541931, "step": 673}
{"train_info/time_between_train_steps": 0.0069065093994140625, "step": 673}
{"info/global_step": 674, "train_info/time_within_train_step": 27.96521759033203, "step": 674}
{"train_info/time_between_train_steps": 0.005828142166137695, "step": 674}
{"info/global_step": 675, "train_info/time_within_train_step": 27.881195783615112, "step": 675}
{"train_info/time_between_train_steps": 0.01193857192993164, "step": 675}
{"train_info/time_between_train_steps": 20.820451736450195, "step": 675}
{"info/global_step": 676, "train_info/time_within_train_step": 28.032230615615845, "step": 676}
{"train_info/time_between_train_steps": 0.005008220672607422, "step": 676}
{"info/global_step": 677, "train_info/time_within_train_step": 28.159091472625732, "step": 677}
{"train_info/time_between_train_steps": 0.009872913360595703, "step": 677}
{"info/global_step": 678, "train_info/time_within_train_step": 27.859030961990356, "step": 678}
{"train_info/time_between_train_steps": 0.01078033447265625, "step": 678}
{"info/global_step": 679, "train_info/time_within_train_step": 28.02574610710144, "step": 679}
{"train_info/time_between_train_steps": 0.01183938980102539, "step": 679}
{"info/global_step": 680, "train_info/time_within_train_step": 27.762159824371338, "step": 680}
{"train_info/time_between_train_steps": 0.010845422744750977, "step": 680}
{"info/global_step": 681, "train_info/time_within_train_step": 28.08094549179077, "step": 681}
{"train_info/time_between_train_steps": 0.007648468017578125, "step": 681}
{"info/global_step": 682, "train_info/time_within_train_step": 27.857422351837158, "step": 682}
{"train_info/time_between_train_steps": 0.005667448043823242, "step": 682}
{"info/global_step": 683, "train_info/time_within_train_step": 27.80535864830017, "step": 683}
{"train_info/time_between_train_steps": 0.005268573760986328, "step": 683}
{"info/global_step": 684, "train_info/time_within_train_step": 27.78654432296753, "step": 684}
{"train_info/time_between_train_steps": 0.005522251129150391, "step": 684}
{"info/global_step": 685, "train_info/time_within_train_step": 27.73254132270813, "step": 685}
{"train_info/time_between_train_steps": 0.005078792572021484, "step": 685}
{"info/global_step": 686, "train_info/time_within_train_step": 27.759995698928833, "step": 686}
{"train_info/time_between_train_steps": 0.005072832107543945, "step": 686}
{"info/global_step": 687, "train_info/time_within_train_step": 27.766327619552612, "step": 687}
{"train_info/time_between_train_steps": 0.004964351654052734, "step": 687}
{"info/global_step": 688, "train_info/time_within_train_step": 27.882941246032715, "step": 688}
{"train_info/time_between_train_steps": 0.005217313766479492, "step": 688}
{"info/global_step": 689, "train_info/time_within_train_step": 27.73148226737976, "step": 689}
{"train_info/time_between_train_steps": 0.005072832107543945, "step": 689}
{"info/global_step": 690, "train_info/time_within_train_step": 27.731948375701904, "step": 690}
{"train_info/time_between_train_steps": 0.005117654800415039, "step": 690}
{"info/global_step": 691, "train_info/time_within_train_step": 27.75292181968689, "step": 691}
{"train_info/time_between_train_steps": 0.005227088928222656, "step": 691}
{"info/global_step": 692, "train_info/time_within_train_step": 27.768151998519897, "step": 692}
{"train_info/time_between_train_steps": 0.010084152221679688, "step": 692}
{"info/global_step": 693, "train_info/time_within_train_step": 27.7857506275177, "step": 693}
{"train_info/time_between_train_steps": 0.005054950714111328, "step": 693}
{"info/global_step": 694, "train_info/time_within_train_step": 27.774452447891235, "step": 694}
{"train_info/time_between_train_steps": 0.005279064178466797, "step": 694}
{"info/global_step": 695, "train_info/time_within_train_step": 27.760937690734863, "step": 695}
{"train_info/time_between_train_steps": 0.005057573318481445, "step": 695}
{"info/global_step": 696, "train_info/time_within_train_step": 27.75197458267212, "step": 696}
{"train_info/time_between_train_steps": 0.016013383865356445, "step": 696}
{"info/global_step": 697, "train_info/time_within_train_step": 27.78341794013977, "step": 697}
{"train_info/time_between_train_steps": 0.010151147842407227, "step": 697}
{"info/global_step": 698, "train_info/time_within_train_step": 27.787412643432617, "step": 698}
{"train_info/time_between_train_steps": 0.005017280578613281, "step": 698}
{"info/global_step": 699, "train_info/time_within_train_step": 27.791131258010864, "step": 699}
{"train_info/time_between_train_steps": 0.005463123321533203, "step": 699}
{"info/global_step": 700, "train_info/time_within_train_step": 27.7733793258667, "step": 700}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733857488, "_runtime": 20022}, "step": 700}
{"logs": {"train/loss": 4.3451, "train/learning_rate": 0.0002777777777777778, "train/epoch": 25.02, "_timestamp": 1733857488, "_runtime": 20022}, "step": 700}
{"train_info/time_between_train_steps": 2.9054064750671387, "step": 700}
{"info/global_step": 701, "train_info/time_within_train_step": 27.75606608390808, "step": 701}
{"train_info/time_between_train_steps": 0.0056610107421875, "step": 701}
{"info/global_step": 702, "train_info/time_within_train_step": 27.995950937271118, "step": 702}
{"train_info/time_between_train_steps": 0.010704517364501953, "step": 702}
{"train_info/time_between_train_steps": 21.024512767791748, "step": 702}
{"info/global_step": 703, "train_info/time_within_train_step": 28.20804214477539, "step": 703}
{"train_info/time_between_train_steps": 0.005292654037475586, "step": 703}
{"info/global_step": 704, "train_info/time_within_train_step": 28.001627445220947, "step": 704}
{"train_info/time_between_train_steps": 0.0054285526275634766, "step": 704}
{"info/global_step": 705, "train_info/time_within_train_step": 27.77179217338562, "step": 705}
{"train_info/time_between_train_steps": 0.0055387020111083984, "step": 705}
{"info/global_step": 706, "train_info/time_within_train_step": 27.9720458984375, "step": 706}
{"train_info/time_between_train_steps": 0.005349397659301758, "step": 706}
{"info/global_step": 707, "train_info/time_within_train_step": 27.748349905014038, "step": 707}
{"train_info/time_between_train_steps": 0.005260944366455078, "step": 707}
{"info/global_step": 708, "train_info/time_within_train_step": 27.913304567337036, "step": 708}
{"train_info/time_between_train_steps": 0.005385875701904297, "step": 708}
{"info/global_step": 709, "train_info/time_within_train_step": 27.769442319869995, "step": 709}
{"train_info/time_between_train_steps": 0.005429983139038086, "step": 709}
{"info/global_step": 710, "train_info/time_within_train_step": 27.78275442123413, "step": 710}
{"train_info/time_between_train_steps": 0.005241870880126953, "step": 710}
{"info/global_step": 711, "train_info/time_within_train_step": 27.74041223526001, "step": 711}
{"train_info/time_between_train_steps": 0.005082607269287109, "step": 711}
{"info/global_step": 712, "train_info/time_within_train_step": 27.74175524711609, "step": 712}
{"train_info/time_between_train_steps": 0.009997844696044922, "step": 712}
{"info/global_step": 713, "train_info/time_within_train_step": 27.730478525161743, "step": 713}
{"train_info/time_between_train_steps": 0.0050051212310791016, "step": 713}
{"info/global_step": 714, "train_info/time_within_train_step": 27.732248783111572, "step": 714}
{"train_info/time_between_train_steps": 0.005173683166503906, "step": 714}
{"info/global_step": 715, "train_info/time_within_train_step": 27.733840465545654, "step": 715}
{"train_info/time_between_train_steps": 0.00989079475402832, "step": 715}
{"info/global_step": 716, "train_info/time_within_train_step": 27.769760131835938, "step": 716}
{"train_info/time_between_train_steps": 0.005110979080200195, "step": 716}
{"info/global_step": 717, "train_info/time_within_train_step": 27.753504037857056, "step": 717}
{"train_info/time_between_train_steps": 0.009802103042602539, "step": 717}
{"info/global_step": 718, "train_info/time_within_train_step": 27.78731894493103, "step": 718}
{"train_info/time_between_train_steps": 0.0050754547119140625, "step": 718}
{"info/global_step": 719, "train_info/time_within_train_step": 27.849456787109375, "step": 719}
{"train_info/time_between_train_steps": 0.005118370056152344, "step": 719}
{"info/global_step": 720, "train_info/time_within_train_step": 27.81949543952942, "step": 720}
{"train_info/time_between_train_steps": 0.005130290985107422, "step": 720}
{"info/global_step": 721, "train_info/time_within_train_step": 27.747304677963257, "step": 721}
{"train_info/time_between_train_steps": 0.005051851272583008, "step": 721}
{"info/global_step": 722, "train_info/time_within_train_step": 27.876521825790405, "step": 722}
{"train_info/time_between_train_steps": 0.00499725341796875, "step": 722}
{"info/global_step": 723, "train_info/time_within_train_step": 27.7373948097229, "step": 723}
{"train_info/time_between_train_steps": 0.005211353302001953, "step": 723}
{"info/global_step": 724, "train_info/time_within_train_step": 27.75586462020874, "step": 724}
{"train_info/time_between_train_steps": 0.009953498840332031, "step": 724}
{"info/global_step": 725, "train_info/time_within_train_step": 27.91322159767151, "step": 725}
{"train_info/time_between_train_steps": 0.005059480667114258, "step": 725}
{"info/global_step": 726, "train_info/time_within_train_step": 27.787941455841064, "step": 726}
{"train_info/time_between_train_steps": 0.010191917419433594, "step": 726}
{"info/global_step": 727, "train_info/time_within_train_step": 27.768125534057617, "step": 727}
{"train_info/time_between_train_steps": 0.005154609680175781, "step": 727}
{"info/global_step": 728, "train_info/time_within_train_step": 27.959896087646484, "step": 728}
{"train_info/time_between_train_steps": 0.005789279937744141, "step": 728}
{"info/global_step": 729, "train_info/time_within_train_step": 27.848345041275024, "step": 729}
{"train_info/time_between_train_steps": 0.006972789764404297, "step": 729}
{"train_info/time_between_train_steps": 20.82680892944336, "step": 729}
{"info/global_step": 730, "train_info/time_within_train_step": 27.81589913368225, "step": 730}
{"train_info/time_between_train_steps": 0.00615692138671875, "step": 730}
{"info/global_step": 731, "train_info/time_within_train_step": 28.002861976623535, "step": 731}
{"train_info/time_between_train_steps": 0.005352973937988281, "step": 731}
{"info/global_step": 732, "train_info/time_within_train_step": 27.771703481674194, "step": 732}
{"train_info/time_between_train_steps": 0.0070950984954833984, "step": 732}
{"info/global_step": 733, "train_info/time_within_train_step": 27.865707635879517, "step": 733}
{"train_info/time_between_train_steps": 0.005634784698486328, "step": 733}
{"info/global_step": 734, "train_info/time_within_train_step": 27.954219102859497, "step": 734}
{"train_info/time_between_train_steps": 0.005891323089599609, "step": 734}
{"info/global_step": 735, "train_info/time_within_train_step": 27.964405298233032, "step": 735}
{"train_info/time_between_train_steps": 0.00542759895324707, "step": 735}
{"info/global_step": 736, "train_info/time_within_train_step": 27.777755737304688, "step": 736}
{"train_info/time_between_train_steps": 0.005480527877807617, "step": 736}
{"info/global_step": 737, "train_info/time_within_train_step": 27.829132795333862, "step": 737}
{"train_info/time_between_train_steps": 0.005699634552001953, "step": 737}
{"info/global_step": 738, "train_info/time_within_train_step": 27.764833450317383, "step": 738}
{"train_info/time_between_train_steps": 0.00535893440246582, "step": 738}
{"info/global_step": 739, "train_info/time_within_train_step": 27.746598958969116, "step": 739}
{"train_info/time_between_train_steps": 0.009990215301513672, "step": 739}
{"info/global_step": 740, "train_info/time_within_train_step": 27.739686250686646, "step": 740}
{"train_info/time_between_train_steps": 0.0052106380462646484, "step": 740}
{"info/global_step": 741, "train_info/time_within_train_step": 27.74333143234253, "step": 741}
{"train_info/time_between_train_steps": 0.005127429962158203, "step": 741}
{"info/global_step": 742, "train_info/time_within_train_step": 27.74279284477234, "step": 742}
{"train_info/time_between_train_steps": 0.005280017852783203, "step": 742}
{"info/global_step": 743, "train_info/time_within_train_step": 27.769591569900513, "step": 743}
{"train_info/time_between_train_steps": 0.005243062973022461, "step": 743}
{"info/global_step": 744, "train_info/time_within_train_step": 27.76388645172119, "step": 744}
{"train_info/time_between_train_steps": 0.005299091339111328, "step": 744}
{"info/global_step": 745, "train_info/time_within_train_step": 27.73931312561035, "step": 745}
{"train_info/time_between_train_steps": 0.005203962326049805, "step": 745}
{"info/global_step": 746, "train_info/time_within_train_step": 27.785672903060913, "step": 746}
{"train_info/time_between_train_steps": 0.005850553512573242, "step": 746}
{"info/global_step": 747, "train_info/time_within_train_step": 27.7842538356781, "step": 747}
{"train_info/time_between_train_steps": 0.005190134048461914, "step": 747}
{"info/global_step": 748, "train_info/time_within_train_step": 27.759260892868042, "step": 748}
{"train_info/time_between_train_steps": 0.00532221794128418, "step": 748}
{"info/global_step": 749, "train_info/time_within_train_step": 27.901291131973267, "step": 749}
{"train_info/time_between_train_steps": 0.0052373409271240234, "step": 749}
{"info/global_step": 750, "train_info/time_within_train_step": 27.742299556732178, "step": 750}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733858924, "_runtime": 21458}, "step": 750}
{"logs": {"train/loss": 4.2866, "train/learning_rate": 0.00025, "train/epoch": 27.02, "_timestamp": 1733858924, "_runtime": 21458}, "step": 750}
{"train_info/time_between_train_steps": 0.007154703140258789, "step": 750}
{"info/global_step": 751, "train_info/time_within_train_step": 27.750572204589844, "step": 751}
{"train_info/time_between_train_steps": 0.005186557769775391, "step": 751}
{"info/global_step": 752, "train_info/time_within_train_step": 27.74537706375122, "step": 752}
{"train_info/time_between_train_steps": 0.005104780197143555, "step": 752}
{"info/global_step": 753, "train_info/time_within_train_step": 27.750664472579956, "step": 753}
{"train_info/time_between_train_steps": 0.00545191764831543, "step": 753}
{"info/global_step": 754, "train_info/time_within_train_step": 27.888830423355103, "step": 754}
{"train_info/time_between_train_steps": 0.010643720626831055, "step": 754}
{"info/global_step": 755, "train_info/time_within_train_step": 27.782248973846436, "step": 755}
{"train_info/time_between_train_steps": 0.01036691665649414, "step": 755}
{"info/global_step": 756, "train_info/time_within_train_step": 27.8254292011261, "step": 756}
{"train_info/time_between_train_steps": 0.011447668075561523, "step": 756}
{"train_info/time_between_train_steps": 20.784735441207886, "step": 756}
{"info/global_step": 757, "train_info/time_within_train_step": 27.96948218345642, "step": 757}
{"train_info/time_between_train_steps": 0.010297298431396484, "step": 757}
{"info/global_step": 758, "train_info/time_within_train_step": 28.23109483718872, "step": 758}
{"train_info/time_between_train_steps": 0.005286693572998047, "step": 758}
{"info/global_step": 759, "train_info/time_within_train_step": 27.765300989151, "step": 759}
{"train_info/time_between_train_steps": 0.005259275436401367, "step": 759}
{"info/global_step": 760, "train_info/time_within_train_step": 28.00747776031494, "step": 760}
{"train_info/time_between_train_steps": 0.010720968246459961, "step": 760}
{"info/global_step": 761, "train_info/time_within_train_step": 27.955004692077637, "step": 761}
{"train_info/time_between_train_steps": 0.006685018539428711, "step": 761}
{"info/global_step": 762, "train_info/time_within_train_step": 27.948418617248535, "step": 762}
{"train_info/time_between_train_steps": 0.005742073059082031, "step": 762}
{"info/global_step": 763, "train_info/time_within_train_step": 27.799349308013916, "step": 763}
{"train_info/time_between_train_steps": 0.0103912353515625, "step": 763}
{"info/global_step": 764, "train_info/time_within_train_step": 27.93612837791443, "step": 764}
{"train_info/time_between_train_steps": 0.005117654800415039, "step": 764}
{"info/global_step": 765, "train_info/time_within_train_step": 27.779027462005615, "step": 765}
{"train_info/time_between_train_steps": 0.00981450080871582, "step": 765}
{"info/global_step": 766, "train_info/time_within_train_step": 27.763695240020752, "step": 766}
{"train_info/time_between_train_steps": 0.00514531135559082, "step": 766}
{"info/global_step": 767, "train_info/time_within_train_step": 27.756420373916626, "step": 767}
{"train_info/time_between_train_steps": 0.004957914352416992, "step": 767}
{"info/global_step": 768, "train_info/time_within_train_step": 27.769798040390015, "step": 768}
{"train_info/time_between_train_steps": 0.005002260208129883, "step": 768}
{"info/global_step": 769, "train_info/time_within_train_step": 27.74608874320984, "step": 769}
{"train_info/time_between_train_steps": 0.005125761032104492, "step": 769}
{"info/global_step": 770, "train_info/time_within_train_step": 27.79612374305725, "step": 770}
{"train_info/time_between_train_steps": 0.010365486145019531, "step": 770}
{"info/global_step": 771, "train_info/time_within_train_step": 28.126373767852783, "step": 771}
{"train_info/time_between_train_steps": 0.010439634323120117, "step": 771}
{"info/global_step": 772, "train_info/time_within_train_step": 27.766002893447876, "step": 772}
{"train_info/time_between_train_steps": 0.005137920379638672, "step": 772}
{"info/global_step": 773, "train_info/time_within_train_step": 27.856428623199463, "step": 773}
{"train_info/time_between_train_steps": 0.010401725769042969, "step": 773}
{"info/global_step": 774, "train_info/time_within_train_step": 27.99237370491028, "step": 774}
{"train_info/time_between_train_steps": 0.005056142807006836, "step": 774}
{"info/global_step": 775, "train_info/time_within_train_step": 27.796188354492188, "step": 775}
{"train_info/time_between_train_steps": 0.010869264602661133, "step": 775}
{"info/global_step": 776, "train_info/time_within_train_step": 27.91520094871521, "step": 776}
{"train_info/time_between_train_steps": 0.005068778991699219, "step": 776}
{"info/global_step": 777, "train_info/time_within_train_step": 27.932671546936035, "step": 777}
{"train_info/time_between_train_steps": 0.01170969009399414, "step": 777}
{"info/global_step": 778, "train_info/time_within_train_step": 27.892632961273193, "step": 778}
{"train_info/time_between_train_steps": 0.013838529586791992, "step": 778}
{"info/global_step": 779, "train_info/time_within_train_step": 27.759634971618652, "step": 779}
{"train_info/time_between_train_steps": 0.009881019592285156, "step": 779}
{"info/global_step": 780, "train_info/time_within_train_step": 27.88732933998108, "step": 780}
{"train_info/time_between_train_steps": 0.0055561065673828125, "step": 780}
{"info/global_step": 781, "train_info/time_within_train_step": 27.819807291030884, "step": 781}
{"train_info/time_between_train_steps": 0.005361080169677734, "step": 781}
{"info/global_step": 782, "train_info/time_within_train_step": 27.791014432907104, "step": 782}
{"train_info/time_between_train_steps": 0.01651620864868164, "step": 782}
{"info/global_step": 783, "train_info/time_within_train_step": 27.865684032440186, "step": 783}
{"train_info/time_between_train_steps": 0.010695457458496094, "step": 783}
{"train_info/time_between_train_steps": 20.653300046920776, "step": 783}
{"info/global_step": 784, "train_info/time_within_train_step": 27.775646209716797, "step": 784}
{"train_info/time_between_train_steps": 0.010829448699951172, "step": 784}
{"info/global_step": 785, "train_info/time_within_train_step": 27.990938663482666, "step": 785}
{"train_info/time_between_train_steps": 0.005357265472412109, "step": 785}
{"info/global_step": 786, "train_info/time_within_train_step": 27.761942148208618, "step": 786}
{"train_info/time_between_train_steps": 0.0050961971282958984, "step": 786}
{"info/global_step": 787, "train_info/time_within_train_step": 27.94463324546814, "step": 787}
{"train_info/time_between_train_steps": 0.005518674850463867, "step": 787}
{"info/global_step": 788, "train_info/time_within_train_step": 27.814650535583496, "step": 788}
{"train_info/time_between_train_steps": 0.0052602291107177734, "step": 788}
{"info/global_step": 789, "train_info/time_within_train_step": 27.961944103240967, "step": 789}
{"train_info/time_between_train_steps": 0.005331516265869141, "step": 789}
{"info/global_step": 790, "train_info/time_within_train_step": 27.756439447402954, "step": 790}
{"train_info/time_between_train_steps": 0.005766391754150391, "step": 790}
{"info/global_step": 791, "train_info/time_within_train_step": 27.804078817367554, "step": 791}
{"train_info/time_between_train_steps": 0.005232095718383789, "step": 791}
{"info/global_step": 792, "train_info/time_within_train_step": 27.782673120498657, "step": 792}
{"train_info/time_between_train_steps": 0.005108356475830078, "step": 792}
{"info/global_step": 793, "train_info/time_within_train_step": 27.74203634262085, "step": 793}
{"train_info/time_between_train_steps": 0.004982948303222656, "step": 793}
{"info/global_step": 794, "train_info/time_within_train_step": 27.73490333557129, "step": 794}
{"train_info/time_between_train_steps": 0.004984140396118164, "step": 794}
{"info/global_step": 795, "train_info/time_within_train_step": 27.954015254974365, "step": 795}
{"train_info/time_between_train_steps": 0.00531458854675293, "step": 795}
{"info/global_step": 796, "train_info/time_within_train_step": 27.836215257644653, "step": 796}
{"train_info/time_between_train_steps": 0.01409149169921875, "step": 796}
{"info/global_step": 797, "train_info/time_within_train_step": 28.0342378616333, "step": 797}
{"train_info/time_between_train_steps": 0.014373064041137695, "step": 797}
{"info/global_step": 798, "train_info/time_within_train_step": 28.02618098258972, "step": 798}
{"train_info/time_between_train_steps": 0.006067514419555664, "step": 798}
{"info/global_step": 799, "train_info/time_within_train_step": 28.14580464363098, "step": 799}
{"train_info/time_between_train_steps": 0.0053408145904541016, "step": 799}
{"info/global_step": 800, "train_info/time_within_train_step": 28.170615434646606, "step": 800}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733860359, "_runtime": 22893}, "step": 800}
{"logs": {"train/loss": 4.1896, "train/learning_rate": 0.00022222222222222218, "train/epoch": 29.01, "_timestamp": 1733860359, "_runtime": 22893}, "step": 800}
{"train_info/time_between_train_steps": 3.7730815410614014, "step": 800}
{"info/global_step": 801, "train_info/time_within_train_step": 28.147759437561035, "step": 801}
{"train_info/time_between_train_steps": 0.01047515869140625, "step": 801}
{"info/global_step": 802, "train_info/time_within_train_step": 28.136391639709473, "step": 802}
{"train_info/time_between_train_steps": 0.010560989379882812, "step": 802}
{"info/global_step": 803, "train_info/time_within_train_step": 28.149136543273926, "step": 803}
{"train_info/time_between_train_steps": 0.010887622833251953, "step": 803}
{"info/global_step": 804, "train_info/time_within_train_step": 28.15393900871277, "step": 804}
{"train_info/time_between_train_steps": 0.01047372817993164, "step": 804}
{"info/global_step": 805, "train_info/time_within_train_step": 28.176430702209473, "step": 805}
{"train_info/time_between_train_steps": 0.009564638137817383, "step": 805}
{"info/global_step": 806, "train_info/time_within_train_step": 28.15347194671631, "step": 806}
{"train_info/time_between_train_steps": 0.010111570358276367, "step": 806}
{"info/global_step": 807, "train_info/time_within_train_step": 28.155084371566772, "step": 807}
{"train_info/time_between_train_steps": 0.010541439056396484, "step": 807}
{"info/global_step": 808, "train_info/time_within_train_step": 28.171049118041992, "step": 808}
{"train_info/time_between_train_steps": 0.014525413513183594, "step": 808}
{"info/global_step": 809, "train_info/time_within_train_step": 28.083993911743164, "step": 809}
{"train_info/time_between_train_steps": 0.009550094604492188, "step": 809}
{"info/global_step": 810, "train_info/time_within_train_step": 28.377387046813965, "step": 810}
{"train_info/time_between_train_steps": 0.010971784591674805, "step": 810}
{"train_info/time_between_train_steps": 20.791377782821655, "step": 810}
{"info/global_step": 811, "train_info/time_within_train_step": 28.154419422149658, "step": 811}
{"train_info/time_between_train_steps": 0.010653018951416016, "step": 811}
{"info/global_step": 812, "train_info/time_within_train_step": 27.992589235305786, "step": 812}
{"train_info/time_between_train_steps": 0.005143404006958008, "step": 812}
{"info/global_step": 813, "train_info/time_within_train_step": 27.90430998802185, "step": 813}
{"train_info/time_between_train_steps": 0.005536079406738281, "step": 813}
{"info/global_step": 814, "train_info/time_within_train_step": 28.371655702590942, "step": 814}
{"train_info/time_between_train_steps": 0.010779380798339844, "step": 814}
{"info/global_step": 815, "train_info/time_within_train_step": 27.98257541656494, "step": 815}
{"train_info/time_between_train_steps": 0.010765790939331055, "step": 815}
{"info/global_step": 816, "train_info/time_within_train_step": 27.93235468864441, "step": 816}
{"train_info/time_between_train_steps": 0.005124092102050781, "step": 816}
{"info/global_step": 817, "train_info/time_within_train_step": 28.079336881637573, "step": 817}
{"train_info/time_between_train_steps": 0.010939836502075195, "step": 817}
{"info/global_step": 818, "train_info/time_within_train_step": 28.14146399497986, "step": 818}
{"train_info/time_between_train_steps": 0.010530948638916016, "step": 818}
{"info/global_step": 819, "train_info/time_within_train_step": 27.826980590820312, "step": 819}
{"train_info/time_between_train_steps": 0.005059003829956055, "step": 819}
{"info/global_step": 820, "train_info/time_within_train_step": 28.063514947891235, "step": 820}
{"train_info/time_between_train_steps": 0.009591341018676758, "step": 820}
{"info/global_step": 821, "train_info/time_within_train_step": 28.08044934272766, "step": 821}
{"train_info/time_between_train_steps": 0.010360479354858398, "step": 821}
{"info/global_step": 822, "train_info/time_within_train_step": 27.933400630950928, "step": 822}
{"train_info/time_between_train_steps": 0.0051691532135009766, "step": 822}
{"info/global_step": 823, "train_info/time_within_train_step": 28.056773900985718, "step": 823}
{"train_info/time_between_train_steps": 0.010706901550292969, "step": 823}
{"info/global_step": 824, "train_info/time_within_train_step": 27.95741033554077, "step": 824}
{"train_info/time_between_train_steps": 0.00530695915222168, "step": 824}
{"info/global_step": 825, "train_info/time_within_train_step": 28.061409950256348, "step": 825}
{"train_info/time_between_train_steps": 0.005333662033081055, "step": 825}
{"info/global_step": 826, "train_info/time_within_train_step": 27.98524785041809, "step": 826}
{"train_info/time_between_train_steps": 0.011123895645141602, "step": 826}
{"info/global_step": 827, "train_info/time_within_train_step": 27.93649125099182, "step": 827}
{"train_info/time_between_train_steps": 0.00530552864074707, "step": 827}
{"info/global_step": 828, "train_info/time_within_train_step": 28.002474308013916, "step": 828}
{"train_info/time_between_train_steps": 0.005227088928222656, "step": 828}
{"info/global_step": 829, "train_info/time_within_train_step": 28.118083000183105, "step": 829}
{"train_info/time_between_train_steps": 0.010158061981201172, "step": 829}
{"info/global_step": 830, "train_info/time_within_train_step": 28.07231378555298, "step": 830}
{"train_info/time_between_train_steps": 0.009129047393798828, "step": 830}
{"info/global_step": 831, "train_info/time_within_train_step": 27.945619106292725, "step": 831}
{"train_info/time_between_train_steps": 0.005425691604614258, "step": 831}
{"info/global_step": 832, "train_info/time_within_train_step": 28.069262266159058, "step": 832}
{"train_info/time_between_train_steps": 0.01051187515258789, "step": 832}
{"info/global_step": 833, "train_info/time_within_train_step": 27.994598388671875, "step": 833}
{"train_info/time_between_train_steps": 0.009095907211303711, "step": 833}
{"info/global_step": 834, "train_info/time_within_train_step": 28.03999161720276, "step": 834}
{"train_info/time_between_train_steps": 0.005808115005493164, "step": 834}
{"info/global_step": 835, "train_info/time_within_train_step": 27.830479621887207, "step": 835}
{"train_info/time_between_train_steps": 0.00530242919921875, "step": 835}
{"info/global_step": 836, "train_info/time_within_train_step": 27.822879552841187, "step": 836}
{"train_info/time_between_train_steps": 0.005937337875366211, "step": 836}
{"info/global_step": 837, "train_info/time_within_train_step": 28.01689600944519, "step": 837}
{"train_info/time_between_train_steps": 0.005647420883178711, "step": 837}
{"train_info/time_between_train_steps": 21.058192491531372, "step": 837}
{"info/global_step": 838, "train_info/time_within_train_step": 27.97298502922058, "step": 838}
{"train_info/time_between_train_steps": 0.010608911514282227, "step": 838}
{"info/global_step": 839, "train_info/time_within_train_step": 28.13266611099243, "step": 839}
{"train_info/time_between_train_steps": 0.0063593387603759766, "step": 839}
{"info/global_step": 840, "train_info/time_within_train_step": 28.150012254714966, "step": 840}
{"train_info/time_between_train_steps": 0.005516529083251953, "step": 840}
{"info/global_step": 841, "train_info/time_within_train_step": 28.140575170516968, "step": 841}
{"train_info/time_between_train_steps": 0.011340618133544922, "step": 841}
{"info/global_step": 842, "train_info/time_within_train_step": 28.053829669952393, "step": 842}
{"train_info/time_between_train_steps": 0.005689382553100586, "step": 842}
{"info/global_step": 843, "train_info/time_within_train_step": 28.505693674087524, "step": 843}
{"train_info/time_between_train_steps": 0.011718988418579102, "step": 843}
{"info/global_step": 844, "train_info/time_within_train_step": 28.081591844558716, "step": 844}
{"train_info/time_between_train_steps": 0.008577823638916016, "step": 844}
{"info/global_step": 845, "train_info/time_within_train_step": 28.335606336593628, "step": 845}
{"train_info/time_between_train_steps": 0.014864206314086914, "step": 845}
{"info/global_step": 846, "train_info/time_within_train_step": 29.273052215576172, "step": 846}
{"train_info/time_between_train_steps": 0.010953903198242188, "step": 846}
{"info/global_step": 847, "train_info/time_within_train_step": 28.266181707382202, "step": 847}
{"train_info/time_between_train_steps": 0.010805368423461914, "step": 847}
{"info/global_step": 848, "train_info/time_within_train_step": 28.52638006210327, "step": 848}
{"train_info/time_between_train_steps": 0.010480880737304688, "step": 848}
{"info/global_step": 849, "train_info/time_within_train_step": 28.177536010742188, "step": 849}
{"train_info/time_between_train_steps": 0.010652780532836914, "step": 849}
{"info/global_step": 850, "train_info/time_within_train_step": 28.25381064414978, "step": 850}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733861811, "_runtime": 24345}, "step": 850}
{"logs": {"train/loss": 4.0998, "train/learning_rate": 0.00019444444444444443, "train/epoch": 31.01, "_timestamp": 1733861811, "_runtime": 24345}, "step": 850}
{"train_info/time_between_train_steps": 0.014621496200561523, "step": 850}
{"info/global_step": 851, "train_info/time_within_train_step": 28.135321855545044, "step": 851}
{"train_info/time_between_train_steps": 0.011039018630981445, "step": 851}
{"info/global_step": 852, "train_info/time_within_train_step": 28.195711135864258, "step": 852}
{"train_info/time_between_train_steps": 0.011078834533691406, "step": 852}
{"info/global_step": 853, "train_info/time_within_train_step": 28.218517780303955, "step": 853}
{"train_info/time_between_train_steps": 0.010957717895507812, "step": 853}
{"info/global_step": 854, "train_info/time_within_train_step": 28.119282007217407, "step": 854}
{"train_info/time_between_train_steps": 0.010884523391723633, "step": 854}
{"info/global_step": 855, "train_info/time_within_train_step": 28.066579341888428, "step": 855}
{"train_info/time_between_train_steps": 0.010861396789550781, "step": 855}
{"info/global_step": 856, "train_info/time_within_train_step": 28.320006847381592, "step": 856}
{"train_info/time_between_train_steps": 0.011310577392578125, "step": 856}
{"info/global_step": 857, "train_info/time_within_train_step": 28.200040817260742, "step": 857}
{"train_info/time_between_train_steps": 0.011404752731323242, "step": 857}
{"info/global_step": 858, "train_info/time_within_train_step": 28.030030965805054, "step": 858}
{"train_info/time_between_train_steps": 0.010941267013549805, "step": 858}
{"info/global_step": 859, "train_info/time_within_train_step": 28.192368507385254, "step": 859}
{"train_info/time_between_train_steps": 0.012374401092529297, "step": 859}
{"info/global_step": 860, "train_info/time_within_train_step": 28.134522438049316, "step": 860}
{"train_info/time_between_train_steps": 0.010798931121826172, "step": 860}
{"info/global_step": 861, "train_info/time_within_train_step": 28.182603120803833, "step": 861}
{"train_info/time_between_train_steps": 0.011863470077514648, "step": 861}
{"info/global_step": 862, "train_info/time_within_train_step": 28.207134008407593, "step": 862}
{"train_info/time_between_train_steps": 0.011107683181762695, "step": 862}
{"info/global_step": 863, "train_info/time_within_train_step": 28.210939645767212, "step": 863}
{"train_info/time_between_train_steps": 0.013712644577026367, "step": 863}
{"info/global_step": 864, "train_info/time_within_train_step": 28.240939140319824, "step": 864}
{"train_info/time_between_train_steps": 0.014113903045654297, "step": 864}
{"train_info/time_between_train_steps": 22.24693012237549, "step": 864}
{"info/global_step": 865, "train_info/time_within_train_step": 28.15004062652588, "step": 865}
{"train_info/time_between_train_steps": 0.010506153106689453, "step": 865}
{"info/global_step": 866, "train_info/time_within_train_step": 28.44516897201538, "step": 866}
{"train_info/time_between_train_steps": 0.010295867919921875, "step": 866}
{"info/global_step": 867, "train_info/time_within_train_step": 28.046899557113647, "step": 867}
{"train_info/time_between_train_steps": 0.0055811405181884766, "step": 867}
{"info/global_step": 868, "train_info/time_within_train_step": 28.379171133041382, "step": 868}
{"train_info/time_between_train_steps": 0.011019229888916016, "step": 868}
{"info/global_step": 869, "train_info/time_within_train_step": 28.19662594795227, "step": 869}
{"train_info/time_between_train_steps": 0.01193547248840332, "step": 869}
{"info/global_step": 870, "train_info/time_within_train_step": 28.452964305877686, "step": 870}
{"train_info/time_between_train_steps": 0.011024951934814453, "step": 870}
{"info/global_step": 871, "train_info/time_within_train_step": 28.30947232246399, "step": 871}
{"train_info/time_between_train_steps": 0.01121377944946289, "step": 871}
{"info/global_step": 872, "train_info/time_within_train_step": 28.23776149749756, "step": 872}
{"train_info/time_between_train_steps": 0.010845422744750977, "step": 872}
{"info/global_step": 873, "train_info/time_within_train_step": 28.14577007293701, "step": 873}
{"train_info/time_between_train_steps": 0.013403177261352539, "step": 873}
{"info/global_step": 874, "train_info/time_within_train_step": 28.164746284484863, "step": 874}
{"train_info/time_between_train_steps": 0.010682344436645508, "step": 874}
{"info/global_step": 875, "train_info/time_within_train_step": 28.1235830783844, "step": 875}
{"train_info/time_between_train_steps": 0.011402368545532227, "step": 875}
{"info/global_step": 876, "train_info/time_within_train_step": 28.193041801452637, "step": 876}
{"train_info/time_between_train_steps": 0.012187719345092773, "step": 876}
{"info/global_step": 877, "train_info/time_within_train_step": 28.205087661743164, "step": 877}
{"train_info/time_between_train_steps": 0.010223865509033203, "step": 877}
{"info/global_step": 878, "train_info/time_within_train_step": 28.17852807044983, "step": 878}
{"train_info/time_between_train_steps": 0.011054754257202148, "step": 878}
{"info/global_step": 879, "train_info/time_within_train_step": 28.120259523391724, "step": 879}
{"train_info/time_between_train_steps": 0.010991096496582031, "step": 879}
{"info/global_step": 880, "train_info/time_within_train_step": 28.109877109527588, "step": 880}
{"train_info/time_between_train_steps": 0.00993490219116211, "step": 880}
{"info/global_step": 881, "train_info/time_within_train_step": 28.172051668167114, "step": 881}
{"train_info/time_between_train_steps": 0.005293607711791992, "step": 881}
{"info/global_step": 882, "train_info/time_within_train_step": 27.98906707763672, "step": 882}
{"train_info/time_between_train_steps": 0.005388021469116211, "step": 882}
{"info/global_step": 883, "train_info/time_within_train_step": 28.556209564208984, "step": 883}
{"train_info/time_between_train_steps": 0.012005805969238281, "step": 883}
{"info/global_step": 884, "train_info/time_within_train_step": 28.085872411727905, "step": 884}
{"train_info/time_between_train_steps": 0.009110212326049805, "step": 884}
{"info/global_step": 885, "train_info/time_within_train_step": 28.486947774887085, "step": 885}
{"train_info/time_between_train_steps": 0.010506868362426758, "step": 885}
{"info/global_step": 886, "train_info/time_within_train_step": 28.14364004135132, "step": 886}
{"train_info/time_between_train_steps": 0.010560750961303711, "step": 886}
{"info/global_step": 887, "train_info/time_within_train_step": 28.510090827941895, "step": 887}
{"train_info/time_between_train_steps": 0.011277914047241211, "step": 887}
{"info/global_step": 888, "train_info/time_within_train_step": 28.185128211975098, "step": 888}
{"train_info/time_between_train_steps": 0.010780096054077148, "step": 888}
{"info/global_step": 889, "train_info/time_within_train_step": 28.244864463806152, "step": 889}
{"train_info/time_between_train_steps": 0.007537126541137695, "step": 889}
{"info/global_step": 890, "train_info/time_within_train_step": 28.154435873031616, "step": 890}
{"train_info/time_between_train_steps": 0.010852575302124023, "step": 890}
{"info/global_step": 891, "train_info/time_within_train_step": 28.214789628982544, "step": 891}
{"train_info/time_between_train_steps": 0.011254549026489258, "step": 891}
{"train_info/time_between_train_steps": 22.41699194908142, "step": 891}
{"info/global_step": 892, "train_info/time_within_train_step": 28.170485019683838, "step": 892}
{"train_info/time_between_train_steps": 0.011173009872436523, "step": 892}
{"info/global_step": 893, "train_info/time_within_train_step": 28.948068380355835, "step": 893}
{"train_info/time_between_train_steps": 0.009618759155273438, "step": 893}
{"info/global_step": 894, "train_info/time_within_train_step": 28.318596363067627, "step": 894}
{"train_info/time_between_train_steps": 0.010677814483642578, "step": 894}
{"info/global_step": 895, "train_info/time_within_train_step": 28.23550820350647, "step": 895}
{"train_info/time_between_train_steps": 0.008219718933105469, "step": 895}
{"info/global_step": 896, "train_info/time_within_train_step": 28.128715991973877, "step": 896}
{"train_info/time_between_train_steps": 0.00996708869934082, "step": 896}
{"info/global_step": 897, "train_info/time_within_train_step": 28.29961347579956, "step": 897}
{"train_info/time_between_train_steps": 0.011058330535888672, "step": 897}
{"info/global_step": 898, "train_info/time_within_train_step": 28.06834077835083, "step": 898}
{"train_info/time_between_train_steps": 0.011873722076416016, "step": 898}
{"info/global_step": 899, "train_info/time_within_train_step": 28.295522689819336, "step": 899}
{"train_info/time_between_train_steps": 0.011369466781616211, "step": 899}
{"info/global_step": 900, "train_info/time_within_train_step": 28.28398084640503, "step": 900}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733863268, "_runtime": 25802}, "step": 900}
{"logs": {"train/loss": 4.0267, "train/learning_rate": 0.00016666666666666666, "train/epoch": 33.01, "_timestamp": 1733863268, "_runtime": 25802}, "step": 900}
{"train_info/time_between_train_steps": 2.83976149559021, "step": 900}
{"info/global_step": 901, "train_info/time_within_train_step": 28.04024338722229, "step": 901}
{"train_info/time_between_train_steps": 0.014393329620361328, "step": 901}
{"info/global_step": 902, "train_info/time_within_train_step": 28.275495290756226, "step": 902}
{"train_info/time_between_train_steps": 0.010705709457397461, "step": 902}
{"info/global_step": 903, "train_info/time_within_train_step": 28.050211429595947, "step": 903}
{"train_info/time_between_train_steps": 0.005448579788208008, "step": 903}
{"info/global_step": 904, "train_info/time_within_train_step": 27.84912133216858, "step": 904}
{"train_info/time_between_train_steps": 0.005206108093261719, "step": 904}
{"info/global_step": 905, "train_info/time_within_train_step": 28.09527897834778, "step": 905}
{"train_info/time_between_train_steps": 0.0052509307861328125, "step": 905}
{"info/global_step": 906, "train_info/time_within_train_step": 27.874746799468994, "step": 906}
{"train_info/time_between_train_steps": 0.005127668380737305, "step": 906}
{"info/global_step": 907, "train_info/time_within_train_step": 27.763564109802246, "step": 907}
{"train_info/time_between_train_steps": 0.005248069763183594, "step": 907}
{"info/global_step": 908, "train_info/time_within_train_step": 27.937874794006348, "step": 908}
{"train_info/time_between_train_steps": 0.010716676712036133, "step": 908}
{"info/global_step": 909, "train_info/time_within_train_step": 28.13379693031311, "step": 909}
{"train_info/time_between_train_steps": 0.005438566207885742, "step": 909}
{"info/global_step": 910, "train_info/time_within_train_step": 28.094092845916748, "step": 910}
{"train_info/time_between_train_steps": 0.005223274230957031, "step": 910}
{"info/global_step": 911, "train_info/time_within_train_step": 27.909799098968506, "step": 911}
{"train_info/time_between_train_steps": 0.0054492950439453125, "step": 911}
{"info/global_step": 912, "train_info/time_within_train_step": 28.057018041610718, "step": 912}
{"train_info/time_between_train_steps": 0.010752677917480469, "step": 912}
{"info/global_step": 913, "train_info/time_within_train_step": 27.967777013778687, "step": 913}
{"train_info/time_between_train_steps": 0.010538101196289062, "step": 913}
{"info/global_step": 914, "train_info/time_within_train_step": 27.86587119102478, "step": 914}
{"train_info/time_between_train_steps": 0.010206460952758789, "step": 914}
{"info/global_step": 915, "train_info/time_within_train_step": 27.920061111450195, "step": 915}
{"train_info/time_between_train_steps": 0.010545730590820312, "step": 915}
{"info/global_step": 916, "train_info/time_within_train_step": 28.037233114242554, "step": 916}
{"train_info/time_between_train_steps": 0.010946512222290039, "step": 916}
{"info/global_step": 917, "train_info/time_within_train_step": 28.080792903900146, "step": 917}
{"train_info/time_between_train_steps": 0.01099848747253418, "step": 917}
{"info/global_step": 918, "train_info/time_within_train_step": 27.990916967391968, "step": 918}
{"train_info/time_between_train_steps": 0.005858182907104492, "step": 918}
{"train_info/time_between_train_steps": 20.657811880111694, "step": 918}
{"info/global_step": 919, "train_info/time_within_train_step": 27.981245517730713, "step": 919}
{"train_info/time_between_train_steps": 0.011313915252685547, "step": 919}
{"info/global_step": 920, "train_info/time_within_train_step": 28.33268141746521, "step": 920}
{"train_info/time_between_train_steps": 0.010809183120727539, "step": 920}
{"info/global_step": 921, "train_info/time_within_train_step": 27.942462682724, "step": 921}
{"train_info/time_between_train_steps": 0.005697488784790039, "step": 921}
{"info/global_step": 922, "train_info/time_within_train_step": 28.455002069473267, "step": 922}
{"train_info/time_between_train_steps": 0.01425313949584961, "step": 922}
{"info/global_step": 923, "train_info/time_within_train_step": 28.118034839630127, "step": 923}
{"train_info/time_between_train_steps": 0.011277914047241211, "step": 923}
{"info/global_step": 924, "train_info/time_within_train_step": 28.24912142753601, "step": 924}
{"train_info/time_between_train_steps": 0.010217666625976562, "step": 924}
{"info/global_step": 925, "train_info/time_within_train_step": 27.864712953567505, "step": 925}
{"train_info/time_between_train_steps": 0.005709648132324219, "step": 925}
{"info/global_step": 926, "train_info/time_within_train_step": 28.0736882686615, "step": 926}
{"train_info/time_between_train_steps": 0.005369424819946289, "step": 926}
{"info/global_step": 927, "train_info/time_within_train_step": 28.243131160736084, "step": 927}
{"train_info/time_between_train_steps": 0.010622501373291016, "step": 927}
{"info/global_step": 928, "train_info/time_within_train_step": 27.935855865478516, "step": 928}
{"train_info/time_between_train_steps": 0.010234832763671875, "step": 928}
{"info/global_step": 929, "train_info/time_within_train_step": 27.938555002212524, "step": 929}
{"train_info/time_between_train_steps": 0.005017280578613281, "step": 929}
{"info/global_step": 930, "train_info/time_within_train_step": 27.968082904815674, "step": 930}
{"train_info/time_between_train_steps": 0.00515437126159668, "step": 930}
{"info/global_step": 931, "train_info/time_within_train_step": 28.433637857437134, "step": 931}
{"train_info/time_between_train_steps": 0.01018381118774414, "step": 931}
{"info/global_step": 932, "train_info/time_within_train_step": 27.98762011528015, "step": 932}
{"train_info/time_between_train_steps": 0.01047658920288086, "step": 932}
{"info/global_step": 933, "train_info/time_within_train_step": 27.857944011688232, "step": 933}
{"train_info/time_between_train_steps": 0.005268096923828125, "step": 933}
{"info/global_step": 934, "train_info/time_within_train_step": 27.957361221313477, "step": 934}
{"train_info/time_between_train_steps": 0.005288124084472656, "step": 934}
{"info/global_step": 935, "train_info/time_within_train_step": 28.084186553955078, "step": 935}
{"train_info/time_between_train_steps": 0.009878158569335938, "step": 935}
{"info/global_step": 936, "train_info/time_within_train_step": 27.896156311035156, "step": 936}
{"train_info/time_between_train_steps": 0.005195140838623047, "step": 936}
{"info/global_step": 937, "train_info/time_within_train_step": 27.845463275909424, "step": 937}
{"train_info/time_between_train_steps": 0.005266904830932617, "step": 937}
{"info/global_step": 938, "train_info/time_within_train_step": 27.778114080429077, "step": 938}
{"train_info/time_between_train_steps": 0.009915351867675781, "step": 938}
{"info/global_step": 939, "train_info/time_within_train_step": 27.812703847885132, "step": 939}
{"train_info/time_between_train_steps": 0.005251407623291016, "step": 939}
{"info/global_step": 940, "train_info/time_within_train_step": 27.89936065673828, "step": 940}
{"train_info/time_between_train_steps": 0.0051898956298828125, "step": 940}
{"info/global_step": 941, "train_info/time_within_train_step": 27.88140296936035, "step": 941}
{"train_info/time_between_train_steps": 0.0052297115325927734, "step": 941}
{"info/global_step": 942, "train_info/time_within_train_step": 27.752466678619385, "step": 942}
{"train_info/time_between_train_steps": 0.0053844451904296875, "step": 942}
{"info/global_step": 943, "train_info/time_within_train_step": 27.752554178237915, "step": 943}
{"train_info/time_between_train_steps": 0.005298614501953125, "step": 943}
{"info/global_step": 944, "train_info/time_within_train_step": 27.747405529022217, "step": 944}
{"train_info/time_between_train_steps": 0.005703449249267578, "step": 944}
{"info/global_step": 945, "train_info/time_within_train_step": 27.78584599494934, "step": 945}
{"train_info/time_between_train_steps": 0.0059201717376708984, "step": 945}
{"train_info/time_between_train_steps": 20.614458084106445, "step": 945}
{"info/global_step": 946, "train_info/time_within_train_step": 27.90655517578125, "step": 946}
{"train_info/time_between_train_steps": 0.009958505630493164, "step": 946}
{"info/global_step": 947, "train_info/time_within_train_step": 28.009108066558838, "step": 947}
{"train_info/time_between_train_steps": 0.005433797836303711, "step": 947}
{"info/global_step": 948, "train_info/time_within_train_step": 27.72826647758484, "step": 948}
{"train_info/time_between_train_steps": 0.0051860809326171875, "step": 948}
{"info/global_step": 949, "train_info/time_within_train_step": 27.966679573059082, "step": 949}
{"train_info/time_between_train_steps": 0.0052378177642822266, "step": 949}
{"info/global_step": 950, "train_info/time_within_train_step": 27.73220920562744, "step": 950}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733864711, "_runtime": 27245}, "step": 950}
{"logs": {"train/loss": 3.957, "train/learning_rate": 0.0001388888888888889, "train/epoch": 35.0, "_timestamp": 1733864711, "_runtime": 27245}, "step": 950}
{"train_info/time_between_train_steps": 0.006945133209228516, "step": 950}
{"info/global_step": 951, "train_info/time_within_train_step": 27.86129403114319, "step": 951}
{"train_info/time_between_train_steps": 0.005145072937011719, "step": 951}
{"info/global_step": 952, "train_info/time_within_train_step": 27.767020225524902, "step": 952}
{"train_info/time_between_train_steps": 0.012254476547241211, "step": 952}
{"info/global_step": 953, "train_info/time_within_train_step": 27.850679636001587, "step": 953}
{"train_info/time_between_train_steps": 0.005218029022216797, "step": 953}
{"info/global_step": 954, "train_info/time_within_train_step": 27.717576265335083, "step": 954}
{"train_info/time_between_train_steps": 0.005043506622314453, "step": 954}
{"info/global_step": 955, "train_info/time_within_train_step": 27.70478105545044, "step": 955}
{"train_info/time_between_train_steps": 0.005009651184082031, "step": 955}
{"info/global_step": 956, "train_info/time_within_train_step": 27.758460521697998, "step": 956}
{"train_info/time_between_train_steps": 0.010000944137573242, "step": 956}
{"info/global_step": 957, "train_info/time_within_train_step": 27.71564817428589, "step": 957}
{"train_info/time_between_train_steps": 0.004926919937133789, "step": 957}
{"info/global_step": 958, "train_info/time_within_train_step": 27.71828603744507, "step": 958}
{"train_info/time_between_train_steps": 0.004937887191772461, "step": 958}
{"info/global_step": 959, "train_info/time_within_train_step": 27.71938943862915, "step": 959}
{"train_info/time_between_train_steps": 0.010177850723266602, "step": 959}
{"info/global_step": 960, "train_info/time_within_train_step": 27.72687029838562, "step": 960}
{"train_info/time_between_train_steps": 0.009849786758422852, "step": 960}
{"info/global_step": 961, "train_info/time_within_train_step": 27.71880865097046, "step": 961}
{"train_info/time_between_train_steps": 0.004937887191772461, "step": 961}
{"info/global_step": 962, "train_info/time_within_train_step": 27.71631169319153, "step": 962}
{"train_info/time_between_train_steps": 0.00948786735534668, "step": 962}
{"info/global_step": 963, "train_info/time_within_train_step": 27.858189344406128, "step": 963}
{"train_info/time_between_train_steps": 0.0049321651458740234, "step": 963}
{"info/global_step": 964, "train_info/time_within_train_step": 27.736122846603394, "step": 964}
{"train_info/time_between_train_steps": 0.005084991455078125, "step": 964}
{"info/global_step": 965, "train_info/time_within_train_step": 27.743210554122925, "step": 965}
{"train_info/time_between_train_steps": 0.005071401596069336, "step": 965}
{"info/global_step": 966, "train_info/time_within_train_step": 27.741085052490234, "step": 966}
{"train_info/time_between_train_steps": 0.005237102508544922, "step": 966}
{"info/global_step": 967, "train_info/time_within_train_step": 27.763476848602295, "step": 967}
{"train_info/time_between_train_steps": 0.005197048187255859, "step": 967}
{"info/global_step": 968, "train_info/time_within_train_step": 27.786025524139404, "step": 968}
{"train_info/time_between_train_steps": 0.010113000869750977, "step": 968}
{"info/global_step": 969, "train_info/time_within_train_step": 27.759390830993652, "step": 969}
{"train_info/time_between_train_steps": 0.005503177642822266, "step": 969}
{"info/global_step": 970, "train_info/time_within_train_step": 27.812840461730957, "step": 970}
{"train_info/time_between_train_steps": 0.0056836605072021484, "step": 970}
{"info/global_step": 971, "train_info/time_within_train_step": 27.837220907211304, "step": 971}
{"train_info/time_between_train_steps": 0.005561351776123047, "step": 971}
{"info/global_step": 972, "train_info/time_within_train_step": 27.934996128082275, "step": 972}
{"train_info/time_between_train_steps": 0.0056722164154052734, "step": 972}
{"train_info/time_between_train_steps": 20.787396669387817, "step": 972}
{"info/global_step": 973, "train_info/time_within_train_step": 27.775776863098145, "step": 973}
{"train_info/time_between_train_steps": 0.005589485168457031, "step": 973}
{"info/global_step": 974, "train_info/time_within_train_step": 28.237979412078857, "step": 974}
{"train_info/time_between_train_steps": 0.005322694778442383, "step": 974}
{"info/global_step": 975, "train_info/time_within_train_step": 27.870591640472412, "step": 975}
{"train_info/time_between_train_steps": 0.010855674743652344, "step": 975}
{"info/global_step": 976, "train_info/time_within_train_step": 27.964322566986084, "step": 976}
{"train_info/time_between_train_steps": 0.0052220821380615234, "step": 976}
{"info/global_step": 977, "train_info/time_within_train_step": 27.748222827911377, "step": 977}
{"train_info/time_between_train_steps": 0.005634784698486328, "step": 977}
{"info/global_step": 978, "train_info/time_within_train_step": 28.111653804779053, "step": 978}
{"train_info/time_between_train_steps": 0.010029315948486328, "step": 978}
{"info/global_step": 979, "train_info/time_within_train_step": 28.01500964164734, "step": 979}
{"train_info/time_between_train_steps": 0.01019144058227539, "step": 979}
{"info/global_step": 980, "train_info/time_within_train_step": 27.938659191131592, "step": 980}
{"train_info/time_between_train_steps": 0.014774084091186523, "step": 980}
{"info/global_step": 981, "train_info/time_within_train_step": 27.88243579864502, "step": 981}
{"train_info/time_between_train_steps": 0.0051403045654296875, "step": 981}
{"info/global_step": 982, "train_info/time_within_train_step": 27.953790426254272, "step": 982}
{"train_info/time_between_train_steps": 0.00499272346496582, "step": 982}
{"info/global_step": 983, "train_info/time_within_train_step": 27.761951208114624, "step": 983}
{"train_info/time_between_train_steps": 0.005492687225341797, "step": 983}
{"info/global_step": 984, "train_info/time_within_train_step": 27.755688190460205, "step": 984}
{"train_info/time_between_train_steps": 0.005189418792724609, "step": 984}
{"info/global_step": 985, "train_info/time_within_train_step": 27.748633861541748, "step": 985}
{"train_info/time_between_train_steps": 0.005342006683349609, "step": 985}
{"info/global_step": 986, "train_info/time_within_train_step": 27.838547945022583, "step": 986}
{"train_info/time_between_train_steps": 0.005434274673461914, "step": 986}
{"info/global_step": 987, "train_info/time_within_train_step": 27.77293872833252, "step": 987}
{"train_info/time_between_train_steps": 0.005230903625488281, "step": 987}
{"info/global_step": 988, "train_info/time_within_train_step": 27.898409366607666, "step": 988}
{"train_info/time_between_train_steps": 0.005079984664916992, "step": 988}
{"info/global_step": 989, "train_info/time_within_train_step": 27.816214561462402, "step": 989}
{"train_info/time_between_train_steps": 0.005182981491088867, "step": 989}
{"info/global_step": 990, "train_info/time_within_train_step": 27.92796564102173, "step": 990}
{"train_info/time_between_train_steps": 0.005496978759765625, "step": 990}
{"info/global_step": 991, "train_info/time_within_train_step": 27.8152916431427, "step": 991}
{"train_info/time_between_train_steps": 0.00528407096862793, "step": 991}
{"info/global_step": 992, "train_info/time_within_train_step": 27.863839626312256, "step": 992}
{"train_info/time_between_train_steps": 0.0051419734954833984, "step": 992}
{"info/global_step": 993, "train_info/time_within_train_step": 27.934853553771973, "step": 993}
{"train_info/time_between_train_steps": 0.009746074676513672, "step": 993}
{"info/global_step": 994, "train_info/time_within_train_step": 28.15082049369812, "step": 994}
{"train_info/time_between_train_steps": 0.00535893440246582, "step": 994}
{"info/global_step": 995, "train_info/time_within_train_step": 28.014829397201538, "step": 995}
{"train_info/time_between_train_steps": 0.008744001388549805, "step": 995}
{"info/global_step": 996, "train_info/time_within_train_step": 27.8234646320343, "step": 996}
{"train_info/time_between_train_steps": 0.0068666934967041016, "step": 996}
{"info/global_step": 997, "train_info/time_within_train_step": 27.898988008499146, "step": 997}
{"train_info/time_between_train_steps": 0.0053730010986328125, "step": 997}
{"info/global_step": 998, "train_info/time_within_train_step": 28.1851909160614, "step": 998}
{"train_info/time_between_train_steps": 0.005699872970581055, "step": 998}
{"info/global_step": 999, "train_info/time_within_train_step": 28.376864433288574, "step": 999}
{"train_info/time_between_train_steps": 0.006084442138671875, "step": 999}
{"train_info/time_between_train_steps": 20.906773805618286, "step": 999}
{"info/global_step": 1000, "train_info/time_within_train_step": 27.88956046104431, "step": 1000}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733866146, "_runtime": 28680}, "step": 1000}
{"logs": {"train/loss": 3.8983, "train/learning_rate": 0.00011111111111111109, "train/epoch": 37.0, "_timestamp": 1733866146, "_runtime": 28680}, "step": 1000}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1733866148, "_runtime": 28682}, "step": 1000}
{"logs": {"eval/loss": 4.7766218185424805, "eval/runtime": 1.9754, "eval/samples_per_second": 50.622, "eval/steps_per_second": 3.544, "train/epoch": 37.0, "_timestamp": 1733866148, "_runtime": 28682}, "step": 1000}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1733866148, "_runtime": 28682}, "step": 1000}
{"logs": {"eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_loss": 4.7766218185424805, "eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_ppl": 118.70267278930945, "eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_runtime": 1.9754, "eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_samples_per_second": 50.622, "train/epoch": 37.0, "_timestamp": 1733866148, "_runtime": 28682}, "step": 1000}
{"train_info/time_between_train_steps": 4.720615863800049, "step": 1000}
{"info/global_step": 1001, "train_info/time_within_train_step": 28.265764713287354, "step": 1001}
{"train_info/time_between_train_steps": 0.00590825080871582, "step": 1001}
{"info/global_step": 1002, "train_info/time_within_train_step": 27.861116409301758, "step": 1002}
{"train_info/time_between_train_steps": 0.005235433578491211, "step": 1002}
{"info/global_step": 1003, "train_info/time_within_train_step": 28.55913543701172, "step": 1003}
{"train_info/time_between_train_steps": 0.011383056640625, "step": 1003}
{"info/global_step": 1004, "train_info/time_within_train_step": 28.524770498275757, "step": 1004}
{"train_info/time_between_train_steps": 0.005327463150024414, "step": 1004}
{"info/global_step": 1005, "train_info/time_within_train_step": 28.158924341201782, "step": 1005}
{"train_info/time_between_train_steps": 0.008378267288208008, "step": 1005}
{"info/global_step": 1006, "train_info/time_within_train_step": 28.33240270614624, "step": 1006}
{"train_info/time_between_train_steps": 0.0056040287017822266, "step": 1006}
{"info/global_step": 1007, "train_info/time_within_train_step": 28.125815629959106, "step": 1007}
{"train_info/time_between_train_steps": 0.010479211807250977, "step": 1007}
{"info/global_step": 1008, "train_info/time_within_train_step": 27.955246925354004, "step": 1008}
{"train_info/time_between_train_steps": 0.00510096549987793, "step": 1008}
{"info/global_step": 1009, "train_info/time_within_train_step": 27.942725896835327, "step": 1009}
{"train_info/time_between_train_steps": 0.0061795711517333984, "step": 1009}
{"info/global_step": 1010, "train_info/time_within_train_step": 27.821572303771973, "step": 1010}
{"train_info/time_between_train_steps": 0.005227565765380859, "step": 1010}
{"info/global_step": 1011, "train_info/time_within_train_step": 28.046298503875732, "step": 1011}
{"train_info/time_between_train_steps": 0.005272865295410156, "step": 1011}
{"info/global_step": 1012, "train_info/time_within_train_step": 28.035595893859863, "step": 1012}
{"train_info/time_between_train_steps": 0.00516819953918457, "step": 1012}
{"info/global_step": 1013, "train_info/time_within_train_step": 27.86954355239868, "step": 1013}
{"train_info/time_between_train_steps": 0.005432605743408203, "step": 1013}
{"info/global_step": 1014, "train_info/time_within_train_step": 27.93195343017578, "step": 1014}
{"train_info/time_between_train_steps": 0.005390644073486328, "step": 1014}
{"info/global_step": 1015, "train_info/time_within_train_step": 27.897040128707886, "step": 1015}
{"train_info/time_between_train_steps": 0.005240917205810547, "step": 1015}
{"info/global_step": 1016, "train_info/time_within_train_step": 27.84133791923523, "step": 1016}
{"train_info/time_between_train_steps": 0.005277395248413086, "step": 1016}
{"info/global_step": 1017, "train_info/time_within_train_step": 27.76405119895935, "step": 1017}
{"train_info/time_between_train_steps": 0.005158185958862305, "step": 1017}
{"info/global_step": 1018, "train_info/time_within_train_step": 27.74962282180786, "step": 1018}
{"train_info/time_between_train_steps": 0.010697364807128906, "step": 1018}
{"info/global_step": 1019, "train_info/time_within_train_step": 27.831948041915894, "step": 1019}
{"train_info/time_between_train_steps": 0.005045413970947266, "step": 1019}
{"info/global_step": 1020, "train_info/time_within_train_step": 27.75615668296814, "step": 1020}
{"train_info/time_between_train_steps": 0.005220651626586914, "step": 1020}
{"info/global_step": 1021, "train_info/time_within_train_step": 27.822712182998657, "step": 1021}
{"train_info/time_between_train_steps": 0.010125160217285156, "step": 1021}
{"info/global_step": 1022, "train_info/time_within_train_step": 27.766263008117676, "step": 1022}
{"train_info/time_between_train_steps": 0.005115032196044922, "step": 1022}
{"info/global_step": 1023, "train_info/time_within_train_step": 27.743645429611206, "step": 1023}
{"train_info/time_between_train_steps": 0.005446195602416992, "step": 1023}
{"info/global_step": 1024, "train_info/time_within_train_step": 27.96702218055725, "step": 1024}
{"train_info/time_between_train_steps": 0.005258083343505859, "step": 1024}
{"info/global_step": 1025, "train_info/time_within_train_step": 27.935526609420776, "step": 1025}
{"train_info/time_between_train_steps": 0.0058405399322509766, "step": 1025}
{"info/global_step": 1026, "train_info/time_within_train_step": 27.81609535217285, "step": 1026}
{"train_info/time_between_train_steps": 0.005841255187988281, "step": 1026}
{"train_info/time_between_train_steps": 20.68848729133606, "step": 1026}
{"info/global_step": 1027, "train_info/time_within_train_step": 27.754698991775513, "step": 1027}
{"train_info/time_between_train_steps": 0.005594968795776367, "step": 1027}
{"info/global_step": 1028, "train_info/time_within_train_step": 27.980385780334473, "step": 1028}
{"train_info/time_between_train_steps": 0.00527501106262207, "step": 1028}
{"info/global_step": 1029, "train_info/time_within_train_step": 27.724507808685303, "step": 1029}
{"train_info/time_between_train_steps": 0.005131959915161133, "step": 1029}
{"info/global_step": 1030, "train_info/time_within_train_step": 27.91776704788208, "step": 1030}
{"train_info/time_between_train_steps": 0.005296945571899414, "step": 1030}
{"info/global_step": 1031, "train_info/time_within_train_step": 27.758700609207153, "step": 1031}
{"train_info/time_between_train_steps": 0.0051805973052978516, "step": 1031}
{"info/global_step": 1032, "train_info/time_within_train_step": 27.944806814193726, "step": 1032}
{"train_info/time_between_train_steps": 0.015481948852539062, "step": 1032}
{"info/global_step": 1033, "train_info/time_within_train_step": 27.78759741783142, "step": 1033}
{"train_info/time_between_train_steps": 0.0052106380462646484, "step": 1033}
{"info/global_step": 1034, "train_info/time_within_train_step": 27.809213638305664, "step": 1034}
{"train_info/time_between_train_steps": 0.005330324172973633, "step": 1034}
{"info/global_step": 1035, "train_info/time_within_train_step": 27.78104043006897, "step": 1035}
{"train_info/time_between_train_steps": 0.005072116851806641, "step": 1035}
{"info/global_step": 1036, "train_info/time_within_train_step": 27.833741426467896, "step": 1036}
{"train_info/time_between_train_steps": 0.0049283504486083984, "step": 1036}
{"info/global_step": 1037, "train_info/time_within_train_step": 27.76793336868286, "step": 1037}
{"train_info/time_between_train_steps": 0.004954099655151367, "step": 1037}
{"info/global_step": 1038, "train_info/time_within_train_step": 27.731841802597046, "step": 1038}
{"train_info/time_between_train_steps": 0.005087375640869141, "step": 1038}
{"info/global_step": 1039, "train_info/time_within_train_step": 27.93584942817688, "step": 1039}
{"train_info/time_between_train_steps": 0.0049250125885009766, "step": 1039}
{"info/global_step": 1040, "train_info/time_within_train_step": 27.739464282989502, "step": 1040}
{"train_info/time_between_train_steps": 0.010116100311279297, "step": 1040}
{"info/global_step": 1041, "train_info/time_within_train_step": 27.834669589996338, "step": 1041}
{"train_info/time_between_train_steps": 0.012079477310180664, "step": 1041}
{"info/global_step": 1042, "train_info/time_within_train_step": 27.793960332870483, "step": 1042}
{"train_info/time_between_train_steps": 0.004988431930541992, "step": 1042}
{"info/global_step": 1043, "train_info/time_within_train_step": 27.766842365264893, "step": 1043}
{"train_info/time_between_train_steps": 0.009579181671142578, "step": 1043}
{"info/global_step": 1044, "train_info/time_within_train_step": 27.81093192100525, "step": 1044}
{"train_info/time_between_train_steps": 0.01006174087524414, "step": 1044}
{"info/global_step": 1045, "train_info/time_within_train_step": 27.731571435928345, "step": 1045}
{"train_info/time_between_train_steps": 0.004975795745849609, "step": 1045}
{"info/global_step": 1046, "train_info/time_within_train_step": 27.730366230010986, "step": 1046}
{"train_info/time_between_train_steps": 0.010028362274169922, "step": 1046}
{"info/global_step": 1047, "train_info/time_within_train_step": 27.75085735321045, "step": 1047}
{"train_info/time_between_train_steps": 0.009851455688476562, "step": 1047}
{"info/global_step": 1048, "train_info/time_within_train_step": 27.80298089981079, "step": 1048}
{"train_info/time_between_train_steps": 0.005092144012451172, "step": 1048}
{"info/global_step": 1049, "train_info/time_within_train_step": 27.746459245681763, "step": 1049}
{"train_info/time_between_train_steps": 0.005100250244140625, "step": 1049}
{"info/global_step": 1050, "train_info/time_within_train_step": 27.7289297580719, "step": 1050}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1733867566, "_runtime": 30100}, "step": 1050}
{"logs": {"train/loss": 3.8001, "train/learning_rate": 8.333333333333333e-05, "train/epoch": 38.02, "_timestamp": 1733867566, "_runtime": 30100}, "step": 1050}
{"train_info/time_between_train_steps": 0.012228250503540039, "step": 1050}
{"info/global_step": 1051, "train_info/time_within_train_step": 27.726914644241333, "step": 1051}
{"train_info/time_between_train_steps": 0.010247230529785156, "step": 1051}
{"info/global_step": 1052, "train_info/time_within_train_step": 27.757915258407593, "step": 1052}
{"train_info/time_between_train_steps": 0.005877256393432617, "step": 1052}
{"info/global_step": 1053, "train_info/time_within_train_step": 27.74388098716736, "step": 1053}
{"train_info/time_between_train_steps": 0.010735034942626953, "step": 1053}
{"train_info/time_between_train_steps": 20.687130212783813, "step": 1053}
{"info/global_step": 1054, "train_info/time_within_train_step": 27.822505235671997, "step": 1054}
{"train_info/time_between_train_steps": 0.010724306106567383, "step": 1054}
{"info/global_step": 1055, "train_info/time_within_train_step": 27.867484092712402, "step": 1055}
{"train_info/time_between_train_steps": 0.005248546600341797, "step": 1055}
{"info/global_step": 1056, "train_info/time_within_train_step": 27.73382306098938, "step": 1056}
{"train_info/time_between_train_steps": 0.005096912384033203, "step": 1056}
{"info/global_step": 1057, "train_info/time_within_train_step": 27.906592845916748, "step": 1057}
{"train_info/time_between_train_steps": 0.00526881217956543, "step": 1057}
{"info/global_step": 1058, "train_info/time_within_train_step": 27.740787029266357, "step": 1058}
{"train_info/time_between_train_steps": 0.006348133087158203, "step": 1058}
{"info/global_step": 1059, "train_info/time_within_train_step": 27.86966872215271, "step": 1059}
{"train_info/time_between_train_steps": 0.005169391632080078, "step": 1059}
{"info/global_step": 1060, "train_info/time_within_train_step": 27.7552707195282, "step": 1060}
{"train_info/time_between_train_steps": 0.00554203987121582, "step": 1060}
{"info/global_step": 1061, "train_info/time_within_train_step": 27.870962142944336, "step": 1061}
{"train_info/time_between_train_steps": 0.005164384841918945, "step": 1061}
{"info/global_step": 1062, "train_info/time_within_train_step": 27.766284465789795, "step": 1062}
{"train_info/time_between_train_steps": 0.004927635192871094, "step": 1062}
{"info/global_step": 1063, "train_info/time_within_train_step": 27.727215051651, "step": 1063}
{"train_info/time_between_train_steps": 0.00499725341796875, "step": 1063}
{"info/global_step": 1064, "train_info/time_within_train_step": 27.797054290771484, "step": 1064}
{"train_info/time_between_train_steps": 0.010082006454467773, "step": 1064}
{"info/global_step": 1065, "train_info/time_within_train_step": 27.717302560806274, "step": 1065}
{"train_info/time_between_train_steps": 0.009834051132202148, "step": 1065}
{"info/global_step": 1066, "train_info/time_within_train_step": 27.722641468048096, "step": 1066}
{"train_info/time_between_train_steps": 0.010152578353881836, "step": 1066}
{"info/global_step": 1067, "train_info/time_within_train_step": 27.750913381576538, "step": 1067}
{"train_info/time_between_train_steps": 0.005160093307495117, "step": 1067}
{"info/global_step": 1068, "train_info/time_within_train_step": 27.721277475357056, "step": 1068}
{"train_info/time_between_train_steps": 0.0051538944244384766, "step": 1068}
{"info/global_step": 1069, "train_info/time_within_train_step": 27.724077463150024, "step": 1069}
{"train_info/time_between_train_steps": 0.005156040191650391, "step": 1069}
{"info/global_step": 1070, "train_info/time_within_train_step": 27.819231748580933, "step": 1070}
{"train_info/time_between_train_steps": 0.005237579345703125, "step": 1070}
{"info/global_step": 1071, "train_info/time_within_train_step": 27.743303775787354, "step": 1071}
{"train_info/time_between_train_steps": 0.005166530609130859, "step": 1071}
{"info/global_step": 1072, "train_info/time_within_train_step": 27.73980712890625, "step": 1072}
{"train_info/time_between_train_steps": 0.005158901214599609, "step": 1072}
{"info/global_step": 1073, "train_info/time_within_train_step": 27.72539210319519, "step": 1073}
{"train_info/time_between_train_steps": 0.005103588104248047, "step": 1073}
{"info/global_step": 1074, "train_info/time_within_train_step": 27.735180139541626, "step": 1074}
{"train_info/time_between_train_steps": 0.005139350891113281, "step": 1074}
{"info/global_step": 1075, "train_info/time_within_train_step": 27.743367910385132, "step": 1075}
{"train_info/time_between_train_steps": 0.005090236663818359, "step": 1075}
{"info/global_step": 1076, "train_info/time_within_train_step": 27.77042841911316, "step": 1076}
{"train_info/time_between_train_steps": 0.005174875259399414, "step": 1076}
{"info/global_step": 1077, "train_info/time_within_train_step": 27.79031538963318, "step": 1077}
{"train_info/time_between_train_steps": 0.005514621734619141, "step": 1077}
{"info/global_step": 1078, "train_info/time_within_train_step": 27.834808111190796, "step": 1078}
{"train_info/time_between_train_steps": 0.005318164825439453, "step": 1078}
{"info/global_step": 1079, "train_info/time_within_train_step": 27.76159906387329, "step": 1079}
{"train_info/time_between_train_steps": 0.010701417922973633, "step": 1079}
{"info/global_step": 1080, "train_info/time_within_train_step": 27.778059720993042, "step": 1080}
{"train_info/time_between_train_steps": 0.0057637691497802734, "step": 1080}
{"train_info/time_between_train_steps": 20.440624952316284, "step": 1080}
{"info/global_step": 1081, "train_info/time_within_train_step": 27.701832056045532, "step": 1081}
{"train_info/time_between_train_steps": 0.0050144195556640625, "step": 1081}
{"info/global_step": 1082, "train_info/time_within_train_step": 27.81026840209961, "step": 1082}
{"train_info/time_between_train_steps": 0.005269527435302734, "step": 1082}
{"info/global_step": 1083, "train_info/time_within_train_step": 27.75364351272583, "step": 1083}
{"train_info/time_between_train_steps": 0.0053272247314453125, "step": 1083}
{"info/global_step": 1084, "train_info/time_within_train_step": 27.889233589172363, "step": 1084}
{"train_info/time_between_train_steps": 0.005154609680175781, "step": 1084}
{"info/global_step": 1085, "train_info/time_within_train_step": 28.030937433242798, "step": 1085}
{"train_info/time_between_train_steps": 0.005173921585083008, "step": 1085}
{"info/global_step": 1086, "train_info/time_within_train_step": 27.86110806465149, "step": 1086}
{"train_info/time_between_train_steps": 0.0051479339599609375, "step": 1086}
{"info/global_step": 1087, "train_info/time_within_train_step": 27.763917684555054, "step": 1087}
{"train_info/time_between_train_steps": 0.005563259124755859, "step": 1087}
{"info/global_step": 1088, "train_info/time_within_train_step": 27.7989239692688, "step": 1088}
{"train_info/time_between_train_steps": 0.010379791259765625, "step": 1088}
{"info/global_step": 1089, "train_info/time_within_train_step": 27.793206691741943, "step": 1089}
{"train_info/time_between_train_steps": 0.009943008422851562, "step": 1089}
{"info/global_step": 1090, "train_info/time_within_train_step": 27.73973298072815, "step": 1090}
{"train_info/time_between_train_steps": 0.005094051361083984, "step": 1090}
{"info/global_step": 1091, "train_info/time_within_train_step": 27.727315664291382, "step": 1091}
{"train_info/time_between_train_steps": 0.01009511947631836, "step": 1091}
{"info/global_step": 1092, "train_info/time_within_train_step": 27.71931219100952, "step": 1092}
{"train_info/time_between_train_steps": 0.004949808120727539, "step": 1092}
{"info/global_step": 1093, "train_info/time_within_train_step": 27.717634439468384, "step": 1093}
{"train_info/time_between_train_steps": 0.01001429557800293, "step": 1093}
{"info/global_step": 1094, "train_info/time_within_train_step": 27.725228786468506, "step": 1094}
{"train_info/time_between_train_steps": 0.0053424835205078125, "step": 1094}
{"info/global_step": 1095, "train_info/time_within_train_step": 27.724708080291748, "step": 1095}
{"train_info/time_between_train_steps": 0.005044221878051758, "step": 1095}
{"info/global_step": 1096, "train_info/time_within_train_step": 27.745607137680054, "step": 1096}
{"train_info/time_between_train_steps": 0.0050466060638427734, "step": 1096}
{"info/global_step": 1097, "train_info/time_within_train_step": 27.747455835342407, "step": 1097}
{"train_info/time_between_train_steps": 0.010095357894897461, "step": 1097}
{"info/global_step": 1098, "train_info/time_within_train_step": 27.719680547714233, "step": 1098}
{"train_info/time_between_train_steps": 0.010018110275268555, "step": 1098}
{"info/global_step": 1099, "train_info/time_within_train_step": 27.732697248458862, "step": 1099}
{"train_info/time_between_train_steps": 0.00516200065612793, "step": 1099}
{"info/global_step": 1100, "train_info/time_within_train_step": 27.85067629814148, "step": 1100}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1733868997, "_runtime": 31531}, "step": 1100}
{"logs": {"train/loss": 3.8078, "train/learning_rate": 5.5555555555555545e-05, "train/epoch": 40.02, "_timestamp": 1733868997, "_runtime": 31531}, "step": 1100}
{"train_info/time_between_train_steps": 2.3058581352233887, "step": 1100}
{"info/global_step": 1101, "train_info/time_within_train_step": 27.715275287628174, "step": 1101}
{"train_info/time_between_train_steps": 0.005007266998291016, "step": 1101}
{"info/global_step": 1102, "train_info/time_within_train_step": 27.771273374557495, "step": 1102}
{"train_info/time_between_train_steps": 0.0051670074462890625, "step": 1102}
{"info/global_step": 1103, "train_info/time_within_train_step": 27.742286443710327, "step": 1103}
{"train_info/time_between_train_steps": 0.005227327346801758, "step": 1103}
{"info/global_step": 1104, "train_info/time_within_train_step": 27.745771169662476, "step": 1104}
{"train_info/time_between_train_steps": 0.0052149295806884766, "step": 1104}
{"info/global_step": 1105, "train_info/time_within_train_step": 27.749118328094482, "step": 1105}
{"train_info/time_between_train_steps": 0.0053174495697021484, "step": 1105}
{"info/global_step": 1106, "train_info/time_within_train_step": 27.74170684814453, "step": 1106}
{"train_info/time_between_train_steps": 0.005637168884277344, "step": 1106}
{"info/global_step": 1107, "train_info/time_within_train_step": 27.750822067260742, "step": 1107}
{"train_info/time_between_train_steps": 0.006018400192260742, "step": 1107}
{"train_info/time_between_train_steps": 20.61910343170166, "step": 1107}
{"info/global_step": 1108, "train_info/time_within_train_step": 27.738756895065308, "step": 1108}
{"train_info/time_between_train_steps": 0.0048863887786865234, "step": 1108}
{"info/global_step": 1109, "train_info/time_within_train_step": 27.862391710281372, "step": 1109}
{"train_info/time_between_train_steps": 0.0049245357513427734, "step": 1109}
{"info/global_step": 1110, "train_info/time_within_train_step": 27.719833374023438, "step": 1110}
{"train_info/time_between_train_steps": 0.004994869232177734, "step": 1110}
{"info/global_step": 1111, "train_info/time_within_train_step": 27.899317741394043, "step": 1111}
{"train_info/time_between_train_steps": 0.005224704742431641, "step": 1111}
{"info/global_step": 1112, "train_info/time_within_train_step": 27.760632276535034, "step": 1112}
{"train_info/time_between_train_steps": 0.009696483612060547, "step": 1112}
{"info/global_step": 1113, "train_info/time_within_train_step": 27.880170345306396, "step": 1113}
{"train_info/time_between_train_steps": 0.005091190338134766, "step": 1113}
{"info/global_step": 1114, "train_info/time_within_train_step": 27.74229407310486, "step": 1114}
{"train_info/time_between_train_steps": 0.00536799430847168, "step": 1114}
{"info/global_step": 1115, "train_info/time_within_train_step": 27.89645767211914, "step": 1115}
{"train_info/time_between_train_steps": 0.005255937576293945, "step": 1115}
{"info/global_step": 1116, "train_info/time_within_train_step": 27.780900955200195, "step": 1116}
{"train_info/time_between_train_steps": 0.0053653717041015625, "step": 1116}
{"info/global_step": 1117, "train_info/time_within_train_step": 27.720247268676758, "step": 1117}
{"train_info/time_between_train_steps": 0.00494074821472168, "step": 1117}
{"info/global_step": 1118, "train_info/time_within_train_step": 27.724558115005493, "step": 1118}
{"train_info/time_between_train_steps": 0.0050504207611083984, "step": 1118}
{"info/global_step": 1119, "train_info/time_within_train_step": 27.735576629638672, "step": 1119}
{"train_info/time_between_train_steps": 0.00507664680480957, "step": 1119}
{"info/global_step": 1120, "train_info/time_within_train_step": 27.79386019706726, "step": 1120}
{"train_info/time_between_train_steps": 0.0066301822662353516, "step": 1120}
{"info/global_step": 1121, "train_info/time_within_train_step": 27.73970103263855, "step": 1121}
{"train_info/time_between_train_steps": 0.0050966739654541016, "step": 1121}
{"info/global_step": 1122, "train_info/time_within_train_step": 27.737592220306396, "step": 1122}
{"train_info/time_between_train_steps": 0.005150794982910156, "step": 1122}
{"info/global_step": 1123, "train_info/time_within_train_step": 27.729382514953613, "step": 1123}
{"train_info/time_between_train_steps": 0.005091428756713867, "step": 1123}
{"info/global_step": 1124, "train_info/time_within_train_step": 27.761698722839355, "step": 1124}
{"train_info/time_between_train_steps": 0.005085945129394531, "step": 1124}
{"info/global_step": 1125, "train_info/time_within_train_step": 27.75344467163086, "step": 1125}
{"train_info/time_between_train_steps": 0.005068778991699219, "step": 1125}
{"info/global_step": 1126, "train_info/time_within_train_step": 27.746357679367065, "step": 1126}
{"train_info/time_between_train_steps": 0.005084037780761719, "step": 1126}
{"info/global_step": 1127, "train_info/time_within_train_step": 27.776720762252808, "step": 1127}
{"train_info/time_between_train_steps": 0.0051882266998291016, "step": 1127}
{"info/global_step": 1128, "train_info/time_within_train_step": 27.777824640274048, "step": 1128}
{"train_info/time_between_train_steps": 0.0051996707916259766, "step": 1128}
{"info/global_step": 1129, "train_info/time_within_train_step": 27.76321792602539, "step": 1129}
{"train_info/time_between_train_steps": 0.005087137222290039, "step": 1129}
{"info/global_step": 1130, "train_info/time_within_train_step": 27.769997596740723, "step": 1130}
{"train_info/time_between_train_steps": 0.005041599273681641, "step": 1130}
{"info/global_step": 1131, "train_info/time_within_train_step": 27.875169277191162, "step": 1131}
{"train_info/time_between_train_steps": 0.005273342132568359, "step": 1131}
{"info/global_step": 1132, "train_info/time_within_train_step": 27.762566566467285, "step": 1132}
{"train_info/time_between_train_steps": 0.005089282989501953, "step": 1132}
{"info/global_step": 1133, "train_info/time_within_train_step": 27.743337631225586, "step": 1133}
{"train_info/time_between_train_steps": 0.005768537521362305, "step": 1133}
{"info/global_step": 1134, "train_info/time_within_train_step": 27.920222759246826, "step": 1134}
{"train_info/time_between_train_steps": 0.010230064392089844, "step": 1134}
{"train_info/time_between_train_steps": 20.728115797042847, "step": 1134}
{"info/global_step": 1135, "train_info/time_within_train_step": 27.80004644393921, "step": 1135}
{"train_info/time_between_train_steps": 0.005250692367553711, "step": 1135}
{"info/global_step": 1136, "train_info/time_within_train_step": 27.965604305267334, "step": 1136}
{"train_info/time_between_train_steps": 0.005186319351196289, "step": 1136}
{"info/global_step": 1137, "train_info/time_within_train_step": 27.728875160217285, "step": 1137}
{"train_info/time_between_train_steps": 0.012301445007324219, "step": 1137}
{"info/global_step": 1138, "train_info/time_within_train_step": 27.96345806121826, "step": 1138}
{"train_info/time_between_train_steps": 0.005154609680175781, "step": 1138}
{"info/global_step": 1139, "train_info/time_within_train_step": 27.76114559173584, "step": 1139}
{"train_info/time_between_train_steps": 0.010444879531860352, "step": 1139}
{"info/global_step": 1140, "train_info/time_within_train_step": 27.896573543548584, "step": 1140}
{"train_info/time_between_train_steps": 0.0052487850189208984, "step": 1140}
{"info/global_step": 1141, "train_info/time_within_train_step": 27.783985137939453, "step": 1141}
{"train_info/time_between_train_steps": 0.015265703201293945, "step": 1141}
{"info/global_step": 1142, "train_info/time_within_train_step": 27.851522207260132, "step": 1142}
{"train_info/time_between_train_steps": 0.005298137664794922, "step": 1142}
{"info/global_step": 1143, "train_info/time_within_train_step": 27.75624132156372, "step": 1143}
{"train_info/time_between_train_steps": 0.004983663558959961, "step": 1143}
{"info/global_step": 1144, "train_info/time_within_train_step": 27.759366989135742, "step": 1144}
{"train_info/time_between_train_steps": 0.006188154220581055, "step": 1144}
{"info/global_step": 1145, "train_info/time_within_train_step": 27.764378786087036, "step": 1145}
{"train_info/time_between_train_steps": 0.005104541778564453, "step": 1145}
{"info/global_step": 1146, "train_info/time_within_train_step": 27.849615573883057, "step": 1146}
{"train_info/time_between_train_steps": 0.009947538375854492, "step": 1146}
{"info/global_step": 1147, "train_info/time_within_train_step": 27.75794291496277, "step": 1147}
{"train_info/time_between_train_steps": 0.004974842071533203, "step": 1147}
{"info/global_step": 1148, "train_info/time_within_train_step": 27.756688594818115, "step": 1148}
{"train_info/time_between_train_steps": 0.005208015441894531, "step": 1148}
{"info/global_step": 1149, "train_info/time_within_train_step": 27.718482732772827, "step": 1149}
{"train_info/time_between_train_steps": 0.005035877227783203, "step": 1149}
{"info/global_step": 1150, "train_info/time_within_train_step": 27.78149390220642, "step": 1150}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1733870430, "_runtime": 32964}, "step": 1150}
{"logs": {"train/loss": 3.7753, "train/learning_rate": 2.7777777777777772e-05, "train/epoch": 42.01, "_timestamp": 1733870430, "_runtime": 32964}, "step": 1150}
{"train_info/time_between_train_steps": 0.015943288803100586, "step": 1150}
{"info/global_step": 1151, "train_info/time_within_train_step": 27.874078512191772, "step": 1151}
{"train_info/time_between_train_steps": 0.0051708221435546875, "step": 1151}
{"info/global_step": 1152, "train_info/time_within_train_step": 27.767088174819946, "step": 1152}
{"train_info/time_between_train_steps": 0.011645793914794922, "step": 1152}
{"info/global_step": 1153, "train_info/time_within_train_step": 27.91932463645935, "step": 1153}
{"train_info/time_between_train_steps": 0.0050907135009765625, "step": 1153}
{"info/global_step": 1154, "train_info/time_within_train_step": 27.740225553512573, "step": 1154}
{"train_info/time_between_train_steps": 0.005050182342529297, "step": 1154}
{"info/global_step": 1155, "train_info/time_within_train_step": 27.76547861099243, "step": 1155}
{"train_info/time_between_train_steps": 0.010131359100341797, "step": 1155}
{"info/global_step": 1156, "train_info/time_within_train_step": 27.7650728225708, "step": 1156}
{"train_info/time_between_train_steps": 0.005167245864868164, "step": 1156}
{"info/global_step": 1157, "train_info/time_within_train_step": 27.875389099121094, "step": 1157}
{"train_info/time_between_train_steps": 0.005051612854003906, "step": 1157}
{"info/global_step": 1158, "train_info/time_within_train_step": 27.834078550338745, "step": 1158}
{"train_info/time_between_train_steps": 0.012631654739379883, "step": 1158}
{"info/global_step": 1159, "train_info/time_within_train_step": 27.930981636047363, "step": 1159}
{"train_info/time_between_train_steps": 0.01503753662109375, "step": 1159}
{"info/global_step": 1160, "train_info/time_within_train_step": 27.76871967315674, "step": 1160}
{"train_info/time_between_train_steps": 0.005547285079956055, "step": 1160}
{"info/global_step": 1161, "train_info/time_within_train_step": 27.747706413269043, "step": 1161}
{"train_info/time_between_train_steps": 0.0057528018951416016, "step": 1161}
{"train_info/time_between_train_steps": 20.636688709259033, "step": 1161}
{"info/global_step": 1162, "train_info/time_within_train_step": 27.73164653778076, "step": 1162}
{"train_info/time_between_train_steps": 0.004883289337158203, "step": 1162}
{"info/global_step": 1163, "train_info/time_within_train_step": 27.94796657562256, "step": 1163}
{"train_info/time_between_train_steps": 0.005129098892211914, "step": 1163}
{"info/global_step": 1164, "train_info/time_within_train_step": 27.732406854629517, "step": 1164}
{"train_info/time_between_train_steps": 0.0052318572998046875, "step": 1164}
{"info/global_step": 1165, "train_info/time_within_train_step": 27.856664180755615, "step": 1165}
{"train_info/time_between_train_steps": 0.00531315803527832, "step": 1165}
{"info/global_step": 1166, "train_info/time_within_train_step": 27.74107336997986, "step": 1166}
{"train_info/time_between_train_steps": 0.005135774612426758, "step": 1166}
{"info/global_step": 1167, "train_info/time_within_train_step": 27.936355352401733, "step": 1167}
{"train_info/time_between_train_steps": 0.005574703216552734, "step": 1167}
{"info/global_step": 1168, "train_info/time_within_train_step": 27.726258277893066, "step": 1168}
{"train_info/time_between_train_steps": 0.0053403377532958984, "step": 1168}
{"info/global_step": 1169, "train_info/time_within_train_step": 27.76104187965393, "step": 1169}
{"train_info/time_between_train_steps": 0.0051670074462890625, "step": 1169}
{"info/global_step": 1170, "train_info/time_within_train_step": 27.72580313682556, "step": 1170}
{"train_info/time_between_train_steps": 0.01001739501953125, "step": 1170}
{"info/global_step": 1171, "train_info/time_within_train_step": 27.834872722625732, "step": 1171}
{"train_info/time_between_train_steps": 0.007077932357788086, "step": 1171}
{"info/global_step": 1172, "train_info/time_within_train_step": 27.97549796104431, "step": 1172}
{"train_info/time_between_train_steps": 0.005215883255004883, "step": 1172}
{"info/global_step": 1173, "train_info/time_within_train_step": 27.854413747787476, "step": 1173}
{"train_info/time_between_train_steps": 0.005359649658203125, "step": 1173}
{"info/global_step": 1174, "train_info/time_within_train_step": 27.93261170387268, "step": 1174}
{"train_info/time_between_train_steps": 0.005586385726928711, "step": 1174}
{"info/global_step": 1175, "train_info/time_within_train_step": 27.804119348526, "step": 1175}
{"train_info/time_between_train_steps": 0.012202262878417969, "step": 1175}
{"info/global_step": 1176, "train_info/time_within_train_step": 27.921279191970825, "step": 1176}
{"train_info/time_between_train_steps": 0.00593256950378418, "step": 1176}
{"info/global_step": 1177, "train_info/time_within_train_step": 28.147870540618896, "step": 1177}
{"train_info/time_between_train_steps": 0.011621475219726562, "step": 1177}
{"info/global_step": 1178, "train_info/time_within_train_step": 27.96319556236267, "step": 1178}
{"train_info/time_between_train_steps": 0.0054056644439697266, "step": 1178}
{"info/global_step": 1179, "train_info/time_within_train_step": 29.06465721130371, "step": 1179}
{"train_info/time_between_train_steps": 0.012110233306884766, "step": 1179}
{"info/global_step": 1180, "train_info/time_within_train_step": 27.944053888320923, "step": 1180}
{"train_info/time_between_train_steps": 0.006745100021362305, "step": 1180}
{"info/global_step": 1181, "train_info/time_within_train_step": 28.606297492980957, "step": 1181}
{"train_info/time_between_train_steps": 0.00995182991027832, "step": 1181}
{"info/global_step": 1182, "train_info/time_within_train_step": 28.03815746307373, "step": 1182}
{"train_info/time_between_train_steps": 0.0061342716217041016, "step": 1182}
{"info/global_step": 1183, "train_info/time_within_train_step": 28.416154861450195, "step": 1183}
{"train_info/time_between_train_steps": 0.006195545196533203, "step": 1183}
{"info/global_step": 1184, "train_info/time_within_train_step": 27.987674474716187, "step": 1184}
{"train_info/time_between_train_steps": 0.0058269500732421875, "step": 1184}
{"info/global_step": 1185, "train_info/time_within_train_step": 27.80829906463623, "step": 1185}
{"train_info/time_between_train_steps": 0.006519317626953125, "step": 1185}
{"info/global_step": 1186, "train_info/time_within_train_step": 27.964194297790527, "step": 1186}
{"train_info/time_between_train_steps": 0.013529539108276367, "step": 1186}
{"info/global_step": 1187, "train_info/time_within_train_step": 27.87629461288452, "step": 1187}
{"train_info/time_between_train_steps": 0.011346578598022461, "step": 1187}
{"info/global_step": 1188, "train_info/time_within_train_step": 27.999777793884277, "step": 1188}
{"train_info/time_between_train_steps": 0.012089729309082031, "step": 1188}
{"train_info/time_between_train_steps": 21.02147102355957, "step": 1188}
{"info/global_step": 1189, "train_info/time_within_train_step": 27.83963704109192, "step": 1189}
{"train_info/time_between_train_steps": 0.005727529525756836, "step": 1189}
{"info/global_step": 1190, "train_info/time_within_train_step": 27.96070432662964, "step": 1190}
{"train_info/time_between_train_steps": 0.005553722381591797, "step": 1190}
{"info/global_step": 1191, "train_info/time_within_train_step": 27.868375778198242, "step": 1191}
{"train_info/time_between_train_steps": 0.009809732437133789, "step": 1191}
{"info/global_step": 1192, "train_info/time_within_train_step": 28.18784213066101, "step": 1192}
{"train_info/time_between_train_steps": 0.005536079406738281, "step": 1192}
{"info/global_step": 1193, "train_info/time_within_train_step": 27.863304376602173, "step": 1193}
{"train_info/time_between_train_steps": 0.005702018737792969, "step": 1193}
{"info/global_step": 1194, "train_info/time_within_train_step": 27.881144762039185, "step": 1194}
{"train_info/time_between_train_steps": 0.0051763057708740234, "step": 1194}
{"info/global_step": 1195, "train_info/time_within_train_step": 27.770480394363403, "step": 1195}
{"train_info/time_between_train_steps": 0.005539655685424805, "step": 1195}
{"info/global_step": 1196, "train_info/time_within_train_step": 27.86095905303955, "step": 1196}
{"train_info/time_between_train_steps": 0.005375385284423828, "step": 1196}
{"info/global_step": 1197, "train_info/time_within_train_step": 27.857652187347412, "step": 1197}
{"train_info/time_between_train_steps": 0.005436897277832031, "step": 1197}
{"info/global_step": 1198, "train_info/time_within_train_step": 27.789196729660034, "step": 1198}
{"train_info/time_between_train_steps": 0.009607791900634766, "step": 1198}
{"info/global_step": 1199, "train_info/time_within_train_step": 27.777125358581543, "step": 1199}
{"train_info/time_between_train_steps": 0.005398750305175781, "step": 1199}
{"info/global_step": 1200, "train_info/time_within_train_step": 27.802236795425415, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1733871868, "_runtime": 34402}, "step": 1200}
{"logs": {"train/loss": 3.7526, "train/learning_rate": 0.0, "train/epoch": 44.01, "_timestamp": 1733871868, "_runtime": 34402}, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1733871871, "_runtime": 34405}, "step": 1200}
{"logs": {"train/train_runtime": 34405.9147, "train/train_samples_per_second": 17.857, "train/train_steps_per_second": 0.035, "train/total_flos": 3.2843363254272e+17, "train/train_loss": 4.8779505236943566, "train/epoch": 44.01, "_timestamp": 1733871871, "_runtime": 34405}, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1922.4453125, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1733871874, "_runtime": 34408}, "step": 1200}
{"logs": {"eval/loss": 4.762734413146973, "eval/runtime": 1.9661, "eval/samples_per_second": 50.862, "eval/steps_per_second": 3.56, "train/epoch": 44.01, "_timestamp": 1733871874, "_runtime": 34408}, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1922.4453125, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1733871874, "_runtime": 34408}, "step": 1200}
{"logs": {"eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_loss": 4.762734413146973, "eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_ppl": 117.06559434724694, "eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_runtime": 1.9661, "eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_samples_per_second": 50.862, "train/epoch": 44.01, "_timestamp": 1733871874, "_runtime": 34408}, "step": 1200}