NNDA_EN / metrics.json
xiulinyang's picture
Adding model checkpoints and config files
a70e734
{"num_parameters": 124439808, "trainable_parameters": 124439808, "step": 0}
{"train_info/time_between_train_steps": 3.4724998474121094, "step": 0}
{"info/global_step": 1, "train_info/time_within_train_step": 28.356553077697754, "step": 1}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 19761.71484375, "train_info/memory_reserved": 22624.0, "train_info/memory_max_reserved": 22624.0, "_timestamp": 1740821931, "_runtime": 36}, "step": 1}
{"logs": {"train/loss": 11.021, "train/learning_rate": 4.9999999999999996e-06, "train/epoch": 0.0, "_timestamp": 1740821931, "_runtime": 36}, "step": 1}
{"train_info/time_between_train_steps": 0.012038469314575195, "step": 1}
{"info/global_step": 2, "train_info/time_within_train_step": 28.006027936935425, "step": 2}
{"train_info/time_between_train_steps": 0.0057528018951416016, "step": 2}
{"info/global_step": 3, "train_info/time_within_train_step": 27.819584369659424, "step": 3}
{"train_info/time_between_train_steps": 0.0054590702056884766, "step": 3}
{"info/global_step": 4, "train_info/time_within_train_step": 27.99886393547058, "step": 4}
{"train_info/time_between_train_steps": 0.005727052688598633, "step": 4}
{"info/global_step": 5, "train_info/time_within_train_step": 28.30250859260559, "step": 5}
{"train_info/time_between_train_steps": 0.005971431732177734, "step": 5}
{"info/global_step": 6, "train_info/time_within_train_step": 27.94543480873108, "step": 6}
{"train_info/time_between_train_steps": 0.00553131103515625, "step": 6}
{"info/global_step": 7, "train_info/time_within_train_step": 27.809932231903076, "step": 7}
{"train_info/time_between_train_steps": 0.005543947219848633, "step": 7}
{"info/global_step": 8, "train_info/time_within_train_step": 27.83526921272278, "step": 8}
{"train_info/time_between_train_steps": 0.009299278259277344, "step": 8}
{"info/global_step": 9, "train_info/time_within_train_step": 27.847907543182373, "step": 9}
{"train_info/time_between_train_steps": 0.00568842887878418, "step": 9}
{"info/global_step": 10, "train_info/time_within_train_step": 27.800608158111572, "step": 10}
{"train_info/time_between_train_steps": 0.00514674186706543, "step": 10}
{"info/global_step": 11, "train_info/time_within_train_step": 27.826843738555908, "step": 11}
{"train_info/time_between_train_steps": 0.005217552185058594, "step": 11}
{"info/global_step": 12, "train_info/time_within_train_step": 27.790063619613647, "step": 12}
{"train_info/time_between_train_steps": 0.005198478698730469, "step": 12}
{"info/global_step": 13, "train_info/time_within_train_step": 27.76912498474121, "step": 13}
{"train_info/time_between_train_steps": 0.00516963005065918, "step": 13}
{"info/global_step": 14, "train_info/time_within_train_step": 27.83258318901062, "step": 14}
{"train_info/time_between_train_steps": 0.009354829788208008, "step": 14}
{"info/global_step": 15, "train_info/time_within_train_step": 27.861929893493652, "step": 15}
{"train_info/time_between_train_steps": 0.005177974700927734, "step": 15}
{"info/global_step": 16, "train_info/time_within_train_step": 27.914808750152588, "step": 16}
{"train_info/time_between_train_steps": 0.010395288467407227, "step": 16}
{"info/global_step": 17, "train_info/time_within_train_step": 27.798729181289673, "step": 17}
{"train_info/time_between_train_steps": 0.0067234039306640625, "step": 17}
{"info/global_step": 18, "train_info/time_within_train_step": 27.80428719520569, "step": 18}
{"train_info/time_between_train_steps": 0.0053005218505859375, "step": 18}
{"info/global_step": 19, "train_info/time_within_train_step": 27.843390464782715, "step": 19}
{"train_info/time_between_train_steps": 0.009669303894042969, "step": 19}
{"info/global_step": 20, "train_info/time_within_train_step": 27.80223846435547, "step": 20}
{"train_info/time_between_train_steps": 0.005280494689941406, "step": 20}
{"info/global_step": 21, "train_info/time_within_train_step": 27.862175941467285, "step": 21}
{"train_info/time_between_train_steps": 0.010325193405151367, "step": 21}
{"info/global_step": 22, "train_info/time_within_train_step": 27.799952507019043, "step": 22}
{"train_info/time_between_train_steps": 0.005244731903076172, "step": 22}
{"info/global_step": 23, "train_info/time_within_train_step": 27.772393465042114, "step": 23}
{"train_info/time_between_train_steps": 0.007596254348754883, "step": 23}
{"info/global_step": 24, "train_info/time_within_train_step": 27.846765518188477, "step": 24}
{"train_info/time_between_train_steps": 0.009978771209716797, "step": 24}
{"info/global_step": 25, "train_info/time_within_train_step": 27.83141326904297, "step": 25}
{"train_info/time_between_train_steps": 0.005211591720581055, "step": 25}
{"info/global_step": 26, "train_info/time_within_train_step": 27.791510105133057, "step": 26}
{"train_info/time_between_train_steps": 0.005450248718261719, "step": 26}
{"info/global_step": 27, "train_info/time_within_train_step": 27.86794352531433, "step": 27}
{"train_info/time_between_train_steps": 0.005995512008666992, "step": 27}
{"info/global_step": 28, "train_info/time_within_train_step": 27.893683195114136, "step": 28}
{"train_info/time_between_train_steps": 0.005707263946533203, "step": 28}
{"train_info/time_between_train_steps": 3.6946041584014893, "step": 28}
{"info/global_step": 29, "train_info/time_within_train_step": 27.84069848060608, "step": 29}
{"train_info/time_between_train_steps": 0.005944728851318359, "step": 29}
{"info/global_step": 30, "train_info/time_within_train_step": 27.982110261917114, "step": 30}
{"train_info/time_between_train_steps": 0.005479097366333008, "step": 30}
{"info/global_step": 31, "train_info/time_within_train_step": 27.837183713912964, "step": 31}
{"train_info/time_between_train_steps": 0.005900382995605469, "step": 31}
{"info/global_step": 32, "train_info/time_within_train_step": 28.155944108963013, "step": 32}
{"train_info/time_between_train_steps": 0.006777524948120117, "step": 32}
{"info/global_step": 33, "train_info/time_within_train_step": 27.838008165359497, "step": 33}
{"train_info/time_between_train_steps": 0.005716800689697266, "step": 33}
{"info/global_step": 34, "train_info/time_within_train_step": 27.947983264923096, "step": 34}
{"train_info/time_between_train_steps": 0.005556344985961914, "step": 34}
{"info/global_step": 35, "train_info/time_within_train_step": 27.82180404663086, "step": 35}
{"train_info/time_between_train_steps": 0.005548000335693359, "step": 35}
{"info/global_step": 36, "train_info/time_within_train_step": 27.92001509666443, "step": 36}
{"train_info/time_between_train_steps": 0.009606361389160156, "step": 36}
{"info/global_step": 37, "train_info/time_within_train_step": 27.805169343948364, "step": 37}
{"train_info/time_between_train_steps": 0.0069217681884765625, "step": 37}
{"info/global_step": 38, "train_info/time_within_train_step": 27.78155541419983, "step": 38}
{"train_info/time_between_train_steps": 0.005247592926025391, "step": 38}
{"info/global_step": 39, "train_info/time_within_train_step": 27.783386945724487, "step": 39}
{"train_info/time_between_train_steps": 0.005268096923828125, "step": 39}
{"info/global_step": 40, "train_info/time_within_train_step": 27.766067504882812, "step": 40}
{"train_info/time_between_train_steps": 0.005438566207885742, "step": 40}
{"info/global_step": 41, "train_info/time_within_train_step": 27.797367334365845, "step": 41}
{"train_info/time_between_train_steps": 0.005288124084472656, "step": 41}
{"info/global_step": 42, "train_info/time_within_train_step": 27.78087329864502, "step": 42}
{"train_info/time_between_train_steps": 0.007078647613525391, "step": 42}
{"info/global_step": 43, "train_info/time_within_train_step": 27.824498891830444, "step": 43}
{"train_info/time_between_train_steps": 0.010068655014038086, "step": 43}
{"info/global_step": 44, "train_info/time_within_train_step": 27.802767276763916, "step": 44}
{"train_info/time_between_train_steps": 0.005560159683227539, "step": 44}
{"info/global_step": 45, "train_info/time_within_train_step": 27.809051752090454, "step": 45}
{"train_info/time_between_train_steps": 0.009051322937011719, "step": 45}
{"info/global_step": 46, "train_info/time_within_train_step": 27.772316217422485, "step": 46}
{"train_info/time_between_train_steps": 0.005424022674560547, "step": 46}
{"info/global_step": 47, "train_info/time_within_train_step": 27.937561750411987, "step": 47}
{"train_info/time_between_train_steps": 0.006182670593261719, "step": 47}
{"info/global_step": 48, "train_info/time_within_train_step": 27.839527130126953, "step": 48}
{"train_info/time_between_train_steps": 0.005408048629760742, "step": 48}
{"info/global_step": 49, "train_info/time_within_train_step": 27.787217140197754, "step": 49}
{"train_info/time_between_train_steps": 0.008166074752807617, "step": 49}
{"info/global_step": 50, "train_info/time_within_train_step": 27.799281120300293, "step": 50}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740823301, "_runtime": 1406}, "step": 50}
{"logs": {"train/loss": 7.8725, "train/learning_rate": 0.00025, "train/epoch": 1.02, "_timestamp": 1740823301, "_runtime": 1406}, "step": 50}
{"train_info/time_between_train_steps": 0.009000539779663086, "step": 50}
{"info/global_step": 51, "train_info/time_within_train_step": 27.79505944252014, "step": 51}
{"train_info/time_between_train_steps": 0.005532264709472656, "step": 51}
{"info/global_step": 52, "train_info/time_within_train_step": 27.80429196357727, "step": 52}
{"train_info/time_between_train_steps": 0.005517244338989258, "step": 52}
{"info/global_step": 53, "train_info/time_within_train_step": 27.818836212158203, "step": 53}
{"train_info/time_between_train_steps": 0.005526304244995117, "step": 53}
{"info/global_step": 54, "train_info/time_within_train_step": 27.824252367019653, "step": 54}
{"train_info/time_between_train_steps": 0.010345935821533203, "step": 54}
{"info/global_step": 55, "train_info/time_within_train_step": 27.82606816291809, "step": 55}
{"train_info/time_between_train_steps": 0.006042957305908203, "step": 55}
{"info/global_step": 56, "train_info/time_within_train_step": 27.801787853240967, "step": 56}
{"train_info/time_between_train_steps": 0.005684375762939453, "step": 56}
{"train_info/time_between_train_steps": 3.623784065246582, "step": 56}
{"info/global_step": 57, "train_info/time_within_train_step": 27.787062406539917, "step": 57}
{"train_info/time_between_train_steps": 0.0053212642669677734, "step": 57}
{"info/global_step": 58, "train_info/time_within_train_step": 27.902050018310547, "step": 58}
{"train_info/time_between_train_steps": 0.0074977874755859375, "step": 58}
{"info/global_step": 59, "train_info/time_within_train_step": 27.81241226196289, "step": 59}
{"train_info/time_between_train_steps": 0.005563259124755859, "step": 59}
{"info/global_step": 60, "train_info/time_within_train_step": 27.985328674316406, "step": 60}
{"train_info/time_between_train_steps": 0.005492210388183594, "step": 60}
{"info/global_step": 61, "train_info/time_within_train_step": 27.827990531921387, "step": 61}
{"train_info/time_between_train_steps": 0.005626678466796875, "step": 61}
{"info/global_step": 62, "train_info/time_within_train_step": 27.97930669784546, "step": 62}
{"train_info/time_between_train_steps": 0.005777120590209961, "step": 62}
{"info/global_step": 63, "train_info/time_within_train_step": 27.923497915267944, "step": 63}
{"train_info/time_between_train_steps": 0.0054590702056884766, "step": 63}
{"info/global_step": 64, "train_info/time_within_train_step": 27.897172927856445, "step": 64}
{"train_info/time_between_train_steps": 0.008363485336303711, "step": 64}
{"info/global_step": 65, "train_info/time_within_train_step": 27.83108615875244, "step": 65}
{"train_info/time_between_train_steps": 0.00988626480102539, "step": 65}
{"info/global_step": 66, "train_info/time_within_train_step": 27.806541919708252, "step": 66}
{"train_info/time_between_train_steps": 0.005526304244995117, "step": 66}
{"info/global_step": 67, "train_info/time_within_train_step": 27.818402767181396, "step": 67}
{"train_info/time_between_train_steps": 0.005293846130371094, "step": 67}
{"info/global_step": 68, "train_info/time_within_train_step": 27.777019739151, "step": 68}
{"train_info/time_between_train_steps": 0.005370616912841797, "step": 68}
{"info/global_step": 69, "train_info/time_within_train_step": 27.818470001220703, "step": 69}
{"train_info/time_between_train_steps": 0.005198240280151367, "step": 69}
{"info/global_step": 70, "train_info/time_within_train_step": 27.780710458755493, "step": 70}
{"train_info/time_between_train_steps": 0.005295991897583008, "step": 70}
{"info/global_step": 71, "train_info/time_within_train_step": 27.828418970108032, "step": 71}
{"train_info/time_between_train_steps": 0.009238481521606445, "step": 71}
{"info/global_step": 72, "train_info/time_within_train_step": 27.76832628250122, "step": 72}
{"train_info/time_between_train_steps": 0.005285024642944336, "step": 72}
{"info/global_step": 73, "train_info/time_within_train_step": 27.76000189781189, "step": 73}
{"train_info/time_between_train_steps": 0.005151033401489258, "step": 73}
{"info/global_step": 74, "train_info/time_within_train_step": 27.776265382766724, "step": 74}
{"train_info/time_between_train_steps": 0.005638837814331055, "step": 74}
{"info/global_step": 75, "train_info/time_within_train_step": 27.80670666694641, "step": 75}
{"train_info/time_between_train_steps": 0.007349967956542969, "step": 75}
{"info/global_step": 76, "train_info/time_within_train_step": 27.809953212738037, "step": 76}
{"train_info/time_between_train_steps": 0.0052258968353271484, "step": 76}
{"info/global_step": 77, "train_info/time_within_train_step": 27.81095290184021, "step": 77}
{"train_info/time_between_train_steps": 0.005394697189331055, "step": 77}
{"info/global_step": 78, "train_info/time_within_train_step": 27.748566389083862, "step": 78}
{"train_info/time_between_train_steps": 0.006069183349609375, "step": 78}
{"info/global_step": 79, "train_info/time_within_train_step": 27.91358518600464, "step": 79}
{"train_info/time_between_train_steps": 0.010476350784301758, "step": 79}
{"info/global_step": 80, "train_info/time_within_train_step": 27.796142101287842, "step": 80}
{"train_info/time_between_train_steps": 0.005406379699707031, "step": 80}
{"info/global_step": 81, "train_info/time_within_train_step": 27.844451904296875, "step": 81}
{"train_info/time_between_train_steps": 0.005265712738037109, "step": 81}
{"info/global_step": 82, "train_info/time_within_train_step": 27.82050395011902, "step": 82}
{"train_info/time_between_train_steps": 0.005697727203369141, "step": 82}
{"info/global_step": 83, "train_info/time_within_train_step": 27.813305139541626, "step": 83}
{"train_info/time_between_train_steps": 0.005603790283203125, "step": 83}
{"info/global_step": 84, "train_info/time_within_train_step": 27.856889486312866, "step": 84}
{"train_info/time_between_train_steps": 0.008751153945922852, "step": 84}
{"train_info/time_between_train_steps": 4.014496564865112, "step": 84}
{"info/global_step": 85, "train_info/time_within_train_step": 27.808276414871216, "step": 85}
{"train_info/time_between_train_steps": 0.004974365234375, "step": 85}
{"info/global_step": 86, "train_info/time_within_train_step": 27.95068097114563, "step": 86}
{"train_info/time_between_train_steps": 0.007505178451538086, "step": 86}
{"info/global_step": 87, "train_info/time_within_train_step": 27.848283052444458, "step": 87}
{"train_info/time_between_train_steps": 0.005724430084228516, "step": 87}
{"info/global_step": 88, "train_info/time_within_train_step": 27.93825101852417, "step": 88}
{"train_info/time_between_train_steps": 0.00552821159362793, "step": 88}
{"info/global_step": 89, "train_info/time_within_train_step": 27.83279824256897, "step": 89}
{"train_info/time_between_train_steps": 0.008088827133178711, "step": 89}
{"info/global_step": 90, "train_info/time_within_train_step": 28.00257396697998, "step": 90}
{"train_info/time_between_train_steps": 0.008002519607543945, "step": 90}
{"info/global_step": 91, "train_info/time_within_train_step": 27.77607035636902, "step": 91}
{"train_info/time_between_train_steps": 0.005440711975097656, "step": 91}
{"info/global_step": 92, "train_info/time_within_train_step": 27.910706043243408, "step": 92}
{"train_info/time_between_train_steps": 0.005451202392578125, "step": 92}
{"info/global_step": 93, "train_info/time_within_train_step": 27.82893943786621, "step": 93}
{"train_info/time_between_train_steps": 0.00508570671081543, "step": 93}
{"info/global_step": 94, "train_info/time_within_train_step": 27.892857313156128, "step": 94}
{"train_info/time_between_train_steps": 0.010195255279541016, "step": 94}
{"info/global_step": 95, "train_info/time_within_train_step": 27.80492353439331, "step": 95}
{"train_info/time_between_train_steps": 0.00521087646484375, "step": 95}
{"info/global_step": 96, "train_info/time_within_train_step": 27.787481784820557, "step": 96}
{"train_info/time_between_train_steps": 0.005272865295410156, "step": 96}
{"info/global_step": 97, "train_info/time_within_train_step": 27.831461191177368, "step": 97}
{"train_info/time_between_train_steps": 0.005959033966064453, "step": 97}
{"info/global_step": 98, "train_info/time_within_train_step": 27.794795274734497, "step": 98}
{"train_info/time_between_train_steps": 0.005286216735839844, "step": 98}
{"info/global_step": 99, "train_info/time_within_train_step": 27.786753177642822, "step": 99}
{"train_info/time_between_train_steps": 0.005564451217651367, "step": 99}
{"info/global_step": 100, "train_info/time_within_train_step": 27.80515694618225, "step": 100}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740824701, "_runtime": 2806}, "step": 100}
{"logs": {"train/loss": 5.5983, "train/learning_rate": 0.0005, "train/epoch": 3.01, "_timestamp": 1740824701, "_runtime": 2806}, "step": 100}
{"train_info/time_between_train_steps": 13.536832094192505, "step": 100}
{"info/global_step": 101, "train_info/time_within_train_step": 27.771305561065674, "step": 101}
{"train_info/time_between_train_steps": 0.005130290985107422, "step": 101}
{"info/global_step": 102, "train_info/time_within_train_step": 27.826687335968018, "step": 102}
{"train_info/time_between_train_steps": 0.005797386169433594, "step": 102}
{"info/global_step": 103, "train_info/time_within_train_step": 27.98226499557495, "step": 103}
{"train_info/time_between_train_steps": 0.005266904830932617, "step": 103}
{"info/global_step": 104, "train_info/time_within_train_step": 27.82792901992798, "step": 104}
{"train_info/time_between_train_steps": 0.005323886871337891, "step": 104}
{"info/global_step": 105, "train_info/time_within_train_step": 27.812942504882812, "step": 105}
{"train_info/time_between_train_steps": 0.005154848098754883, "step": 105}
{"info/global_step": 106, "train_info/time_within_train_step": 27.859114170074463, "step": 106}
{"train_info/time_between_train_steps": 0.008170604705810547, "step": 106}
{"info/global_step": 107, "train_info/time_within_train_step": 27.79299306869507, "step": 107}
{"train_info/time_between_train_steps": 0.005409955978393555, "step": 107}
{"info/global_step": 108, "train_info/time_within_train_step": 27.80273723602295, "step": 108}
{"train_info/time_between_train_steps": 0.010274648666381836, "step": 108}
{"info/global_step": 109, "train_info/time_within_train_step": 27.815847396850586, "step": 109}
{"train_info/time_between_train_steps": 0.00519871711730957, "step": 109}
{"info/global_step": 110, "train_info/time_within_train_step": 27.928594827651978, "step": 110}
{"train_info/time_between_train_steps": 0.0054090023040771484, "step": 110}
{"info/global_step": 111, "train_info/time_within_train_step": 27.82640528678894, "step": 111}
{"train_info/time_between_train_steps": 0.0056610107421875, "step": 111}
{"info/global_step": 112, "train_info/time_within_train_step": 27.83763313293457, "step": 112}
{"train_info/time_between_train_steps": 0.005823373794555664, "step": 112}
{"train_info/time_between_train_steps": 3.7082626819610596, "step": 112}
{"info/global_step": 113, "train_info/time_within_train_step": 27.82156205177307, "step": 113}
{"train_info/time_between_train_steps": 0.0054929256439208984, "step": 113}
{"info/global_step": 114, "train_info/time_within_train_step": 27.957148790359497, "step": 114}
{"train_info/time_between_train_steps": 0.0077288150787353516, "step": 114}
{"info/global_step": 115, "train_info/time_within_train_step": 27.854825496673584, "step": 115}
{"train_info/time_between_train_steps": 0.011506080627441406, "step": 115}
{"info/global_step": 116, "train_info/time_within_train_step": 27.937596082687378, "step": 116}
{"train_info/time_between_train_steps": 0.007453203201293945, "step": 116}
{"info/global_step": 117, "train_info/time_within_train_step": 27.805935382843018, "step": 117}
{"train_info/time_between_train_steps": 0.0077898502349853516, "step": 117}
{"info/global_step": 118, "train_info/time_within_train_step": 28.00645399093628, "step": 118}
{"train_info/time_between_train_steps": 0.005555391311645508, "step": 118}
{"info/global_step": 119, "train_info/time_within_train_step": 27.83558487892151, "step": 119}
{"train_info/time_between_train_steps": 0.00532221794128418, "step": 119}
{"info/global_step": 120, "train_info/time_within_train_step": 27.918855667114258, "step": 120}
{"train_info/time_between_train_steps": 0.005616664886474609, "step": 120}
{"info/global_step": 121, "train_info/time_within_train_step": 27.799076557159424, "step": 121}
{"train_info/time_between_train_steps": 0.0065381526947021484, "step": 121}
{"info/global_step": 122, "train_info/time_within_train_step": 27.75593400001526, "step": 122}
{"train_info/time_between_train_steps": 0.009989261627197266, "step": 122}
{"info/global_step": 123, "train_info/time_within_train_step": 27.818716049194336, "step": 123}
{"train_info/time_between_train_steps": 0.00533294677734375, "step": 123}
{"info/global_step": 124, "train_info/time_within_train_step": 27.81406307220459, "step": 124}
{"train_info/time_between_train_steps": 0.010175943374633789, "step": 124}
{"info/global_step": 125, "train_info/time_within_train_step": 27.92747974395752, "step": 125}
{"train_info/time_between_train_steps": 0.0054476261138916016, "step": 125}
{"info/global_step": 126, "train_info/time_within_train_step": 27.82266879081726, "step": 126}
{"train_info/time_between_train_steps": 0.005212068557739258, "step": 126}
{"info/global_step": 127, "train_info/time_within_train_step": 27.764457941055298, "step": 127}
{"train_info/time_between_train_steps": 0.005334615707397461, "step": 127}
{"info/global_step": 128, "train_info/time_within_train_step": 27.832029104232788, "step": 128}
{"train_info/time_between_train_steps": 0.00927424430847168, "step": 128}
{"info/global_step": 129, "train_info/time_within_train_step": 27.787821054458618, "step": 129}
{"train_info/time_between_train_steps": 0.005190849304199219, "step": 129}
{"info/global_step": 130, "train_info/time_within_train_step": 27.81515336036682, "step": 130}
{"train_info/time_between_train_steps": 0.005429983139038086, "step": 130}
{"info/global_step": 131, "train_info/time_within_train_step": 27.834139347076416, "step": 131}
{"train_info/time_between_train_steps": 0.0054166316986083984, "step": 131}
{"info/global_step": 132, "train_info/time_within_train_step": 27.854929447174072, "step": 132}
{"train_info/time_between_train_steps": 0.007562875747680664, "step": 132}
{"info/global_step": 133, "train_info/time_within_train_step": 27.82447123527527, "step": 133}
{"train_info/time_between_train_steps": 0.007594585418701172, "step": 133}
{"info/global_step": 134, "train_info/time_within_train_step": 27.858262062072754, "step": 134}
{"train_info/time_between_train_steps": 0.005301237106323242, "step": 134}
{"info/global_step": 135, "train_info/time_within_train_step": 27.83580255508423, "step": 135}
{"train_info/time_between_train_steps": 0.005358457565307617, "step": 135}
{"info/global_step": 136, "train_info/time_within_train_step": 27.819738149642944, "step": 136}
{"train_info/time_between_train_steps": 0.007197856903076172, "step": 136}
{"info/global_step": 137, "train_info/time_within_train_step": 27.813014030456543, "step": 137}
{"train_info/time_between_train_steps": 0.007719516754150391, "step": 137}
{"info/global_step": 138, "train_info/time_within_train_step": 27.815109968185425, "step": 138}
{"train_info/time_between_train_steps": 0.0054018497467041016, "step": 138}
{"info/global_step": 139, "train_info/time_within_train_step": 27.830943822860718, "step": 139}
{"train_info/time_between_train_steps": 0.010714530944824219, "step": 139}
{"info/global_step": 140, "train_info/time_within_train_step": 27.847147226333618, "step": 140}
{"train_info/time_between_train_steps": 0.010834217071533203, "step": 140}
{"train_info/time_between_train_steps": 3.9085946083068848, "step": 140}
{"info/global_step": 141, "train_info/time_within_train_step": 27.890338897705078, "step": 141}
{"train_info/time_between_train_steps": 0.0054280757904052734, "step": 141}
{"info/global_step": 142, "train_info/time_within_train_step": 27.96570658683777, "step": 142}
{"train_info/time_between_train_steps": 0.005415439605712891, "step": 142}
{"info/global_step": 143, "train_info/time_within_train_step": 27.804539442062378, "step": 143}
{"train_info/time_between_train_steps": 0.010367155075073242, "step": 143}
{"info/global_step": 144, "train_info/time_within_train_step": 27.914630651474, "step": 144}
{"train_info/time_between_train_steps": 0.005303859710693359, "step": 144}
{"info/global_step": 145, "train_info/time_within_train_step": 27.813136100769043, "step": 145}
{"train_info/time_between_train_steps": 0.005410194396972656, "step": 145}
{"info/global_step": 146, "train_info/time_within_train_step": 27.984649896621704, "step": 146}
{"train_info/time_between_train_steps": 0.00923919677734375, "step": 146}
{"info/global_step": 147, "train_info/time_within_train_step": 27.867210865020752, "step": 147}
{"train_info/time_between_train_steps": 0.005538463592529297, "step": 147}
{"info/global_step": 148, "train_info/time_within_train_step": 27.93470287322998, "step": 148}
{"train_info/time_between_train_steps": 0.007696628570556641, "step": 148}
{"info/global_step": 149, "train_info/time_within_train_step": 27.79654097557068, "step": 149}
{"train_info/time_between_train_steps": 0.005255699157714844, "step": 149}
{"info/global_step": 150, "train_info/time_within_train_step": 28.291189193725586, "step": 150}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740826115, "_runtime": 4220}, "step": 150}
{"logs": {"train/loss": 5.0109, "train/learning_rate": 0.0005833333333333333, "train/epoch": 5.01, "_timestamp": 1740826115, "_runtime": 4220}, "step": 150}
{"train_info/time_between_train_steps": 0.009603261947631836, "step": 150}
{"info/global_step": 151, "train_info/time_within_train_step": 27.764455795288086, "step": 151}
{"train_info/time_between_train_steps": 0.0050811767578125, "step": 151}
{"info/global_step": 152, "train_info/time_within_train_step": 27.804359912872314, "step": 152}
{"train_info/time_between_train_steps": 0.007776021957397461, "step": 152}
{"info/global_step": 153, "train_info/time_within_train_step": 27.813221216201782, "step": 153}
{"train_info/time_between_train_steps": 0.005273580551147461, "step": 153}
{"info/global_step": 154, "train_info/time_within_train_step": 27.807286024093628, "step": 154}
{"train_info/time_between_train_steps": 0.0052869319915771484, "step": 154}
{"info/global_step": 155, "train_info/time_within_train_step": 27.833208084106445, "step": 155}
{"train_info/time_between_train_steps": 0.00836491584777832, "step": 155}
{"info/global_step": 156, "train_info/time_within_train_step": 27.82679295539856, "step": 156}
{"train_info/time_between_train_steps": 0.008167505264282227, "step": 156}
{"info/global_step": 157, "train_info/time_within_train_step": 27.94090986251831, "step": 157}
{"train_info/time_between_train_steps": 0.0051746368408203125, "step": 157}
{"info/global_step": 158, "train_info/time_within_train_step": 27.764575004577637, "step": 158}
{"train_info/time_between_train_steps": 0.005167961120605469, "step": 158}
{"info/global_step": 159, "train_info/time_within_train_step": 27.809075355529785, "step": 159}
{"train_info/time_between_train_steps": 0.010025501251220703, "step": 159}
{"info/global_step": 160, "train_info/time_within_train_step": 27.78304934501648, "step": 160}
{"train_info/time_between_train_steps": 0.005292654037475586, "step": 160}
{"info/global_step": 161, "train_info/time_within_train_step": 27.769049644470215, "step": 161}
{"train_info/time_between_train_steps": 0.0050983428955078125, "step": 161}
{"info/global_step": 162, "train_info/time_within_train_step": 27.762680768966675, "step": 162}
{"train_info/time_between_train_steps": 0.005522012710571289, "step": 162}
{"info/global_step": 163, "train_info/time_within_train_step": 27.812731504440308, "step": 163}
{"train_info/time_between_train_steps": 0.005175590515136719, "step": 163}
{"info/global_step": 164, "train_info/time_within_train_step": 27.816518783569336, "step": 164}
{"train_info/time_between_train_steps": 0.009271860122680664, "step": 164}
{"info/global_step": 165, "train_info/time_within_train_step": 27.786248445510864, "step": 165}
{"train_info/time_between_train_steps": 0.005376100540161133, "step": 165}
{"info/global_step": 166, "train_info/time_within_train_step": 27.82313060760498, "step": 166}
{"train_info/time_between_train_steps": 0.008601665496826172, "step": 166}
{"info/global_step": 167, "train_info/time_within_train_step": 27.820623636245728, "step": 167}
{"train_info/time_between_train_steps": 0.0059833526611328125, "step": 167}
{"info/global_step": 168, "train_info/time_within_train_step": 27.851032257080078, "step": 168}
{"train_info/time_between_train_steps": 0.005892038345336914, "step": 168}
{"train_info/time_between_train_steps": 3.943171739578247, "step": 168}
{"info/global_step": 169, "train_info/time_within_train_step": 27.806818962097168, "step": 169}
{"train_info/time_between_train_steps": 0.00845646858215332, "step": 169}
{"info/global_step": 170, "train_info/time_within_train_step": 27.96310305595398, "step": 170}
{"train_info/time_between_train_steps": 0.00762939453125, "step": 170}
{"info/global_step": 171, "train_info/time_within_train_step": 27.827465772628784, "step": 171}
{"train_info/time_between_train_steps": 0.009911537170410156, "step": 171}
{"info/global_step": 172, "train_info/time_within_train_step": 28.114561080932617, "step": 172}
{"train_info/time_between_train_steps": 0.009656906127929688, "step": 172}
{"info/global_step": 173, "train_info/time_within_train_step": 27.844417095184326, "step": 173}
{"train_info/time_between_train_steps": 0.005591630935668945, "step": 173}
{"info/global_step": 174, "train_info/time_within_train_step": 27.984702825546265, "step": 174}
{"train_info/time_between_train_steps": 0.011197090148925781, "step": 174}
{"info/global_step": 175, "train_info/time_within_train_step": 27.868202686309814, "step": 175}
{"train_info/time_between_train_steps": 0.005535125732421875, "step": 175}
{"info/global_step": 176, "train_info/time_within_train_step": 27.892975091934204, "step": 176}
{"train_info/time_between_train_steps": 0.010135650634765625, "step": 176}
{"info/global_step": 177, "train_info/time_within_train_step": 27.79840326309204, "step": 177}
{"train_info/time_between_train_steps": 0.005881071090698242, "step": 177}
{"info/global_step": 178, "train_info/time_within_train_step": 27.82417106628418, "step": 178}
{"train_info/time_between_train_steps": 0.005136728286743164, "step": 178}
{"info/global_step": 179, "train_info/time_within_train_step": 27.848939895629883, "step": 179}
{"train_info/time_between_train_steps": 0.005458831787109375, "step": 179}
{"info/global_step": 180, "train_info/time_within_train_step": 27.817201137542725, "step": 180}
{"train_info/time_between_train_steps": 0.0053293704986572266, "step": 180}
{"info/global_step": 181, "train_info/time_within_train_step": 27.794469833374023, "step": 181}
{"train_info/time_between_train_steps": 0.0054433345794677734, "step": 181}
{"info/global_step": 182, "train_info/time_within_train_step": 27.808525323867798, "step": 182}
{"train_info/time_between_train_steps": 0.010086297988891602, "step": 182}
{"info/global_step": 183, "train_info/time_within_train_step": 27.804043531417847, "step": 183}
{"train_info/time_between_train_steps": 0.007485866546630859, "step": 183}
{"info/global_step": 184, "train_info/time_within_train_step": 27.814395427703857, "step": 184}
{"train_info/time_between_train_steps": 0.005297660827636719, "step": 184}
{"info/global_step": 185, "train_info/time_within_train_step": 27.819876194000244, "step": 185}
{"train_info/time_between_train_steps": 0.005406856536865234, "step": 185}
{"info/global_step": 186, "train_info/time_within_train_step": 27.756282329559326, "step": 186}
{"train_info/time_between_train_steps": 0.0052983760833740234, "step": 186}
{"info/global_step": 187, "train_info/time_within_train_step": 27.775111198425293, "step": 187}
{"train_info/time_between_train_steps": 0.008806228637695312, "step": 187}
{"info/global_step": 188, "train_info/time_within_train_step": 27.897838830947876, "step": 188}
{"train_info/time_between_train_steps": 0.0051996707916259766, "step": 188}
{"info/global_step": 189, "train_info/time_within_train_step": 27.8088800907135, "step": 189}
{"train_info/time_between_train_steps": 0.0053675174713134766, "step": 189}
{"info/global_step": 190, "train_info/time_within_train_step": 27.77263069152832, "step": 190}
{"train_info/time_between_train_steps": 0.005246400833129883, "step": 190}
{"info/global_step": 191, "train_info/time_within_train_step": 27.81566047668457, "step": 191}
{"train_info/time_between_train_steps": 0.007913827896118164, "step": 191}
{"info/global_step": 192, "train_info/time_within_train_step": 27.809995889663696, "step": 192}
{"train_info/time_between_train_steps": 0.0053577423095703125, "step": 192}
{"info/global_step": 193, "train_info/time_within_train_step": 27.79763126373291, "step": 193}
{"train_info/time_between_train_steps": 0.005216121673583984, "step": 193}
{"info/global_step": 194, "train_info/time_within_train_step": 27.823216199874878, "step": 194}
{"train_info/time_between_train_steps": 0.005503654479980469, "step": 194}
{"info/global_step": 195, "train_info/time_within_train_step": 27.834144830703735, "step": 195}
{"train_info/time_between_train_steps": 0.0053784847259521484, "step": 195}
{"info/global_step": 196, "train_info/time_within_train_step": 27.846399068832397, "step": 196}
{"train_info/time_between_train_steps": 0.005790233612060547, "step": 196}
{"train_info/time_between_train_steps": 3.6928367614746094, "step": 196}
{"info/global_step": 197, "train_info/time_within_train_step": 27.80562686920166, "step": 197}
{"train_info/time_between_train_steps": 0.007535219192504883, "step": 197}
{"info/global_step": 198, "train_info/time_within_train_step": 27.866255283355713, "step": 198}
{"train_info/time_between_train_steps": 0.010520696640014648, "step": 198}
{"info/global_step": 199, "train_info/time_within_train_step": 27.82500696182251, "step": 199}
{"train_info/time_between_train_steps": 0.005719900131225586, "step": 199}
{"info/global_step": 200, "train_info/time_within_train_step": 27.916962385177612, "step": 200}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740827515, "_runtime": 5620}, "step": 200}
{"logs": {"train/loss": 4.7657, "train/learning_rate": 0.0005555555555555556, "train/epoch": 7.0, "_timestamp": 1740827515, "_runtime": 5620}, "step": 200}
{"train_info/time_between_train_steps": 13.418500900268555, "step": 200}
{"info/global_step": 201, "train_info/time_within_train_step": 27.809272289276123, "step": 201}
{"train_info/time_between_train_steps": 0.006539106369018555, "step": 201}
{"info/global_step": 202, "train_info/time_within_train_step": 28.002063035964966, "step": 202}
{"train_info/time_between_train_steps": 0.005440711975097656, "step": 202}
{"info/global_step": 203, "train_info/time_within_train_step": 27.764480113983154, "step": 203}
{"train_info/time_between_train_steps": 0.005387306213378906, "step": 203}
{"info/global_step": 204, "train_info/time_within_train_step": 28.09516954421997, "step": 204}
{"train_info/time_between_train_steps": 0.005440235137939453, "step": 204}
{"info/global_step": 205, "train_info/time_within_train_step": 27.82693362236023, "step": 205}
{"train_info/time_between_train_steps": 0.005081892013549805, "step": 205}
{"info/global_step": 206, "train_info/time_within_train_step": 27.828951835632324, "step": 206}
{"train_info/time_between_train_steps": 0.0061299800872802734, "step": 206}
{"info/global_step": 207, "train_info/time_within_train_step": 27.7842276096344, "step": 207}
{"train_info/time_between_train_steps": 0.005281925201416016, "step": 207}
{"info/global_step": 208, "train_info/time_within_train_step": 27.7876398563385, "step": 208}
{"train_info/time_between_train_steps": 0.0051937103271484375, "step": 208}
{"info/global_step": 209, "train_info/time_within_train_step": 27.804612398147583, "step": 209}
{"train_info/time_between_train_steps": 0.005362272262573242, "step": 209}
{"info/global_step": 210, "train_info/time_within_train_step": 27.77005958557129, "step": 210}
{"train_info/time_between_train_steps": 0.005234479904174805, "step": 210}
{"info/global_step": 211, "train_info/time_within_train_step": 27.792601823806763, "step": 211}
{"train_info/time_between_train_steps": 0.005416154861450195, "step": 211}
{"info/global_step": 212, "train_info/time_within_train_step": 27.80718445777893, "step": 212}
{"train_info/time_between_train_steps": 0.005366325378417969, "step": 212}
{"info/global_step": 213, "train_info/time_within_train_step": 27.83264183998108, "step": 213}
{"train_info/time_between_train_steps": 0.0059735774993896484, "step": 213}
{"info/global_step": 214, "train_info/time_within_train_step": 27.81888461112976, "step": 214}
{"train_info/time_between_train_steps": 0.00905466079711914, "step": 214}
{"info/global_step": 215, "train_info/time_within_train_step": 27.821526527404785, "step": 215}
{"train_info/time_between_train_steps": 0.005216836929321289, "step": 215}
{"info/global_step": 216, "train_info/time_within_train_step": 27.82576298713684, "step": 216}
{"train_info/time_between_train_steps": 0.005421876907348633, "step": 216}
{"info/global_step": 217, "train_info/time_within_train_step": 27.8278067111969, "step": 217}
{"train_info/time_between_train_steps": 0.007876157760620117, "step": 217}
{"info/global_step": 218, "train_info/time_within_train_step": 27.83123755455017, "step": 218}
{"train_info/time_between_train_steps": 0.005321025848388672, "step": 218}
{"info/global_step": 219, "train_info/time_within_train_step": 27.916914463043213, "step": 219}
{"train_info/time_between_train_steps": 0.005331277847290039, "step": 219}
{"info/global_step": 220, "train_info/time_within_train_step": 27.822428464889526, "step": 220}
{"train_info/time_between_train_steps": 0.005479335784912109, "step": 220}
{"info/global_step": 221, "train_info/time_within_train_step": 27.78006410598755, "step": 221}
{"train_info/time_between_train_steps": 0.00531458854675293, "step": 221}
{"info/global_step": 222, "train_info/time_within_train_step": 27.82030153274536, "step": 222}
{"train_info/time_between_train_steps": 0.005405902862548828, "step": 222}
{"info/global_step": 223, "train_info/time_within_train_step": 27.838712215423584, "step": 223}
{"train_info/time_between_train_steps": 0.0056915283203125, "step": 223}
{"info/global_step": 224, "train_info/time_within_train_step": 27.84438991546631, "step": 224}
{"train_info/time_between_train_steps": 0.0057125091552734375, "step": 224}
{"train_info/time_between_train_steps": 3.9231619834899902, "step": 224}
{"info/global_step": 225, "train_info/time_within_train_step": 27.827130794525146, "step": 225}
{"train_info/time_between_train_steps": 0.005388975143432617, "step": 225}
{"info/global_step": 226, "train_info/time_within_train_step": 27.953911781311035, "step": 226}
{"train_info/time_between_train_steps": 0.005540132522583008, "step": 226}
{"info/global_step": 227, "train_info/time_within_train_step": 27.820146083831787, "step": 227}
{"train_info/time_between_train_steps": 0.010215282440185547, "step": 227}
{"info/global_step": 228, "train_info/time_within_train_step": 27.891865015029907, "step": 228}
{"train_info/time_between_train_steps": 0.0055086612701416016, "step": 228}
{"info/global_step": 229, "train_info/time_within_train_step": 27.87870740890503, "step": 229}
{"train_info/time_between_train_steps": 0.005299806594848633, "step": 229}
{"info/global_step": 230, "train_info/time_within_train_step": 27.93180823326111, "step": 230}
{"train_info/time_between_train_steps": 0.005284786224365234, "step": 230}
{"info/global_step": 231, "train_info/time_within_train_step": 27.84108281135559, "step": 231}
{"train_info/time_between_train_steps": 0.005652427673339844, "step": 231}
{"info/global_step": 232, "train_info/time_within_train_step": 27.874508142471313, "step": 232}
{"train_info/time_between_train_steps": 0.005423069000244141, "step": 232}
{"info/global_step": 233, "train_info/time_within_train_step": 27.7871572971344, "step": 233}
{"train_info/time_between_train_steps": 0.00521087646484375, "step": 233}
{"info/global_step": 234, "train_info/time_within_train_step": 27.82003879547119, "step": 234}
{"train_info/time_between_train_steps": 0.00526881217956543, "step": 234}
{"info/global_step": 235, "train_info/time_within_train_step": 27.887198209762573, "step": 235}
{"train_info/time_between_train_steps": 0.010209083557128906, "step": 235}
{"info/global_step": 236, "train_info/time_within_train_step": 27.823084831237793, "step": 236}
{"train_info/time_between_train_steps": 0.005202054977416992, "step": 236}
{"info/global_step": 237, "train_info/time_within_train_step": 27.81166911125183, "step": 237}
{"train_info/time_between_train_steps": 0.0063381195068359375, "step": 237}
{"info/global_step": 238, "train_info/time_within_train_step": 27.819461584091187, "step": 238}
{"train_info/time_between_train_steps": 0.005250692367553711, "step": 238}
{"info/global_step": 239, "train_info/time_within_train_step": 27.81384015083313, "step": 239}
{"train_info/time_between_train_steps": 0.005484819412231445, "step": 239}
{"info/global_step": 240, "train_info/time_within_train_step": 27.78565239906311, "step": 240}
{"train_info/time_between_train_steps": 0.00519251823425293, "step": 240}
{"info/global_step": 241, "train_info/time_within_train_step": 27.812976360321045, "step": 241}
{"train_info/time_between_train_steps": 0.005293130874633789, "step": 241}
{"info/global_step": 242, "train_info/time_within_train_step": 27.842568159103394, "step": 242}
{"train_info/time_between_train_steps": 0.0052068233489990234, "step": 242}
{"info/global_step": 243, "train_info/time_within_train_step": 27.796549558639526, "step": 243}
{"train_info/time_between_train_steps": 0.0051937103271484375, "step": 243}
{"info/global_step": 244, "train_info/time_within_train_step": 27.824290990829468, "step": 244}
{"train_info/time_between_train_steps": 0.005292415618896484, "step": 244}
{"info/global_step": 245, "train_info/time_within_train_step": 27.797576189041138, "step": 245}
{"train_info/time_between_train_steps": 0.005279541015625, "step": 245}
{"info/global_step": 246, "train_info/time_within_train_step": 27.805294275283813, "step": 246}
{"train_info/time_between_train_steps": 0.007819890975952148, "step": 246}
{"info/global_step": 247, "train_info/time_within_train_step": 27.79555368423462, "step": 247}
{"train_info/time_between_train_steps": 0.005206584930419922, "step": 247}
{"info/global_step": 248, "train_info/time_within_train_step": 27.818635940551758, "step": 248}
{"train_info/time_between_train_steps": 0.005477190017700195, "step": 248}
{"info/global_step": 249, "train_info/time_within_train_step": 27.820781469345093, "step": 249}
{"train_info/time_between_train_steps": 0.005461454391479492, "step": 249}
{"info/global_step": 250, "train_info/time_within_train_step": 27.926085710525513, "step": 250}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740828925, "_runtime": 7030}, "step": 250}
{"logs": {"train/loss": 4.6242, "train/learning_rate": 0.0005277777777777777, "train/epoch": 8.02, "_timestamp": 1740828925, "_runtime": 7030}, "step": 250}
{"train_info/time_between_train_steps": 0.009057760238647461, "step": 250}
{"info/global_step": 251, "train_info/time_within_train_step": 27.823302268981934, "step": 251}
{"train_info/time_between_train_steps": 0.006116390228271484, "step": 251}
{"info/global_step": 252, "train_info/time_within_train_step": 27.843580961227417, "step": 252}
{"train_info/time_between_train_steps": 0.007911920547485352, "step": 252}
{"train_info/time_between_train_steps": 4.121532440185547, "step": 252}
{"info/global_step": 253, "train_info/time_within_train_step": 27.811823844909668, "step": 253}
{"train_info/time_between_train_steps": 0.0055081844329833984, "step": 253}
{"info/global_step": 254, "train_info/time_within_train_step": 27.989382028579712, "step": 254}
{"train_info/time_between_train_steps": 0.0073833465576171875, "step": 254}
{"info/global_step": 255, "train_info/time_within_train_step": 27.796714305877686, "step": 255}
{"train_info/time_between_train_steps": 0.005204200744628906, "step": 255}
{"info/global_step": 256, "train_info/time_within_train_step": 27.948131799697876, "step": 256}
{"train_info/time_between_train_steps": 0.005475759506225586, "step": 256}
{"info/global_step": 257, "train_info/time_within_train_step": 27.83631920814514, "step": 257}
{"train_info/time_between_train_steps": 0.0054051876068115234, "step": 257}
{"info/global_step": 258, "train_info/time_within_train_step": 27.92336654663086, "step": 258}
{"train_info/time_between_train_steps": 0.0054433345794677734, "step": 258}
{"info/global_step": 259, "train_info/time_within_train_step": 27.82267141342163, "step": 259}
{"train_info/time_between_train_steps": 0.010913848876953125, "step": 259}
{"info/global_step": 260, "train_info/time_within_train_step": 27.89757490158081, "step": 260}
{"train_info/time_between_train_steps": 0.0078105926513671875, "step": 260}
{"info/global_step": 261, "train_info/time_within_train_step": 27.784600257873535, "step": 261}
{"train_info/time_between_train_steps": 0.005084991455078125, "step": 261}
{"info/global_step": 262, "train_info/time_within_train_step": 27.779297351837158, "step": 262}
{"train_info/time_between_train_steps": 0.005259990692138672, "step": 262}
{"info/global_step": 263, "train_info/time_within_train_step": 27.768163204193115, "step": 263}
{"train_info/time_between_train_steps": 0.009232759475708008, "step": 263}
{"info/global_step": 264, "train_info/time_within_train_step": 27.793174505233765, "step": 264}
{"train_info/time_between_train_steps": 0.005605936050415039, "step": 264}
{"info/global_step": 265, "train_info/time_within_train_step": 27.816864490509033, "step": 265}
{"train_info/time_between_train_steps": 0.005110979080200195, "step": 265}
{"info/global_step": 266, "train_info/time_within_train_step": 27.911153554916382, "step": 266}
{"train_info/time_between_train_steps": 0.006384372711181641, "step": 266}
{"info/global_step": 267, "train_info/time_within_train_step": 27.80981421470642, "step": 267}
{"train_info/time_between_train_steps": 0.00526881217956543, "step": 267}
{"info/global_step": 268, "train_info/time_within_train_step": 27.76142430305481, "step": 268}
{"train_info/time_between_train_steps": 0.005311250686645508, "step": 268}
{"info/global_step": 269, "train_info/time_within_train_step": 27.818730115890503, "step": 269}
{"train_info/time_between_train_steps": 0.010836124420166016, "step": 269}
{"info/global_step": 270, "train_info/time_within_train_step": 27.808137893676758, "step": 270}
{"train_info/time_between_train_steps": 0.005151510238647461, "step": 270}
{"info/global_step": 271, "train_info/time_within_train_step": 27.869166135787964, "step": 271}
{"train_info/time_between_train_steps": 0.005258083343505859, "step": 271}
{"info/global_step": 272, "train_info/time_within_train_step": 27.839311599731445, "step": 272}
{"train_info/time_between_train_steps": 0.0075147151947021484, "step": 272}
{"info/global_step": 273, "train_info/time_within_train_step": 27.82636833190918, "step": 273}
{"train_info/time_between_train_steps": 0.005249977111816406, "step": 273}
{"info/global_step": 274, "train_info/time_within_train_step": 27.808494329452515, "step": 274}
{"train_info/time_between_train_steps": 0.005280733108520508, "step": 274}
{"info/global_step": 275, "train_info/time_within_train_step": 27.82548689842224, "step": 275}
{"train_info/time_between_train_steps": 0.007371187210083008, "step": 275}
{"info/global_step": 276, "train_info/time_within_train_step": 27.83398699760437, "step": 276}
{"train_info/time_between_train_steps": 0.005217790603637695, "step": 276}
{"info/global_step": 277, "train_info/time_within_train_step": 27.82807993888855, "step": 277}
{"train_info/time_between_train_steps": 0.0076138973236083984, "step": 277}
{"info/global_step": 278, "train_info/time_within_train_step": 27.81234049797058, "step": 278}
{"train_info/time_between_train_steps": 0.0053713321685791016, "step": 278}
{"info/global_step": 279, "train_info/time_within_train_step": 27.824976444244385, "step": 279}
{"train_info/time_between_train_steps": 0.005880117416381836, "step": 279}
{"info/global_step": 280, "train_info/time_within_train_step": 27.848202228546143, "step": 280}
{"train_info/time_between_train_steps": 0.00586390495300293, "step": 280}
{"train_info/time_between_train_steps": 3.761810302734375, "step": 280}
{"info/global_step": 281, "train_info/time_within_train_step": 27.848044633865356, "step": 281}
{"train_info/time_between_train_steps": 0.005617856979370117, "step": 281}
{"info/global_step": 282, "train_info/time_within_train_step": 28.117014169692993, "step": 282}
{"train_info/time_between_train_steps": 0.010716438293457031, "step": 282}
{"info/global_step": 283, "train_info/time_within_train_step": 27.873979806900024, "step": 283}
{"train_info/time_between_train_steps": 0.010972023010253906, "step": 283}
{"info/global_step": 284, "train_info/time_within_train_step": 28.038569688796997, "step": 284}
{"train_info/time_between_train_steps": 0.0055692195892333984, "step": 284}
{"info/global_step": 285, "train_info/time_within_train_step": 27.858095169067383, "step": 285}
{"train_info/time_between_train_steps": 0.006086826324462891, "step": 285}
{"info/global_step": 286, "train_info/time_within_train_step": 28.03693437576294, "step": 286}
{"train_info/time_between_train_steps": 0.005663394927978516, "step": 286}
{"info/global_step": 287, "train_info/time_within_train_step": 27.85081148147583, "step": 287}
{"train_info/time_between_train_steps": 0.005891323089599609, "step": 287}
{"info/global_step": 288, "train_info/time_within_train_step": 27.94114065170288, "step": 288}
{"train_info/time_between_train_steps": 0.0065155029296875, "step": 288}
{"info/global_step": 289, "train_info/time_within_train_step": 27.802529335021973, "step": 289}
{"train_info/time_between_train_steps": 0.006826162338256836, "step": 289}
{"info/global_step": 290, "train_info/time_within_train_step": 27.820984840393066, "step": 290}
{"train_info/time_between_train_steps": 0.006310939788818359, "step": 290}
{"info/global_step": 291, "train_info/time_within_train_step": 27.814223766326904, "step": 291}
{"train_info/time_between_train_steps": 0.007433652877807617, "step": 291}
{"info/global_step": 292, "train_info/time_within_train_step": 27.793094158172607, "step": 292}
{"train_info/time_between_train_steps": 0.005419731140136719, "step": 292}
{"info/global_step": 293, "train_info/time_within_train_step": 27.815439701080322, "step": 293}
{"train_info/time_between_train_steps": 0.005192995071411133, "step": 293}
{"info/global_step": 294, "train_info/time_within_train_step": 27.81691884994507, "step": 294}
{"train_info/time_between_train_steps": 0.005277156829833984, "step": 294}
{"info/global_step": 295, "train_info/time_within_train_step": 27.811658143997192, "step": 295}
{"train_info/time_between_train_steps": 0.005199909210205078, "step": 295}
{"info/global_step": 296, "train_info/time_within_train_step": 27.797460794448853, "step": 296}
{"train_info/time_between_train_steps": 0.009759187698364258, "step": 296}
{"info/global_step": 297, "train_info/time_within_train_step": 27.8796124458313, "step": 297}
{"train_info/time_between_train_steps": 0.005412101745605469, "step": 297}
{"info/global_step": 298, "train_info/time_within_train_step": 27.800076961517334, "step": 298}
{"train_info/time_between_train_steps": 0.005415439605712891, "step": 298}
{"info/global_step": 299, "train_info/time_within_train_step": 27.783785343170166, "step": 299}
{"train_info/time_between_train_steps": 0.0051767826080322266, "step": 299}
{"info/global_step": 300, "train_info/time_within_train_step": 27.83069896697998, "step": 300}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740830325, "_runtime": 8430}, "step": 300}
{"logs": {"train/loss": 4.4779, "train/learning_rate": 0.0005, "train/epoch": 10.02, "_timestamp": 1740830325, "_runtime": 8430}, "step": 300}
{"train_info/time_between_train_steps": 13.903845071792603, "step": 300}
{"info/global_step": 301, "train_info/time_within_train_step": 27.78844666481018, "step": 301}
{"train_info/time_between_train_steps": 0.005065202713012695, "step": 301}
{"info/global_step": 302, "train_info/time_within_train_step": 27.78866696357727, "step": 302}
{"train_info/time_between_train_steps": 0.005006074905395508, "step": 302}
{"info/global_step": 303, "train_info/time_within_train_step": 27.841763257980347, "step": 303}
{"train_info/time_between_train_steps": 0.005460977554321289, "step": 303}
{"info/global_step": 304, "train_info/time_within_train_step": 27.765018701553345, "step": 304}
{"train_info/time_between_train_steps": 0.0054149627685546875, "step": 304}
{"info/global_step": 305, "train_info/time_within_train_step": 27.761534929275513, "step": 305}
{"train_info/time_between_train_steps": 0.005319118499755859, "step": 305}
{"info/global_step": 306, "train_info/time_within_train_step": 27.76868200302124, "step": 306}
{"train_info/time_between_train_steps": 0.005507707595825195, "step": 306}
{"info/global_step": 307, "train_info/time_within_train_step": 27.838423013687134, "step": 307}
{"train_info/time_between_train_steps": 0.010580301284790039, "step": 307}
{"info/global_step": 308, "train_info/time_within_train_step": 27.81758761405945, "step": 308}
{"train_info/time_between_train_steps": 0.006134748458862305, "step": 308}
{"train_info/time_between_train_steps": 3.661559820175171, "step": 308}
{"info/global_step": 309, "train_info/time_within_train_step": 27.795165538787842, "step": 309}
{"train_info/time_between_train_steps": 0.005143880844116211, "step": 309}
{"info/global_step": 310, "train_info/time_within_train_step": 27.999423503875732, "step": 310}
{"train_info/time_between_train_steps": 0.005484342575073242, "step": 310}
{"info/global_step": 311, "train_info/time_within_train_step": 27.813859462738037, "step": 311}
{"train_info/time_between_train_steps": 0.005337238311767578, "step": 311}
{"info/global_step": 312, "train_info/time_within_train_step": 27.930824756622314, "step": 312}
{"train_info/time_between_train_steps": 0.0055408477783203125, "step": 312}
{"info/global_step": 313, "train_info/time_within_train_step": 27.931779623031616, "step": 313}
{"train_info/time_between_train_steps": 0.0054471492767333984, "step": 313}
{"info/global_step": 314, "train_info/time_within_train_step": 27.97813057899475, "step": 314}
{"train_info/time_between_train_steps": 0.00546717643737793, "step": 314}
{"info/global_step": 315, "train_info/time_within_train_step": 27.808707237243652, "step": 315}
{"train_info/time_between_train_steps": 0.005301713943481445, "step": 315}
{"info/global_step": 316, "train_info/time_within_train_step": 27.902738094329834, "step": 316}
{"train_info/time_between_train_steps": 0.0052852630615234375, "step": 316}
{"info/global_step": 317, "train_info/time_within_train_step": 27.823915243148804, "step": 317}
{"train_info/time_between_train_steps": 0.005127668380737305, "step": 317}
{"info/global_step": 318, "train_info/time_within_train_step": 27.818689107894897, "step": 318}
{"train_info/time_between_train_steps": 0.006361246109008789, "step": 318}
{"info/global_step": 319, "train_info/time_within_train_step": 27.794191122055054, "step": 319}
{"train_info/time_between_train_steps": 0.00640869140625, "step": 319}
{"info/global_step": 320, "train_info/time_within_train_step": 27.811643838882446, "step": 320}
{"train_info/time_between_train_steps": 0.005207538604736328, "step": 320}
{"info/global_step": 321, "train_info/time_within_train_step": 27.81695246696472, "step": 321}
{"train_info/time_between_train_steps": 0.007711648941040039, "step": 321}
{"info/global_step": 322, "train_info/time_within_train_step": 27.84296226501465, "step": 322}
{"train_info/time_between_train_steps": 0.005304813385009766, "step": 322}
{"info/global_step": 323, "train_info/time_within_train_step": 27.82839345932007, "step": 323}
{"train_info/time_between_train_steps": 0.005267143249511719, "step": 323}
{"info/global_step": 324, "train_info/time_within_train_step": 27.816221714019775, "step": 324}
{"train_info/time_between_train_steps": 0.005320549011230469, "step": 324}
{"info/global_step": 325, "train_info/time_within_train_step": 27.8230721950531, "step": 325}
{"train_info/time_between_train_steps": 0.005298137664794922, "step": 325}
{"info/global_step": 326, "train_info/time_within_train_step": 27.771368741989136, "step": 326}
{"train_info/time_between_train_steps": 0.005594015121459961, "step": 326}
{"info/global_step": 327, "train_info/time_within_train_step": 27.819236755371094, "step": 327}
{"train_info/time_between_train_steps": 0.006115436553955078, "step": 327}
{"info/global_step": 328, "train_info/time_within_train_step": 27.937848806381226, "step": 328}
{"train_info/time_between_train_steps": 0.005316019058227539, "step": 328}
{"info/global_step": 329, "train_info/time_within_train_step": 27.803073167800903, "step": 329}
{"train_info/time_between_train_steps": 0.005259990692138672, "step": 329}
{"info/global_step": 330, "train_info/time_within_train_step": 27.794492483139038, "step": 330}
{"train_info/time_between_train_steps": 0.0053942203521728516, "step": 330}
{"info/global_step": 331, "train_info/time_within_train_step": 27.816240072250366, "step": 331}
{"train_info/time_between_train_steps": 0.0053441524505615234, "step": 331}
{"info/global_step": 332, "train_info/time_within_train_step": 27.857606172561646, "step": 332}
{"train_info/time_between_train_steps": 0.007731914520263672, "step": 332}
{"info/global_step": 333, "train_info/time_within_train_step": 27.845845222473145, "step": 333}
{"train_info/time_between_train_steps": 0.010374784469604492, "step": 333}
{"info/global_step": 334, "train_info/time_within_train_step": 27.82761549949646, "step": 334}
{"train_info/time_between_train_steps": 0.005481243133544922, "step": 334}
{"info/global_step": 335, "train_info/time_within_train_step": 27.854064226150513, "step": 335}
{"train_info/time_between_train_steps": 0.005603790283203125, "step": 335}
{"info/global_step": 336, "train_info/time_within_train_step": 27.810401439666748, "step": 336}
{"train_info/time_between_train_steps": 0.005883932113647461, "step": 336}
{"train_info/time_between_train_steps": 3.911999225616455, "step": 336}
{"info/global_step": 337, "train_info/time_within_train_step": 28.498860836029053, "step": 337}
{"train_info/time_between_train_steps": 0.005118370056152344, "step": 337}
{"info/global_step": 338, "train_info/time_within_train_step": 28.017695903778076, "step": 338}
{"train_info/time_between_train_steps": 0.005430936813354492, "step": 338}
{"info/global_step": 339, "train_info/time_within_train_step": 27.809843063354492, "step": 339}
{"train_info/time_between_train_steps": 0.005445241928100586, "step": 339}
{"info/global_step": 340, "train_info/time_within_train_step": 27.96132779121399, "step": 340}
{"train_info/time_between_train_steps": 0.005388021469116211, "step": 340}
{"info/global_step": 341, "train_info/time_within_train_step": 27.829780340194702, "step": 341}
{"train_info/time_between_train_steps": 0.005667448043823242, "step": 341}
{"info/global_step": 342, "train_info/time_within_train_step": 27.971843957901, "step": 342}
{"train_info/time_between_train_steps": 0.00546574592590332, "step": 342}
{"info/global_step": 343, "train_info/time_within_train_step": 27.79807949066162, "step": 343}
{"train_info/time_between_train_steps": 0.007794857025146484, "step": 343}
{"info/global_step": 344, "train_info/time_within_train_step": 28.047731399536133, "step": 344}
{"train_info/time_between_train_steps": 0.0054438114166259766, "step": 344}
{"info/global_step": 345, "train_info/time_within_train_step": 27.802197694778442, "step": 345}
{"train_info/time_between_train_steps": 0.005002737045288086, "step": 345}
{"info/global_step": 346, "train_info/time_within_train_step": 27.797529935836792, "step": 346}
{"train_info/time_between_train_steps": 0.00520777702331543, "step": 346}
{"info/global_step": 347, "train_info/time_within_train_step": 27.829097270965576, "step": 347}
{"train_info/time_between_train_steps": 0.0052492618560791016, "step": 347}
{"info/global_step": 348, "train_info/time_within_train_step": 27.77901816368103, "step": 348}
{"train_info/time_between_train_steps": 0.005113363265991211, "step": 348}
{"info/global_step": 349, "train_info/time_within_train_step": 27.772207260131836, "step": 349}
{"train_info/time_between_train_steps": 0.005302906036376953, "step": 349}
{"info/global_step": 350, "train_info/time_within_train_step": 27.816659450531006, "step": 350}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740831740, "_runtime": 9845}, "step": 350}
{"logs": {"train/loss": 4.2996, "train/learning_rate": 0.00047222222222222224, "train/epoch": 12.01, "_timestamp": 1740831740, "_runtime": 9845}, "step": 350}
{"train_info/time_between_train_steps": 0.011163711547851562, "step": 350}
{"info/global_step": 351, "train_info/time_within_train_step": 27.818705558776855, "step": 351}
{"train_info/time_between_train_steps": 0.005461692810058594, "step": 351}
{"info/global_step": 352, "train_info/time_within_train_step": 27.83040976524353, "step": 352}
{"train_info/time_between_train_steps": 0.005139827728271484, "step": 352}
{"info/global_step": 353, "train_info/time_within_train_step": 27.77718758583069, "step": 353}
{"train_info/time_between_train_steps": 0.005228281021118164, "step": 353}
{"info/global_step": 354, "train_info/time_within_train_step": 27.748903036117554, "step": 354}
{"train_info/time_between_train_steps": 0.005181789398193359, "step": 354}
{"info/global_step": 355, "train_info/time_within_train_step": 27.75320529937744, "step": 355}
{"train_info/time_between_train_steps": 0.010615110397338867, "step": 355}
{"info/global_step": 356, "train_info/time_within_train_step": 27.804503917694092, "step": 356}
{"train_info/time_between_train_steps": 0.009475946426391602, "step": 356}
{"info/global_step": 357, "train_info/time_within_train_step": 27.82391667366028, "step": 357}
{"train_info/time_between_train_steps": 0.005161285400390625, "step": 357}
{"info/global_step": 358, "train_info/time_within_train_step": 27.782827377319336, "step": 358}
{"train_info/time_between_train_steps": 0.006093263626098633, "step": 358}
{"info/global_step": 359, "train_info/time_within_train_step": 27.822960376739502, "step": 359}
{"train_info/time_between_train_steps": 0.005372047424316406, "step": 359}
{"info/global_step": 360, "train_info/time_within_train_step": 27.908743143081665, "step": 360}
{"train_info/time_between_train_steps": 0.01018834114074707, "step": 360}
{"info/global_step": 361, "train_info/time_within_train_step": 27.825236558914185, "step": 361}
{"train_info/time_between_train_steps": 0.010062456130981445, "step": 361}
{"info/global_step": 362, "train_info/time_within_train_step": 27.837830305099487, "step": 362}
{"train_info/time_between_train_steps": 0.0056498050689697266, "step": 362}
{"info/global_step": 363, "train_info/time_within_train_step": 27.84150743484497, "step": 363}
{"train_info/time_between_train_steps": 0.0057294368743896484, "step": 363}
{"info/global_step": 364, "train_info/time_within_train_step": 27.848509550094604, "step": 364}
{"train_info/time_between_train_steps": 0.01040029525756836, "step": 364}
{"train_info/time_between_train_steps": 4.238274097442627, "step": 364}
{"info/global_step": 365, "train_info/time_within_train_step": 27.772576570510864, "step": 365}
{"train_info/time_between_train_steps": 0.005392551422119141, "step": 365}
{"info/global_step": 366, "train_info/time_within_train_step": 27.8976628780365, "step": 366}
{"train_info/time_between_train_steps": 0.0074310302734375, "step": 366}
{"info/global_step": 367, "train_info/time_within_train_step": 27.843959093093872, "step": 367}
{"train_info/time_between_train_steps": 0.0056915283203125, "step": 367}
{"info/global_step": 368, "train_info/time_within_train_step": 27.87925386428833, "step": 368}
{"train_info/time_between_train_steps": 0.005292415618896484, "step": 368}
{"info/global_step": 369, "train_info/time_within_train_step": 27.82013773918152, "step": 369}
{"train_info/time_between_train_steps": 0.00539851188659668, "step": 369}
{"info/global_step": 370, "train_info/time_within_train_step": 28.026528358459473, "step": 370}
{"train_info/time_between_train_steps": 0.005397796630859375, "step": 370}
{"info/global_step": 371, "train_info/time_within_train_step": 27.813122272491455, "step": 371}
{"train_info/time_between_train_steps": 0.005189657211303711, "step": 371}
{"info/global_step": 372, "train_info/time_within_train_step": 27.89592170715332, "step": 372}
{"train_info/time_between_train_steps": 0.005476474761962891, "step": 372}
{"info/global_step": 373, "train_info/time_within_train_step": 27.820018529891968, "step": 373}
{"train_info/time_between_train_steps": 0.004967689514160156, "step": 373}
{"info/global_step": 374, "train_info/time_within_train_step": 27.80724787712097, "step": 374}
{"train_info/time_between_train_steps": 0.005506038665771484, "step": 374}
{"info/global_step": 375, "train_info/time_within_train_step": 27.935547351837158, "step": 375}
{"train_info/time_between_train_steps": 0.010229110717773438, "step": 375}
{"info/global_step": 376, "train_info/time_within_train_step": 27.75505781173706, "step": 376}
{"train_info/time_between_train_steps": 0.00516819953918457, "step": 376}
{"info/global_step": 377, "train_info/time_within_train_step": 27.821985483169556, "step": 377}
{"train_info/time_between_train_steps": 0.005696773529052734, "step": 377}
{"info/global_step": 378, "train_info/time_within_train_step": 27.861501932144165, "step": 378}
{"train_info/time_between_train_steps": 0.005278825759887695, "step": 378}
{"info/global_step": 379, "train_info/time_within_train_step": 27.837692975997925, "step": 379}
{"train_info/time_between_train_steps": 0.009562015533447266, "step": 379}
{"info/global_step": 380, "train_info/time_within_train_step": 27.821922779083252, "step": 380}
{"train_info/time_between_train_steps": 0.00896000862121582, "step": 380}
{"info/global_step": 381, "train_info/time_within_train_step": 27.808866500854492, "step": 381}
{"train_info/time_between_train_steps": 0.004957914352416992, "step": 381}
{"info/global_step": 382, "train_info/time_within_train_step": 27.747923612594604, "step": 382}
{"train_info/time_between_train_steps": 0.0050580501556396484, "step": 382}
{"info/global_step": 383, "train_info/time_within_train_step": 27.80599331855774, "step": 383}
{"train_info/time_between_train_steps": 0.005129814147949219, "step": 383}
{"info/global_step": 384, "train_info/time_within_train_step": 27.777913331985474, "step": 384}
{"train_info/time_between_train_steps": 0.0051784515380859375, "step": 384}
{"info/global_step": 385, "train_info/time_within_train_step": 27.795411348342896, "step": 385}
{"train_info/time_between_train_steps": 0.005185842514038086, "step": 385}
{"info/global_step": 386, "train_info/time_within_train_step": 27.81191372871399, "step": 386}
{"train_info/time_between_train_steps": 0.005458831787109375, "step": 386}
{"info/global_step": 387, "train_info/time_within_train_step": 27.803629636764526, "step": 387}
{"train_info/time_between_train_steps": 0.009408950805664062, "step": 387}
{"info/global_step": 388, "train_info/time_within_train_step": 27.768684148788452, "step": 388}
{"train_info/time_between_train_steps": 0.005213737487792969, "step": 388}
{"info/global_step": 389, "train_info/time_within_train_step": 27.79500436782837, "step": 389}
{"train_info/time_between_train_steps": 0.005029439926147461, "step": 389}
{"info/global_step": 390, "train_info/time_within_train_step": 27.796717643737793, "step": 390}
{"train_info/time_between_train_steps": 0.010134458541870117, "step": 390}
{"info/global_step": 391, "train_info/time_within_train_step": 27.897013187408447, "step": 391}
{"train_info/time_between_train_steps": 0.005170106887817383, "step": 391}
{"info/global_step": 392, "train_info/time_within_train_step": 27.825507640838623, "step": 392}
{"train_info/time_between_train_steps": 0.010344505310058594, "step": 392}
{"train_info/time_between_train_steps": 3.6825709342956543, "step": 392}
{"info/global_step": 393, "train_info/time_within_train_step": 27.792104244232178, "step": 393}
{"train_info/time_between_train_steps": 0.007442951202392578, "step": 393}
{"info/global_step": 394, "train_info/time_within_train_step": 27.978073358535767, "step": 394}
{"train_info/time_between_train_steps": 0.005191802978515625, "step": 394}
{"info/global_step": 395, "train_info/time_within_train_step": 27.81184196472168, "step": 395}
{"train_info/time_between_train_steps": 0.0054779052734375, "step": 395}
{"info/global_step": 396, "train_info/time_within_train_step": 27.926804065704346, "step": 396}
{"train_info/time_between_train_steps": 0.0053327083587646484, "step": 396}
{"info/global_step": 397, "train_info/time_within_train_step": 27.834290504455566, "step": 397}
{"train_info/time_between_train_steps": 0.005603790283203125, "step": 397}
{"info/global_step": 398, "train_info/time_within_train_step": 27.970906019210815, "step": 398}
{"train_info/time_between_train_steps": 0.005471944808959961, "step": 398}
{"info/global_step": 399, "train_info/time_within_train_step": 27.82743740081787, "step": 399}
{"train_info/time_between_train_steps": 0.006193876266479492, "step": 399}
{"info/global_step": 400, "train_info/time_within_train_step": 27.94221544265747, "step": 400}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740833140, "_runtime": 11245}, "step": 400}
{"logs": {"train/loss": 4.0981, "train/learning_rate": 0.00044444444444444436, "train/epoch": 14.01, "_timestamp": 1740833140, "_runtime": 11245}, "step": 400}
{"train_info/time_between_train_steps": 13.962942123413086, "step": 400}
{"info/global_step": 401, "train_info/time_within_train_step": 27.816324949264526, "step": 401}
{"train_info/time_between_train_steps": 0.005011558532714844, "step": 401}
{"info/global_step": 402, "train_info/time_within_train_step": 27.80419158935547, "step": 402}
{"train_info/time_between_train_steps": 0.005275249481201172, "step": 402}
{"info/global_step": 403, "train_info/time_within_train_step": 27.797324180603027, "step": 403}
{"train_info/time_between_train_steps": 0.005140542984008789, "step": 403}
{"info/global_step": 404, "train_info/time_within_train_step": 27.776463747024536, "step": 404}
{"train_info/time_between_train_steps": 0.005087852478027344, "step": 404}
{"info/global_step": 405, "train_info/time_within_train_step": 27.805121421813965, "step": 405}
{"train_info/time_between_train_steps": 0.0051805973052978516, "step": 405}
{"info/global_step": 406, "train_info/time_within_train_step": 27.765162706375122, "step": 406}
{"train_info/time_between_train_steps": 0.005120992660522461, "step": 406}
{"info/global_step": 407, "train_info/time_within_train_step": 27.874680757522583, "step": 407}
{"train_info/time_between_train_steps": 0.005329608917236328, "step": 407}
{"info/global_step": 408, "train_info/time_within_train_step": 27.83106756210327, "step": 408}
{"train_info/time_between_train_steps": 0.0051648616790771484, "step": 408}
{"info/global_step": 409, "train_info/time_within_train_step": 27.79146432876587, "step": 409}
{"train_info/time_between_train_steps": 0.005148410797119141, "step": 409}
{"info/global_step": 410, "train_info/time_within_train_step": 27.8564395904541, "step": 410}
{"train_info/time_between_train_steps": 0.005348920822143555, "step": 410}
{"info/global_step": 411, "train_info/time_within_train_step": 27.78473997116089, "step": 411}
{"train_info/time_between_train_steps": 0.005171537399291992, "step": 411}
{"info/global_step": 412, "train_info/time_within_train_step": 27.84813952445984, "step": 412}
{"train_info/time_between_train_steps": 0.005267143249511719, "step": 412}
{"info/global_step": 413, "train_info/time_within_train_step": 27.82337498664856, "step": 413}
{"train_info/time_between_train_steps": 0.00797414779663086, "step": 413}
{"info/global_step": 414, "train_info/time_within_train_step": 27.812015771865845, "step": 414}
{"train_info/time_between_train_steps": 0.006387948989868164, "step": 414}
{"info/global_step": 415, "train_info/time_within_train_step": 27.851624727249146, "step": 415}
{"train_info/time_between_train_steps": 0.005277156829833984, "step": 415}
{"info/global_step": 416, "train_info/time_within_train_step": 27.752774953842163, "step": 416}
{"train_info/time_between_train_steps": 0.0052645206451416016, "step": 416}
{"info/global_step": 417, "train_info/time_within_train_step": 27.807173490524292, "step": 417}
{"train_info/time_between_train_steps": 0.005285739898681641, "step": 417}
{"info/global_step": 418, "train_info/time_within_train_step": 27.795528650283813, "step": 418}
{"train_info/time_between_train_steps": 0.005315542221069336, "step": 418}
{"info/global_step": 419, "train_info/time_within_train_step": 27.809530019760132, "step": 419}
{"train_info/time_between_train_steps": 0.009289264678955078, "step": 419}
{"info/global_step": 420, "train_info/time_within_train_step": 27.84631061553955, "step": 420}
{"train_info/time_between_train_steps": 0.005857229232788086, "step": 420}
{"train_info/time_between_train_steps": 3.893141508102417, "step": 420}
{"info/global_step": 421, "train_info/time_within_train_step": 27.8202702999115, "step": 421}
{"train_info/time_between_train_steps": 0.009581565856933594, "step": 421}
{"info/global_step": 422, "train_info/time_within_train_step": 28.12226939201355, "step": 422}
{"train_info/time_between_train_steps": 0.005477190017700195, "step": 422}
{"info/global_step": 423, "train_info/time_within_train_step": 27.85039758682251, "step": 423}
{"train_info/time_between_train_steps": 0.005316734313964844, "step": 423}
{"info/global_step": 424, "train_info/time_within_train_step": 27.90130305290222, "step": 424}
{"train_info/time_between_train_steps": 0.005499839782714844, "step": 424}
{"info/global_step": 425, "train_info/time_within_train_step": 27.82666516304016, "step": 425}
{"train_info/time_between_train_steps": 0.005461692810058594, "step": 425}
{"info/global_step": 426, "train_info/time_within_train_step": 27.975325345993042, "step": 426}
{"train_info/time_between_train_steps": 0.006384134292602539, "step": 426}
{"info/global_step": 427, "train_info/time_within_train_step": 27.853139638900757, "step": 427}
{"train_info/time_between_train_steps": 0.0053522586822509766, "step": 427}
{"info/global_step": 428, "train_info/time_within_train_step": 27.903920650482178, "step": 428}
{"train_info/time_between_train_steps": 0.00542902946472168, "step": 428}
{"info/global_step": 429, "train_info/time_within_train_step": 27.85896372795105, "step": 429}
{"train_info/time_between_train_steps": 0.00504302978515625, "step": 429}
{"info/global_step": 430, "train_info/time_within_train_step": 27.79951286315918, "step": 430}
{"train_info/time_between_train_steps": 0.0053675174713134766, "step": 430}
{"info/global_step": 431, "train_info/time_within_train_step": 27.81152367591858, "step": 431}
{"train_info/time_between_train_steps": 0.007695198059082031, "step": 431}
{"info/global_step": 432, "train_info/time_within_train_step": 27.76431918144226, "step": 432}
{"train_info/time_between_train_steps": 0.005375385284423828, "step": 432}
{"info/global_step": 433, "train_info/time_within_train_step": 27.760913848876953, "step": 433}
{"train_info/time_between_train_steps": 0.00510716438293457, "step": 433}
{"info/global_step": 434, "train_info/time_within_train_step": 27.78481698036194, "step": 434}
{"train_info/time_between_train_steps": 0.00711369514465332, "step": 434}
{"info/global_step": 435, "train_info/time_within_train_step": 27.817137002944946, "step": 435}
{"train_info/time_between_train_steps": 0.00522923469543457, "step": 435}
{"info/global_step": 436, "train_info/time_within_train_step": 27.787460327148438, "step": 436}
{"train_info/time_between_train_steps": 0.009846925735473633, "step": 436}
{"info/global_step": 437, "train_info/time_within_train_step": 27.798141956329346, "step": 437}
{"train_info/time_between_train_steps": 0.005104780197143555, "step": 437}
{"info/global_step": 438, "train_info/time_within_train_step": 27.932321548461914, "step": 438}
{"train_info/time_between_train_steps": 0.007953166961669922, "step": 438}
{"info/global_step": 439, "train_info/time_within_train_step": 27.819528102874756, "step": 439}
{"train_info/time_between_train_steps": 0.005600690841674805, "step": 439}
{"info/global_step": 440, "train_info/time_within_train_step": 27.841899871826172, "step": 440}
{"train_info/time_between_train_steps": 0.00618743896484375, "step": 440}
{"info/global_step": 441, "train_info/time_within_train_step": 27.81983995437622, "step": 441}
{"train_info/time_between_train_steps": 0.005223989486694336, "step": 441}
{"info/global_step": 442, "train_info/time_within_train_step": 27.78586483001709, "step": 442}
{"train_info/time_between_train_steps": 0.005301475524902344, "step": 442}
{"info/global_step": 443, "train_info/time_within_train_step": 27.806952714920044, "step": 443}
{"train_info/time_between_train_steps": 0.008636713027954102, "step": 443}
{"info/global_step": 444, "train_info/time_within_train_step": 27.79621911048889, "step": 444}
{"train_info/time_between_train_steps": 0.005231142044067383, "step": 444}
{"info/global_step": 445, "train_info/time_within_train_step": 27.780028820037842, "step": 445}
{"train_info/time_between_train_steps": 0.007645845413208008, "step": 445}
{"info/global_step": 446, "train_info/time_within_train_step": 27.8197660446167, "step": 446}
{"train_info/time_between_train_steps": 0.005456686019897461, "step": 446}
{"info/global_step": 447, "train_info/time_within_train_step": 27.85206890106201, "step": 447}
{"train_info/time_between_train_steps": 0.005875349044799805, "step": 447}
{"info/global_step": 448, "train_info/time_within_train_step": 27.853067636489868, "step": 448}
{"train_info/time_between_train_steps": 0.0056116580963134766, "step": 448}
{"train_info/time_between_train_steps": 3.9857985973358154, "step": 448}
{"info/global_step": 449, "train_info/time_within_train_step": 27.829267024993896, "step": 449}
{"train_info/time_between_train_steps": 0.008216619491577148, "step": 449}
{"info/global_step": 450, "train_info/time_within_train_step": 27.927269220352173, "step": 450}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740834554, "_runtime": 12659}, "step": 450}
{"logs": {"train/loss": 3.9387, "train/learning_rate": 0.00041666666666666664, "train/epoch": 16.0, "_timestamp": 1740834554, "_runtime": 12659}, "step": 450}
{"train_info/time_between_train_steps": 0.013326168060302734, "step": 450}
{"info/global_step": 451, "train_info/time_within_train_step": 27.79821538925171, "step": 451}
{"train_info/time_between_train_steps": 0.007770061492919922, "step": 451}
{"info/global_step": 452, "train_info/time_within_train_step": 27.907159090042114, "step": 452}
{"train_info/time_between_train_steps": 0.005431413650512695, "step": 452}
{"info/global_step": 453, "train_info/time_within_train_step": 27.883275032043457, "step": 453}
{"train_info/time_between_train_steps": 0.0053560733795166016, "step": 453}
{"info/global_step": 454, "train_info/time_within_train_step": 28.003644704818726, "step": 454}
{"train_info/time_between_train_steps": 0.0054302215576171875, "step": 454}
{"info/global_step": 455, "train_info/time_within_train_step": 27.785566806793213, "step": 455}
{"train_info/time_between_train_steps": 0.005350589752197266, "step": 455}
{"info/global_step": 456, "train_info/time_within_train_step": 27.924084186553955, "step": 456}
{"train_info/time_between_train_steps": 0.0056912899017333984, "step": 456}
{"info/global_step": 457, "train_info/time_within_train_step": 27.828535079956055, "step": 457}
{"train_info/time_between_train_steps": 0.005269050598144531, "step": 457}
{"info/global_step": 458, "train_info/time_within_train_step": 27.80317783355713, "step": 458}
{"train_info/time_between_train_steps": 0.005352020263671875, "step": 458}
{"info/global_step": 459, "train_info/time_within_train_step": 27.801265239715576, "step": 459}
{"train_info/time_between_train_steps": 0.0054247379302978516, "step": 459}
{"info/global_step": 460, "train_info/time_within_train_step": 27.761361598968506, "step": 460}
{"train_info/time_between_train_steps": 0.005769491195678711, "step": 460}
{"info/global_step": 461, "train_info/time_within_train_step": 27.804556131362915, "step": 461}
{"train_info/time_between_train_steps": 0.005063533782958984, "step": 461}
{"info/global_step": 462, "train_info/time_within_train_step": 27.841058254241943, "step": 462}
{"train_info/time_between_train_steps": 0.005223989486694336, "step": 462}
{"info/global_step": 463, "train_info/time_within_train_step": 27.816059350967407, "step": 463}
{"train_info/time_between_train_steps": 0.009747028350830078, "step": 463}
{"info/global_step": 464, "train_info/time_within_train_step": 27.794799089431763, "step": 464}
{"train_info/time_between_train_steps": 0.009858369827270508, "step": 464}
{"info/global_step": 465, "train_info/time_within_train_step": 27.80543851852417, "step": 465}
{"train_info/time_between_train_steps": 0.005103349685668945, "step": 465}
{"info/global_step": 466, "train_info/time_within_train_step": 27.802227020263672, "step": 466}
{"train_info/time_between_train_steps": 0.005223989486694336, "step": 466}
{"info/global_step": 467, "train_info/time_within_train_step": 27.81628441810608, "step": 467}
{"train_info/time_between_train_steps": 0.005274295806884766, "step": 467}
{"info/global_step": 468, "train_info/time_within_train_step": 27.788817167282104, "step": 468}
{"train_info/time_between_train_steps": 0.005275726318359375, "step": 468}
{"info/global_step": 469, "train_info/time_within_train_step": 27.896835327148438, "step": 469}
{"train_info/time_between_train_steps": 0.010222911834716797, "step": 469}
{"info/global_step": 470, "train_info/time_within_train_step": 27.800848484039307, "step": 470}
{"train_info/time_between_train_steps": 0.009857177734375, "step": 470}
{"info/global_step": 471, "train_info/time_within_train_step": 27.82248592376709, "step": 471}
{"train_info/time_between_train_steps": 0.00552058219909668, "step": 471}
{"info/global_step": 472, "train_info/time_within_train_step": 27.795007467269897, "step": 472}
{"train_info/time_between_train_steps": 0.007572174072265625, "step": 472}
{"info/global_step": 473, "train_info/time_within_train_step": 27.835232257843018, "step": 473}
{"train_info/time_between_train_steps": 0.005255222320556641, "step": 473}
{"info/global_step": 474, "train_info/time_within_train_step": 27.84242010116577, "step": 474}
{"train_info/time_between_train_steps": 0.008123397827148438, "step": 474}
{"info/global_step": 475, "train_info/time_within_train_step": 27.845481872558594, "step": 475}
{"train_info/time_between_train_steps": 0.009835004806518555, "step": 475}
{"info/global_step": 476, "train_info/time_within_train_step": 27.86538076400757, "step": 476}
{"train_info/time_between_train_steps": 0.006052970886230469, "step": 476}
{"train_info/time_between_train_steps": 3.6352367401123047, "step": 476}
{"info/global_step": 477, "train_info/time_within_train_step": 27.806535959243774, "step": 477}
{"train_info/time_between_train_steps": 0.0056304931640625, "step": 477}
{"info/global_step": 478, "train_info/time_within_train_step": 27.975430011749268, "step": 478}
{"train_info/time_between_train_steps": 0.00647425651550293, "step": 478}
{"info/global_step": 479, "train_info/time_within_train_step": 27.80760407447815, "step": 479}
{"train_info/time_between_train_steps": 0.0056531429290771484, "step": 479}
{"info/global_step": 480, "train_info/time_within_train_step": 28.02502202987671, "step": 480}
{"train_info/time_between_train_steps": 0.00544428825378418, "step": 480}
{"info/global_step": 481, "train_info/time_within_train_step": 27.856618642807007, "step": 481}
{"train_info/time_between_train_steps": 0.015325784683227539, "step": 481}
{"info/global_step": 482, "train_info/time_within_train_step": 27.993900537490845, "step": 482}
{"train_info/time_between_train_steps": 0.009823799133300781, "step": 482}
{"info/global_step": 483, "train_info/time_within_train_step": 27.806763648986816, "step": 483}
{"train_info/time_between_train_steps": 0.008490562438964844, "step": 483}
{"info/global_step": 484, "train_info/time_within_train_step": 27.919288873672485, "step": 484}
{"train_info/time_between_train_steps": 0.0054705142974853516, "step": 484}
{"info/global_step": 485, "train_info/time_within_train_step": 27.942620038986206, "step": 485}
{"train_info/time_between_train_steps": 0.010010242462158203, "step": 485}
{"info/global_step": 486, "train_info/time_within_train_step": 27.785045623779297, "step": 486}
{"train_info/time_between_train_steps": 0.007460832595825195, "step": 486}
{"info/global_step": 487, "train_info/time_within_train_step": 27.796478509902954, "step": 487}
{"train_info/time_between_train_steps": 0.009807348251342773, "step": 487}
{"info/global_step": 488, "train_info/time_within_train_step": 27.800060510635376, "step": 488}
{"train_info/time_between_train_steps": 0.0051844120025634766, "step": 488}
{"info/global_step": 489, "train_info/time_within_train_step": 27.755393743515015, "step": 489}
{"train_info/time_between_train_steps": 0.005067586898803711, "step": 489}
{"info/global_step": 490, "train_info/time_within_train_step": 27.74203085899353, "step": 490}
{"train_info/time_between_train_steps": 0.005011081695556641, "step": 490}
{"info/global_step": 491, "train_info/time_within_train_step": 27.780775547027588, "step": 491}
{"train_info/time_between_train_steps": 0.005237579345703125, "step": 491}
{"info/global_step": 492, "train_info/time_within_train_step": 27.79423499107361, "step": 492}
{"train_info/time_between_train_steps": 0.00499272346496582, "step": 492}
{"info/global_step": 493, "train_info/time_within_train_step": 27.821685314178467, "step": 493}
{"train_info/time_between_train_steps": 0.009612798690795898, "step": 493}
{"info/global_step": 494, "train_info/time_within_train_step": 27.809882640838623, "step": 494}
{"train_info/time_between_train_steps": 0.005291938781738281, "step": 494}
{"info/global_step": 495, "train_info/time_within_train_step": 27.812567472457886, "step": 495}
{"train_info/time_between_train_steps": 0.005208492279052734, "step": 495}
{"info/global_step": 496, "train_info/time_within_train_step": 27.80254316329956, "step": 496}
{"train_info/time_between_train_steps": 0.0055615901947021484, "step": 496}
{"info/global_step": 497, "train_info/time_within_train_step": 27.776583671569824, "step": 497}
{"train_info/time_between_train_steps": 0.007685184478759766, "step": 497}
{"info/global_step": 498, "train_info/time_within_train_step": 27.798020362854004, "step": 498}
{"train_info/time_between_train_steps": 0.0052874088287353516, "step": 498}
{"info/global_step": 499, "train_info/time_within_train_step": 27.784963846206665, "step": 499}
{"train_info/time_between_train_steps": 0.005234241485595703, "step": 499}
{"info/global_step": 500, "train_info/time_within_train_step": 27.86127233505249, "step": 500}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740835950, "_runtime": 14055}, "step": 500}
{"logs": {"train/loss": 3.8085, "train/learning_rate": 0.00038888888888888887, "train/epoch": 17.02, "_timestamp": 1740835950, "_runtime": 14055}, "step": 500}
{"train_info/time_between_train_steps": 14.189197778701782, "step": 500}
{"info/global_step": 501, "train_info/time_within_train_step": 27.846189975738525, "step": 501}
{"train_info/time_between_train_steps": 0.005236625671386719, "step": 501}
{"info/global_step": 502, "train_info/time_within_train_step": 27.775885820388794, "step": 502}
{"train_info/time_between_train_steps": 0.0054929256439208984, "step": 502}
{"info/global_step": 503, "train_info/time_within_train_step": 27.830585718154907, "step": 503}
{"train_info/time_between_train_steps": 0.010839462280273438, "step": 503}
{"info/global_step": 504, "train_info/time_within_train_step": 27.840182781219482, "step": 504}
{"train_info/time_between_train_steps": 0.009620189666748047, "step": 504}
{"train_info/time_between_train_steps": 3.6857614517211914, "step": 504}
{"info/global_step": 505, "train_info/time_within_train_step": 27.77082633972168, "step": 505}
{"train_info/time_between_train_steps": 0.005463361740112305, "step": 505}
{"info/global_step": 506, "train_info/time_within_train_step": 27.92387056350708, "step": 506}
{"train_info/time_between_train_steps": 0.007948160171508789, "step": 506}
{"info/global_step": 507, "train_info/time_within_train_step": 27.801214933395386, "step": 507}
{"train_info/time_between_train_steps": 0.0053632259368896484, "step": 507}
{"info/global_step": 508, "train_info/time_within_train_step": 27.954480409622192, "step": 508}
{"train_info/time_between_train_steps": 0.005246400833129883, "step": 508}
{"info/global_step": 509, "train_info/time_within_train_step": 27.81925129890442, "step": 509}
{"train_info/time_between_train_steps": 0.0062177181243896484, "step": 509}
{"info/global_step": 510, "train_info/time_within_train_step": 27.948535919189453, "step": 510}
{"train_info/time_between_train_steps": 0.005423784255981445, "step": 510}
{"info/global_step": 511, "train_info/time_within_train_step": 27.82804846763611, "step": 511}
{"train_info/time_between_train_steps": 0.0052797794342041016, "step": 511}
{"info/global_step": 512, "train_info/time_within_train_step": 27.813592433929443, "step": 512}
{"train_info/time_between_train_steps": 0.005196332931518555, "step": 512}
{"info/global_step": 513, "train_info/time_within_train_step": 27.812912940979004, "step": 513}
{"train_info/time_between_train_steps": 0.005298137664794922, "step": 513}
{"info/global_step": 514, "train_info/time_within_train_step": 27.754926204681396, "step": 514}
{"train_info/time_between_train_steps": 0.00513768196105957, "step": 514}
{"info/global_step": 515, "train_info/time_within_train_step": 27.781287908554077, "step": 515}
{"train_info/time_between_train_steps": 0.005138874053955078, "step": 515}
{"info/global_step": 516, "train_info/time_within_train_step": 27.862929344177246, "step": 516}
{"train_info/time_between_train_steps": 0.0052356719970703125, "step": 516}
{"info/global_step": 517, "train_info/time_within_train_step": 27.80831289291382, "step": 517}
{"train_info/time_between_train_steps": 0.0050394535064697266, "step": 517}
{"info/global_step": 518, "train_info/time_within_train_step": 27.82653546333313, "step": 518}
{"train_info/time_between_train_steps": 0.0054051876068115234, "step": 518}
{"info/global_step": 519, "train_info/time_within_train_step": 27.825673818588257, "step": 519}
{"train_info/time_between_train_steps": 0.009766340255737305, "step": 519}
{"info/global_step": 520, "train_info/time_within_train_step": 27.79369592666626, "step": 520}
{"train_info/time_between_train_steps": 0.005113840103149414, "step": 520}
{"info/global_step": 521, "train_info/time_within_train_step": 27.8018536567688, "step": 521}
{"train_info/time_between_train_steps": 0.0052068233489990234, "step": 521}
{"info/global_step": 522, "train_info/time_within_train_step": 27.811406135559082, "step": 522}
{"train_info/time_between_train_steps": 0.0050699710845947266, "step": 522}
{"info/global_step": 523, "train_info/time_within_train_step": 27.77441930770874, "step": 523}
{"train_info/time_between_train_steps": 0.005243778228759766, "step": 523}
{"info/global_step": 524, "train_info/time_within_train_step": 27.801734447479248, "step": 524}
{"train_info/time_between_train_steps": 0.0076487064361572266, "step": 524}
{"info/global_step": 525, "train_info/time_within_train_step": 27.842828512191772, "step": 525}
{"train_info/time_between_train_steps": 0.005228281021118164, "step": 525}
{"info/global_step": 526, "train_info/time_within_train_step": 27.795531749725342, "step": 526}
{"train_info/time_between_train_steps": 0.005317211151123047, "step": 526}
{"info/global_step": 527, "train_info/time_within_train_step": 27.802194118499756, "step": 527}
{"train_info/time_between_train_steps": 0.006566286087036133, "step": 527}
{"info/global_step": 528, "train_info/time_within_train_step": 27.843257665634155, "step": 528}
{"train_info/time_between_train_steps": 0.009439468383789062, "step": 528}
{"info/global_step": 529, "train_info/time_within_train_step": 27.814422130584717, "step": 529}
{"train_info/time_between_train_steps": 0.00522923469543457, "step": 529}
{"info/global_step": 530, "train_info/time_within_train_step": 27.807762622833252, "step": 530}
{"train_info/time_between_train_steps": 0.005517721176147461, "step": 530}
{"info/global_step": 531, "train_info/time_within_train_step": 27.932082891464233, "step": 531}
{"train_info/time_between_train_steps": 0.005388498306274414, "step": 531}
{"info/global_step": 532, "train_info/time_within_train_step": 27.80071234703064, "step": 532}
{"train_info/time_between_train_steps": 0.00588536262512207, "step": 532}
{"train_info/time_between_train_steps": 3.921175241470337, "step": 532}
{"info/global_step": 533, "train_info/time_within_train_step": 27.80641508102417, "step": 533}
{"train_info/time_between_train_steps": 0.0077326297760009766, "step": 533}
{"info/global_step": 534, "train_info/time_within_train_step": 27.92051362991333, "step": 534}
{"train_info/time_between_train_steps": 0.005048036575317383, "step": 534}
{"info/global_step": 535, "train_info/time_within_train_step": 27.809017658233643, "step": 535}
{"train_info/time_between_train_steps": 0.005477190017700195, "step": 535}
{"info/global_step": 536, "train_info/time_within_train_step": 27.928197383880615, "step": 536}
{"train_info/time_between_train_steps": 0.005392789840698242, "step": 536}
{"info/global_step": 537, "train_info/time_within_train_step": 27.79922890663147, "step": 537}
{"train_info/time_between_train_steps": 0.005380392074584961, "step": 537}
{"info/global_step": 538, "train_info/time_within_train_step": 27.951085805892944, "step": 538}
{"train_info/time_between_train_steps": 0.009943008422851562, "step": 538}
{"info/global_step": 539, "train_info/time_within_train_step": 27.799713611602783, "step": 539}
{"train_info/time_between_train_steps": 0.006931781768798828, "step": 539}
{"info/global_step": 540, "train_info/time_within_train_step": 27.879247426986694, "step": 540}
{"train_info/time_between_train_steps": 0.006857872009277344, "step": 540}
{"info/global_step": 541, "train_info/time_within_train_step": 27.811657190322876, "step": 541}
{"train_info/time_between_train_steps": 0.007334709167480469, "step": 541}
{"info/global_step": 542, "train_info/time_within_train_step": 27.810797452926636, "step": 542}
{"train_info/time_between_train_steps": 0.005156517028808594, "step": 542}
{"info/global_step": 543, "train_info/time_within_train_step": 27.787402629852295, "step": 543}
{"train_info/time_between_train_steps": 0.005177974700927734, "step": 543}
{"info/global_step": 544, "train_info/time_within_train_step": 27.786525011062622, "step": 544}
{"train_info/time_between_train_steps": 0.005178213119506836, "step": 544}
{"info/global_step": 545, "train_info/time_within_train_step": 27.774317741394043, "step": 545}
{"train_info/time_between_train_steps": 0.00507664680480957, "step": 545}
{"info/global_step": 546, "train_info/time_within_train_step": 27.79187297821045, "step": 546}
{"train_info/time_between_train_steps": 0.005164146423339844, "step": 546}
{"info/global_step": 547, "train_info/time_within_train_step": 27.918724298477173, "step": 547}
{"train_info/time_between_train_steps": 0.0076122283935546875, "step": 547}
{"info/global_step": 548, "train_info/time_within_train_step": 27.769433736801147, "step": 548}
{"train_info/time_between_train_steps": 0.005136966705322266, "step": 548}
{"info/global_step": 549, "train_info/time_within_train_step": 27.797597885131836, "step": 549}
{"train_info/time_between_train_steps": 0.005051612854003906, "step": 549}
{"info/global_step": 550, "train_info/time_within_train_step": 27.810226440429688, "step": 550}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740837364, "_runtime": 15469}, "step": 550}
{"logs": {"train/loss": 3.7016, "train/learning_rate": 0.0003611111111111111, "train/epoch": 19.02, "_timestamp": 1740837364, "_runtime": 15469}, "step": 550}
{"train_info/time_between_train_steps": 0.013922929763793945, "step": 550}
{"info/global_step": 551, "train_info/time_within_train_step": 27.828412771224976, "step": 551}
{"train_info/time_between_train_steps": 0.0052759647369384766, "step": 551}
{"info/global_step": 552, "train_info/time_within_train_step": 27.840587377548218, "step": 552}
{"train_info/time_between_train_steps": 0.0051958560943603516, "step": 552}
{"info/global_step": 553, "train_info/time_within_train_step": 27.78309965133667, "step": 553}
{"train_info/time_between_train_steps": 0.005398750305175781, "step": 553}
{"info/global_step": 554, "train_info/time_within_train_step": 27.836289644241333, "step": 554}
{"train_info/time_between_train_steps": 0.00985860824584961, "step": 554}
{"info/global_step": 555, "train_info/time_within_train_step": 27.805938482284546, "step": 555}
{"train_info/time_between_train_steps": 0.0052754878997802734, "step": 555}
{"info/global_step": 556, "train_info/time_within_train_step": 27.776400566101074, "step": 556}
{"train_info/time_between_train_steps": 0.00528717041015625, "step": 556}
{"info/global_step": 557, "train_info/time_within_train_step": 27.81393027305603, "step": 557}
{"train_info/time_between_train_steps": 0.00741267204284668, "step": 557}
{"info/global_step": 558, "train_info/time_within_train_step": 27.797611951828003, "step": 558}
{"train_info/time_between_train_steps": 0.010162830352783203, "step": 558}
{"info/global_step": 559, "train_info/time_within_train_step": 27.814342737197876, "step": 559}
{"train_info/time_between_train_steps": 0.006814002990722656, "step": 559}
{"info/global_step": 560, "train_info/time_within_train_step": 27.85678505897522, "step": 560}
{"train_info/time_between_train_steps": 0.005997896194458008, "step": 560}
{"train_info/time_between_train_steps": 3.6320512294769287, "step": 560}
{"info/global_step": 561, "train_info/time_within_train_step": 27.869420051574707, "step": 561}
{"train_info/time_between_train_steps": 0.005085945129394531, "step": 561}
{"info/global_step": 562, "train_info/time_within_train_step": 27.94179606437683, "step": 562}
{"train_info/time_between_train_steps": 0.005536079406738281, "step": 562}
{"info/global_step": 563, "train_info/time_within_train_step": 27.919126749038696, "step": 563}
{"train_info/time_between_train_steps": 0.0065920352935791016, "step": 563}
{"info/global_step": 564, "train_info/time_within_train_step": 27.935136556625366, "step": 564}
{"train_info/time_between_train_steps": 0.005553007125854492, "step": 564}
{"info/global_step": 565, "train_info/time_within_train_step": 27.971998929977417, "step": 565}
{"train_info/time_between_train_steps": 0.0054607391357421875, "step": 565}
{"info/global_step": 566, "train_info/time_within_train_step": 27.96735668182373, "step": 566}
{"train_info/time_between_train_steps": 0.0055637359619140625, "step": 566}
{"info/global_step": 567, "train_info/time_within_train_step": 27.82014536857605, "step": 567}
{"train_info/time_between_train_steps": 0.005860805511474609, "step": 567}
{"info/global_step": 568, "train_info/time_within_train_step": 27.925113677978516, "step": 568}
{"train_info/time_between_train_steps": 0.0052187442779541016, "step": 568}
{"info/global_step": 569, "train_info/time_within_train_step": 27.86826491355896, "step": 569}
{"train_info/time_between_train_steps": 0.005105257034301758, "step": 569}
{"info/global_step": 570, "train_info/time_within_train_step": 27.798211574554443, "step": 570}
{"train_info/time_between_train_steps": 0.00960230827331543, "step": 570}
{"info/global_step": 571, "train_info/time_within_train_step": 27.808173179626465, "step": 571}
{"train_info/time_between_train_steps": 0.008716583251953125, "step": 571}
{"info/global_step": 572, "train_info/time_within_train_step": 27.80329418182373, "step": 572}
{"train_info/time_between_train_steps": 0.005250692367553711, "step": 572}
{"info/global_step": 573, "train_info/time_within_train_step": 27.798349380493164, "step": 573}
{"train_info/time_between_train_steps": 0.009621620178222656, "step": 573}
{"info/global_step": 574, "train_info/time_within_train_step": 27.76245903968811, "step": 574}
{"train_info/time_between_train_steps": 0.0051882266998291016, "step": 574}
{"info/global_step": 575, "train_info/time_within_train_step": 27.746220350265503, "step": 575}
{"train_info/time_between_train_steps": 0.005034685134887695, "step": 575}
{"info/global_step": 576, "train_info/time_within_train_step": 27.772531032562256, "step": 576}
{"train_info/time_between_train_steps": 0.005316019058227539, "step": 576}
{"info/global_step": 577, "train_info/time_within_train_step": 27.809699296951294, "step": 577}
{"train_info/time_between_train_steps": 0.005946636199951172, "step": 577}
{"info/global_step": 578, "train_info/time_within_train_step": 27.918071508407593, "step": 578}
{"train_info/time_between_train_steps": 0.005196809768676758, "step": 578}
{"info/global_step": 579, "train_info/time_within_train_step": 27.81370496749878, "step": 579}
{"train_info/time_between_train_steps": 0.005186796188354492, "step": 579}
{"info/global_step": 580, "train_info/time_within_train_step": 27.822216749191284, "step": 580}
{"train_info/time_between_train_steps": 0.009512662887573242, "step": 580}
{"info/global_step": 581, "train_info/time_within_train_step": 27.800208568572998, "step": 581}
{"train_info/time_between_train_steps": 0.00524592399597168, "step": 581}
{"info/global_step": 582, "train_info/time_within_train_step": 27.79184317588806, "step": 582}
{"train_info/time_between_train_steps": 0.005330562591552734, "step": 582}
{"info/global_step": 583, "train_info/time_within_train_step": 27.8177752494812, "step": 583}
{"train_info/time_between_train_steps": 0.0053865909576416016, "step": 583}
{"info/global_step": 584, "train_info/time_within_train_step": 27.814644813537598, "step": 584}
{"train_info/time_between_train_steps": 0.005282402038574219, "step": 584}
{"info/global_step": 585, "train_info/time_within_train_step": 27.791556119918823, "step": 585}
{"train_info/time_between_train_steps": 0.005332469940185547, "step": 585}
{"info/global_step": 586, "train_info/time_within_train_step": 27.819555521011353, "step": 586}
{"train_info/time_between_train_steps": 0.005488395690917969, "step": 586}
{"info/global_step": 587, "train_info/time_within_train_step": 27.84312677383423, "step": 587}
{"train_info/time_between_train_steps": 0.005765438079833984, "step": 587}
{"info/global_step": 588, "train_info/time_within_train_step": 27.850248336791992, "step": 588}
{"train_info/time_between_train_steps": 0.006056547164916992, "step": 588}
{"train_info/time_between_train_steps": 3.719479560852051, "step": 588}
{"info/global_step": 589, "train_info/time_within_train_step": 27.84113597869873, "step": 589}
{"train_info/time_between_train_steps": 0.005689382553100586, "step": 589}
{"info/global_step": 590, "train_info/time_within_train_step": 27.943331718444824, "step": 590}
{"train_info/time_between_train_steps": 0.0053331851959228516, "step": 590}
{"info/global_step": 591, "train_info/time_within_train_step": 27.833431243896484, "step": 591}
{"train_info/time_between_train_steps": 0.0052776336669921875, "step": 591}
{"info/global_step": 592, "train_info/time_within_train_step": 28.002939462661743, "step": 592}
{"train_info/time_between_train_steps": 0.005844593048095703, "step": 592}
{"info/global_step": 593, "train_info/time_within_train_step": 27.83576726913452, "step": 593}
{"train_info/time_between_train_steps": 0.005354404449462891, "step": 593}
{"info/global_step": 594, "train_info/time_within_train_step": 28.05852437019348, "step": 594}
{"train_info/time_between_train_steps": 0.010487079620361328, "step": 594}
{"info/global_step": 595, "train_info/time_within_train_step": 27.810911178588867, "step": 595}
{"train_info/time_between_train_steps": 0.01036381721496582, "step": 595}
{"info/global_step": 596, "train_info/time_within_train_step": 27.857080936431885, "step": 596}
{"train_info/time_between_train_steps": 0.005234718322753906, "step": 596}
{"info/global_step": 597, "train_info/time_within_train_step": 27.76921582221985, "step": 597}
{"train_info/time_between_train_steps": 0.007447004318237305, "step": 597}
{"info/global_step": 598, "train_info/time_within_train_step": 27.8084614276886, "step": 598}
{"train_info/time_between_train_steps": 0.005301713943481445, "step": 598}
{"info/global_step": 599, "train_info/time_within_train_step": 27.820078134536743, "step": 599}
{"train_info/time_between_train_steps": 0.00519871711730957, "step": 599}
{"info/global_step": 600, "train_info/time_within_train_step": 27.768131256103516, "step": 600}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740838764, "_runtime": 16869}, "step": 600}
{"logs": {"train/loss": 3.6041, "train/learning_rate": 0.0003333333333333333, "train/epoch": 21.01, "_timestamp": 1740838764, "_runtime": 16869}, "step": 600}
{"train_info/time_between_train_steps": 13.920995473861694, "step": 600}
{"info/global_step": 601, "train_info/time_within_train_step": 27.771422386169434, "step": 601}
{"train_info/time_between_train_steps": 0.005070686340332031, "step": 601}
{"info/global_step": 602, "train_info/time_within_train_step": 27.76831293106079, "step": 602}
{"train_info/time_between_train_steps": 0.005098819732666016, "step": 602}
{"info/global_step": 603, "train_info/time_within_train_step": 27.805000066757202, "step": 603}
{"train_info/time_between_train_steps": 0.0051479339599609375, "step": 603}
{"info/global_step": 604, "train_info/time_within_train_step": 27.824710369110107, "step": 604}
{"train_info/time_between_train_steps": 0.005010128021240234, "step": 604}
{"info/global_step": 605, "train_info/time_within_train_step": 27.807061433792114, "step": 605}
{"train_info/time_between_train_steps": 0.006101846694946289, "step": 605}
{"info/global_step": 606, "train_info/time_within_train_step": 27.775835752487183, "step": 606}
{"train_info/time_between_train_steps": 0.005261898040771484, "step": 606}
{"info/global_step": 607, "train_info/time_within_train_step": 27.800142526626587, "step": 607}
{"train_info/time_between_train_steps": 0.005156993865966797, "step": 607}
{"info/global_step": 608, "train_info/time_within_train_step": 27.807782411575317, "step": 608}
{"train_info/time_between_train_steps": 0.01013040542602539, "step": 608}
{"info/global_step": 609, "train_info/time_within_train_step": 27.79599165916443, "step": 609}
{"train_info/time_between_train_steps": 0.005100727081298828, "step": 609}
{"info/global_step": 610, "train_info/time_within_train_step": 27.911987781524658, "step": 610}
{"train_info/time_between_train_steps": 0.0052220821380615234, "step": 610}
{"info/global_step": 611, "train_info/time_within_train_step": 27.789352655410767, "step": 611}
{"train_info/time_between_train_steps": 0.005230903625488281, "step": 611}
{"info/global_step": 612, "train_info/time_within_train_step": 27.781248807907104, "step": 612}
{"train_info/time_between_train_steps": 0.0051288604736328125, "step": 612}
{"info/global_step": 613, "train_info/time_within_train_step": 27.822612762451172, "step": 613}
{"train_info/time_between_train_steps": 0.007467031478881836, "step": 613}
{"info/global_step": 614, "train_info/time_within_train_step": 27.82826828956604, "step": 614}
{"train_info/time_between_train_steps": 0.0051195621490478516, "step": 614}
{"info/global_step": 615, "train_info/time_within_train_step": 27.81863498687744, "step": 615}
{"train_info/time_between_train_steps": 0.0076694488525390625, "step": 615}
{"info/global_step": 616, "train_info/time_within_train_step": 27.83182120323181, "step": 616}
{"train_info/time_between_train_steps": 0.005635738372802734, "step": 616}
{"train_info/time_between_train_steps": 3.9341299533843994, "step": 616}
{"info/global_step": 617, "train_info/time_within_train_step": 27.82147979736328, "step": 617}
{"train_info/time_between_train_steps": 0.005327463150024414, "step": 617}
{"info/global_step": 618, "train_info/time_within_train_step": 27.914600372314453, "step": 618}
{"train_info/time_between_train_steps": 0.009990453720092773, "step": 618}
{"info/global_step": 619, "train_info/time_within_train_step": 27.80506205558777, "step": 619}
{"train_info/time_between_train_steps": 0.010230302810668945, "step": 619}
{"info/global_step": 620, "train_info/time_within_train_step": 27.970555067062378, "step": 620}
{"train_info/time_between_train_steps": 0.0054209232330322266, "step": 620}
{"info/global_step": 621, "train_info/time_within_train_step": 27.79461932182312, "step": 621}
{"train_info/time_between_train_steps": 0.005137205123901367, "step": 621}
{"info/global_step": 622, "train_info/time_within_train_step": 27.998805046081543, "step": 622}
{"train_info/time_between_train_steps": 0.008720874786376953, "step": 622}
{"info/global_step": 623, "train_info/time_within_train_step": 27.806467056274414, "step": 623}
{"train_info/time_between_train_steps": 0.005232095718383789, "step": 623}
{"info/global_step": 624, "train_info/time_within_train_step": 27.893194437026978, "step": 624}
{"train_info/time_between_train_steps": 0.006297111511230469, "step": 624}
{"info/global_step": 625, "train_info/time_within_train_step": 27.926856994628906, "step": 625}
{"train_info/time_between_train_steps": 0.007429838180541992, "step": 625}
{"info/global_step": 626, "train_info/time_within_train_step": 27.750041723251343, "step": 626}
{"train_info/time_between_train_steps": 0.005092144012451172, "step": 626}
{"info/global_step": 627, "train_info/time_within_train_step": 27.807595014572144, "step": 627}
{"train_info/time_between_train_steps": 0.0054361820220947266, "step": 627}
{"info/global_step": 628, "train_info/time_within_train_step": 27.82017731666565, "step": 628}
{"train_info/time_between_train_steps": 0.0051348209381103516, "step": 628}
{"info/global_step": 629, "train_info/time_within_train_step": 27.77102041244507, "step": 629}
{"train_info/time_between_train_steps": 0.005354404449462891, "step": 629}
{"info/global_step": 630, "train_info/time_within_train_step": 27.784446239471436, "step": 630}
{"train_info/time_between_train_steps": 0.005187034606933594, "step": 630}
{"info/global_step": 631, "train_info/time_within_train_step": 27.774232387542725, "step": 631}
{"train_info/time_between_train_steps": 0.00513911247253418, "step": 631}
{"info/global_step": 632, "train_info/time_within_train_step": 27.807467937469482, "step": 632}
{"train_info/time_between_train_steps": 0.00514674186706543, "step": 632}
{"info/global_step": 633, "train_info/time_within_train_step": 27.769604444503784, "step": 633}
{"train_info/time_between_train_steps": 0.009363412857055664, "step": 633}
{"info/global_step": 634, "train_info/time_within_train_step": 27.80651092529297, "step": 634}
{"train_info/time_between_train_steps": 0.005038022994995117, "step": 634}
{"info/global_step": 635, "train_info/time_within_train_step": 27.779109477996826, "step": 635}
{"train_info/time_between_train_steps": 0.007518291473388672, "step": 635}
{"info/global_step": 636, "train_info/time_within_train_step": 27.779987812042236, "step": 636}
{"train_info/time_between_train_steps": 0.0060350894927978516, "step": 636}
{"info/global_step": 637, "train_info/time_within_train_step": 27.821019887924194, "step": 637}
{"train_info/time_between_train_steps": 0.005188941955566406, "step": 637}
{"info/global_step": 638, "train_info/time_within_train_step": 27.78091311454773, "step": 638}
{"train_info/time_between_train_steps": 0.005172252655029297, "step": 638}
{"info/global_step": 639, "train_info/time_within_train_step": 27.778934478759766, "step": 639}
{"train_info/time_between_train_steps": 0.01067352294921875, "step": 639}
{"info/global_step": 640, "train_info/time_within_train_step": 27.815194845199585, "step": 640}
{"train_info/time_between_train_steps": 0.005170345306396484, "step": 640}
{"info/global_step": 641, "train_info/time_within_train_step": 27.949131727218628, "step": 641}
{"train_info/time_between_train_steps": 0.009999752044677734, "step": 641}
{"info/global_step": 642, "train_info/time_within_train_step": 27.825516939163208, "step": 642}
{"train_info/time_between_train_steps": 0.005336284637451172, "step": 642}
{"info/global_step": 643, "train_info/time_within_train_step": 27.852107286453247, "step": 643}
{"train_info/time_between_train_steps": 0.0054798126220703125, "step": 643}
{"info/global_step": 644, "train_info/time_within_train_step": 27.85737419128418, "step": 644}
{"train_info/time_between_train_steps": 0.005910396575927734, "step": 644}
{"train_info/time_between_train_steps": 3.6700336933135986, "step": 644}
{"info/global_step": 645, "train_info/time_within_train_step": 27.798474073410034, "step": 645}
{"train_info/time_between_train_steps": 0.004999399185180664, "step": 645}
{"info/global_step": 646, "train_info/time_within_train_step": 27.90797996520996, "step": 646}
{"train_info/time_between_train_steps": 0.006822347640991211, "step": 646}
{"info/global_step": 647, "train_info/time_within_train_step": 27.807633876800537, "step": 647}
{"train_info/time_between_train_steps": 0.009073495864868164, "step": 647}
{"info/global_step": 648, "train_info/time_within_train_step": 27.903615951538086, "step": 648}
{"train_info/time_between_train_steps": 0.005326986312866211, "step": 648}
{"info/global_step": 649, "train_info/time_within_train_step": 27.782381057739258, "step": 649}
{"train_info/time_between_train_steps": 0.006490230560302734, "step": 649}
{"info/global_step": 650, "train_info/time_within_train_step": 27.971916675567627, "step": 650}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740840177, "_runtime": 18282}, "step": 650}
{"logs": {"train/loss": 3.5193, "train/learning_rate": 0.00030555555555555555, "train/epoch": 23.0, "_timestamp": 1740840177, "_runtime": 18282}, "step": 650}
{"train_info/time_between_train_steps": 0.010270833969116211, "step": 650}
{"info/global_step": 651, "train_info/time_within_train_step": 27.834259510040283, "step": 651}
{"train_info/time_between_train_steps": 0.005231618881225586, "step": 651}
{"info/global_step": 652, "train_info/time_within_train_step": 27.887081146240234, "step": 652}
{"train_info/time_between_train_steps": 0.005460023880004883, "step": 652}
{"info/global_step": 653, "train_info/time_within_train_step": 27.811224460601807, "step": 653}
{"train_info/time_between_train_steps": 0.0050470829010009766, "step": 653}
{"info/global_step": 654, "train_info/time_within_train_step": 27.75714135169983, "step": 654}
{"train_info/time_between_train_steps": 0.00915074348449707, "step": 654}
{"info/global_step": 655, "train_info/time_within_train_step": 27.776140928268433, "step": 655}
{"train_info/time_between_train_steps": 0.006948947906494141, "step": 655}
{"info/global_step": 656, "train_info/time_within_train_step": 27.88591718673706, "step": 656}
{"train_info/time_between_train_steps": 0.005143404006958008, "step": 656}
{"info/global_step": 657, "train_info/time_within_train_step": 27.80380892753601, "step": 657}
{"train_info/time_between_train_steps": 0.005239725112915039, "step": 657}
{"info/global_step": 658, "train_info/time_within_train_step": 27.795579433441162, "step": 658}
{"train_info/time_between_train_steps": 0.007279872894287109, "step": 658}
{"info/global_step": 659, "train_info/time_within_train_step": 27.825692415237427, "step": 659}
{"train_info/time_between_train_steps": 0.005492687225341797, "step": 659}
{"info/global_step": 660, "train_info/time_within_train_step": 27.79794979095459, "step": 660}
{"train_info/time_between_train_steps": 0.005123615264892578, "step": 660}
{"info/global_step": 661, "train_info/time_within_train_step": 27.752360343933105, "step": 661}
{"train_info/time_between_train_steps": 0.0050811767578125, "step": 661}
{"info/global_step": 662, "train_info/time_within_train_step": 27.774709701538086, "step": 662}
{"train_info/time_between_train_steps": 0.005327463150024414, "step": 662}
{"info/global_step": 663, "train_info/time_within_train_step": 27.784778356552124, "step": 663}
{"train_info/time_between_train_steps": 0.0051784515380859375, "step": 663}
{"info/global_step": 664, "train_info/time_within_train_step": 27.804117679595947, "step": 664}
{"train_info/time_between_train_steps": 0.0074422359466552734, "step": 664}
{"info/global_step": 665, "train_info/time_within_train_step": 27.81522297859192, "step": 665}
{"train_info/time_between_train_steps": 0.005169868469238281, "step": 665}
{"info/global_step": 666, "train_info/time_within_train_step": 27.773992776870728, "step": 666}
{"train_info/time_between_train_steps": 0.0052530765533447266, "step": 666}
{"info/global_step": 667, "train_info/time_within_train_step": 27.841779708862305, "step": 667}
{"train_info/time_between_train_steps": 0.005146980285644531, "step": 667}
{"info/global_step": 668, "train_info/time_within_train_step": 27.79154348373413, "step": 668}
{"train_info/time_between_train_steps": 0.0052068233489990234, "step": 668}
{"info/global_step": 669, "train_info/time_within_train_step": 28.16539978981018, "step": 669}
{"train_info/time_between_train_steps": 0.005333423614501953, "step": 669}
{"info/global_step": 670, "train_info/time_within_train_step": 27.80395817756653, "step": 670}
{"train_info/time_between_train_steps": 0.010025262832641602, "step": 670}
{"info/global_step": 671, "train_info/time_within_train_step": 27.82781434059143, "step": 671}
{"train_info/time_between_train_steps": 0.005743265151977539, "step": 671}
{"info/global_step": 672, "train_info/time_within_train_step": 28.106802701950073, "step": 672}
{"train_info/time_between_train_steps": 0.005915164947509766, "step": 672}
{"train_info/time_between_train_steps": 3.8156790733337402, "step": 672}
{"info/global_step": 673, "train_info/time_within_train_step": 27.82368302345276, "step": 673}
{"train_info/time_between_train_steps": 0.005558490753173828, "step": 673}
{"info/global_step": 674, "train_info/time_within_train_step": 27.932151794433594, "step": 674}
{"train_info/time_between_train_steps": 0.0053217411041259766, "step": 674}
{"info/global_step": 675, "train_info/time_within_train_step": 27.798741817474365, "step": 675}
{"train_info/time_between_train_steps": 0.0089111328125, "step": 675}
{"info/global_step": 676, "train_info/time_within_train_step": 28.03020668029785, "step": 676}
{"train_info/time_between_train_steps": 0.007233858108520508, "step": 676}
{"info/global_step": 677, "train_info/time_within_train_step": 27.810558080673218, "step": 677}
{"train_info/time_between_train_steps": 0.0052721500396728516, "step": 677}
{"info/global_step": 678, "train_info/time_within_train_step": 27.952890872955322, "step": 678}
{"train_info/time_between_train_steps": 0.0053327083587646484, "step": 678}
{"info/global_step": 679, "train_info/time_within_train_step": 27.756752490997314, "step": 679}
{"train_info/time_between_train_steps": 0.005234479904174805, "step": 679}
{"info/global_step": 680, "train_info/time_within_train_step": 27.897463083267212, "step": 680}
{"train_info/time_between_train_steps": 0.005238771438598633, "step": 680}
{"info/global_step": 681, "train_info/time_within_train_step": 27.83367657661438, "step": 681}
{"train_info/time_between_train_steps": 0.009070396423339844, "step": 681}
{"info/global_step": 682, "train_info/time_within_train_step": 27.788614988327026, "step": 682}
{"train_info/time_between_train_steps": 0.004996538162231445, "step": 682}
{"info/global_step": 683, "train_info/time_within_train_step": 27.79777693748474, "step": 683}
{"train_info/time_between_train_steps": 0.0051727294921875, "step": 683}
{"info/global_step": 684, "train_info/time_within_train_step": 27.805476665496826, "step": 684}
{"train_info/time_between_train_steps": 0.005154609680175781, "step": 684}
{"info/global_step": 685, "train_info/time_within_train_step": 27.77130103111267, "step": 685}
{"train_info/time_between_train_steps": 0.005859851837158203, "step": 685}
{"info/global_step": 686, "train_info/time_within_train_step": 27.814821004867554, "step": 686}
{"train_info/time_between_train_steps": 0.0051767826080322266, "step": 686}
{"info/global_step": 687, "train_info/time_within_train_step": 27.7808358669281, "step": 687}
{"train_info/time_between_train_steps": 0.005177021026611328, "step": 687}
{"info/global_step": 688, "train_info/time_within_train_step": 27.894068002700806, "step": 688}
{"train_info/time_between_train_steps": 0.005213737487792969, "step": 688}
{"info/global_step": 689, "train_info/time_within_train_step": 27.809101819992065, "step": 689}
{"train_info/time_between_train_steps": 0.005194902420043945, "step": 689}
{"info/global_step": 690, "train_info/time_within_train_step": 27.80603528022766, "step": 690}
{"train_info/time_between_train_steps": 0.0052301883697509766, "step": 690}
{"info/global_step": 691, "train_info/time_within_train_step": 27.833141088485718, "step": 691}
{"train_info/time_between_train_steps": 0.010040760040283203, "step": 691}
{"info/global_step": 692, "train_info/time_within_train_step": 27.811559677124023, "step": 692}
{"train_info/time_between_train_steps": 0.005071401596069336, "step": 692}
{"info/global_step": 693, "train_info/time_within_train_step": 27.81013774871826, "step": 693}
{"train_info/time_between_train_steps": 0.005184173583984375, "step": 693}
{"info/global_step": 694, "train_info/time_within_train_step": 27.791139364242554, "step": 694}
{"train_info/time_between_train_steps": 0.00506138801574707, "step": 694}
{"info/global_step": 695, "train_info/time_within_train_step": 27.802238941192627, "step": 695}
{"train_info/time_between_train_steps": 0.010042905807495117, "step": 695}
{"info/global_step": 696, "train_info/time_within_train_step": 27.782469034194946, "step": 696}
{"train_info/time_between_train_steps": 0.0053615570068359375, "step": 696}
{"info/global_step": 697, "train_info/time_within_train_step": 27.745993852615356, "step": 697}
{"train_info/time_between_train_steps": 0.005347013473510742, "step": 697}
{"info/global_step": 698, "train_info/time_within_train_step": 27.76400876045227, "step": 698}
{"train_info/time_between_train_steps": 0.0075435638427734375, "step": 698}
{"info/global_step": 699, "train_info/time_within_train_step": 27.818974256515503, "step": 699}
{"train_info/time_between_train_steps": 0.005625009536743164, "step": 699}
{"info/global_step": 700, "train_info/time_within_train_step": 27.826781034469604, "step": 700}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740841573, "_runtime": 19678}, "step": 700}
{"logs": {"train/loss": 3.4405, "train/learning_rate": 0.0002777777777777778, "train/epoch": 24.02, "_timestamp": 1740841573, "_runtime": 19678}, "step": 700}
{"train_info/time_between_train_steps": 13.427456378936768, "step": 700}
{"train_info/time_between_train_steps": 17.18051815032959, "step": 700}
{"info/global_step": 701, "train_info/time_within_train_step": 27.789172887802124, "step": 701}
{"train_info/time_between_train_steps": 0.009477615356445312, "step": 701}
{"info/global_step": 702, "train_info/time_within_train_step": 27.96382975578308, "step": 702}
{"train_info/time_between_train_steps": 0.010021686553955078, "step": 702}
{"info/global_step": 703, "train_info/time_within_train_step": 27.93750524520874, "step": 703}
{"train_info/time_between_train_steps": 0.005352497100830078, "step": 703}
{"info/global_step": 704, "train_info/time_within_train_step": 27.970821857452393, "step": 704}
{"train_info/time_between_train_steps": 0.00534367561340332, "step": 704}
{"info/global_step": 705, "train_info/time_within_train_step": 27.818883180618286, "step": 705}
{"train_info/time_between_train_steps": 0.005410194396972656, "step": 705}
{"info/global_step": 706, "train_info/time_within_train_step": 27.963913917541504, "step": 706}
{"train_info/time_between_train_steps": 0.01032876968383789, "step": 706}
{"info/global_step": 707, "train_info/time_within_train_step": 27.813822507858276, "step": 707}
{"train_info/time_between_train_steps": 0.005179882049560547, "step": 707}
{"info/global_step": 708, "train_info/time_within_train_step": 27.88570475578308, "step": 708}
{"train_info/time_between_train_steps": 0.007630109786987305, "step": 708}
{"info/global_step": 709, "train_info/time_within_train_step": 27.82837677001953, "step": 709}
{"train_info/time_between_train_steps": 0.0048885345458984375, "step": 709}
{"info/global_step": 710, "train_info/time_within_train_step": 27.81193709373474, "step": 710}
{"train_info/time_between_train_steps": 0.005030393600463867, "step": 710}
{"info/global_step": 711, "train_info/time_within_train_step": 27.78319215774536, "step": 711}
{"train_info/time_between_train_steps": 0.009585142135620117, "step": 711}
{"info/global_step": 712, "train_info/time_within_train_step": 27.775876998901367, "step": 712}
{"train_info/time_between_train_steps": 0.00516963005065918, "step": 712}
{"info/global_step": 713, "train_info/time_within_train_step": 27.796048641204834, "step": 713}
{"train_info/time_between_train_steps": 0.0050737857818603516, "step": 713}
{"info/global_step": 714, "train_info/time_within_train_step": 27.76953625679016, "step": 714}
{"train_info/time_between_train_steps": 0.00504612922668457, "step": 714}
{"info/global_step": 715, "train_info/time_within_train_step": 27.82244038581848, "step": 715}
{"train_info/time_between_train_steps": 0.005378007888793945, "step": 715}
{"info/global_step": 716, "train_info/time_within_train_step": 27.778432607650757, "step": 716}
{"train_info/time_between_train_steps": 0.0051670074462890625, "step": 716}
{"info/global_step": 717, "train_info/time_within_train_step": 27.737014055252075, "step": 717}
{"train_info/time_between_train_steps": 0.00577092170715332, "step": 717}
{"info/global_step": 718, "train_info/time_within_train_step": 27.747223138809204, "step": 718}
{"train_info/time_between_train_steps": 0.005137443542480469, "step": 718}
{"info/global_step": 719, "train_info/time_within_train_step": 27.868901014328003, "step": 719}
{"train_info/time_between_train_steps": 0.005304813385009766, "step": 719}
{"info/global_step": 720, "train_info/time_within_train_step": 27.81447196006775, "step": 720}
{"train_info/time_between_train_steps": 0.0052034854888916016, "step": 720}
{"info/global_step": 721, "train_info/time_within_train_step": 27.792957305908203, "step": 721}
{"train_info/time_between_train_steps": 0.005140781402587891, "step": 721}
{"info/global_step": 722, "train_info/time_within_train_step": 27.80615496635437, "step": 722}
{"train_info/time_between_train_steps": 0.005071163177490234, "step": 722}
{"info/global_step": 723, "train_info/time_within_train_step": 27.795068502426147, "step": 723}
{"train_info/time_between_train_steps": 0.005163669586181641, "step": 723}
{"info/global_step": 724, "train_info/time_within_train_step": 27.82041358947754, "step": 724}
{"train_info/time_between_train_steps": 0.005097150802612305, "step": 724}
{"info/global_step": 725, "train_info/time_within_train_step": 27.823283195495605, "step": 725}
{"train_info/time_between_train_steps": 0.01004481315612793, "step": 725}
{"info/global_step": 726, "train_info/time_within_train_step": 27.847411155700684, "step": 726}
{"train_info/time_between_train_steps": 0.00533604621887207, "step": 726}
{"info/global_step": 727, "train_info/time_within_train_step": 27.82577085494995, "step": 727}
{"train_info/time_between_train_steps": 0.005582571029663086, "step": 727}
{"info/global_step": 728, "train_info/time_within_train_step": 27.847283363342285, "step": 728}
{"train_info/time_between_train_steps": 0.0057468414306640625, "step": 728}
{"train_info/time_between_train_steps": 3.507816791534424, "step": 728}
{"info/global_step": 729, "train_info/time_within_train_step": 27.783355951309204, "step": 729}
{"train_info/time_between_train_steps": 0.009767532348632812, "step": 729}
{"info/global_step": 730, "train_info/time_within_train_step": 27.932753801345825, "step": 730}
{"train_info/time_between_train_steps": 0.010049819946289062, "step": 730}
{"info/global_step": 731, "train_info/time_within_train_step": 27.8344624042511, "step": 731}
{"train_info/time_between_train_steps": 0.005441427230834961, "step": 731}
{"info/global_step": 732, "train_info/time_within_train_step": 27.919600248336792, "step": 732}
{"train_info/time_between_train_steps": 0.005309343338012695, "step": 732}
{"info/global_step": 733, "train_info/time_within_train_step": 27.853291273117065, "step": 733}
{"train_info/time_between_train_steps": 0.008070230484008789, "step": 733}
{"info/global_step": 734, "train_info/time_within_train_step": 28.070204496383667, "step": 734}
{"train_info/time_between_train_steps": 0.005886554718017578, "step": 734}
{"info/global_step": 735, "train_info/time_within_train_step": 27.811752796173096, "step": 735}
{"train_info/time_between_train_steps": 0.005643129348754883, "step": 735}
{"info/global_step": 736, "train_info/time_within_train_step": 27.848227977752686, "step": 736}
{"train_info/time_between_train_steps": 0.005094289779663086, "step": 736}
{"info/global_step": 737, "train_info/time_within_train_step": 27.79422116279602, "step": 737}
{"train_info/time_between_train_steps": 0.00513458251953125, "step": 737}
{"info/global_step": 738, "train_info/time_within_train_step": 27.829689264297485, "step": 738}
{"train_info/time_between_train_steps": 0.006136417388916016, "step": 738}
{"info/global_step": 739, "train_info/time_within_train_step": 27.76767349243164, "step": 739}
{"train_info/time_between_train_steps": 0.0050432682037353516, "step": 739}
{"info/global_step": 740, "train_info/time_within_train_step": 27.771910190582275, "step": 740}
{"train_info/time_between_train_steps": 0.010306358337402344, "step": 740}
{"info/global_step": 741, "train_info/time_within_train_step": 27.78625178337097, "step": 741}
{"train_info/time_between_train_steps": 0.0053577423095703125, "step": 741}
{"info/global_step": 742, "train_info/time_within_train_step": 27.77874517440796, "step": 742}
{"train_info/time_between_train_steps": 0.009493350982666016, "step": 742}
{"info/global_step": 743, "train_info/time_within_train_step": 27.790919303894043, "step": 743}
{"train_info/time_between_train_steps": 0.006213665008544922, "step": 743}
{"info/global_step": 744, "train_info/time_within_train_step": 27.817269325256348, "step": 744}
{"train_info/time_between_train_steps": 0.00504755973815918, "step": 744}
{"info/global_step": 745, "train_info/time_within_train_step": 27.74066138267517, "step": 745}
{"train_info/time_between_train_steps": 0.005126953125, "step": 745}
{"info/global_step": 746, "train_info/time_within_train_step": 27.816099643707275, "step": 746}
{"train_info/time_between_train_steps": 0.005110740661621094, "step": 746}
{"info/global_step": 747, "train_info/time_within_train_step": 27.768463134765625, "step": 747}
{"train_info/time_between_train_steps": 0.009332656860351562, "step": 747}
{"info/global_step": 748, "train_info/time_within_train_step": 27.807121992111206, "step": 748}
{"train_info/time_between_train_steps": 0.005142927169799805, "step": 748}
{"info/global_step": 749, "train_info/time_within_train_step": 27.78801941871643, "step": 749}
{"train_info/time_between_train_steps": 0.005074977874755859, "step": 749}
{"info/global_step": 750, "train_info/time_within_train_step": 27.908727645874023, "step": 750}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740842986, "_runtime": 21091}, "step": 750}
{"logs": {"train/loss": 3.3724, "train/learning_rate": 0.00025, "train/epoch": 26.02, "_timestamp": 1740842986, "_runtime": 21091}, "step": 750}
{"train_info/time_between_train_steps": 0.013231992721557617, "step": 750}
{"info/global_step": 751, "train_info/time_within_train_step": 27.777912139892578, "step": 751}
{"train_info/time_between_train_steps": 0.005091190338134766, "step": 751}
{"info/global_step": 752, "train_info/time_within_train_step": 27.814412832260132, "step": 752}
{"train_info/time_between_train_steps": 0.010114908218383789, "step": 752}
{"info/global_step": 753, "train_info/time_within_train_step": 27.83700466156006, "step": 753}
{"train_info/time_between_train_steps": 0.009968757629394531, "step": 753}
{"info/global_step": 754, "train_info/time_within_train_step": 27.796993732452393, "step": 754}
{"train_info/time_between_train_steps": 0.005394935607910156, "step": 754}
{"info/global_step": 755, "train_info/time_within_train_step": 27.82188391685486, "step": 755}
{"train_info/time_between_train_steps": 0.0057353973388671875, "step": 755}
{"info/global_step": 756, "train_info/time_within_train_step": 27.824808359146118, "step": 756}
{"train_info/time_between_train_steps": 0.00610041618347168, "step": 756}
{"train_info/time_between_train_steps": 3.649829864501953, "step": 756}
{"info/global_step": 757, "train_info/time_within_train_step": 27.803032875061035, "step": 757}
{"train_info/time_between_train_steps": 0.010546207427978516, "step": 757}
{"info/global_step": 758, "train_info/time_within_train_step": 27.931596279144287, "step": 758}
{"train_info/time_between_train_steps": 0.00527644157409668, "step": 758}
{"info/global_step": 759, "train_info/time_within_train_step": 27.830218076705933, "step": 759}
{"train_info/time_between_train_steps": 0.005320310592651367, "step": 759}
{"info/global_step": 760, "train_info/time_within_train_step": 27.91835618019104, "step": 760}
{"train_info/time_between_train_steps": 0.005997419357299805, "step": 760}
{"info/global_step": 761, "train_info/time_within_train_step": 27.822797060012817, "step": 761}
{"train_info/time_between_train_steps": 0.010235071182250977, "step": 761}
{"info/global_step": 762, "train_info/time_within_train_step": 27.95533037185669, "step": 762}
{"train_info/time_between_train_steps": 0.010050535202026367, "step": 762}
{"info/global_step": 763, "train_info/time_within_train_step": 27.769165515899658, "step": 763}
{"train_info/time_between_train_steps": 0.005416154861450195, "step": 763}
{"info/global_step": 764, "train_info/time_within_train_step": 27.846973419189453, "step": 764}
{"train_info/time_between_train_steps": 0.005128145217895508, "step": 764}
{"info/global_step": 765, "train_info/time_within_train_step": 27.840988159179688, "step": 765}
{"train_info/time_between_train_steps": 0.0052814483642578125, "step": 765}
{"info/global_step": 766, "train_info/time_within_train_step": 27.882741451263428, "step": 766}
{"train_info/time_between_train_steps": 0.005002021789550781, "step": 766}
{"info/global_step": 767, "train_info/time_within_train_step": 27.74442982673645, "step": 767}
{"train_info/time_between_train_steps": 0.00506591796875, "step": 767}
{"info/global_step": 768, "train_info/time_within_train_step": 27.795570611953735, "step": 768}
{"train_info/time_between_train_steps": 0.0051822662353515625, "step": 768}
{"info/global_step": 769, "train_info/time_within_train_step": 27.800164699554443, "step": 769}
{"train_info/time_between_train_steps": 0.005050182342529297, "step": 769}
{"info/global_step": 770, "train_info/time_within_train_step": 27.80761432647705, "step": 770}
{"train_info/time_between_train_steps": 0.005332231521606445, "step": 770}
{"info/global_step": 771, "train_info/time_within_train_step": 27.810274839401245, "step": 771}
{"train_info/time_between_train_steps": 0.006469011306762695, "step": 771}
{"info/global_step": 772, "train_info/time_within_train_step": 28.04605484008789, "step": 772}
{"train_info/time_between_train_steps": 0.0075817108154296875, "step": 772}
{"info/global_step": 773, "train_info/time_within_train_step": 27.80141592025757, "step": 773}
{"train_info/time_between_train_steps": 0.005067348480224609, "step": 773}
{"info/global_step": 774, "train_info/time_within_train_step": 27.800655841827393, "step": 774}
{"train_info/time_between_train_steps": 0.005118608474731445, "step": 774}
{"info/global_step": 775, "train_info/time_within_train_step": 27.80028510093689, "step": 775}
{"train_info/time_between_train_steps": 0.009973764419555664, "step": 775}
{"info/global_step": 776, "train_info/time_within_train_step": 27.816051483154297, "step": 776}
{"train_info/time_between_train_steps": 0.005057573318481445, "step": 776}
{"info/global_step": 777, "train_info/time_within_train_step": 27.778882265090942, "step": 777}
{"train_info/time_between_train_steps": 0.00632786750793457, "step": 777}
{"info/global_step": 778, "train_info/time_within_train_step": 27.789703845977783, "step": 778}
{"train_info/time_between_train_steps": 0.005105733871459961, "step": 778}
{"info/global_step": 779, "train_info/time_within_train_step": 27.812096118927002, "step": 779}
{"train_info/time_between_train_steps": 0.005279064178466797, "step": 779}
{"info/global_step": 780, "train_info/time_within_train_step": 27.79128408432007, "step": 780}
{"train_info/time_between_train_steps": 0.005118370056152344, "step": 780}
{"info/global_step": 781, "train_info/time_within_train_step": 27.89992666244507, "step": 781}
{"train_info/time_between_train_steps": 0.005127429962158203, "step": 781}
{"info/global_step": 782, "train_info/time_within_train_step": 27.805580377578735, "step": 782}
{"train_info/time_between_train_steps": 0.0054166316986083984, "step": 782}
{"info/global_step": 783, "train_info/time_within_train_step": 27.836586952209473, "step": 783}
{"train_info/time_between_train_steps": 0.005735635757446289, "step": 783}
{"info/global_step": 784, "train_info/time_within_train_step": 27.81577777862549, "step": 784}
{"train_info/time_between_train_steps": 0.010630130767822266, "step": 784}
{"train_info/time_between_train_steps": 3.765937566757202, "step": 784}
{"info/global_step": 785, "train_info/time_within_train_step": 27.826398372650146, "step": 785}
{"train_info/time_between_train_steps": 0.004926204681396484, "step": 785}
{"info/global_step": 786, "train_info/time_within_train_step": 27.91554594039917, "step": 786}
{"train_info/time_between_train_steps": 0.005002021789550781, "step": 786}
{"info/global_step": 787, "train_info/time_within_train_step": 27.800671577453613, "step": 787}
{"train_info/time_between_train_steps": 0.010329246520996094, "step": 787}
{"info/global_step": 788, "train_info/time_within_train_step": 27.928186893463135, "step": 788}
{"train_info/time_between_train_steps": 0.005436897277832031, "step": 788}
{"info/global_step": 789, "train_info/time_within_train_step": 27.803858041763306, "step": 789}
{"train_info/time_between_train_steps": 0.005321502685546875, "step": 789}
{"info/global_step": 790, "train_info/time_within_train_step": 27.977768659591675, "step": 790}
{"train_info/time_between_train_steps": 0.005397796630859375, "step": 790}
{"info/global_step": 791, "train_info/time_within_train_step": 27.78369975090027, "step": 791}
{"train_info/time_between_train_steps": 0.005188941955566406, "step": 791}
{"info/global_step": 792, "train_info/time_within_train_step": 27.870489358901978, "step": 792}
{"train_info/time_between_train_steps": 0.007342815399169922, "step": 792}
{"info/global_step": 793, "train_info/time_within_train_step": 27.79274606704712, "step": 793}
{"train_info/time_between_train_steps": 0.005151033401489258, "step": 793}
{"info/global_step": 794, "train_info/time_within_train_step": 27.755462646484375, "step": 794}
{"train_info/time_between_train_steps": 0.0051038265228271484, "step": 794}
{"info/global_step": 795, "train_info/time_within_train_step": 27.78397297859192, "step": 795}
{"train_info/time_between_train_steps": 0.009809494018554688, "step": 795}
{"info/global_step": 796, "train_info/time_within_train_step": 27.751744031906128, "step": 796}
{"train_info/time_between_train_steps": 0.009885549545288086, "step": 796}
{"info/global_step": 797, "train_info/time_within_train_step": 27.910775661468506, "step": 797}
{"train_info/time_between_train_steps": 0.005166769027709961, "step": 797}
{"info/global_step": 798, "train_info/time_within_train_step": 27.826347827911377, "step": 798}
{"train_info/time_between_train_steps": 0.005141496658325195, "step": 798}
{"info/global_step": 799, "train_info/time_within_train_step": 27.79386591911316, "step": 799}
{"train_info/time_between_train_steps": 0.007367134094238281, "step": 799}
{"info/global_step": 800, "train_info/time_within_train_step": 27.783908367156982, "step": 800}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740844385, "_runtime": 22490}, "step": 800}
{"logs": {"train/loss": 3.3084, "train/learning_rate": 0.00022222222222222218, "train/epoch": 28.01, "_timestamp": 1740844385, "_runtime": 22490}, "step": 800}
{"train_info/time_between_train_steps": 13.331582307815552, "step": 800}
{"info/global_step": 801, "train_info/time_within_train_step": 27.815171241760254, "step": 801}
{"train_info/time_between_train_steps": 0.00504302978515625, "step": 801}
{"info/global_step": 802, "train_info/time_within_train_step": 27.797075986862183, "step": 802}
{"train_info/time_between_train_steps": 0.009684085845947266, "step": 802}
{"info/global_step": 803, "train_info/time_within_train_step": 27.817859649658203, "step": 803}
{"train_info/time_between_train_steps": 0.009929180145263672, "step": 803}
{"info/global_step": 804, "train_info/time_within_train_step": 27.805962324142456, "step": 804}
{"train_info/time_between_train_steps": 0.009891986846923828, "step": 804}
{"info/global_step": 805, "train_info/time_within_train_step": 27.809054374694824, "step": 805}
{"train_info/time_between_train_steps": 0.009587287902832031, "step": 805}
{"info/global_step": 806, "train_info/time_within_train_step": 27.82260012626648, "step": 806}
{"train_info/time_between_train_steps": 0.00509953498840332, "step": 806}
{"info/global_step": 807, "train_info/time_within_train_step": 27.764647483825684, "step": 807}
{"train_info/time_between_train_steps": 0.0053253173828125, "step": 807}
{"info/global_step": 808, "train_info/time_within_train_step": 27.758989095687866, "step": 808}
{"train_info/time_between_train_steps": 0.006128549575805664, "step": 808}
{"info/global_step": 809, "train_info/time_within_train_step": 27.793578147888184, "step": 809}
{"train_info/time_between_train_steps": 0.0061304569244384766, "step": 809}
{"info/global_step": 810, "train_info/time_within_train_step": 27.815589666366577, "step": 810}
{"train_info/time_between_train_steps": 0.0052759647369384766, "step": 810}
{"info/global_step": 811, "train_info/time_within_train_step": 27.811185836791992, "step": 811}
{"train_info/time_between_train_steps": 0.005522012710571289, "step": 811}
{"info/global_step": 812, "train_info/time_within_train_step": 27.829410314559937, "step": 812}
{"train_info/time_between_train_steps": 0.005884647369384766, "step": 812}
{"train_info/time_between_train_steps": 3.6739447116851807, "step": 812}
{"info/global_step": 813, "train_info/time_within_train_step": 27.889627933502197, "step": 813}
{"train_info/time_between_train_steps": 0.005125284194946289, "step": 813}
{"info/global_step": 814, "train_info/time_within_train_step": 27.949331760406494, "step": 814}
{"train_info/time_between_train_steps": 0.007421255111694336, "step": 814}
{"info/global_step": 815, "train_info/time_within_train_step": 27.83479142189026, "step": 815}
{"train_info/time_between_train_steps": 0.005350351333618164, "step": 815}
{"info/global_step": 816, "train_info/time_within_train_step": 27.924528121948242, "step": 816}
{"train_info/time_between_train_steps": 0.00908207893371582, "step": 816}
{"info/global_step": 817, "train_info/time_within_train_step": 27.7817165851593, "step": 817}
{"train_info/time_between_train_steps": 0.005576610565185547, "step": 817}
{"info/global_step": 818, "train_info/time_within_train_step": 28.005776166915894, "step": 818}
{"train_info/time_between_train_steps": 0.009482145309448242, "step": 818}
{"info/global_step": 819, "train_info/time_within_train_step": 27.79744267463684, "step": 819}
{"train_info/time_between_train_steps": 0.010282754898071289, "step": 819}
{"info/global_step": 820, "train_info/time_within_train_step": 27.877026081085205, "step": 820}
{"train_info/time_between_train_steps": 0.005360126495361328, "step": 820}
{"info/global_step": 821, "train_info/time_within_train_step": 27.79757857322693, "step": 821}
{"train_info/time_between_train_steps": 0.0049285888671875, "step": 821}
{"info/global_step": 822, "train_info/time_within_train_step": 27.801762342453003, "step": 822}
{"train_info/time_between_train_steps": 0.005142927169799805, "step": 822}
{"info/global_step": 823, "train_info/time_within_train_step": 27.78050208091736, "step": 823}
{"train_info/time_between_train_steps": 0.005085945129394531, "step": 823}
{"info/global_step": 824, "train_info/time_within_train_step": 27.78557848930359, "step": 824}
{"train_info/time_between_train_steps": 0.005391836166381836, "step": 824}
{"info/global_step": 825, "train_info/time_within_train_step": 27.80602240562439, "step": 825}
{"train_info/time_between_train_steps": 0.006417751312255859, "step": 825}
{"info/global_step": 826, "train_info/time_within_train_step": 27.80216336250305, "step": 826}
{"train_info/time_between_train_steps": 0.005382537841796875, "step": 826}
{"info/global_step": 827, "train_info/time_within_train_step": 27.772672176361084, "step": 827}
{"train_info/time_between_train_steps": 0.00518798828125, "step": 827}
{"info/global_step": 828, "train_info/time_within_train_step": 27.880825519561768, "step": 828}
{"train_info/time_between_train_steps": 0.005080223083496094, "step": 828}
{"info/global_step": 829, "train_info/time_within_train_step": 27.760875701904297, "step": 829}
{"train_info/time_between_train_steps": 0.005219936370849609, "step": 829}
{"info/global_step": 830, "train_info/time_within_train_step": 27.796047687530518, "step": 830}
{"train_info/time_between_train_steps": 0.005308628082275391, "step": 830}
{"info/global_step": 831, "train_info/time_within_train_step": 27.768691539764404, "step": 831}
{"train_info/time_between_train_steps": 0.00503230094909668, "step": 831}
{"info/global_step": 832, "train_info/time_within_train_step": 27.814356327056885, "step": 832}
{"train_info/time_between_train_steps": 0.005395174026489258, "step": 832}
{"info/global_step": 833, "train_info/time_within_train_step": 27.797957181930542, "step": 833}
{"train_info/time_between_train_steps": 0.00547027587890625, "step": 833}
{"info/global_step": 834, "train_info/time_within_train_step": 27.79698133468628, "step": 834}
{"train_info/time_between_train_steps": 0.010577201843261719, "step": 834}
{"info/global_step": 835, "train_info/time_within_train_step": 27.77055335044861, "step": 835}
{"train_info/time_between_train_steps": 0.005216360092163086, "step": 835}
{"info/global_step": 836, "train_info/time_within_train_step": 27.74602723121643, "step": 836}
{"train_info/time_between_train_steps": 0.005255937576293945, "step": 836}
{"info/global_step": 837, "train_info/time_within_train_step": 27.816629648208618, "step": 837}
{"train_info/time_between_train_steps": 0.0053555965423583984, "step": 837}
{"info/global_step": 838, "train_info/time_within_train_step": 27.823554515838623, "step": 838}
{"train_info/time_between_train_steps": 0.005496978759765625, "step": 838}
{"info/global_step": 839, "train_info/time_within_train_step": 27.80610156059265, "step": 839}
{"train_info/time_between_train_steps": 0.005636692047119141, "step": 839}
{"info/global_step": 840, "train_info/time_within_train_step": 27.817264556884766, "step": 840}
{"train_info/time_between_train_steps": 0.005534172058105469, "step": 840}
{"train_info/time_between_train_steps": 3.602080821990967, "step": 840}
{"info/global_step": 841, "train_info/time_within_train_step": 27.787774562835693, "step": 841}
{"train_info/time_between_train_steps": 0.0053501129150390625, "step": 841}
{"info/global_step": 842, "train_info/time_within_train_step": 27.950938940048218, "step": 842}
{"train_info/time_between_train_steps": 0.00533747673034668, "step": 842}
{"info/global_step": 843, "train_info/time_within_train_step": 27.821473836898804, "step": 843}
{"train_info/time_between_train_steps": 0.005301713943481445, "step": 843}
{"info/global_step": 844, "train_info/time_within_train_step": 28.068676948547363, "step": 844}
{"train_info/time_between_train_steps": 0.005277156829833984, "step": 844}
{"info/global_step": 845, "train_info/time_within_train_step": 27.839383840560913, "step": 845}
{"train_info/time_between_train_steps": 0.005370616912841797, "step": 845}
{"info/global_step": 846, "train_info/time_within_train_step": 27.941660165786743, "step": 846}
{"train_info/time_between_train_steps": 0.006078958511352539, "step": 846}
{"info/global_step": 847, "train_info/time_within_train_step": 27.81775164604187, "step": 847}
{"train_info/time_between_train_steps": 0.005440711975097656, "step": 847}
{"info/global_step": 848, "train_info/time_within_train_step": 27.85343885421753, "step": 848}
{"train_info/time_between_train_steps": 0.005135536193847656, "step": 848}
{"info/global_step": 849, "train_info/time_within_train_step": 27.82539939880371, "step": 849}
{"train_info/time_between_train_steps": 0.005163908004760742, "step": 849}
{"info/global_step": 850, "train_info/time_within_train_step": 27.774280309677124, "step": 850}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740845798, "_runtime": 23903}, "step": 850}
{"logs": {"train/loss": 3.2513, "train/learning_rate": 0.00019444444444444443, "train/epoch": 30.01, "_timestamp": 1740845798, "_runtime": 23903}, "step": 850}
{"train_info/time_between_train_steps": 0.014502763748168945, "step": 850}
{"info/global_step": 851, "train_info/time_within_train_step": 27.779783010482788, "step": 851}
{"train_info/time_between_train_steps": 0.006043195724487305, "step": 851}
{"info/global_step": 852, "train_info/time_within_train_step": 27.781611919403076, "step": 852}
{"train_info/time_between_train_steps": 0.005231618881225586, "step": 852}
{"info/global_step": 853, "train_info/time_within_train_step": 27.792511463165283, "step": 853}
{"train_info/time_between_train_steps": 0.005077362060546875, "step": 853}
{"info/global_step": 854, "train_info/time_within_train_step": 27.768744468688965, "step": 854}
{"train_info/time_between_train_steps": 0.005534172058105469, "step": 854}
{"info/global_step": 855, "train_info/time_within_train_step": 27.786739587783813, "step": 855}
{"train_info/time_between_train_steps": 0.005227088928222656, "step": 855}
{"info/global_step": 856, "train_info/time_within_train_step": 27.83011269569397, "step": 856}
{"train_info/time_between_train_steps": 0.005056858062744141, "step": 856}
{"info/global_step": 857, "train_info/time_within_train_step": 27.816922187805176, "step": 857}
{"train_info/time_between_train_steps": 0.008924484252929688, "step": 857}
{"info/global_step": 858, "train_info/time_within_train_step": 27.813412189483643, "step": 858}
{"train_info/time_between_train_steps": 0.009894371032714844, "step": 858}
{"info/global_step": 859, "train_info/time_within_train_step": 27.90840435028076, "step": 859}
{"train_info/time_between_train_steps": 0.010251760482788086, "step": 859}
{"info/global_step": 860, "train_info/time_within_train_step": 27.754768133163452, "step": 860}
{"train_info/time_between_train_steps": 0.007320880889892578, "step": 860}
{"info/global_step": 861, "train_info/time_within_train_step": 27.806090593338013, "step": 861}
{"train_info/time_between_train_steps": 0.00507354736328125, "step": 861}
{"info/global_step": 862, "train_info/time_within_train_step": 27.807101011276245, "step": 862}
{"train_info/time_between_train_steps": 0.005254983901977539, "step": 862}
{"info/global_step": 863, "train_info/time_within_train_step": 27.79873538017273, "step": 863}
{"train_info/time_between_train_steps": 0.005144357681274414, "step": 863}
{"info/global_step": 864, "train_info/time_within_train_step": 27.8170428276062, "step": 864}
{"train_info/time_between_train_steps": 0.005220174789428711, "step": 864}
{"info/global_step": 865, "train_info/time_within_train_step": 27.825976610183716, "step": 865}
{"train_info/time_between_train_steps": 0.00523066520690918, "step": 865}
{"info/global_step": 866, "train_info/time_within_train_step": 27.830644369125366, "step": 866}
{"train_info/time_between_train_steps": 0.0051784515380859375, "step": 866}
{"info/global_step": 867, "train_info/time_within_train_step": 27.787928104400635, "step": 867}
{"train_info/time_between_train_steps": 0.0056493282318115234, "step": 867}
{"info/global_step": 868, "train_info/time_within_train_step": 27.81781840324402, "step": 868}
{"train_info/time_between_train_steps": 0.00543665885925293, "step": 868}
{"train_info/time_between_train_steps": 3.92742919921875, "step": 868}
{"info/global_step": 869, "train_info/time_within_train_step": 27.826733350753784, "step": 869}
{"train_info/time_between_train_steps": 0.0052547454833984375, "step": 869}
{"info/global_step": 870, "train_info/time_within_train_step": 27.988781929016113, "step": 870}
{"train_info/time_between_train_steps": 0.0051724910736083984, "step": 870}
{"info/global_step": 871, "train_info/time_within_train_step": 27.82254981994629, "step": 871}
{"train_info/time_between_train_steps": 0.010415315628051758, "step": 871}
{"info/global_step": 872, "train_info/time_within_train_step": 27.946834802627563, "step": 872}
{"train_info/time_between_train_steps": 0.005204916000366211, "step": 872}
{"info/global_step": 873, "train_info/time_within_train_step": 27.791164875030518, "step": 873}
{"train_info/time_between_train_steps": 0.006341457366943359, "step": 873}
{"info/global_step": 874, "train_info/time_within_train_step": 27.96312117576599, "step": 874}
{"train_info/time_between_train_steps": 0.005364179611206055, "step": 874}
{"info/global_step": 875, "train_info/time_within_train_step": 27.929577350616455, "step": 875}
{"train_info/time_between_train_steps": 0.00713801383972168, "step": 875}
{"info/global_step": 876, "train_info/time_within_train_step": 27.87396812438965, "step": 876}
{"train_info/time_between_train_steps": 0.005312442779541016, "step": 876}
{"info/global_step": 877, "train_info/time_within_train_step": 27.840601682662964, "step": 877}
{"train_info/time_between_train_steps": 0.004899263381958008, "step": 877}
{"info/global_step": 878, "train_info/time_within_train_step": 27.778520107269287, "step": 878}
{"train_info/time_between_train_steps": 0.007894515991210938, "step": 878}
{"info/global_step": 879, "train_info/time_within_train_step": 27.797609090805054, "step": 879}
{"train_info/time_between_train_steps": 0.004996061325073242, "step": 879}
{"info/global_step": 880, "train_info/time_within_train_step": 27.822654724121094, "step": 880}
{"train_info/time_between_train_steps": 0.0051727294921875, "step": 880}
{"info/global_step": 881, "train_info/time_within_train_step": 27.79343891143799, "step": 881}
{"train_info/time_between_train_steps": 0.006979227066040039, "step": 881}
{"info/global_step": 882, "train_info/time_within_train_step": 27.79534077644348, "step": 882}
{"train_info/time_between_train_steps": 0.0050504207611083984, "step": 882}
{"info/global_step": 883, "train_info/time_within_train_step": 27.804940223693848, "step": 883}
{"train_info/time_between_train_steps": 0.005146026611328125, "step": 883}
{"info/global_step": 884, "train_info/time_within_train_step": 27.806639194488525, "step": 884}
{"train_info/time_between_train_steps": 0.005029201507568359, "step": 884}
{"info/global_step": 885, "train_info/time_within_train_step": 27.7902615070343, "step": 885}
{"train_info/time_between_train_steps": 0.005139589309692383, "step": 885}
{"info/global_step": 886, "train_info/time_within_train_step": 27.825030088424683, "step": 886}
{"train_info/time_between_train_steps": 0.0072286128997802734, "step": 886}
{"info/global_step": 887, "train_info/time_within_train_step": 27.791860103607178, "step": 887}
{"train_info/time_between_train_steps": 0.005155086517333984, "step": 887}
{"info/global_step": 888, "train_info/time_within_train_step": 27.778164625167847, "step": 888}
{"train_info/time_between_train_steps": 0.005144834518432617, "step": 888}
{"info/global_step": 889, "train_info/time_within_train_step": 27.80255937576294, "step": 889}
{"train_info/time_between_train_steps": 0.005038261413574219, "step": 889}
{"info/global_step": 890, "train_info/time_within_train_step": 27.789037942886353, "step": 890}
{"train_info/time_between_train_steps": 0.005386829376220703, "step": 890}
{"info/global_step": 891, "train_info/time_within_train_step": 27.882071495056152, "step": 891}
{"train_info/time_between_train_steps": 0.005560159683227539, "step": 891}
{"info/global_step": 892, "train_info/time_within_train_step": 27.816217184066772, "step": 892}
{"train_info/time_between_train_steps": 0.005226850509643555, "step": 892}
{"info/global_step": 893, "train_info/time_within_train_step": 27.78996515274048, "step": 893}
{"train_info/time_between_train_steps": 0.005359172821044922, "step": 893}
{"info/global_step": 894, "train_info/time_within_train_step": 27.832528352737427, "step": 894}
{"train_info/time_between_train_steps": 0.005184650421142578, "step": 894}
{"info/global_step": 895, "train_info/time_within_train_step": 27.835477352142334, "step": 895}
{"train_info/time_between_train_steps": 0.005609750747680664, "step": 895}
{"info/global_step": 896, "train_info/time_within_train_step": 27.839439392089844, "step": 896}
{"train_info/time_between_train_steps": 0.005732059478759766, "step": 896}
{"train_info/time_between_train_steps": 3.5666065216064453, "step": 896}
{"info/global_step": 897, "train_info/time_within_train_step": 28.03475308418274, "step": 897}
{"train_info/time_between_train_steps": 0.005509138107299805, "step": 897}
{"info/global_step": 898, "train_info/time_within_train_step": 27.941555976867676, "step": 898}
{"train_info/time_between_train_steps": 0.0065114498138427734, "step": 898}
{"info/global_step": 899, "train_info/time_within_train_step": 27.788424015045166, "step": 899}
{"train_info/time_between_train_steps": 0.005125284194946289, "step": 899}
{"info/global_step": 900, "train_info/time_within_train_step": 28.024222373962402, "step": 900}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740847198, "_runtime": 25303}, "step": 900}
{"logs": {"train/loss": 3.1985, "train/learning_rate": 0.00016666666666666666, "train/epoch": 32.0, "_timestamp": 1740847198, "_runtime": 25303}, "step": 900}
{"train_info/time_between_train_steps": 13.488787412643433, "step": 900}
{"info/global_step": 901, "train_info/time_within_train_step": 27.80029821395874, "step": 901}
{"train_info/time_between_train_steps": 0.005253791809082031, "step": 901}
{"info/global_step": 902, "train_info/time_within_train_step": 27.958417654037476, "step": 902}
{"train_info/time_between_train_steps": 0.010503530502319336, "step": 902}
{"info/global_step": 903, "train_info/time_within_train_step": 27.813990592956543, "step": 903}
{"train_info/time_between_train_steps": 0.005425214767456055, "step": 903}
{"info/global_step": 904, "train_info/time_within_train_step": 27.879138469696045, "step": 904}
{"train_info/time_between_train_steps": 0.005883693695068359, "step": 904}
{"info/global_step": 905, "train_info/time_within_train_step": 27.83625626564026, "step": 905}
{"train_info/time_between_train_steps": 0.005300045013427734, "step": 905}
{"info/global_step": 906, "train_info/time_within_train_step": 27.884889841079712, "step": 906}
{"train_info/time_between_train_steps": 0.006067991256713867, "step": 906}
{"info/global_step": 907, "train_info/time_within_train_step": 27.800758123397827, "step": 907}
{"train_info/time_between_train_steps": 0.005175352096557617, "step": 907}
{"info/global_step": 908, "train_info/time_within_train_step": 27.803606510162354, "step": 908}
{"train_info/time_between_train_steps": 0.005335807800292969, "step": 908}
{"info/global_step": 909, "train_info/time_within_train_step": 27.742476224899292, "step": 909}
{"train_info/time_between_train_steps": 0.005254268646240234, "step": 909}
{"info/global_step": 910, "train_info/time_within_train_step": 27.773006677627563, "step": 910}
{"train_info/time_between_train_steps": 0.005244731903076172, "step": 910}
{"info/global_step": 911, "train_info/time_within_train_step": 27.79761576652527, "step": 911}
{"train_info/time_between_train_steps": 0.005316257476806641, "step": 911}
{"info/global_step": 912, "train_info/time_within_train_step": 27.737325191497803, "step": 912}
{"train_info/time_between_train_steps": 0.005421638488769531, "step": 912}
{"info/global_step": 913, "train_info/time_within_train_step": 27.796973705291748, "step": 913}
{"train_info/time_between_train_steps": 0.0052947998046875, "step": 913}
{"info/global_step": 914, "train_info/time_within_train_step": 27.8092303276062, "step": 914}
{"train_info/time_between_train_steps": 0.005370378494262695, "step": 914}
{"info/global_step": 915, "train_info/time_within_train_step": 27.78830337524414, "step": 915}
{"train_info/time_between_train_steps": 0.005377769470214844, "step": 915}
{"info/global_step": 916, "train_info/time_within_train_step": 27.821372270584106, "step": 916}
{"train_info/time_between_train_steps": 0.006257534027099609, "step": 916}
{"info/global_step": 917, "train_info/time_within_train_step": 27.802674770355225, "step": 917}
{"train_info/time_between_train_steps": 0.00865793228149414, "step": 917}
{"info/global_step": 918, "train_info/time_within_train_step": 27.796701192855835, "step": 918}
{"train_info/time_between_train_steps": 0.005183696746826172, "step": 918}
{"info/global_step": 919, "train_info/time_within_train_step": 27.799126148223877, "step": 919}
{"train_info/time_between_train_steps": 0.005396604537963867, "step": 919}
{"info/global_step": 920, "train_info/time_within_train_step": 27.801652193069458, "step": 920}
{"train_info/time_between_train_steps": 0.005214214324951172, "step": 920}
{"info/global_step": 921, "train_info/time_within_train_step": 27.808385610580444, "step": 921}
{"train_info/time_between_train_steps": 0.011578559875488281, "step": 921}
{"info/global_step": 922, "train_info/time_within_train_step": 27.897895336151123, "step": 922}
{"train_info/time_between_train_steps": 0.007706880569458008, "step": 922}
{"info/global_step": 923, "train_info/time_within_train_step": 27.83286738395691, "step": 923}
{"train_info/time_between_train_steps": 0.00549769401550293, "step": 923}
{"info/global_step": 924, "train_info/time_within_train_step": 27.85170006752014, "step": 924}
{"train_info/time_between_train_steps": 0.005771160125732422, "step": 924}
{"train_info/time_between_train_steps": 3.5394625663757324, "step": 924}
{"info/global_step": 925, "train_info/time_within_train_step": 27.77313756942749, "step": 925}
{"train_info/time_between_train_steps": 0.005038738250732422, "step": 925}
{"info/global_step": 926, "train_info/time_within_train_step": 27.963019609451294, "step": 926}
{"train_info/time_between_train_steps": 0.010211944580078125, "step": 926}
{"info/global_step": 927, "train_info/time_within_train_step": 27.785832405090332, "step": 927}
{"train_info/time_between_train_steps": 0.005201578140258789, "step": 927}
{"info/global_step": 928, "train_info/time_within_train_step": 27.913321256637573, "step": 928}
{"train_info/time_between_train_steps": 0.005307197570800781, "step": 928}
{"info/global_step": 929, "train_info/time_within_train_step": 27.82679510116577, "step": 929}
{"train_info/time_between_train_steps": 0.005667448043823242, "step": 929}
{"info/global_step": 930, "train_info/time_within_train_step": 27.88853168487549, "step": 930}
{"train_info/time_between_train_steps": 0.007101774215698242, "step": 930}
{"info/global_step": 931, "train_info/time_within_train_step": 27.76750349998474, "step": 931}
{"train_info/time_between_train_steps": 0.0055463314056396484, "step": 931}
{"info/global_step": 932, "train_info/time_within_train_step": 27.91986918449402, "step": 932}
{"train_info/time_between_train_steps": 0.005347013473510742, "step": 932}
{"info/global_step": 933, "train_info/time_within_train_step": 27.81987953186035, "step": 933}
{"train_info/time_between_train_steps": 0.005129098892211914, "step": 933}
{"info/global_step": 934, "train_info/time_within_train_step": 27.783358097076416, "step": 934}
{"train_info/time_between_train_steps": 0.005364894866943359, "step": 934}
{"info/global_step": 935, "train_info/time_within_train_step": 27.789673805236816, "step": 935}
{"train_info/time_between_train_steps": 0.0050809383392333984, "step": 935}
{"info/global_step": 936, "train_info/time_within_train_step": 27.812650203704834, "step": 936}
{"train_info/time_between_train_steps": 0.005281925201416016, "step": 936}
{"info/global_step": 937, "train_info/time_within_train_step": 27.88978362083435, "step": 937}
{"train_info/time_between_train_steps": 0.005113124847412109, "step": 937}
{"info/global_step": 938, "train_info/time_within_train_step": 27.791118621826172, "step": 938}
{"train_info/time_between_train_steps": 0.008219718933105469, "step": 938}
{"info/global_step": 939, "train_info/time_within_train_step": 27.776747941970825, "step": 939}
{"train_info/time_between_train_steps": 0.005171060562133789, "step": 939}
{"info/global_step": 940, "train_info/time_within_train_step": 27.755221843719482, "step": 940}
{"train_info/time_between_train_steps": 0.008355855941772461, "step": 940}
{"info/global_step": 941, "train_info/time_within_train_step": 27.773802995681763, "step": 941}
{"train_info/time_between_train_steps": 0.0054399967193603516, "step": 941}
{"info/global_step": 942, "train_info/time_within_train_step": 27.783995151519775, "step": 942}
{"train_info/time_between_train_steps": 0.005008697509765625, "step": 942}
{"info/global_step": 943, "train_info/time_within_train_step": 27.79673480987549, "step": 943}
{"train_info/time_between_train_steps": 0.005257844924926758, "step": 943}
{"info/global_step": 944, "train_info/time_within_train_step": 27.77338671684265, "step": 944}
{"train_info/time_between_train_steps": 0.005239725112915039, "step": 944}
{"info/global_step": 945, "train_info/time_within_train_step": 27.785480976104736, "step": 945}
{"train_info/time_between_train_steps": 0.005159854888916016, "step": 945}
{"info/global_step": 946, "train_info/time_within_train_step": 27.77534008026123, "step": 946}
{"train_info/time_between_train_steps": 0.005264759063720703, "step": 946}
{"info/global_step": 947, "train_info/time_within_train_step": 27.818764686584473, "step": 947}
{"train_info/time_between_train_steps": 0.005230903625488281, "step": 947}
{"info/global_step": 948, "train_info/time_within_train_step": 27.77895736694336, "step": 948}
{"train_info/time_between_train_steps": 0.007662773132324219, "step": 948}
{"info/global_step": 949, "train_info/time_within_train_step": 27.799118757247925, "step": 949}
{"train_info/time_between_train_steps": 0.007194995880126953, "step": 949}
{"info/global_step": 950, "train_info/time_within_train_step": 27.816554307937622, "step": 950}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740848606, "_runtime": 26711}, "step": 950}
{"logs": {"train/loss": 3.1481, "train/learning_rate": 0.0001388888888888889, "train/epoch": 33.02, "_timestamp": 1740848606, "_runtime": 26711}, "step": 950}
{"train_info/time_between_train_steps": 0.008621454238891602, "step": 950}
{"info/global_step": 951, "train_info/time_within_train_step": 27.85353708267212, "step": 951}
{"train_info/time_between_train_steps": 0.005742788314819336, "step": 951}
{"info/global_step": 952, "train_info/time_within_train_step": 27.82388973236084, "step": 952}
{"train_info/time_between_train_steps": 0.00561833381652832, "step": 952}
{"train_info/time_between_train_steps": 3.7892978191375732, "step": 952}
{"info/global_step": 953, "train_info/time_within_train_step": 27.923347234725952, "step": 953}
{"train_info/time_between_train_steps": 0.005591392517089844, "step": 953}
{"info/global_step": 954, "train_info/time_within_train_step": 27.990670680999756, "step": 954}
{"train_info/time_between_train_steps": 0.0052683353424072266, "step": 954}
{"info/global_step": 955, "train_info/time_within_train_step": 27.81978988647461, "step": 955}
{"train_info/time_between_train_steps": 0.005274534225463867, "step": 955}
{"info/global_step": 956, "train_info/time_within_train_step": 27.974513053894043, "step": 956}
{"train_info/time_between_train_steps": 0.005433797836303711, "step": 956}
{"info/global_step": 957, "train_info/time_within_train_step": 27.832216024398804, "step": 957}
{"train_info/time_between_train_steps": 0.005328655242919922, "step": 957}
{"info/global_step": 958, "train_info/time_within_train_step": 27.958030939102173, "step": 958}
{"train_info/time_between_train_steps": 0.0054073333740234375, "step": 958}
{"info/global_step": 959, "train_info/time_within_train_step": 27.805023431777954, "step": 959}
{"train_info/time_between_train_steps": 0.00768589973449707, "step": 959}
{"info/global_step": 960, "train_info/time_within_train_step": 27.88135266304016, "step": 960}
{"train_info/time_between_train_steps": 0.005156517028808594, "step": 960}
{"info/global_step": 961, "train_info/time_within_train_step": 27.78261685371399, "step": 961}
{"train_info/time_between_train_steps": 0.005141735076904297, "step": 961}
{"info/global_step": 962, "train_info/time_within_train_step": 27.78256320953369, "step": 962}
{"train_info/time_between_train_steps": 0.005103349685668945, "step": 962}
{"info/global_step": 963, "train_info/time_within_train_step": 27.76496171951294, "step": 963}
{"train_info/time_between_train_steps": 0.005020618438720703, "step": 963}
{"info/global_step": 964, "train_info/time_within_train_step": 27.835005283355713, "step": 964}
{"train_info/time_between_train_steps": 0.007820844650268555, "step": 964}
{"info/global_step": 965, "train_info/time_within_train_step": 27.80876851081848, "step": 965}
{"train_info/time_between_train_steps": 0.005089759826660156, "step": 965}
{"info/global_step": 966, "train_info/time_within_train_step": 27.771737337112427, "step": 966}
{"train_info/time_between_train_steps": 0.007665872573852539, "step": 966}
{"info/global_step": 967, "train_info/time_within_train_step": 27.767638683319092, "step": 967}
{"train_info/time_between_train_steps": 0.005036354064941406, "step": 967}
{"info/global_step": 968, "train_info/time_within_train_step": 27.80823540687561, "step": 968}
{"train_info/time_between_train_steps": 0.009910106658935547, "step": 968}
{"info/global_step": 969, "train_info/time_within_train_step": 27.888181447982788, "step": 969}
{"train_info/time_between_train_steps": 0.007254600524902344, "step": 969}
{"info/global_step": 970, "train_info/time_within_train_step": 27.772504091262817, "step": 970}
{"train_info/time_between_train_steps": 0.005984783172607422, "step": 970}
{"info/global_step": 971, "train_info/time_within_train_step": 27.78868055343628, "step": 971}
{"train_info/time_between_train_steps": 0.005319356918334961, "step": 971}
{"info/global_step": 972, "train_info/time_within_train_step": 27.812945127487183, "step": 972}
{"train_info/time_between_train_steps": 0.010073184967041016, "step": 972}
{"info/global_step": 973, "train_info/time_within_train_step": 27.7794668674469, "step": 973}
{"train_info/time_between_train_steps": 0.005313873291015625, "step": 973}
{"info/global_step": 974, "train_info/time_within_train_step": 27.83791708946228, "step": 974}
{"train_info/time_between_train_steps": 0.005103111267089844, "step": 974}
{"info/global_step": 975, "train_info/time_within_train_step": 27.797060251235962, "step": 975}
{"train_info/time_between_train_steps": 0.005099058151245117, "step": 975}
{"info/global_step": 976, "train_info/time_within_train_step": 27.815797090530396, "step": 976}
{"train_info/time_between_train_steps": 0.005207538604736328, "step": 976}
{"info/global_step": 977, "train_info/time_within_train_step": 27.791017293930054, "step": 977}
{"train_info/time_between_train_steps": 0.00523829460144043, "step": 977}
{"info/global_step": 978, "train_info/time_within_train_step": 27.822373151779175, "step": 978}
{"train_info/time_between_train_steps": 0.0054242610931396484, "step": 978}
{"info/global_step": 979, "train_info/time_within_train_step": 27.812434673309326, "step": 979}
{"train_info/time_between_train_steps": 0.005525112152099609, "step": 979}
{"info/global_step": 980, "train_info/time_within_train_step": 27.95112133026123, "step": 980}
{"train_info/time_between_train_steps": 0.005766630172729492, "step": 980}
{"train_info/time_between_train_steps": 3.8412868976593018, "step": 980}
{"info/global_step": 981, "train_info/time_within_train_step": 27.82179093360901, "step": 981}
{"train_info/time_between_train_steps": 0.005106687545776367, "step": 981}
{"info/global_step": 982, "train_info/time_within_train_step": 27.879409074783325, "step": 982}
{"train_info/time_between_train_steps": 0.009994268417358398, "step": 982}
{"info/global_step": 983, "train_info/time_within_train_step": 27.78145933151245, "step": 983}
{"train_info/time_between_train_steps": 0.0051479339599609375, "step": 983}
{"info/global_step": 984, "train_info/time_within_train_step": 28.03062677383423, "step": 984}
{"train_info/time_between_train_steps": 0.005342960357666016, "step": 984}
{"info/global_step": 985, "train_info/time_within_train_step": 27.81710982322693, "step": 985}
{"train_info/time_between_train_steps": 0.005228996276855469, "step": 985}
{"info/global_step": 986, "train_info/time_within_train_step": 27.975682497024536, "step": 986}
{"train_info/time_between_train_steps": 0.00795888900756836, "step": 986}
{"info/global_step": 987, "train_info/time_within_train_step": 27.84501028060913, "step": 987}
{"train_info/time_between_train_steps": 0.005124807357788086, "step": 987}
{"info/global_step": 988, "train_info/time_within_train_step": 27.875107526779175, "step": 988}
{"train_info/time_between_train_steps": 0.00809931755065918, "step": 988}
{"info/global_step": 989, "train_info/time_within_train_step": 27.825499057769775, "step": 989}
{"train_info/time_between_train_steps": 0.005212068557739258, "step": 989}
{"info/global_step": 990, "train_info/time_within_train_step": 27.789788722991943, "step": 990}
{"train_info/time_between_train_steps": 0.009276151657104492, "step": 990}
{"info/global_step": 991, "train_info/time_within_train_step": 27.818296909332275, "step": 991}
{"train_info/time_between_train_steps": 0.009976863861083984, "step": 991}
{"info/global_step": 992, "train_info/time_within_train_step": 27.7970712184906, "step": 992}
{"train_info/time_between_train_steps": 0.005123138427734375, "step": 992}
{"info/global_step": 993, "train_info/time_within_train_step": 27.76610565185547, "step": 993}
{"train_info/time_between_train_steps": 0.008022785186767578, "step": 993}
{"info/global_step": 994, "train_info/time_within_train_step": 27.81228756904602, "step": 994}
{"train_info/time_between_train_steps": 0.005157470703125, "step": 994}
{"info/global_step": 995, "train_info/time_within_train_step": 27.931204319000244, "step": 995}
{"train_info/time_between_train_steps": 0.006086587905883789, "step": 995}
{"info/global_step": 996, "train_info/time_within_train_step": 27.80522608757019, "step": 996}
{"train_info/time_between_train_steps": 0.005204916000366211, "step": 996}
{"info/global_step": 997, "train_info/time_within_train_step": 27.801093101501465, "step": 997}
{"train_info/time_between_train_steps": 0.005127429962158203, "step": 997}
{"info/global_step": 998, "train_info/time_within_train_step": 27.80565357208252, "step": 998}
{"train_info/time_between_train_steps": 0.006573677062988281, "step": 998}
{"info/global_step": 999, "train_info/time_within_train_step": 27.82584238052368, "step": 999}
{"train_info/time_between_train_steps": 0.005001068115234375, "step": 999}
{"info/global_step": 1000, "train_info/time_within_train_step": 27.902139902114868, "step": 1000}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740850006, "_runtime": 28111}, "step": 1000}
{"logs": {"train/loss": 3.1052, "train/learning_rate": 0.00011111111111111109, "train/epoch": 35.02, "_timestamp": 1740850006, "_runtime": 28111}, "step": 1000}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1740850010, "_runtime": 28115}, "step": 1000}
{"logs": {"eval/loss": 4.192286014556885, "eval/runtime": 4.0507, "eval/samples_per_second": 50.362, "eval/steps_per_second": 3.209, "train/epoch": 35.02, "_timestamp": 1740850010, "_runtime": 28115}, "step": 1000}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1740850010, "_runtime": 28115}, "step": 1000}
{"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.192286014556885, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 66.173892666178, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 4.0507, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 50.362, "train/epoch": 35.02, "_timestamp": 1740850010, "_runtime": 28115}, "step": 1000}
{"train_info/time_between_train_steps": 17.62525510787964, "step": 1000}
{"info/global_step": 1001, "train_info/time_within_train_step": 27.79902982711792, "step": 1001}
{"train_info/time_between_train_steps": 0.005092144012451172, "step": 1001}
{"info/global_step": 1002, "train_info/time_within_train_step": 27.778061628341675, "step": 1002}
{"train_info/time_between_train_steps": 0.0048427581787109375, "step": 1002}
{"info/global_step": 1003, "train_info/time_within_train_step": 27.803203344345093, "step": 1003}
{"train_info/time_between_train_steps": 0.0051958560943603516, "step": 1003}
{"info/global_step": 1004, "train_info/time_within_train_step": 27.8296480178833, "step": 1004}
{"train_info/time_between_train_steps": 0.005156278610229492, "step": 1004}
{"info/global_step": 1005, "train_info/time_within_train_step": 27.824047088623047, "step": 1005}
{"train_info/time_between_train_steps": 0.0053255558013916016, "step": 1005}
{"info/global_step": 1006, "train_info/time_within_train_step": 27.81929922103882, "step": 1006}
{"train_info/time_between_train_steps": 0.0052645206451416016, "step": 1006}
{"info/global_step": 1007, "train_info/time_within_train_step": 27.79573369026184, "step": 1007}
{"train_info/time_between_train_steps": 0.0055010318756103516, "step": 1007}
{"info/global_step": 1008, "train_info/time_within_train_step": 27.87290048599243, "step": 1008}
{"train_info/time_between_train_steps": 0.007962703704833984, "step": 1008}
{"train_info/time_between_train_steps": 3.4945106506347656, "step": 1008}
{"info/global_step": 1009, "train_info/time_within_train_step": 27.805139780044556, "step": 1009}
{"train_info/time_between_train_steps": 0.0049822330474853516, "step": 1009}
{"info/global_step": 1010, "train_info/time_within_train_step": 27.951339721679688, "step": 1010}
{"train_info/time_between_train_steps": 0.008006572723388672, "step": 1010}
{"info/global_step": 1011, "train_info/time_within_train_step": 27.832637548446655, "step": 1011}
{"train_info/time_between_train_steps": 0.005393028259277344, "step": 1011}
{"info/global_step": 1012, "train_info/time_within_train_step": 27.99678897857666, "step": 1012}
{"train_info/time_between_train_steps": 0.0052950382232666016, "step": 1012}
{"info/global_step": 1013, "train_info/time_within_train_step": 27.82842993736267, "step": 1013}
{"train_info/time_between_train_steps": 0.0056285858154296875, "step": 1013}
{"info/global_step": 1014, "train_info/time_within_train_step": 27.960533142089844, "step": 1014}
{"train_info/time_between_train_steps": 0.006482362747192383, "step": 1014}
{"info/global_step": 1015, "train_info/time_within_train_step": 27.822892665863037, "step": 1015}
{"train_info/time_between_train_steps": 0.010093450546264648, "step": 1015}
{"info/global_step": 1016, "train_info/time_within_train_step": 28.001711130142212, "step": 1016}
{"train_info/time_between_train_steps": 0.00545191764831543, "step": 1016}
{"info/global_step": 1017, "train_info/time_within_train_step": 27.768479824066162, "step": 1017}
{"train_info/time_between_train_steps": 0.005064725875854492, "step": 1017}
{"info/global_step": 1018, "train_info/time_within_train_step": 27.786784410476685, "step": 1018}
{"train_info/time_between_train_steps": 0.0051043033599853516, "step": 1018}
{"info/global_step": 1019, "train_info/time_within_train_step": 27.81742763519287, "step": 1019}
{"train_info/time_between_train_steps": 0.005181074142456055, "step": 1019}
{"info/global_step": 1020, "train_info/time_within_train_step": 27.80805468559265, "step": 1020}
{"train_info/time_between_train_steps": 0.009898662567138672, "step": 1020}
{"info/global_step": 1021, "train_info/time_within_train_step": 27.783999919891357, "step": 1021}
{"train_info/time_between_train_steps": 0.0052642822265625, "step": 1021}
{"info/global_step": 1022, "train_info/time_within_train_step": 27.80102038383484, "step": 1022}
{"train_info/time_between_train_steps": 0.00575566291809082, "step": 1022}
{"info/global_step": 1023, "train_info/time_within_train_step": 27.741875648498535, "step": 1023}
{"train_info/time_between_train_steps": 0.0054013729095458984, "step": 1023}
{"info/global_step": 1024, "train_info/time_within_train_step": 27.757972955703735, "step": 1024}
{"train_info/time_between_train_steps": 0.0052394866943359375, "step": 1024}
{"info/global_step": 1025, "train_info/time_within_train_step": 27.79252290725708, "step": 1025}
{"train_info/time_between_train_steps": 0.0052051544189453125, "step": 1025}
{"info/global_step": 1026, "train_info/time_within_train_step": 27.784467458724976, "step": 1026}
{"train_info/time_between_train_steps": 0.005227565765380859, "step": 1026}
{"info/global_step": 1027, "train_info/time_within_train_step": 27.794239282608032, "step": 1027}
{"train_info/time_between_train_steps": 0.009796142578125, "step": 1027}
{"info/global_step": 1028, "train_info/time_within_train_step": 27.79904270172119, "step": 1028}
{"train_info/time_between_train_steps": 0.007761240005493164, "step": 1028}
{"info/global_step": 1029, "train_info/time_within_train_step": 27.806519269943237, "step": 1029}
{"train_info/time_between_train_steps": 0.005164146423339844, "step": 1029}
{"info/global_step": 1030, "train_info/time_within_train_step": 27.79438090324402, "step": 1030}
{"train_info/time_between_train_steps": 0.005097866058349609, "step": 1030}
{"info/global_step": 1031, "train_info/time_within_train_step": 27.900270223617554, "step": 1031}
{"train_info/time_between_train_steps": 0.007833242416381836, "step": 1031}
{"info/global_step": 1032, "train_info/time_within_train_step": 27.799601316452026, "step": 1032}
{"train_info/time_between_train_steps": 0.00540471076965332, "step": 1032}
{"info/global_step": 1033, "train_info/time_within_train_step": 27.81529998779297, "step": 1033}
{"train_info/time_between_train_steps": 0.005276918411254883, "step": 1033}
{"info/global_step": 1034, "train_info/time_within_train_step": 27.79812979698181, "step": 1034}
{"train_info/time_between_train_steps": 0.005212306976318359, "step": 1034}
{"info/global_step": 1035, "train_info/time_within_train_step": 27.856907606124878, "step": 1035}
{"train_info/time_between_train_steps": 0.005673408508300781, "step": 1035}
{"info/global_step": 1036, "train_info/time_within_train_step": 27.85163116455078, "step": 1036}
{"train_info/time_between_train_steps": 0.005742311477661133, "step": 1036}
{"train_info/time_between_train_steps": 3.72320818901062, "step": 1036}
{"info/global_step": 1037, "train_info/time_within_train_step": 27.77842402458191, "step": 1037}
{"train_info/time_between_train_steps": 0.0053119659423828125, "step": 1037}
{"info/global_step": 1038, "train_info/time_within_train_step": 27.944751024246216, "step": 1038}
{"train_info/time_between_train_steps": 0.005292415618896484, "step": 1038}
{"info/global_step": 1039, "train_info/time_within_train_step": 27.79897427558899, "step": 1039}
{"train_info/time_between_train_steps": 0.0070230960845947266, "step": 1039}
{"info/global_step": 1040, "train_info/time_within_train_step": 27.93561029434204, "step": 1040}
{"train_info/time_between_train_steps": 0.005303144454956055, "step": 1040}
{"info/global_step": 1041, "train_info/time_within_train_step": 27.844220638275146, "step": 1041}
{"train_info/time_between_train_steps": 0.005441904067993164, "step": 1041}
{"info/global_step": 1042, "train_info/time_within_train_step": 27.9650776386261, "step": 1042}
{"train_info/time_between_train_steps": 0.00997161865234375, "step": 1042}
{"info/global_step": 1043, "train_info/time_within_train_step": 27.84111213684082, "step": 1043}
{"train_info/time_between_train_steps": 0.008271932601928711, "step": 1043}
{"info/global_step": 1044, "train_info/time_within_train_step": 27.890879154205322, "step": 1044}
{"train_info/time_between_train_steps": 0.005179166793823242, "step": 1044}
{"info/global_step": 1045, "train_info/time_within_train_step": 27.860912084579468, "step": 1045}
{"train_info/time_between_train_steps": 0.00498652458190918, "step": 1045}
{"info/global_step": 1046, "train_info/time_within_train_step": 27.77652072906494, "step": 1046}
{"train_info/time_between_train_steps": 0.005089282989501953, "step": 1046}
{"info/global_step": 1047, "train_info/time_within_train_step": 27.880277395248413, "step": 1047}
{"train_info/time_between_train_steps": 0.005125761032104492, "step": 1047}
{"info/global_step": 1048, "train_info/time_within_train_step": 27.80481719970703, "step": 1048}
{"train_info/time_between_train_steps": 0.0051801204681396484, "step": 1048}
{"info/global_step": 1049, "train_info/time_within_train_step": 27.81621265411377, "step": 1049}
{"train_info/time_between_train_steps": 0.008748054504394531, "step": 1049}
{"info/global_step": 1050, "train_info/time_within_train_step": 27.813483953475952, "step": 1050}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1740851423, "_runtime": 29528}, "step": 1050}
{"logs": {"train/loss": 3.0653, "train/learning_rate": 8.333333333333333e-05, "train/epoch": 37.01, "_timestamp": 1740851423, "_runtime": 29528}, "step": 1050}
{"train_info/time_between_train_steps": 0.009258747100830078, "step": 1050}
{"info/global_step": 1051, "train_info/time_within_train_step": 27.80109405517578, "step": 1051}
{"train_info/time_between_train_steps": 0.005189418792724609, "step": 1051}
{"info/global_step": 1052, "train_info/time_within_train_step": 27.80058264732361, "step": 1052}
{"train_info/time_between_train_steps": 0.0050313472747802734, "step": 1052}
{"info/global_step": 1053, "train_info/time_within_train_step": 27.808229207992554, "step": 1053}
{"train_info/time_between_train_steps": 0.008627891540527344, "step": 1053}
{"info/global_step": 1054, "train_info/time_within_train_step": 27.794918060302734, "step": 1054}
{"train_info/time_between_train_steps": 0.005314826965332031, "step": 1054}
{"info/global_step": 1055, "train_info/time_within_train_step": 27.8187153339386, "step": 1055}
{"train_info/time_between_train_steps": 0.00803828239440918, "step": 1055}
{"info/global_step": 1056, "train_info/time_within_train_step": 27.8390474319458, "step": 1056}
{"train_info/time_between_train_steps": 0.00982213020324707, "step": 1056}
{"info/global_step": 1057, "train_info/time_within_train_step": 27.782208919525146, "step": 1057}
{"train_info/time_between_train_steps": 0.009766578674316406, "step": 1057}
{"info/global_step": 1058, "train_info/time_within_train_step": 27.82338833808899, "step": 1058}
{"train_info/time_between_train_steps": 0.010067224502563477, "step": 1058}
{"info/global_step": 1059, "train_info/time_within_train_step": 27.819578886032104, "step": 1059}
{"train_info/time_between_train_steps": 0.0051004886627197266, "step": 1059}
{"info/global_step": 1060, "train_info/time_within_train_step": 27.81588339805603, "step": 1060}
{"train_info/time_between_train_steps": 0.005317211151123047, "step": 1060}
{"info/global_step": 1061, "train_info/time_within_train_step": 27.847298860549927, "step": 1061}
{"train_info/time_between_train_steps": 0.009914398193359375, "step": 1061}
{"info/global_step": 1062, "train_info/time_within_train_step": 27.927939414978027, "step": 1062}
{"train_info/time_between_train_steps": 0.00528407096862793, "step": 1062}
{"info/global_step": 1063, "train_info/time_within_train_step": 27.838690996170044, "step": 1063}
{"train_info/time_between_train_steps": 0.00556182861328125, "step": 1063}
{"info/global_step": 1064, "train_info/time_within_train_step": 27.872633457183838, "step": 1064}
{"train_info/time_between_train_steps": 0.006244659423828125, "step": 1064}
{"train_info/time_between_train_steps": 3.8721182346343994, "step": 1064}
{"info/global_step": 1065, "train_info/time_within_train_step": 27.810487508773804, "step": 1065}
{"train_info/time_between_train_steps": 0.005637645721435547, "step": 1065}
{"info/global_step": 1066, "train_info/time_within_train_step": 28.034790515899658, "step": 1066}
{"train_info/time_between_train_steps": 0.0055539608001708984, "step": 1066}
{"info/global_step": 1067, "train_info/time_within_train_step": 27.846205234527588, "step": 1067}
{"train_info/time_between_train_steps": 0.005630016326904297, "step": 1067}
{"info/global_step": 1068, "train_info/time_within_train_step": 28.007869482040405, "step": 1068}
{"train_info/time_between_train_steps": 0.005454063415527344, "step": 1068}
{"info/global_step": 1069, "train_info/time_within_train_step": 27.830490589141846, "step": 1069}
{"train_info/time_between_train_steps": 0.008845090866088867, "step": 1069}
{"info/global_step": 1070, "train_info/time_within_train_step": 27.98770546913147, "step": 1070}
{"train_info/time_between_train_steps": 0.007795810699462891, "step": 1070}
{"info/global_step": 1071, "train_info/time_within_train_step": 27.827953577041626, "step": 1071}
{"train_info/time_between_train_steps": 0.009459972381591797, "step": 1071}
{"info/global_step": 1072, "train_info/time_within_train_step": 27.954997062683105, "step": 1072}
{"train_info/time_between_train_steps": 0.0056018829345703125, "step": 1072}
{"info/global_step": 1073, "train_info/time_within_train_step": 27.838211059570312, "step": 1073}
{"train_info/time_between_train_steps": 0.00690007209777832, "step": 1073}
{"info/global_step": 1074, "train_info/time_within_train_step": 27.76661705970764, "step": 1074}
{"train_info/time_between_train_steps": 0.009442806243896484, "step": 1074}
{"info/global_step": 1075, "train_info/time_within_train_step": 27.7876558303833, "step": 1075}
{"train_info/time_between_train_steps": 0.005827426910400391, "step": 1075}
{"info/global_step": 1076, "train_info/time_within_train_step": 27.779203414916992, "step": 1076}
{"train_info/time_between_train_steps": 0.00529789924621582, "step": 1076}
{"info/global_step": 1077, "train_info/time_within_train_step": 27.802456378936768, "step": 1077}
{"train_info/time_between_train_steps": 0.005429983139038086, "step": 1077}
{"info/global_step": 1078, "train_info/time_within_train_step": 27.933249950408936, "step": 1078}
{"train_info/time_between_train_steps": 0.0054168701171875, "step": 1078}
{"info/global_step": 1079, "train_info/time_within_train_step": 27.775091409683228, "step": 1079}
{"train_info/time_between_train_steps": 0.0051763057708740234, "step": 1079}
{"info/global_step": 1080, "train_info/time_within_train_step": 27.859294652938843, "step": 1080}
{"train_info/time_between_train_steps": 0.005239009857177734, "step": 1080}
{"info/global_step": 1081, "train_info/time_within_train_step": 27.83651566505432, "step": 1081}
{"train_info/time_between_train_steps": 0.00497889518737793, "step": 1081}
{"info/global_step": 1082, "train_info/time_within_train_step": 27.795670747756958, "step": 1082}
{"train_info/time_between_train_steps": 0.005182027816772461, "step": 1082}
{"info/global_step": 1083, "train_info/time_within_train_step": 27.785676956176758, "step": 1083}
{"train_info/time_between_train_steps": 0.0050716400146484375, "step": 1083}
{"info/global_step": 1084, "train_info/time_within_train_step": 28.11453628540039, "step": 1084}
{"train_info/time_between_train_steps": 0.005275249481201172, "step": 1084}
{"info/global_step": 1085, "train_info/time_within_train_step": 27.80505132675171, "step": 1085}
{"train_info/time_between_train_steps": 0.005112886428833008, "step": 1085}
{"info/global_step": 1086, "train_info/time_within_train_step": 27.844565629959106, "step": 1086}
{"train_info/time_between_train_steps": 0.010042428970336914, "step": 1086}
{"info/global_step": 1087, "train_info/time_within_train_step": 27.758373737335205, "step": 1087}
{"train_info/time_between_train_steps": 0.005144834518432617, "step": 1087}
{"info/global_step": 1088, "train_info/time_within_train_step": 27.8255832195282, "step": 1088}
{"train_info/time_between_train_steps": 0.00535893440246582, "step": 1088}
{"info/global_step": 1089, "train_info/time_within_train_step": 27.823697566986084, "step": 1089}
{"train_info/time_between_train_steps": 0.005223512649536133, "step": 1089}
{"info/global_step": 1090, "train_info/time_within_train_step": 27.824263095855713, "step": 1090}
{"train_info/time_between_train_steps": 0.005315303802490234, "step": 1090}
{"info/global_step": 1091, "train_info/time_within_train_step": 27.78979516029358, "step": 1091}
{"train_info/time_between_train_steps": 0.005524158477783203, "step": 1091}
{"info/global_step": 1092, "train_info/time_within_train_step": 27.786406993865967, "step": 1092}
{"train_info/time_between_train_steps": 0.005567312240600586, "step": 1092}
{"train_info/time_between_train_steps": 3.4654877185821533, "step": 1092}
{"info/global_step": 1093, "train_info/time_within_train_step": 27.784501314163208, "step": 1093}
{"train_info/time_between_train_steps": 0.005496978759765625, "step": 1093}
{"info/global_step": 1094, "train_info/time_within_train_step": 28.00702404975891, "step": 1094}
{"train_info/time_between_train_steps": 0.005539894104003906, "step": 1094}
{"info/global_step": 1095, "train_info/time_within_train_step": 27.800817251205444, "step": 1095}
{"train_info/time_between_train_steps": 0.007026195526123047, "step": 1095}
{"info/global_step": 1096, "train_info/time_within_train_step": 27.891108512878418, "step": 1096}
{"train_info/time_between_train_steps": 0.005974769592285156, "step": 1096}
{"info/global_step": 1097, "train_info/time_within_train_step": 27.807618379592896, "step": 1097}
{"train_info/time_between_train_steps": 0.0055124759674072266, "step": 1097}
{"info/global_step": 1098, "train_info/time_within_train_step": 27.880183935165405, "step": 1098}
{"train_info/time_between_train_steps": 0.005313396453857422, "step": 1098}
{"info/global_step": 1099, "train_info/time_within_train_step": 27.8280668258667, "step": 1099}
{"train_info/time_between_train_steps": 0.00556492805480957, "step": 1099}
{"info/global_step": 1100, "train_info/time_within_train_step": 27.88570213317871, "step": 1100}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1740852823, "_runtime": 30928}, "step": 1100}
{"logs": {"train/loss": 3.0302, "train/learning_rate": 5.5555555555555545e-05, "train/epoch": 39.01, "_timestamp": 1740852823, "_runtime": 30928}, "step": 1100}
{"train_info/time_between_train_steps": 13.97428560256958, "step": 1100}
{"info/global_step": 1101, "train_info/time_within_train_step": 27.816577434539795, "step": 1101}
{"train_info/time_between_train_steps": 0.005232572555541992, "step": 1101}
{"info/global_step": 1102, "train_info/time_within_train_step": 27.82252597808838, "step": 1102}
{"train_info/time_between_train_steps": 0.00509333610534668, "step": 1102}
{"info/global_step": 1103, "train_info/time_within_train_step": 27.792673110961914, "step": 1103}
{"train_info/time_between_train_steps": 0.005030155181884766, "step": 1103}
{"info/global_step": 1104, "train_info/time_within_train_step": 27.793988704681396, "step": 1104}
{"train_info/time_between_train_steps": 0.005240678787231445, "step": 1104}
{"info/global_step": 1105, "train_info/time_within_train_step": 27.810800552368164, "step": 1105}
{"train_info/time_between_train_steps": 0.00894618034362793, "step": 1105}
{"info/global_step": 1106, "train_info/time_within_train_step": 27.815096616744995, "step": 1106}
{"train_info/time_between_train_steps": 0.005105733871459961, "step": 1106}
{"info/global_step": 1107, "train_info/time_within_train_step": 27.806565761566162, "step": 1107}
{"train_info/time_between_train_steps": 0.009732484817504883, "step": 1107}
{"info/global_step": 1108, "train_info/time_within_train_step": 27.82137131690979, "step": 1108}
{"train_info/time_between_train_steps": 0.005343437194824219, "step": 1108}
{"info/global_step": 1109, "train_info/time_within_train_step": 27.91968011856079, "step": 1109}
{"train_info/time_between_train_steps": 0.0053653717041015625, "step": 1109}
{"info/global_step": 1110, "train_info/time_within_train_step": 27.82554531097412, "step": 1110}
{"train_info/time_between_train_steps": 0.00545501708984375, "step": 1110}
{"info/global_step": 1111, "train_info/time_within_train_step": 27.793237447738647, "step": 1111}
{"train_info/time_between_train_steps": 0.005248546600341797, "step": 1111}
{"info/global_step": 1112, "train_info/time_within_train_step": 27.84116244316101, "step": 1112}
{"train_info/time_between_train_steps": 0.0054738521575927734, "step": 1112}
{"info/global_step": 1113, "train_info/time_within_train_step": 27.830729961395264, "step": 1113}
{"train_info/time_between_train_steps": 0.005397319793701172, "step": 1113}
{"info/global_step": 1114, "train_info/time_within_train_step": 27.81604290008545, "step": 1114}
{"train_info/time_between_train_steps": 0.005500078201293945, "step": 1114}
{"info/global_step": 1115, "train_info/time_within_train_step": 27.84122323989868, "step": 1115}
{"train_info/time_between_train_steps": 0.005317211151123047, "step": 1115}
{"info/global_step": 1116, "train_info/time_within_train_step": 27.77157187461853, "step": 1116}
{"train_info/time_between_train_steps": 0.010173559188842773, "step": 1116}
{"info/global_step": 1117, "train_info/time_within_train_step": 27.79380512237549, "step": 1117}
{"train_info/time_between_train_steps": 0.005597114562988281, "step": 1117}
{"info/global_step": 1118, "train_info/time_within_train_step": 27.80533742904663, "step": 1118}
{"train_info/time_between_train_steps": 0.008254766464233398, "step": 1118}
{"info/global_step": 1119, "train_info/time_within_train_step": 27.81784176826477, "step": 1119}
{"train_info/time_between_train_steps": 0.0056879520416259766, "step": 1119}
{"info/global_step": 1120, "train_info/time_within_train_step": 27.826703310012817, "step": 1120}
{"train_info/time_between_train_steps": 0.006154775619506836, "step": 1120}
{"train_info/time_between_train_steps": 3.698732614517212, "step": 1120}
{"info/global_step": 1121, "train_info/time_within_train_step": 27.797924757003784, "step": 1121}
{"train_info/time_between_train_steps": 0.00542140007019043, "step": 1121}
{"info/global_step": 1122, "train_info/time_within_train_step": 27.963257789611816, "step": 1122}
{"train_info/time_between_train_steps": 0.005353212356567383, "step": 1122}
{"info/global_step": 1123, "train_info/time_within_train_step": 27.822998523712158, "step": 1123}
{"train_info/time_between_train_steps": 0.005491018295288086, "step": 1123}
{"info/global_step": 1124, "train_info/time_within_train_step": 27.95958375930786, "step": 1124}
{"train_info/time_between_train_steps": 0.010190486907958984, "step": 1124}
{"info/global_step": 1125, "train_info/time_within_train_step": 27.88796639442444, "step": 1125}
{"train_info/time_between_train_steps": 0.00575709342956543, "step": 1125}
{"info/global_step": 1126, "train_info/time_within_train_step": 27.943564653396606, "step": 1126}
{"train_info/time_between_train_steps": 0.010042190551757812, "step": 1126}
{"info/global_step": 1127, "train_info/time_within_train_step": 27.84993290901184, "step": 1127}
{"train_info/time_between_train_steps": 0.010520696640014648, "step": 1127}
{"info/global_step": 1128, "train_info/time_within_train_step": 27.926679372787476, "step": 1128}
{"train_info/time_between_train_steps": 0.005769968032836914, "step": 1128}
{"info/global_step": 1129, "train_info/time_within_train_step": 27.81141233444214, "step": 1129}
{"train_info/time_between_train_steps": 0.005322456359863281, "step": 1129}
{"info/global_step": 1130, "train_info/time_within_train_step": 27.77386236190796, "step": 1130}
{"train_info/time_between_train_steps": 0.006048679351806641, "step": 1130}
{"info/global_step": 1131, "train_info/time_within_train_step": 27.80385112762451, "step": 1131}
{"train_info/time_between_train_steps": 0.00913858413696289, "step": 1131}
{"info/global_step": 1132, "train_info/time_within_train_step": 27.815276861190796, "step": 1132}
{"train_info/time_between_train_steps": 0.005308866500854492, "step": 1132}
{"info/global_step": 1133, "train_info/time_within_train_step": 27.797411680221558, "step": 1133}
{"train_info/time_between_train_steps": 0.005188941955566406, "step": 1133}
{"info/global_step": 1134, "train_info/time_within_train_step": 27.798914194107056, "step": 1134}
{"train_info/time_between_train_steps": 0.00747227668762207, "step": 1134}
{"info/global_step": 1135, "train_info/time_within_train_step": 27.808561086654663, "step": 1135}
{"train_info/time_between_train_steps": 0.005192995071411133, "step": 1135}
{"info/global_step": 1136, "train_info/time_within_train_step": 27.751624584197998, "step": 1136}
{"train_info/time_between_train_steps": 0.00527191162109375, "step": 1136}
{"info/global_step": 1137, "train_info/time_within_train_step": 27.755836248397827, "step": 1137}
{"train_info/time_between_train_steps": 0.005304098129272461, "step": 1137}
{"info/global_step": 1138, "train_info/time_within_train_step": 27.821805953979492, "step": 1138}
{"train_info/time_between_train_steps": 0.009427309036254883, "step": 1138}
{"info/global_step": 1139, "train_info/time_within_train_step": 27.844618320465088, "step": 1139}
{"train_info/time_between_train_steps": 0.005365610122680664, "step": 1139}
{"info/global_step": 1140, "train_info/time_within_train_step": 27.911228895187378, "step": 1140}
{"train_info/time_between_train_steps": 0.0052068233489990234, "step": 1140}
{"info/global_step": 1141, "train_info/time_within_train_step": 27.818846940994263, "step": 1141}
{"train_info/time_between_train_steps": 0.009424448013305664, "step": 1141}
{"info/global_step": 1142, "train_info/time_within_train_step": 27.771101713180542, "step": 1142}
{"train_info/time_between_train_steps": 0.007310152053833008, "step": 1142}
{"info/global_step": 1143, "train_info/time_within_train_step": 27.79176378250122, "step": 1143}
{"train_info/time_between_train_steps": 0.00530552864074707, "step": 1143}
{"info/global_step": 1144, "train_info/time_within_train_step": 27.789071321487427, "step": 1144}
{"train_info/time_between_train_steps": 0.005308866500854492, "step": 1144}
{"info/global_step": 1145, "train_info/time_within_train_step": 27.794540405273438, "step": 1145}
{"train_info/time_between_train_steps": 0.005239248275756836, "step": 1145}
{"info/global_step": 1146, "train_info/time_within_train_step": 27.79960584640503, "step": 1146}
{"train_info/time_between_train_steps": 0.0051915645599365234, "step": 1146}
{"info/global_step": 1147, "train_info/time_within_train_step": 27.76937508583069, "step": 1147}
{"train_info/time_between_train_steps": 0.005500078201293945, "step": 1147}
{"info/global_step": 1148, "train_info/time_within_train_step": 27.849714994430542, "step": 1148}
{"train_info/time_between_train_steps": 0.005942106246948242, "step": 1148}
{"train_info/time_between_train_steps": 3.825277090072632, "step": 1148}
{"info/global_step": 1149, "train_info/time_within_train_step": 27.833155632019043, "step": 1149}
{"train_info/time_between_train_steps": 0.005087137222290039, "step": 1149}
{"info/global_step": 1150, "train_info/time_within_train_step": 27.975826501846313, "step": 1150}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1740854236, "_runtime": 32341}, "step": 1150}
{"logs": {"train/loss": 3.001, "train/learning_rate": 2.7777777777777772e-05, "train/epoch": 41.0, "_timestamp": 1740854236, "_runtime": 32341}, "step": 1150}
{"train_info/time_between_train_steps": 0.009183168411254883, "step": 1150}
{"info/global_step": 1151, "train_info/time_within_train_step": 27.800992727279663, "step": 1151}
{"train_info/time_between_train_steps": 0.010259628295898438, "step": 1151}
{"info/global_step": 1152, "train_info/time_within_train_step": 27.89049005508423, "step": 1152}
{"train_info/time_between_train_steps": 0.005165815353393555, "step": 1152}
{"info/global_step": 1153, "train_info/time_within_train_step": 27.789488554000854, "step": 1153}
{"train_info/time_between_train_steps": 0.005637645721435547, "step": 1153}
{"info/global_step": 1154, "train_info/time_within_train_step": 27.96065402030945, "step": 1154}
{"train_info/time_between_train_steps": 0.005232334136962891, "step": 1154}
{"info/global_step": 1155, "train_info/time_within_train_step": 27.76510214805603, "step": 1155}
{"train_info/time_between_train_steps": 0.005315065383911133, "step": 1155}
{"info/global_step": 1156, "train_info/time_within_train_step": 28.0059494972229, "step": 1156}
{"train_info/time_between_train_steps": 0.005381107330322266, "step": 1156}
{"info/global_step": 1157, "train_info/time_within_train_step": 27.813976049423218, "step": 1157}
{"train_info/time_between_train_steps": 0.005232095718383789, "step": 1157}
{"info/global_step": 1158, "train_info/time_within_train_step": 27.80465292930603, "step": 1158}
{"train_info/time_between_train_steps": 0.006296634674072266, "step": 1158}
{"info/global_step": 1159, "train_info/time_within_train_step": 27.791571140289307, "step": 1159}
{"train_info/time_between_train_steps": 0.005073070526123047, "step": 1159}
{"info/global_step": 1160, "train_info/time_within_train_step": 27.749158143997192, "step": 1160}
{"train_info/time_between_train_steps": 0.005021572113037109, "step": 1160}
{"info/global_step": 1161, "train_info/time_within_train_step": 27.781271934509277, "step": 1161}
{"train_info/time_between_train_steps": 0.00535273551940918, "step": 1161}
{"info/global_step": 1162, "train_info/time_within_train_step": 27.76425075531006, "step": 1162}
{"train_info/time_between_train_steps": 0.005108356475830078, "step": 1162}
{"info/global_step": 1163, "train_info/time_within_train_step": 27.833186149597168, "step": 1163}
{"train_info/time_between_train_steps": 0.005311250686645508, "step": 1163}
{"info/global_step": 1164, "train_info/time_within_train_step": 27.784329414367676, "step": 1164}
{"train_info/time_between_train_steps": 0.007626056671142578, "step": 1164}
{"info/global_step": 1165, "train_info/time_within_train_step": 27.7837553024292, "step": 1165}
{"train_info/time_between_train_steps": 0.005234479904174805, "step": 1165}
{"info/global_step": 1166, "train_info/time_within_train_step": 27.779184341430664, "step": 1166}
{"train_info/time_between_train_steps": 0.005273103713989258, "step": 1166}
{"info/global_step": 1167, "train_info/time_within_train_step": 27.83307456970215, "step": 1167}
{"train_info/time_between_train_steps": 0.005368471145629883, "step": 1167}
{"info/global_step": 1168, "train_info/time_within_train_step": 27.79749870300293, "step": 1168}
{"train_info/time_between_train_steps": 0.005359172821044922, "step": 1168}
{"info/global_step": 1169, "train_info/time_within_train_step": 27.793476819992065, "step": 1169}
{"train_info/time_between_train_steps": 0.005344390869140625, "step": 1169}
{"info/global_step": 1170, "train_info/time_within_train_step": 27.818201541900635, "step": 1170}
{"train_info/time_between_train_steps": 0.005415678024291992, "step": 1170}
{"info/global_step": 1171, "train_info/time_within_train_step": 27.817407369613647, "step": 1171}
{"train_info/time_between_train_steps": 0.005377531051635742, "step": 1171}
{"info/global_step": 1172, "train_info/time_within_train_step": 27.89783525466919, "step": 1172}
{"train_info/time_between_train_steps": 0.005368947982788086, "step": 1172}
{"info/global_step": 1173, "train_info/time_within_train_step": 27.80613398551941, "step": 1173}
{"train_info/time_between_train_steps": 0.010289192199707031, "step": 1173}
{"info/global_step": 1174, "train_info/time_within_train_step": 27.79181671142578, "step": 1174}
{"train_info/time_between_train_steps": 0.005469083786010742, "step": 1174}
{"info/global_step": 1175, "train_info/time_within_train_step": 27.83210515975952, "step": 1175}
{"train_info/time_between_train_steps": 0.0064656734466552734, "step": 1175}
{"info/global_step": 1176, "train_info/time_within_train_step": 27.848377227783203, "step": 1176}
{"train_info/time_between_train_steps": 0.006265163421630859, "step": 1176}
{"train_info/time_between_train_steps": 3.538677453994751, "step": 1176}
{"info/global_step": 1177, "train_info/time_within_train_step": 27.826403379440308, "step": 1177}
{"train_info/time_between_train_steps": 0.005336284637451172, "step": 1177}
{"info/global_step": 1178, "train_info/time_within_train_step": 27.92079734802246, "step": 1178}
{"train_info/time_between_train_steps": 0.005483150482177734, "step": 1178}
{"info/global_step": 1179, "train_info/time_within_train_step": 27.83755350112915, "step": 1179}
{"train_info/time_between_train_steps": 0.010384082794189453, "step": 1179}
{"info/global_step": 1180, "train_info/time_within_train_step": 27.987401962280273, "step": 1180}
{"train_info/time_between_train_steps": 0.005453348159790039, "step": 1180}
{"info/global_step": 1181, "train_info/time_within_train_step": 27.83491039276123, "step": 1181}
{"train_info/time_between_train_steps": 0.00799417495727539, "step": 1181}
{"info/global_step": 1182, "train_info/time_within_train_step": 27.997958660125732, "step": 1182}
{"train_info/time_between_train_steps": 0.005391836166381836, "step": 1182}
{"info/global_step": 1183, "train_info/time_within_train_step": 27.801268339157104, "step": 1183}
{"train_info/time_between_train_steps": 0.0052564144134521484, "step": 1183}
{"info/global_step": 1184, "train_info/time_within_train_step": 27.91610884666443, "step": 1184}
{"train_info/time_between_train_steps": 0.008068561553955078, "step": 1184}
{"info/global_step": 1185, "train_info/time_within_train_step": 27.81396770477295, "step": 1185}
{"train_info/time_between_train_steps": 0.00975942611694336, "step": 1185}
{"info/global_step": 1186, "train_info/time_within_train_step": 27.797860860824585, "step": 1186}
{"train_info/time_between_train_steps": 0.005269289016723633, "step": 1186}
{"info/global_step": 1187, "train_info/time_within_train_step": 28.232648849487305, "step": 1187}
{"train_info/time_between_train_steps": 0.008191823959350586, "step": 1187}
{"info/global_step": 1188, "train_info/time_within_train_step": 27.792732000350952, "step": 1188}
{"train_info/time_between_train_steps": 0.007239103317260742, "step": 1188}
{"info/global_step": 1189, "train_info/time_within_train_step": 27.778307676315308, "step": 1189}
{"train_info/time_between_train_steps": 0.005064725875854492, "step": 1189}
{"info/global_step": 1190, "train_info/time_within_train_step": 27.75729990005493, "step": 1190}
{"train_info/time_between_train_steps": 0.0053102970123291016, "step": 1190}
{"info/global_step": 1191, "train_info/time_within_train_step": 27.796148538589478, "step": 1191}
{"train_info/time_between_train_steps": 0.005058765411376953, "step": 1191}
{"info/global_step": 1192, "train_info/time_within_train_step": 27.79399299621582, "step": 1192}
{"train_info/time_between_train_steps": 0.009864330291748047, "step": 1192}
{"info/global_step": 1193, "train_info/time_within_train_step": 27.771926879882812, "step": 1193}
{"train_info/time_between_train_steps": 0.009743928909301758, "step": 1193}
{"info/global_step": 1194, "train_info/time_within_train_step": 27.777860164642334, "step": 1194}
{"train_info/time_between_train_steps": 0.005017518997192383, "step": 1194}
{"info/global_step": 1195, "train_info/time_within_train_step": 27.839017629623413, "step": 1195}
{"train_info/time_between_train_steps": 0.005201101303100586, "step": 1195}
{"info/global_step": 1196, "train_info/time_within_train_step": 27.79917025566101, "step": 1196}
{"train_info/time_between_train_steps": 0.0050907135009765625, "step": 1196}
{"info/global_step": 1197, "train_info/time_within_train_step": 27.81654119491577, "step": 1197}
{"train_info/time_between_train_steps": 0.007686138153076172, "step": 1197}
{"info/global_step": 1198, "train_info/time_within_train_step": 27.814350128173828, "step": 1198}
{"train_info/time_between_train_steps": 0.005034446716308594, "step": 1198}
{"info/global_step": 1199, "train_info/time_within_train_step": 27.79250144958496, "step": 1199}
{"train_info/time_between_train_steps": 0.005432844161987305, "step": 1199}
{"info/global_step": 1200, "train_info/time_within_train_step": 27.782989740371704, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1740855632, "_runtime": 33737}, "step": 1200}
{"logs": {"train/loss": 2.9765, "train/learning_rate": 0.0, "train/epoch": 42.02, "_timestamp": 1740855632, "_runtime": 33737}, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1740855646, "_runtime": 33751}, "step": 1200}
{"logs": {"train/train_runtime": 33751.3496, "train/train_samples_per_second": 18.204, "train/train_steps_per_second": 0.036, "train/total_flos": 3.21251237167104e+17, "train/train_loss": 3.9283212423324585, "train/epoch": 42.02, "_timestamp": 1740855646, "_runtime": 33751}, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1922.4453125, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1740855654, "_runtime": 33759}, "step": 1200}
{"logs": {"eval/loss": 4.2149577140808105, "eval/runtime": 3.988, "eval/samples_per_second": 51.153, "eval/steps_per_second": 3.26, "train/epoch": 42.02, "_timestamp": 1740855654, "_runtime": 33759}, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1922.4453125, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1740855654, "_runtime": 33759}, "step": 1200}
{"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.2149577140808105, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 67.69130342142533, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 3.988, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 51.153, "train/epoch": 42.02, "_timestamp": 1740855654, "_runtime": 33759}, "step": 1200}