shuffle_local3_EN53 / metrics.json
xiulinyang's picture
Adding model checkpoints and config files
3bd0946
Invalid JSON: Unexpected non-whitespace character after JSONat line 2, column 1
{"num_parameters": 124439808, "trainable_parameters": 124439808, "step": 0}
{"train_info/time_between_train_steps": 3.305532455444336, "step": 0}
{"info/global_step": 1, "train_info/time_within_train_step": 37.56768226623535, "step": 1}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 19761.71484375, "train_info/memory_reserved": 22624.0, "train_info/memory_max_reserved": 22624.0, "_timestamp": 1733687155, "_runtime": 44}, "step": 1}
{"logs": {"train/loss": 11.0182, "train/learning_rate": 4.9999999999999996e-06, "train/epoch": 0.0, "_timestamp": 1733687155, "_runtime": 44}, "step": 1}
{"train_info/time_between_train_steps": 0.12585067749023438, "step": 1}
{"info/global_step": 2, "train_info/time_within_train_step": 37.25658130645752, "step": 2}
{"train_info/time_between_train_steps": 0.005544185638427734, "step": 2}
{"info/global_step": 3, "train_info/time_within_train_step": 37.105878829956055, "step": 3}
{"train_info/time_between_train_steps": 0.005793094635009766, "step": 3}
{"info/global_step": 4, "train_info/time_within_train_step": 37.28779911994934, "step": 4}
{"train_info/time_between_train_steps": 0.005553245544433594, "step": 4}
{"info/global_step": 5, "train_info/time_within_train_step": 37.355743646621704, "step": 5}
{"train_info/time_between_train_steps": 0.0057675838470458984, "step": 5}
{"info/global_step": 6, "train_info/time_within_train_step": 37.142465114593506, "step": 6}
{"train_info/time_between_train_steps": 0.0057926177978515625, "step": 6}
{"info/global_step": 7, "train_info/time_within_train_step": 37.2636296749115, "step": 7}
{"train_info/time_between_train_steps": 0.005975008010864258, "step": 7}
{"info/global_step": 8, "train_info/time_within_train_step": 37.20551919937134, "step": 8}
{"train_info/time_between_train_steps": 0.0057184696197509766, "step": 8}
{"info/global_step": 9, "train_info/time_within_train_step": 36.99384617805481, "step": 9}
{"train_info/time_between_train_steps": 0.00529932975769043, "step": 9}
{"info/global_step": 10, "train_info/time_within_train_step": 36.91899633407593, "step": 10}
{"train_info/time_between_train_steps": 0.005202531814575195, "step": 10}
{"info/global_step": 11, "train_info/time_within_train_step": 36.56480312347412, "step": 11}
{"train_info/time_between_train_steps": 0.00791478157043457, "step": 11}
{"info/global_step": 12, "train_info/time_within_train_step": 36.87714385986328, "step": 12}
{"train_info/time_between_train_steps": 0.009951591491699219, "step": 12}
{"info/global_step": 13, "train_info/time_within_train_step": 36.734025716781616, "step": 13}
{"train_info/time_between_train_steps": 0.00532984733581543, "step": 13}
{"info/global_step": 14, "train_info/time_within_train_step": 37.15535235404968, "step": 14}
{"train_info/time_between_train_steps": 0.00604248046875, "step": 14}
{"info/global_step": 15, "train_info/time_within_train_step": 36.98492980003357, "step": 15}
{"train_info/time_between_train_steps": 0.0055103302001953125, "step": 15}
{"info/global_step": 16, "train_info/time_within_train_step": 37.422340393066406, "step": 16}
{"train_info/time_between_train_steps": 0.005247592926025391, "step": 16}
{"info/global_step": 17, "train_info/time_within_train_step": 36.84571599960327, "step": 17}
{"train_info/time_between_train_steps": 0.005360841751098633, "step": 17}
{"info/global_step": 18, "train_info/time_within_train_step": 36.92981743812561, "step": 18}
{"train_info/time_between_train_steps": 0.0052967071533203125, "step": 18}
{"info/global_step": 19, "train_info/time_within_train_step": 36.93381190299988, "step": 19}
{"train_info/time_between_train_steps": 0.005281925201416016, "step": 19}
{"info/global_step": 20, "train_info/time_within_train_step": 36.97473406791687, "step": 20}
{"train_info/time_between_train_steps": 0.0052988529205322266, "step": 20}
{"info/global_step": 21, "train_info/time_within_train_step": 37.12398982048035, "step": 21}
{"train_info/time_between_train_steps": 0.005362510681152344, "step": 21}
{"info/global_step": 22, "train_info/time_within_train_step": 37.27206563949585, "step": 22}
{"train_info/time_between_train_steps": 0.005208492279052734, "step": 22}
{"info/global_step": 23, "train_info/time_within_train_step": 36.9516806602478, "step": 23}
{"train_info/time_between_train_steps": 0.005250692367553711, "step": 23}
{"info/global_step": 24, "train_info/time_within_train_step": 37.34328866004944, "step": 24}
{"train_info/time_between_train_steps": 0.010568618774414062, "step": 24}
{"info/global_step": 25, "train_info/time_within_train_step": 37.05659532546997, "step": 25}
{"train_info/time_between_train_steps": 0.009963274002075195, "step": 25}
{"info/global_step": 26, "train_info/time_within_train_step": 37.18834733963013, "step": 26}
{"train_info/time_between_train_steps": 0.005765199661254883, "step": 26}
{"info/global_step": 27, "train_info/time_within_train_step": 36.63203573226929, "step": 27}
{"train_info/time_between_train_steps": 0.011049509048461914, "step": 27}
{"train_info/time_between_train_steps": 26.19924521446228, "step": 27}
{"info/global_step": 28, "train_info/time_within_train_step": 36.687071800231934, "step": 28}
{"train_info/time_between_train_steps": 0.006062984466552734, "step": 28}
{"info/global_step": 29, "train_info/time_within_train_step": 37.07667279243469, "step": 29}
{"train_info/time_between_train_steps": 0.005641460418701172, "step": 29}
{"info/global_step": 30, "train_info/time_within_train_step": 36.94907093048096, "step": 30}
{"train_info/time_between_train_steps": 0.005342245101928711, "step": 30}
{"info/global_step": 31, "train_info/time_within_train_step": 37.208707332611084, "step": 31}
{"train_info/time_between_train_steps": 0.0055179595947265625, "step": 31}
{"info/global_step": 32, "train_info/time_within_train_step": 36.90923023223877, "step": 32}
{"train_info/time_between_train_steps": 0.006143093109130859, "step": 32}
{"info/global_step": 33, "train_info/time_within_train_step": 37.225669145584106, "step": 33}
{"train_info/time_between_train_steps": 0.005608797073364258, "step": 33}
{"info/global_step": 34, "train_info/time_within_train_step": 37.13282871246338, "step": 34}
{"train_info/time_between_train_steps": 0.005728483200073242, "step": 34}
{"info/global_step": 35, "train_info/time_within_train_step": 36.9979453086853, "step": 35}
{"train_info/time_between_train_steps": 0.005419015884399414, "step": 35}
{"info/global_step": 36, "train_info/time_within_train_step": 36.92385196685791, "step": 36}
{"train_info/time_between_train_steps": 0.010780096054077148, "step": 36}
{"info/global_step": 37, "train_info/time_within_train_step": 37.22185158729553, "step": 37}
{"train_info/time_between_train_steps": 0.010071754455566406, "step": 37}
{"info/global_step": 38, "train_info/time_within_train_step": 36.87276792526245, "step": 38}
{"train_info/time_between_train_steps": 0.00523066520690918, "step": 38}
{"info/global_step": 39, "train_info/time_within_train_step": 36.72222375869751, "step": 39}
{"train_info/time_between_train_steps": 0.005124092102050781, "step": 39}
{"info/global_step": 40, "train_info/time_within_train_step": 36.709068298339844, "step": 40}
{"train_info/time_between_train_steps": 0.005522251129150391, "step": 40}
{"info/global_step": 41, "train_info/time_within_train_step": 36.658042669296265, "step": 41}
{"train_info/time_between_train_steps": 0.005566596984863281, "step": 41}
{"info/global_step": 42, "train_info/time_within_train_step": 36.79260182380676, "step": 42}
{"train_info/time_between_train_steps": 0.0052678585052490234, "step": 42}
{"info/global_step": 43, "train_info/time_within_train_step": 37.22409963607788, "step": 43}
{"train_info/time_between_train_steps": 0.0052525997161865234, "step": 43}
{"info/global_step": 44, "train_info/time_within_train_step": 37.11901593208313, "step": 44}
{"train_info/time_between_train_steps": 0.009228944778442383, "step": 44}
{"info/global_step": 45, "train_info/time_within_train_step": 36.86217665672302, "step": 45}
{"train_info/time_between_train_steps": 0.005307197570800781, "step": 45}
{"info/global_step": 46, "train_info/time_within_train_step": 36.863877058029175, "step": 46}
{"train_info/time_between_train_steps": 0.005359649658203125, "step": 46}
{"info/global_step": 47, "train_info/time_within_train_step": 37.26547312736511, "step": 47}
{"train_info/time_between_train_steps": 0.005342721939086914, "step": 47}
{"info/global_step": 48, "train_info/time_within_train_step": 37.05137848854065, "step": 48}
{"train_info/time_between_train_steps": 0.005480766296386719, "step": 48}
{"info/global_step": 49, "train_info/time_within_train_step": 37.011255741119385, "step": 49}
{"train_info/time_between_train_steps": 0.005366086959838867, "step": 49}
{"info/global_step": 50, "train_info/time_within_train_step": 36.88498330116272, "step": 50}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733688995, "_runtime": 1884}, "step": 50}
{"logs": {"train/loss": 8.1282, "train/learning_rate": 0.00025, "train/epoch": 1.02, "_timestamp": 1733688995, "_runtime": 1884}, "step": 50}
{"train_info/time_between_train_steps": 0.00722956657409668, "step": 50}
{"info/global_step": 51, "train_info/time_within_train_step": 36.985023498535156, "step": 51}
{"train_info/time_between_train_steps": 0.005667924880981445, "step": 51}
{"info/global_step": 52, "train_info/time_within_train_step": 36.60629749298096, "step": 52}
{"train_info/time_between_train_steps": 0.0054242610931396484, "step": 52}
{"info/global_step": 53, "train_info/time_within_train_step": 37.295215368270874, "step": 53}
{"train_info/time_between_train_steps": 0.005872011184692383, "step": 53}
{"info/global_step": 54, "train_info/time_within_train_step": 36.989238023757935, "step": 54}
{"train_info/time_between_train_steps": 0.006262540817260742, "step": 54}
{"train_info/time_between_train_steps": 26.416640758514404, "step": 54}
{"info/global_step": 55, "train_info/time_within_train_step": 36.89104604721069, "step": 55}
{"train_info/time_between_train_steps": 0.007743120193481445, "step": 55}
{"info/global_step": 56, "train_info/time_within_train_step": 37.62112307548523, "step": 56}
{"train_info/time_between_train_steps": 0.010442018508911133, "step": 56}
{"info/global_step": 57, "train_info/time_within_train_step": 36.98421764373779, "step": 57}
{"train_info/time_between_train_steps": 0.010928153991699219, "step": 57}
{"info/global_step": 58, "train_info/time_within_train_step": 37.11110019683838, "step": 58}
{"train_info/time_between_train_steps": 0.006121397018432617, "step": 58}
{"info/global_step": 59, "train_info/time_within_train_step": 37.288368701934814, "step": 59}
{"train_info/time_between_train_steps": 0.0058214664459228516, "step": 59}
{"info/global_step": 60, "train_info/time_within_train_step": 37.04699897766113, "step": 60}
{"train_info/time_between_train_steps": 0.005510807037353516, "step": 60}
{"info/global_step": 61, "train_info/time_within_train_step": 36.988808155059814, "step": 61}
{"train_info/time_between_train_steps": 0.005790233612060547, "step": 61}
{"info/global_step": 62, "train_info/time_within_train_step": 37.50537180900574, "step": 62}
{"train_info/time_between_train_steps": 0.005526304244995117, "step": 62}
{"info/global_step": 63, "train_info/time_within_train_step": 37.04291033744812, "step": 63}
{"train_info/time_between_train_steps": 0.005673646926879883, "step": 63}
{"info/global_step": 64, "train_info/time_within_train_step": 37.034071922302246, "step": 64}
{"train_info/time_between_train_steps": 0.010267496109008789, "step": 64}
{"info/global_step": 65, "train_info/time_within_train_step": 37.04934048652649, "step": 65}
{"train_info/time_between_train_steps": 0.005573272705078125, "step": 65}
{"info/global_step": 66, "train_info/time_within_train_step": 37.164143085479736, "step": 66}
{"train_info/time_between_train_steps": 0.005429506301879883, "step": 66}
{"info/global_step": 67, "train_info/time_within_train_step": 36.94400930404663, "step": 67}
{"train_info/time_between_train_steps": 0.005423545837402344, "step": 67}
{"info/global_step": 68, "train_info/time_within_train_step": 37.2547767162323, "step": 68}
{"train_info/time_between_train_steps": 0.005312204360961914, "step": 68}
{"info/global_step": 69, "train_info/time_within_train_step": 36.878443241119385, "step": 69}
{"train_info/time_between_train_steps": 0.010216236114501953, "step": 69}
{"info/global_step": 70, "train_info/time_within_train_step": 37.06665372848511, "step": 70}
{"train_info/time_between_train_steps": 0.010195732116699219, "step": 70}
{"info/global_step": 71, "train_info/time_within_train_step": 37.121002435684204, "step": 71}
{"train_info/time_between_train_steps": 0.005213499069213867, "step": 71}
{"info/global_step": 72, "train_info/time_within_train_step": 36.40369367599487, "step": 72}
{"train_info/time_between_train_steps": 0.005289554595947266, "step": 72}
{"info/global_step": 73, "train_info/time_within_train_step": 36.8427574634552, "step": 73}
{"train_info/time_between_train_steps": 0.0053327083587646484, "step": 73}
{"info/global_step": 74, "train_info/time_within_train_step": 37.26875615119934, "step": 74}
{"train_info/time_between_train_steps": 0.005627632141113281, "step": 74}
{"info/global_step": 75, "train_info/time_within_train_step": 36.605491161346436, "step": 75}
{"train_info/time_between_train_steps": 0.005543231964111328, "step": 75}
{"info/global_step": 76, "train_info/time_within_train_step": 36.805354833602905, "step": 76}
{"train_info/time_between_train_steps": 0.010105371475219727, "step": 76}
{"info/global_step": 77, "train_info/time_within_train_step": 37.103936195373535, "step": 77}
{"train_info/time_between_train_steps": 0.010236024856567383, "step": 77}
{"info/global_step": 78, "train_info/time_within_train_step": 36.69197130203247, "step": 78}
{"train_info/time_between_train_steps": 0.0053272247314453125, "step": 78}
{"info/global_step": 79, "train_info/time_within_train_step": 36.52396297454834, "step": 79}
{"train_info/time_between_train_steps": 0.010595560073852539, "step": 79}
{"info/global_step": 80, "train_info/time_within_train_step": 36.840559005737305, "step": 80}
{"train_info/time_between_train_steps": 0.005609273910522461, "step": 80}
{"info/global_step": 81, "train_info/time_within_train_step": 37.06740760803223, "step": 81}
{"train_info/time_between_train_steps": 0.0059816837310791016, "step": 81}
{"train_info/time_between_train_steps": 26.192055463790894, "step": 81}
{"info/global_step": 82, "train_info/time_within_train_step": 37.06825113296509, "step": 82}
{"train_info/time_between_train_steps": 0.005635976791381836, "step": 82}
{"info/global_step": 83, "train_info/time_within_train_step": 36.63032627105713, "step": 83}
{"train_info/time_between_train_steps": 0.005454301834106445, "step": 83}
{"info/global_step": 84, "train_info/time_within_train_step": 37.06622362136841, "step": 84}
{"train_info/time_between_train_steps": 0.0053441524505615234, "step": 84}
{"info/global_step": 85, "train_info/time_within_train_step": 37.1888382434845, "step": 85}
{"train_info/time_between_train_steps": 0.005646467208862305, "step": 85}
{"info/global_step": 86, "train_info/time_within_train_step": 37.18291902542114, "step": 86}
{"train_info/time_between_train_steps": 0.0054645538330078125, "step": 86}
{"info/global_step": 87, "train_info/time_within_train_step": 36.53674101829529, "step": 87}
{"train_info/time_between_train_steps": 0.006443977355957031, "step": 87}
{"info/global_step": 88, "train_info/time_within_train_step": 36.61099863052368, "step": 88}
{"train_info/time_between_train_steps": 0.005814075469970703, "step": 88}
{"info/global_step": 89, "train_info/time_within_train_step": 37.04363131523132, "step": 89}
{"train_info/time_between_train_steps": 0.010314702987670898, "step": 89}
{"info/global_step": 90, "train_info/time_within_train_step": 37.07141852378845, "step": 90}
{"train_info/time_between_train_steps": 0.005333423614501953, "step": 90}
{"info/global_step": 91, "train_info/time_within_train_step": 36.976367712020874, "step": 91}
{"train_info/time_between_train_steps": 0.0053730010986328125, "step": 91}
{"info/global_step": 92, "train_info/time_within_train_step": 37.00233292579651, "step": 92}
{"train_info/time_between_train_steps": 0.010172843933105469, "step": 92}
{"info/global_step": 93, "train_info/time_within_train_step": 36.76292824745178, "step": 93}
{"train_info/time_between_train_steps": 0.005173206329345703, "step": 93}
{"info/global_step": 94, "train_info/time_within_train_step": 37.01774024963379, "step": 94}
{"train_info/time_between_train_steps": 0.009956121444702148, "step": 94}
{"info/global_step": 95, "train_info/time_within_train_step": 36.793742179870605, "step": 95}
{"train_info/time_between_train_steps": 0.005350589752197266, "step": 95}
{"info/global_step": 96, "train_info/time_within_train_step": 36.94390630722046, "step": 96}
{"train_info/time_between_train_steps": 0.008559465408325195, "step": 96}
{"info/global_step": 97, "train_info/time_within_train_step": 37.001068115234375, "step": 97}
{"train_info/time_between_train_steps": 0.0053462982177734375, "step": 97}
{"info/global_step": 98, "train_info/time_within_train_step": 36.98036813735962, "step": 98}
{"train_info/time_between_train_steps": 0.005335092544555664, "step": 98}
{"info/global_step": 99, "train_info/time_within_train_step": 36.92941498756409, "step": 99}
{"train_info/time_between_train_steps": 0.00512385368347168, "step": 99}
{"info/global_step": 100, "train_info/time_within_train_step": 36.85865879058838, "step": 100}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733690897, "_runtime": 3786}, "step": 100}
{"logs": {"train/loss": 6.6185, "train/learning_rate": 0.0005, "train/epoch": 3.02, "_timestamp": 1733690897, "_runtime": 3786}, "step": 100}
{"train_info/time_between_train_steps": 2.4459481239318848, "step": 100}
{"info/global_step": 101, "train_info/time_within_train_step": 37.04670834541321, "step": 101}
{"train_info/time_between_train_steps": 0.005408048629760742, "step": 101}
{"info/global_step": 102, "train_info/time_within_train_step": 36.93933391571045, "step": 102}
{"train_info/time_between_train_steps": 0.005485057830810547, "step": 102}
{"info/global_step": 103, "train_info/time_within_train_step": 36.92428016662598, "step": 103}
{"train_info/time_between_train_steps": 0.005476951599121094, "step": 103}
{"info/global_step": 104, "train_info/time_within_train_step": 36.664480447769165, "step": 104}
{"train_info/time_between_train_steps": 0.005257844924926758, "step": 104}
{"info/global_step": 105, "train_info/time_within_train_step": 36.97857880592346, "step": 105}
{"train_info/time_between_train_steps": 0.006813764572143555, "step": 105}
{"info/global_step": 106, "train_info/time_within_train_step": 36.95964860916138, "step": 106}
{"train_info/time_between_train_steps": 0.005490303039550781, "step": 106}
{"info/global_step": 107, "train_info/time_within_train_step": 37.062185764312744, "step": 107}
{"train_info/time_between_train_steps": 0.0062444210052490234, "step": 107}
{"info/global_step": 108, "train_info/time_within_train_step": 36.95916676521301, "step": 108}
{"train_info/time_between_train_steps": 0.006083011627197266, "step": 108}
{"train_info/time_between_train_steps": 26.246516942977905, "step": 108}
{"info/global_step": 109, "train_info/time_within_train_step": 36.987948417663574, "step": 109}
{"train_info/time_between_train_steps": 0.0056209564208984375, "step": 109}
{"info/global_step": 110, "train_info/time_within_train_step": 37.042200326919556, "step": 110}
{"train_info/time_between_train_steps": 0.0055999755859375, "step": 110}
{"info/global_step": 111, "train_info/time_within_train_step": 37.07652711868286, "step": 111}
{"train_info/time_between_train_steps": 0.0053555965423583984, "step": 111}
{"info/global_step": 112, "train_info/time_within_train_step": 37.19007897377014, "step": 112}
{"train_info/time_between_train_steps": 0.005297183990478516, "step": 112}
{"info/global_step": 113, "train_info/time_within_train_step": 37.0700478553772, "step": 113}
{"train_info/time_between_train_steps": 0.005441904067993164, "step": 113}
{"info/global_step": 114, "train_info/time_within_train_step": 36.966007709503174, "step": 114}
{"train_info/time_between_train_steps": 0.01037287712097168, "step": 114}
{"info/global_step": 115, "train_info/time_within_train_step": 36.88615870475769, "step": 115}
{"train_info/time_between_train_steps": 0.0059549808502197266, "step": 115}
{"info/global_step": 116, "train_info/time_within_train_step": 37.055357456207275, "step": 116}
{"train_info/time_between_train_steps": 0.005621910095214844, "step": 116}
{"info/global_step": 117, "train_info/time_within_train_step": 36.91941475868225, "step": 117}
{"train_info/time_between_train_steps": 0.005396842956542969, "step": 117}
{"info/global_step": 118, "train_info/time_within_train_step": 36.74212646484375, "step": 118}
{"train_info/time_between_train_steps": 0.00987863540649414, "step": 118}
{"info/global_step": 119, "train_info/time_within_train_step": 36.83319091796875, "step": 119}
{"train_info/time_between_train_steps": 0.005274295806884766, "step": 119}
{"info/global_step": 120, "train_info/time_within_train_step": 36.82252264022827, "step": 120}
{"train_info/time_between_train_steps": 0.005175113677978516, "step": 120}
{"info/global_step": 121, "train_info/time_within_train_step": 36.893317461013794, "step": 121}
{"train_info/time_between_train_steps": 0.0050737857818603516, "step": 121}
{"info/global_step": 122, "train_info/time_within_train_step": 36.56512498855591, "step": 122}
{"train_info/time_between_train_steps": 0.005368232727050781, "step": 122}
{"info/global_step": 123, "train_info/time_within_train_step": 36.87240815162659, "step": 123}
{"train_info/time_between_train_steps": 0.005300998687744141, "step": 123}
{"info/global_step": 124, "train_info/time_within_train_step": 36.65332245826721, "step": 124}
{"train_info/time_between_train_steps": 0.0052912235260009766, "step": 124}
{"info/global_step": 125, "train_info/time_within_train_step": 36.481019496917725, "step": 125}
{"train_info/time_between_train_steps": 0.005407571792602539, "step": 125}
{"info/global_step": 126, "train_info/time_within_train_step": 36.63286304473877, "step": 126}
{"train_info/time_between_train_steps": 0.00524449348449707, "step": 126}
{"info/global_step": 127, "train_info/time_within_train_step": 36.845850706100464, "step": 127}
{"train_info/time_between_train_steps": 0.005444526672363281, "step": 127}
{"info/global_step": 128, "train_info/time_within_train_step": 36.816797971725464, "step": 128}
{"train_info/time_between_train_steps": 0.005228281021118164, "step": 128}
{"info/global_step": 129, "train_info/time_within_train_step": 36.937922954559326, "step": 129}
{"train_info/time_between_train_steps": 0.005455970764160156, "step": 129}
{"info/global_step": 130, "train_info/time_within_train_step": 37.51517462730408, "step": 130}
{"train_info/time_between_train_steps": 0.005384683609008789, "step": 130}
{"info/global_step": 131, "train_info/time_within_train_step": 36.961714029312134, "step": 131}
{"train_info/time_between_train_steps": 0.010164499282836914, "step": 131}
{"info/global_step": 132, "train_info/time_within_train_step": 36.9299840927124, "step": 132}
{"train_info/time_between_train_steps": 0.0053594112396240234, "step": 132}
{"info/global_step": 133, "train_info/time_within_train_step": 36.68817186355591, "step": 133}
{"train_info/time_between_train_steps": 0.0056803226470947266, "step": 133}
{"info/global_step": 134, "train_info/time_within_train_step": 36.87792205810547, "step": 134}
{"train_info/time_between_train_steps": 0.005408763885498047, "step": 134}
{"info/global_step": 135, "train_info/time_within_train_step": 36.859529972076416, "step": 135}
{"train_info/time_between_train_steps": 0.011239051818847656, "step": 135}
{"train_info/time_between_train_steps": 26.061124563217163, "step": 135}
{"info/global_step": 136, "train_info/time_within_train_step": 36.86337351799011, "step": 136}
{"train_info/time_between_train_steps": 0.005745649337768555, "step": 136}
{"info/global_step": 137, "train_info/time_within_train_step": 37.06308197975159, "step": 137}
{"train_info/time_between_train_steps": 0.005573749542236328, "step": 137}
{"info/global_step": 138, "train_info/time_within_train_step": 37.7585551738739, "step": 138}
{"train_info/time_between_train_steps": 0.005503416061401367, "step": 138}
{"info/global_step": 139, "train_info/time_within_train_step": 37.02869272232056, "step": 139}
{"train_info/time_between_train_steps": 0.0053997039794921875, "step": 139}
{"info/global_step": 140, "train_info/time_within_train_step": 36.857747077941895, "step": 140}
{"train_info/time_between_train_steps": 0.010129690170288086, "step": 140}
{"info/global_step": 141, "train_info/time_within_train_step": 37.2378249168396, "step": 141}
{"train_info/time_between_train_steps": 0.005753517150878906, "step": 141}
{"info/global_step": 142, "train_info/time_within_train_step": 36.8606493473053, "step": 142}
{"train_info/time_between_train_steps": 0.01054692268371582, "step": 142}
{"info/global_step": 143, "train_info/time_within_train_step": 36.85635733604431, "step": 143}
{"train_info/time_between_train_steps": 0.010950803756713867, "step": 143}
{"info/global_step": 144, "train_info/time_within_train_step": 36.860130310058594, "step": 144}
{"train_info/time_between_train_steps": 0.01001429557800293, "step": 144}
{"info/global_step": 145, "train_info/time_within_train_step": 36.584686517715454, "step": 145}
{"train_info/time_between_train_steps": 0.010064125061035156, "step": 145}
{"info/global_step": 146, "train_info/time_within_train_step": 37.186410427093506, "step": 146}
{"train_info/time_between_train_steps": 0.005071401596069336, "step": 146}
{"info/global_step": 147, "train_info/time_within_train_step": 36.42175531387329, "step": 147}
{"train_info/time_between_train_steps": 0.0052530765533447266, "step": 147}
{"info/global_step": 148, "train_info/time_within_train_step": 36.63218641281128, "step": 148}
{"train_info/time_between_train_steps": 0.005167961120605469, "step": 148}
{"info/global_step": 149, "train_info/time_within_train_step": 36.66201591491699, "step": 149}
{"train_info/time_between_train_steps": 0.005399465560913086, "step": 149}
{"info/global_step": 150, "train_info/time_within_train_step": 36.831032037734985, "step": 150}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733692797, "_runtime": 5686}, "step": 150}
{"logs": {"train/loss": 6.3455, "train/learning_rate": 0.0005833333333333333, "train/epoch": 5.01, "_timestamp": 1733692797, "_runtime": 5686}, "step": 150}
{"train_info/time_between_train_steps": 0.007654905319213867, "step": 150}
{"info/global_step": 151, "train_info/time_within_train_step": 36.292614698410034, "step": 151}
{"train_info/time_between_train_steps": 0.005183696746826172, "step": 151}
{"info/global_step": 152, "train_info/time_within_train_step": 37.38573145866394, "step": 152}
{"train_info/time_between_train_steps": 0.005385160446166992, "step": 152}
{"info/global_step": 153, "train_info/time_within_train_step": 36.63115620613098, "step": 153}
{"train_info/time_between_train_steps": 0.005369663238525391, "step": 153}
{"info/global_step": 154, "train_info/time_within_train_step": 37.03403091430664, "step": 154}
{"train_info/time_between_train_steps": 0.00533747673034668, "step": 154}
{"info/global_step": 155, "train_info/time_within_train_step": 36.83953046798706, "step": 155}
{"train_info/time_between_train_steps": 0.00979924201965332, "step": 155}
{"info/global_step": 156, "train_info/time_within_train_step": 36.716899394989014, "step": 156}
{"train_info/time_between_train_steps": 0.005327463150024414, "step": 156}
{"info/global_step": 157, "train_info/time_within_train_step": 37.651514291763306, "step": 157}
{"train_info/time_between_train_steps": 0.009142875671386719, "step": 157}
{"info/global_step": 158, "train_info/time_within_train_step": 36.744598627090454, "step": 158}
{"train_info/time_between_train_steps": 0.0053708553314208984, "step": 158}
{"info/global_step": 159, "train_info/time_within_train_step": 36.73069214820862, "step": 159}
{"train_info/time_between_train_steps": 0.005701303482055664, "step": 159}
{"info/global_step": 160, "train_info/time_within_train_step": 36.781455993652344, "step": 160}
{"train_info/time_between_train_steps": 0.00567173957824707, "step": 160}
{"info/global_step": 161, "train_info/time_within_train_step": 36.72890615463257, "step": 161}
{"train_info/time_between_train_steps": 0.006139993667602539, "step": 161}
{"info/global_step": 162, "train_info/time_within_train_step": 37.65891098976135, "step": 162}
{"train_info/time_between_train_steps": 0.010905027389526367, "step": 162}
{"train_info/time_between_train_steps": 25.998289346694946, "step": 162}
{"info/global_step": 163, "train_info/time_within_train_step": 36.84667110443115, "step": 163}
{"train_info/time_between_train_steps": 0.006097555160522461, "step": 163}
{"info/global_step": 164, "train_info/time_within_train_step": 36.685352087020874, "step": 164}
{"train_info/time_between_train_steps": 0.010251998901367188, "step": 164}
{"info/global_step": 165, "train_info/time_within_train_step": 37.56737470626831, "step": 165}
{"train_info/time_between_train_steps": 0.005914926528930664, "step": 165}
{"info/global_step": 166, "train_info/time_within_train_step": 36.92732524871826, "step": 166}
{"train_info/time_between_train_steps": 0.005481719970703125, "step": 166}
{"info/global_step": 167, "train_info/time_within_train_step": 36.881712436676025, "step": 167}
{"train_info/time_between_train_steps": 0.005678892135620117, "step": 167}
{"info/global_step": 168, "train_info/time_within_train_step": 36.91366171836853, "step": 168}
{"train_info/time_between_train_steps": 0.005301952362060547, "step": 168}
{"info/global_step": 169, "train_info/time_within_train_step": 37.10736846923828, "step": 169}
{"train_info/time_between_train_steps": 0.005548715591430664, "step": 169}
{"info/global_step": 170, "train_info/time_within_train_step": 37.39237952232361, "step": 170}
{"train_info/time_between_train_steps": 0.010201692581176758, "step": 170}
{"info/global_step": 171, "train_info/time_within_train_step": 36.65463089942932, "step": 171}
{"train_info/time_between_train_steps": 0.010042190551757812, "step": 171}
{"info/global_step": 172, "train_info/time_within_train_step": 36.691577196121216, "step": 172}
{"train_info/time_between_train_steps": 0.005140542984008789, "step": 172}
{"info/global_step": 173, "train_info/time_within_train_step": 36.80294847488403, "step": 173}
{"train_info/time_between_train_steps": 0.00998067855834961, "step": 173}
{"info/global_step": 174, "train_info/time_within_train_step": 32.99726319313049, "step": 174}
{"train_info/time_between_train_steps": 0.005094766616821289, "step": 174}
{"info/global_step": 175, "train_info/time_within_train_step": 27.874863386154175, "step": 175}
{"train_info/time_between_train_steps": 0.005175352096557617, "step": 175}
{"info/global_step": 176, "train_info/time_within_train_step": 27.94229531288147, "step": 176}
{"train_info/time_between_train_steps": 0.005117654800415039, "step": 176}
{"info/global_step": 177, "train_info/time_within_train_step": 27.77641725540161, "step": 177}
{"train_info/time_between_train_steps": 0.0052890777587890625, "step": 177}
{"info/global_step": 178, "train_info/time_within_train_step": 27.770034074783325, "step": 178}
{"train_info/time_between_train_steps": 0.00514674186706543, "step": 178}
{"info/global_step": 179, "train_info/time_within_train_step": 27.799763202667236, "step": 179}
{"train_info/time_between_train_steps": 0.009192705154418945, "step": 179}
{"info/global_step": 180, "train_info/time_within_train_step": 32.45149517059326, "step": 180}
{"train_info/time_between_train_steps": 0.005208730697631836, "step": 180}
{"info/global_step": 181, "train_info/time_within_train_step": 35.98384475708008, "step": 181}
{"train_info/time_between_train_steps": 0.005362510681152344, "step": 181}
{"info/global_step": 182, "train_info/time_within_train_step": 36.18116760253906, "step": 182}
{"train_info/time_between_train_steps": 0.014997005462646484, "step": 182}
{"info/global_step": 183, "train_info/time_within_train_step": 36.85701394081116, "step": 183}
{"train_info/time_between_train_steps": 0.005431413650512695, "step": 183}
{"info/global_step": 184, "train_info/time_within_train_step": 35.89996385574341, "step": 184}
{"train_info/time_between_train_steps": 0.005267143249511719, "step": 184}
{"info/global_step": 185, "train_info/time_within_train_step": 35.716304302215576, "step": 185}
{"train_info/time_between_train_steps": 0.005378246307373047, "step": 185}
{"info/global_step": 186, "train_info/time_within_train_step": 38.165409564971924, "step": 186}
{"train_info/time_between_train_steps": 0.00545501708984375, "step": 186}
{"info/global_step": 187, "train_info/time_within_train_step": 38.073650598526, "step": 187}
{"train_info/time_between_train_steps": 0.005591154098510742, "step": 187}
{"info/global_step": 188, "train_info/time_within_train_step": 38.12036418914795, "step": 188}
{"train_info/time_between_train_steps": 0.010808229446411133, "step": 188}
{"info/global_step": 189, "train_info/time_within_train_step": 38.110140323638916, "step": 189}
{"train_info/time_between_train_steps": 0.0059697628021240234, "step": 189}
{"train_info/time_between_train_steps": 27.209683656692505, "step": 189}
{"info/global_step": 190, "train_info/time_within_train_step": 37.98987674713135, "step": 190}
{"train_info/time_between_train_steps": 0.005148410797119141, "step": 190}
{"info/global_step": 191, "train_info/time_within_train_step": 38.21374845504761, "step": 191}
{"train_info/time_between_train_steps": 0.005354881286621094, "step": 191}
{"info/global_step": 192, "train_info/time_within_train_step": 38.05084562301636, "step": 192}
{"train_info/time_between_train_steps": 0.005370140075683594, "step": 192}
{"info/global_step": 193, "train_info/time_within_train_step": 38.1448929309845, "step": 193}
{"train_info/time_between_train_steps": 0.010419607162475586, "step": 193}
{"info/global_step": 194, "train_info/time_within_train_step": 37.99287009239197, "step": 194}
{"train_info/time_between_train_steps": 0.005526065826416016, "step": 194}
{"info/global_step": 195, "train_info/time_within_train_step": 38.288920402526855, "step": 195}
{"train_info/time_between_train_steps": 0.0057485103607177734, "step": 195}
{"info/global_step": 196, "train_info/time_within_train_step": 37.92543625831604, "step": 196}
{"train_info/time_between_train_steps": 0.005246400833129883, "step": 196}
{"info/global_step": 197, "train_info/time_within_train_step": 38.301652908325195, "step": 197}
{"train_info/time_between_train_steps": 0.005430459976196289, "step": 197}
{"info/global_step": 198, "train_info/time_within_train_step": 38.16812515258789, "step": 198}
{"train_info/time_between_train_steps": 0.0053217411041259766, "step": 198}
{"info/global_step": 199, "train_info/time_within_train_step": 38.26629972457886, "step": 199}
{"train_info/time_between_train_steps": 0.0051577091217041016, "step": 199}
{"info/global_step": 200, "train_info/time_within_train_step": 38.049236536026, "step": 200}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733694658, "_runtime": 7547}, "step": 200}
{"logs": {"train/loss": 6.178, "train/learning_rate": 0.0005555555555555556, "train/epoch": 7.01, "_timestamp": 1733694658, "_runtime": 7547}, "step": 200}
{"train_info/time_between_train_steps": 2.4909591674804688, "step": 200}
{"info/global_step": 201, "train_info/time_within_train_step": 38.044983863830566, "step": 201}
{"train_info/time_between_train_steps": 0.005060434341430664, "step": 201}
{"info/global_step": 202, "train_info/time_within_train_step": 38.192378997802734, "step": 202}
{"train_info/time_between_train_steps": 0.00546574592590332, "step": 202}
{"info/global_step": 203, "train_info/time_within_train_step": 38.20013070106506, "step": 203}
{"train_info/time_between_train_steps": 0.005402803421020508, "step": 203}
{"info/global_step": 204, "train_info/time_within_train_step": 37.89155554771423, "step": 204}
{"train_info/time_between_train_steps": 0.005403757095336914, "step": 204}
{"info/global_step": 205, "train_info/time_within_train_step": 38.055535316467285, "step": 205}
{"train_info/time_between_train_steps": 0.005647420883178711, "step": 205}
{"info/global_step": 206, "train_info/time_within_train_step": 38.16044592857361, "step": 206}
{"train_info/time_between_train_steps": 0.010181903839111328, "step": 206}
{"info/global_step": 207, "train_info/time_within_train_step": 38.08557653427124, "step": 207}
{"train_info/time_between_train_steps": 0.005250692367553711, "step": 207}
{"info/global_step": 208, "train_info/time_within_train_step": 38.07206153869629, "step": 208}
{"train_info/time_between_train_steps": 0.005446195602416992, "step": 208}
{"info/global_step": 209, "train_info/time_within_train_step": 38.016767501831055, "step": 209}
{"train_info/time_between_train_steps": 0.005316972732543945, "step": 209}
{"info/global_step": 210, "train_info/time_within_train_step": 38.11078119277954, "step": 210}
{"train_info/time_between_train_steps": 0.005303621292114258, "step": 210}
{"info/global_step": 211, "train_info/time_within_train_step": 38.069408655166626, "step": 211}
{"train_info/time_between_train_steps": 0.0053598880767822266, "step": 211}
{"info/global_step": 212, "train_info/time_within_train_step": 38.25405502319336, "step": 212}
{"train_info/time_between_train_steps": 0.0052449703216552734, "step": 212}
{"info/global_step": 213, "train_info/time_within_train_step": 37.992775440216064, "step": 213}
{"train_info/time_between_train_steps": 0.0055081844329833984, "step": 213}
{"info/global_step": 214, "train_info/time_within_train_step": 38.158637285232544, "step": 214}
{"train_info/time_between_train_steps": 0.005489349365234375, "step": 214}
{"info/global_step": 215, "train_info/time_within_train_step": 38.285881996154785, "step": 215}
{"train_info/time_between_train_steps": 0.0058383941650390625, "step": 215}
{"info/global_step": 216, "train_info/time_within_train_step": 38.038187980651855, "step": 216}
{"train_info/time_between_train_steps": 0.00580906867980957, "step": 216}
{"train_info/time_between_train_steps": 27.076931953430176, "step": 216}
{"info/global_step": 217, "train_info/time_within_train_step": 38.05593276023865, "step": 217}
{"train_info/time_between_train_steps": 0.005395412445068359, "step": 217}
{"info/global_step": 218, "train_info/time_within_train_step": 38.25037980079651, "step": 218}
{"train_info/time_between_train_steps": 0.010901451110839844, "step": 218}
{"info/global_step": 219, "train_info/time_within_train_step": 38.12347173690796, "step": 219}
{"train_info/time_between_train_steps": 0.005728244781494141, "step": 219}
{"info/global_step": 220, "train_info/time_within_train_step": 38.450364112854004, "step": 220}
{"train_info/time_between_train_steps": 0.006615161895751953, "step": 220}
{"info/global_step": 221, "train_info/time_within_train_step": 38.07170534133911, "step": 221}
{"train_info/time_between_train_steps": 0.005808353424072266, "step": 221}
{"info/global_step": 222, "train_info/time_within_train_step": 38.21503281593323, "step": 222}
{"train_info/time_between_train_steps": 0.00565648078918457, "step": 222}
{"info/global_step": 223, "train_info/time_within_train_step": 38.18809986114502, "step": 223}
{"train_info/time_between_train_steps": 0.0054590702056884766, "step": 223}
{"info/global_step": 224, "train_info/time_within_train_step": 38.15575575828552, "step": 224}
{"train_info/time_between_train_steps": 0.01684284210205078, "step": 224}
{"info/global_step": 225, "train_info/time_within_train_step": 38.23685145378113, "step": 225}
{"train_info/time_between_train_steps": 0.005305290222167969, "step": 225}
{"info/global_step": 226, "train_info/time_within_train_step": 37.959020137786865, "step": 226}
{"train_info/time_between_train_steps": 0.005108356475830078, "step": 226}
{"info/global_step": 227, "train_info/time_within_train_step": 37.97039723396301, "step": 227}
{"train_info/time_between_train_steps": 0.00519251823425293, "step": 227}
{"info/global_step": 228, "train_info/time_within_train_step": 38.334389448165894, "step": 228}
{"train_info/time_between_train_steps": 0.0049779415130615234, "step": 228}
{"info/global_step": 229, "train_info/time_within_train_step": 38.12607932090759, "step": 229}
{"train_info/time_between_train_steps": 0.005213499069213867, "step": 229}
{"info/global_step": 230, "train_info/time_within_train_step": 38.46728467941284, "step": 230}
{"train_info/time_between_train_steps": 0.010680198669433594, "step": 230}
{"info/global_step": 231, "train_info/time_within_train_step": 38.09563708305359, "step": 231}
{"train_info/time_between_train_steps": 0.0051555633544921875, "step": 231}
{"info/global_step": 232, "train_info/time_within_train_step": 38.17962169647217, "step": 232}
{"train_info/time_between_train_steps": 0.005129575729370117, "step": 232}
{"info/global_step": 233, "train_info/time_within_train_step": 38.27677249908447, "step": 233}
{"train_info/time_between_train_steps": 0.010414600372314453, "step": 233}
{"info/global_step": 234, "train_info/time_within_train_step": 37.875316858291626, "step": 234}
{"train_info/time_between_train_steps": 0.0051496028900146484, "step": 234}
{"info/global_step": 235, "train_info/time_within_train_step": 38.14283227920532, "step": 235}
{"train_info/time_between_train_steps": 0.0063190460205078125, "step": 235}
{"info/global_step": 236, "train_info/time_within_train_step": 37.9433798789978, "step": 236}
{"train_info/time_between_train_steps": 0.005191326141357422, "step": 236}
{"info/global_step": 237, "train_info/time_within_train_step": 38.119606256484985, "step": 237}
{"train_info/time_between_train_steps": 0.005128145217895508, "step": 237}
{"info/global_step": 238, "train_info/time_within_train_step": 38.22804093360901, "step": 238}
{"train_info/time_between_train_steps": 0.007586479187011719, "step": 238}
{"info/global_step": 239, "train_info/time_within_train_step": 38.01687431335449, "step": 239}
{"train_info/time_between_train_steps": 0.005079030990600586, "step": 239}
{"info/global_step": 240, "train_info/time_within_train_step": 38.206382751464844, "step": 240}
{"train_info/time_between_train_steps": 0.010805130004882812, "step": 240}
{"info/global_step": 241, "train_info/time_within_train_step": 38.327964782714844, "step": 241}
{"train_info/time_between_train_steps": 0.00551295280456543, "step": 241}
{"info/global_step": 242, "train_info/time_within_train_step": 38.14648628234863, "step": 242}
{"train_info/time_between_train_steps": 0.01032257080078125, "step": 242}
{"info/global_step": 243, "train_info/time_within_train_step": 38.38426446914673, "step": 243}
{"train_info/time_between_train_steps": 0.0058438777923583984, "step": 243}
{"train_info/time_between_train_steps": 27.077028274536133, "step": 243}
{"info/global_step": 244, "train_info/time_within_train_step": 38.004032611846924, "step": 244}
{"train_info/time_between_train_steps": 0.005959510803222656, "step": 244}
{"info/global_step": 245, "train_info/time_within_train_step": 38.57767701148987, "step": 245}
{"train_info/time_between_train_steps": 0.0055696964263916016, "step": 245}
{"info/global_step": 246, "train_info/time_within_train_step": 38.1271071434021, "step": 246}
{"train_info/time_between_train_steps": 0.010190248489379883, "step": 246}
{"info/global_step": 247, "train_info/time_within_train_step": 38.27557563781738, "step": 247}
{"train_info/time_between_train_steps": 0.005368232727050781, "step": 247}
{"info/global_step": 248, "train_info/time_within_train_step": 37.866668939590454, "step": 248}
{"train_info/time_between_train_steps": 0.008774757385253906, "step": 248}
{"info/global_step": 249, "train_info/time_within_train_step": 38.294979095458984, "step": 249}
{"train_info/time_between_train_steps": 0.005733489990234375, "step": 249}
{"info/global_step": 250, "train_info/time_within_train_step": 38.33638596534729, "step": 250}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733696622, "_runtime": 9511}, "step": 250}
{"logs": {"train/loss": 5.9419, "train/learning_rate": 0.0005277777777777777, "train/epoch": 9.01, "_timestamp": 1733696622, "_runtime": 9511}, "step": 250}
{"train_info/time_between_train_steps": 0.007416963577270508, "step": 250}
{"info/global_step": 251, "train_info/time_within_train_step": 38.262922286987305, "step": 251}
{"train_info/time_between_train_steps": 0.011273384094238281, "step": 251}
{"info/global_step": 252, "train_info/time_within_train_step": 38.075687408447266, "step": 252}
{"train_info/time_between_train_steps": 0.005200386047363281, "step": 252}
{"info/global_step": 253, "train_info/time_within_train_step": 37.82823061943054, "step": 253}
{"train_info/time_between_train_steps": 0.0049822330474853516, "step": 253}
{"info/global_step": 254, "train_info/time_within_train_step": 38.2977135181427, "step": 254}
{"train_info/time_between_train_steps": 0.00855875015258789, "step": 254}
{"info/global_step": 255, "train_info/time_within_train_step": 38.023287773132324, "step": 255}
{"train_info/time_between_train_steps": 0.00489354133605957, "step": 255}
{"info/global_step": 256, "train_info/time_within_train_step": 38.04891633987427, "step": 256}
{"train_info/time_between_train_steps": 0.004957675933837891, "step": 256}
{"info/global_step": 257, "train_info/time_within_train_step": 38.0110125541687, "step": 257}
{"train_info/time_between_train_steps": 0.005250453948974609, "step": 257}
{"info/global_step": 258, "train_info/time_within_train_step": 38.11624217033386, "step": 258}
{"train_info/time_between_train_steps": 0.0050127506256103516, "step": 258}
{"info/global_step": 259, "train_info/time_within_train_step": 38.0488703250885, "step": 259}
{"train_info/time_between_train_steps": 0.00501704216003418, "step": 259}
{"info/global_step": 260, "train_info/time_within_train_step": 38.29648208618164, "step": 260}
{"train_info/time_between_train_steps": 0.004807472229003906, "step": 260}
{"info/global_step": 261, "train_info/time_within_train_step": 38.12542414665222, "step": 261}
{"train_info/time_between_train_steps": 0.00958704948425293, "step": 261}
{"info/global_step": 262, "train_info/time_within_train_step": 38.031140089035034, "step": 262}
{"train_info/time_between_train_steps": 0.004901885986328125, "step": 262}
{"info/global_step": 263, "train_info/time_within_train_step": 37.86141753196716, "step": 263}
{"train_info/time_between_train_steps": 0.0051157474517822266, "step": 263}
{"info/global_step": 264, "train_info/time_within_train_step": 38.07550001144409, "step": 264}
{"train_info/time_between_train_steps": 0.0049741268157958984, "step": 264}
{"info/global_step": 265, "train_info/time_within_train_step": 38.101598262786865, "step": 265}
{"train_info/time_between_train_steps": 0.009611368179321289, "step": 265}
{"info/global_step": 266, "train_info/time_within_train_step": 38.07823443412781, "step": 266}
{"train_info/time_between_train_steps": 0.009724617004394531, "step": 266}
{"info/global_step": 267, "train_info/time_within_train_step": 38.06837439537048, "step": 267}
{"train_info/time_between_train_steps": 0.010521888732910156, "step": 267}
{"info/global_step": 268, "train_info/time_within_train_step": 38.169617652893066, "step": 268}
{"train_info/time_between_train_steps": 0.005275249481201172, "step": 268}
{"info/global_step": 269, "train_info/time_within_train_step": 38.075183629989624, "step": 269}
{"train_info/time_between_train_steps": 0.005380153656005859, "step": 269}
{"info/global_step": 270, "train_info/time_within_train_step": 38.05015158653259, "step": 270}
{"train_info/time_between_train_steps": 0.005373954772949219, "step": 270}
{"train_info/time_between_train_steps": 26.906641483306885, "step": 270}
{"info/global_step": 271, "train_info/time_within_train_step": 38.058775424957275, "step": 271}
{"train_info/time_between_train_steps": 0.0057146549224853516, "step": 271}
{"info/global_step": 272, "train_info/time_within_train_step": 38.316388845443726, "step": 272}
{"train_info/time_between_train_steps": 0.005459785461425781, "step": 272}
{"info/global_step": 273, "train_info/time_within_train_step": 37.9904899597168, "step": 273}
{"train_info/time_between_train_steps": 0.005221366882324219, "step": 273}
{"info/global_step": 274, "train_info/time_within_train_step": 38.387725591659546, "step": 274}
{"train_info/time_between_train_steps": 0.010759592056274414, "step": 274}
{"info/global_step": 275, "train_info/time_within_train_step": 38.489150524139404, "step": 275}
{"train_info/time_between_train_steps": 0.005896091461181641, "step": 275}
{"info/global_step": 276, "train_info/time_within_train_step": 38.33473587036133, "step": 276}
{"train_info/time_between_train_steps": 0.005966663360595703, "step": 276}
{"info/global_step": 277, "train_info/time_within_train_step": 38.19249200820923, "step": 277}
{"train_info/time_between_train_steps": 0.006036043167114258, "step": 277}
{"info/global_step": 278, "train_info/time_within_train_step": 38.16216826438904, "step": 278}
{"train_info/time_between_train_steps": 0.0061435699462890625, "step": 278}
{"info/global_step": 279, "train_info/time_within_train_step": 38.1587975025177, "step": 279}
{"train_info/time_between_train_steps": 0.005597114562988281, "step": 279}
{"info/global_step": 280, "train_info/time_within_train_step": 38.60794806480408, "step": 280}
{"train_info/time_between_train_steps": 0.005502939224243164, "step": 280}
{"info/global_step": 281, "train_info/time_within_train_step": 38.08213257789612, "step": 281}
{"train_info/time_between_train_steps": 0.006196737289428711, "step": 281}
{"info/global_step": 282, "train_info/time_within_train_step": 38.17371916770935, "step": 282}
{"train_info/time_between_train_steps": 0.0070269107818603516, "step": 282}
{"info/global_step": 283, "train_info/time_within_train_step": 38.2808039188385, "step": 283}
{"train_info/time_between_train_steps": 0.00936579704284668, "step": 283}
{"info/global_step": 284, "train_info/time_within_train_step": 38.08581900596619, "step": 284}
{"train_info/time_between_train_steps": 0.00606846809387207, "step": 284}
{"info/global_step": 285, "train_info/time_within_train_step": 38.1133086681366, "step": 285}
{"train_info/time_between_train_steps": 0.01006174087524414, "step": 285}
{"info/global_step": 286, "train_info/time_within_train_step": 38.19284248352051, "step": 286}
{"train_info/time_between_train_steps": 0.00559234619140625, "step": 286}
{"info/global_step": 287, "train_info/time_within_train_step": 38.12731647491455, "step": 287}
{"train_info/time_between_train_steps": 0.005388736724853516, "step": 287}
{"info/global_step": 288, "train_info/time_within_train_step": 38.20029854774475, "step": 288}
{"train_info/time_between_train_steps": 0.005254983901977539, "step": 288}
{"info/global_step": 289, "train_info/time_within_train_step": 38.23696732521057, "step": 289}
{"train_info/time_between_train_steps": 0.005434513092041016, "step": 289}
{"info/global_step": 290, "train_info/time_within_train_step": 38.11381769180298, "step": 290}
{"train_info/time_between_train_steps": 0.005421876907348633, "step": 290}
{"info/global_step": 291, "train_info/time_within_train_step": 38.35515093803406, "step": 291}
{"train_info/time_between_train_steps": 0.005254983901977539, "step": 291}
{"info/global_step": 292, "train_info/time_within_train_step": 38.39768695831299, "step": 292}
{"train_info/time_between_train_steps": 0.005499839782714844, "step": 292}
{"info/global_step": 293, "train_info/time_within_train_step": 37.98329401016235, "step": 293}
{"train_info/time_between_train_steps": 0.005294322967529297, "step": 293}
{"info/global_step": 294, "train_info/time_within_train_step": 38.20191168785095, "step": 294}
{"train_info/time_between_train_steps": 0.0106964111328125, "step": 294}
{"info/global_step": 295, "train_info/time_within_train_step": 38.09756064414978, "step": 295}
{"train_info/time_between_train_steps": 0.006168842315673828, "step": 295}
{"info/global_step": 296, "train_info/time_within_train_step": 38.195539712905884, "step": 296}
{"train_info/time_between_train_steps": 0.00571751594543457, "step": 296}
{"info/global_step": 297, "train_info/time_within_train_step": 38.09455728530884, "step": 297}
{"train_info/time_between_train_steps": 0.006214141845703125, "step": 297}
{"train_info/time_between_train_steps": 27.20600724220276, "step": 297}
{"info/global_step": 298, "train_info/time_within_train_step": 38.32488965988159, "step": 298}
{"train_info/time_between_train_steps": 0.006055593490600586, "step": 298}
{"info/global_step": 299, "train_info/time_within_train_step": 38.483213663101196, "step": 299}
{"train_info/time_between_train_steps": 0.005488872528076172, "step": 299}
{"info/global_step": 300, "train_info/time_within_train_step": 38.19405651092529, "step": 300}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733698585, "_runtime": 11474}, "step": 300}
{"logs": {"train/loss": 5.6175, "train/learning_rate": 0.0005, "train/epoch": 11.0, "_timestamp": 1733698585, "_runtime": 11474}, "step": 300}
{"train_info/time_between_train_steps": 3.0751307010650635, "step": 300}
{"info/global_step": 301, "train_info/time_within_train_step": 38.33628582954407, "step": 301}
{"train_info/time_between_train_steps": 0.005891323089599609, "step": 301}
{"info/global_step": 302, "train_info/time_within_train_step": 38.12257385253906, "step": 302}
{"train_info/time_between_train_steps": 0.00623631477355957, "step": 302}
{"info/global_step": 303, "train_info/time_within_train_step": 38.37046980857849, "step": 303}
{"train_info/time_between_train_steps": 0.006044864654541016, "step": 303}
{"info/global_step": 304, "train_info/time_within_train_step": 38.75762724876404, "step": 304}
{"train_info/time_between_train_steps": 0.007096767425537109, "step": 304}
{"info/global_step": 305, "train_info/time_within_train_step": 38.19355082511902, "step": 305}
{"train_info/time_between_train_steps": 0.005997657775878906, "step": 305}
{"info/global_step": 306, "train_info/time_within_train_step": 38.330724000930786, "step": 306}
{"train_info/time_between_train_steps": 0.011330842971801758, "step": 306}
{"info/global_step": 307, "train_info/time_within_train_step": 38.265419244766235, "step": 307}
{"train_info/time_between_train_steps": 0.005730390548706055, "step": 307}
{"info/global_step": 308, "train_info/time_within_train_step": 38.114824056625366, "step": 308}
{"train_info/time_between_train_steps": 0.006269693374633789, "step": 308}
{"info/global_step": 309, "train_info/time_within_train_step": 38.445149660110474, "step": 309}
{"train_info/time_between_train_steps": 0.00592494010925293, "step": 309}
{"info/global_step": 310, "train_info/time_within_train_step": 37.88769006729126, "step": 310}
{"train_info/time_between_train_steps": 0.005300045013427734, "step": 310}
{"info/global_step": 311, "train_info/time_within_train_step": 37.982192277908325, "step": 311}
{"train_info/time_between_train_steps": 0.005880594253540039, "step": 311}
{"info/global_step": 312, "train_info/time_within_train_step": 37.954705238342285, "step": 312}
{"train_info/time_between_train_steps": 0.015297174453735352, "step": 312}
{"info/global_step": 313, "train_info/time_within_train_step": 38.39408612251282, "step": 313}
{"train_info/time_between_train_steps": 0.005778789520263672, "step": 313}
{"info/global_step": 314, "train_info/time_within_train_step": 38.109251737594604, "step": 314}
{"train_info/time_between_train_steps": 0.010584831237792969, "step": 314}
{"info/global_step": 315, "train_info/time_within_train_step": 38.01689171791077, "step": 315}
{"train_info/time_between_train_steps": 0.005530118942260742, "step": 315}
{"info/global_step": 316, "train_info/time_within_train_step": 37.99798822402954, "step": 316}
{"train_info/time_between_train_steps": 0.006699323654174805, "step": 316}
{"info/global_step": 317, "train_info/time_within_train_step": 38.034663915634155, "step": 317}
{"train_info/time_between_train_steps": 0.005782604217529297, "step": 317}
{"info/global_step": 318, "train_info/time_within_train_step": 38.444631814956665, "step": 318}
{"train_info/time_between_train_steps": 0.005500316619873047, "step": 318}
{"info/global_step": 319, "train_info/time_within_train_step": 38.12262940406799, "step": 319}
{"train_info/time_between_train_steps": 0.005785226821899414, "step": 319}
{"info/global_step": 320, "train_info/time_within_train_step": 38.02841901779175, "step": 320}
{"train_info/time_between_train_steps": 0.005577564239501953, "step": 320}
{"info/global_step": 321, "train_info/time_within_train_step": 38.256863832473755, "step": 321}
{"train_info/time_between_train_steps": 0.0064089298248291016, "step": 321}
{"info/global_step": 322, "train_info/time_within_train_step": 38.649060010910034, "step": 322}
{"train_info/time_between_train_steps": 0.0056803226470947266, "step": 322}
{"info/global_step": 323, "train_info/time_within_train_step": 37.36003589630127, "step": 323}
{"train_info/time_between_train_steps": 0.006280422210693359, "step": 323}
{"info/global_step": 324, "train_info/time_within_train_step": 37.918822288513184, "step": 324}
{"train_info/time_between_train_steps": 0.006522178649902344, "step": 324}
{"train_info/time_between_train_steps": 27.427732706069946, "step": 324}
{"info/global_step": 325, "train_info/time_within_train_step": 38.07412338256836, "step": 325}
{"train_info/time_between_train_steps": 0.006912946701049805, "step": 325}
{"info/global_step": 326, "train_info/time_within_train_step": 38.24715805053711, "step": 326}
{"train_info/time_between_train_steps": 0.005860090255737305, "step": 326}
{"info/global_step": 327, "train_info/time_within_train_step": 38.48783326148987, "step": 327}
{"train_info/time_between_train_steps": 0.005806922912597656, "step": 327}
{"info/global_step": 328, "train_info/time_within_train_step": 38.187798738479614, "step": 328}
{"train_info/time_between_train_steps": 0.005722999572753906, "step": 328}
{"info/global_step": 329, "train_info/time_within_train_step": 38.09533190727234, "step": 329}
{"train_info/time_between_train_steps": 0.005788564682006836, "step": 329}
{"info/global_step": 330, "train_info/time_within_train_step": 38.85364532470703, "step": 330}
{"train_info/time_between_train_steps": 0.005495786666870117, "step": 330}
{"info/global_step": 331, "train_info/time_within_train_step": 38.030946016311646, "step": 331}
{"train_info/time_between_train_steps": 0.006403207778930664, "step": 331}
{"info/global_step": 332, "train_info/time_within_train_step": 38.0911808013916, "step": 332}
{"train_info/time_between_train_steps": 0.01138448715209961, "step": 332}
{"info/global_step": 333, "train_info/time_within_train_step": 38.535595655441284, "step": 333}
{"train_info/time_between_train_steps": 0.006971597671508789, "step": 333}
{"info/global_step": 334, "train_info/time_within_train_step": 37.94685626029968, "step": 334}
{"train_info/time_between_train_steps": 0.005631923675537109, "step": 334}
{"info/global_step": 335, "train_info/time_within_train_step": 38.08712387084961, "step": 335}
{"train_info/time_between_train_steps": 0.00649261474609375, "step": 335}
{"info/global_step": 336, "train_info/time_within_train_step": 38.53069186210632, "step": 336}
{"train_info/time_between_train_steps": 0.010367870330810547, "step": 336}
{"info/global_step": 337, "train_info/time_within_train_step": 38.15481662750244, "step": 337}
{"train_info/time_between_train_steps": 0.00547027587890625, "step": 337}
{"info/global_step": 338, "train_info/time_within_train_step": 37.77186036109924, "step": 338}
{"train_info/time_between_train_steps": 0.0060040950775146484, "step": 338}
{"info/global_step": 339, "train_info/time_within_train_step": 38.41983366012573, "step": 339}
{"train_info/time_between_train_steps": 0.006002664566040039, "step": 339}
{"info/global_step": 340, "train_info/time_within_train_step": 37.897791385650635, "step": 340}
{"train_info/time_between_train_steps": 0.005225419998168945, "step": 340}
{"info/global_step": 341, "train_info/time_within_train_step": 38.03848600387573, "step": 341}
{"train_info/time_between_train_steps": 0.005661964416503906, "step": 341}
{"info/global_step": 342, "train_info/time_within_train_step": 38.30417251586914, "step": 342}
{"train_info/time_between_train_steps": 0.010336875915527344, "step": 342}
{"info/global_step": 343, "train_info/time_within_train_step": 37.87443804740906, "step": 343}
{"train_info/time_between_train_steps": 0.005578041076660156, "step": 343}
{"info/global_step": 344, "train_info/time_within_train_step": 38.24914503097534, "step": 344}
{"train_info/time_between_train_steps": 0.0057506561279296875, "step": 344}
{"info/global_step": 345, "train_info/time_within_train_step": 37.76273798942566, "step": 345}
{"train_info/time_between_train_steps": 0.005372524261474609, "step": 345}
{"info/global_step": 346, "train_info/time_within_train_step": 38.00505995750427, "step": 346}
{"train_info/time_between_train_steps": 0.01005864143371582, "step": 346}
{"info/global_step": 347, "train_info/time_within_train_step": 38.41270589828491, "step": 347}
{"train_info/time_between_train_steps": 0.0061147212982177734, "step": 347}
{"info/global_step": 348, "train_info/time_within_train_step": 37.951396226882935, "step": 348}
{"train_info/time_between_train_steps": 0.005811214447021484, "step": 348}
{"info/global_step": 349, "train_info/time_within_train_step": 38.4422345161438, "step": 349}
{"train_info/time_between_train_steps": 0.005724668502807617, "step": 349}
{"info/global_step": 350, "train_info/time_within_train_step": 37.859580278396606, "step": 350}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733700525, "_runtime": 13414}, "step": 350}
{"logs": {"train/loss": 5.206, "train/learning_rate": 0.00047222222222222224, "train/epoch": 12.02, "_timestamp": 1733700525, "_runtime": 13414}, "step": 350}
{"train_info/time_between_train_steps": 0.008239030838012695, "step": 350}
{"info/global_step": 351, "train_info/time_within_train_step": 38.02564239501953, "step": 351}
{"train_info/time_between_train_steps": 0.006176948547363281, "step": 351}
{"train_info/time_between_train_steps": 27.20397686958313, "step": 351}
{"info/global_step": 352, "train_info/time_within_train_step": 37.99637699127197, "step": 352}
{"train_info/time_between_train_steps": 0.010611534118652344, "step": 352}
{"info/global_step": 353, "train_info/time_within_train_step": 38.56142210960388, "step": 353}
{"train_info/time_between_train_steps": 0.005285978317260742, "step": 353}
{"info/global_step": 354, "train_info/time_within_train_step": 37.858073472976685, "step": 354}
{"train_info/time_between_train_steps": 0.010154485702514648, "step": 354}
{"info/global_step": 355, "train_info/time_within_train_step": 38.055474042892456, "step": 355}
{"train_info/time_between_train_steps": 0.010265350341796875, "step": 355}
{"info/global_step": 356, "train_info/time_within_train_step": 38.20325303077698, "step": 356}
{"train_info/time_between_train_steps": 0.006307840347290039, "step": 356}
{"info/global_step": 357, "train_info/time_within_train_step": 38.11839985847473, "step": 357}
{"train_info/time_between_train_steps": 0.010297775268554688, "step": 357}
{"info/global_step": 358, "train_info/time_within_train_step": 38.46646165847778, "step": 358}
{"train_info/time_between_train_steps": 0.005589723587036133, "step": 358}
{"info/global_step": 359, "train_info/time_within_train_step": 37.83801984786987, "step": 359}
{"train_info/time_between_train_steps": 0.005165815353393555, "step": 359}
{"info/global_step": 360, "train_info/time_within_train_step": 37.733076095581055, "step": 360}
{"train_info/time_between_train_steps": 0.005152225494384766, "step": 360}
{"info/global_step": 361, "train_info/time_within_train_step": 38.391207456588745, "step": 361}
{"train_info/time_between_train_steps": 0.005035400390625, "step": 361}
{"info/global_step": 362, "train_info/time_within_train_step": 37.703691482543945, "step": 362}
{"train_info/time_between_train_steps": 0.008132457733154297, "step": 362}
{"info/global_step": 363, "train_info/time_within_train_step": 38.333253145217896, "step": 363}
{"train_info/time_between_train_steps": 0.009768486022949219, "step": 363}
{"info/global_step": 364, "train_info/time_within_train_step": 37.89440846443176, "step": 364}
{"train_info/time_between_train_steps": 0.005724668502807617, "step": 364}
{"info/global_step": 365, "train_info/time_within_train_step": 38.32552719116211, "step": 365}
{"train_info/time_between_train_steps": 0.00975346565246582, "step": 365}
{"info/global_step": 366, "train_info/time_within_train_step": 37.665934801101685, "step": 366}
{"train_info/time_between_train_steps": 0.005120277404785156, "step": 366}
{"info/global_step": 367, "train_info/time_within_train_step": 37.977630376815796, "step": 367}
{"train_info/time_between_train_steps": 0.005097150802612305, "step": 367}
{"info/global_step": 368, "train_info/time_within_train_step": 38.24496507644653, "step": 368}
{"train_info/time_between_train_steps": 0.005494356155395508, "step": 368}
{"info/global_step": 369, "train_info/time_within_train_step": 37.88554883003235, "step": 369}
{"train_info/time_between_train_steps": 0.00497126579284668, "step": 369}
{"info/global_step": 370, "train_info/time_within_train_step": 38.342963218688965, "step": 370}
{"train_info/time_between_train_steps": 0.0051271915435791016, "step": 370}
{"info/global_step": 371, "train_info/time_within_train_step": 37.92615866661072, "step": 371}
{"train_info/time_between_train_steps": 0.009329080581665039, "step": 371}
{"info/global_step": 372, "train_info/time_within_train_step": 38.61772680282593, "step": 372}
{"train_info/time_between_train_steps": 0.010313272476196289, "step": 372}
{"info/global_step": 373, "train_info/time_within_train_step": 37.90510606765747, "step": 373}
{"train_info/time_between_train_steps": 0.005069732666015625, "step": 373}
{"info/global_step": 374, "train_info/time_within_train_step": 38.53185987472534, "step": 374}
{"train_info/time_between_train_steps": 0.005212306976318359, "step": 374}
{"info/global_step": 375, "train_info/time_within_train_step": 37.812185525894165, "step": 375}
{"train_info/time_between_train_steps": 0.010241985321044922, "step": 375}
{"info/global_step": 376, "train_info/time_within_train_step": 37.83656096458435, "step": 376}
{"train_info/time_between_train_steps": 0.005282878875732422, "step": 376}
{"info/global_step": 377, "train_info/time_within_train_step": 38.48602271080017, "step": 377}
{"train_info/time_between_train_steps": 0.005556821823120117, "step": 377}
{"info/global_step": 378, "train_info/time_within_train_step": 37.79046654701233, "step": 378}
{"train_info/time_between_train_steps": 0.00571441650390625, "step": 378}
{"train_info/time_between_train_steps": 27.25270962715149, "step": 378}
{"info/global_step": 379, "train_info/time_within_train_step": 37.74354839324951, "step": 379}
{"train_info/time_between_train_steps": 0.00959920883178711, "step": 379}
{"info/global_step": 380, "train_info/time_within_train_step": 38.416764974594116, "step": 380}
{"train_info/time_between_train_steps": 0.005135297775268555, "step": 380}
{"info/global_step": 381, "train_info/time_within_train_step": 37.7980694770813, "step": 381}
{"train_info/time_between_train_steps": 0.00508880615234375, "step": 381}
{"info/global_step": 382, "train_info/time_within_train_step": 38.69846296310425, "step": 382}
{"train_info/time_between_train_steps": 0.00539088249206543, "step": 382}
{"info/global_step": 383, "train_info/time_within_train_step": 37.7698495388031, "step": 383}
{"train_info/time_between_train_steps": 0.0050411224365234375, "step": 383}
{"info/global_step": 384, "train_info/time_within_train_step": 38.69284176826477, "step": 384}
{"train_info/time_between_train_steps": 0.0051114559173583984, "step": 384}
{"info/global_step": 385, "train_info/time_within_train_step": 37.81735801696777, "step": 385}
{"train_info/time_between_train_steps": 0.0052471160888671875, "step": 385}
{"info/global_step": 386, "train_info/time_within_train_step": 38.34298777580261, "step": 386}
{"train_info/time_between_train_steps": 0.005249738693237305, "step": 386}
{"info/global_step": 387, "train_info/time_within_train_step": 37.55411767959595, "step": 387}
{"train_info/time_between_train_steps": 0.004912853240966797, "step": 387}
{"info/global_step": 388, "train_info/time_within_train_step": 38.373058795928955, "step": 388}
{"train_info/time_between_train_steps": 0.004950761795043945, "step": 388}
{"info/global_step": 389, "train_info/time_within_train_step": 38.03339695930481, "step": 389}
{"train_info/time_between_train_steps": 0.00513768196105957, "step": 389}
{"info/global_step": 390, "train_info/time_within_train_step": 38.472761392593384, "step": 390}
{"train_info/time_between_train_steps": 0.004952430725097656, "step": 390}
{"info/global_step": 391, "train_info/time_within_train_step": 37.788562536239624, "step": 391}
{"train_info/time_between_train_steps": 0.009667158126831055, "step": 391}
{"info/global_step": 392, "train_info/time_within_train_step": 38.25941467285156, "step": 392}
{"train_info/time_between_train_steps": 0.005154848098754883, "step": 392}
{"info/global_step": 393, "train_info/time_within_train_step": 37.81497263908386, "step": 393}
{"train_info/time_between_train_steps": 0.004962444305419922, "step": 393}
{"info/global_step": 394, "train_info/time_within_train_step": 37.788050413131714, "step": 394}
{"train_info/time_between_train_steps": 0.004889011383056641, "step": 394}
{"info/global_step": 395, "train_info/time_within_train_step": 38.471429109573364, "step": 395}
{"train_info/time_between_train_steps": 0.0051686763763427734, "step": 395}
{"info/global_step": 396, "train_info/time_within_train_step": 37.63517189025879, "step": 396}
{"train_info/time_between_train_steps": 0.004990339279174805, "step": 396}
{"info/global_step": 397, "train_info/time_within_train_step": 38.4140682220459, "step": 397}
{"train_info/time_between_train_steps": 0.005079984664916992, "step": 397}
{"info/global_step": 398, "train_info/time_within_train_step": 37.98316407203674, "step": 398}
{"train_info/time_between_train_steps": 0.005067110061645508, "step": 398}
{"info/global_step": 399, "train_info/time_within_train_step": 38.31161451339722, "step": 399}
{"train_info/time_between_train_steps": 0.005074024200439453, "step": 399}
{"info/global_step": 400, "train_info/time_within_train_step": 37.68264412879944, "step": 400}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733702484, "_runtime": 15373}, "step": 400}
{"logs": {"train/loss": 4.9591, "train/learning_rate": 0.00044444444444444436, "train/epoch": 14.02, "_timestamp": 1733702484, "_runtime": 15373}, "step": 400}
{"train_info/time_between_train_steps": 2.2482261657714844, "step": 400}
{"info/global_step": 401, "train_info/time_within_train_step": 38.48475241661072, "step": 401}
{"train_info/time_between_train_steps": 0.005456447601318359, "step": 401}
{"info/global_step": 402, "train_info/time_within_train_step": 37.833104610443115, "step": 402}
{"train_info/time_between_train_steps": 0.005568504333496094, "step": 402}
{"info/global_step": 403, "train_info/time_within_train_step": 38.32212257385254, "step": 403}
{"train_info/time_between_train_steps": 0.005591154098510742, "step": 403}
{"info/global_step": 404, "train_info/time_within_train_step": 37.70335841178894, "step": 404}
{"train_info/time_between_train_steps": 0.005756855010986328, "step": 404}
{"info/global_step": 405, "train_info/time_within_train_step": 38.25199055671692, "step": 405}
{"train_info/time_between_train_steps": 0.010329008102416992, "step": 405}
{"train_info/time_between_train_steps": 26.899012327194214, "step": 405}
{"info/global_step": 406, "train_info/time_within_train_step": 38.07394862174988, "step": 406}
{"train_info/time_between_train_steps": 0.004984855651855469, "step": 406}
{"info/global_step": 407, "train_info/time_within_train_step": 38.30349946022034, "step": 407}
{"train_info/time_between_train_steps": 0.004967689514160156, "step": 407}
{"info/global_step": 408, "train_info/time_within_train_step": 37.77900195121765, "step": 408}
{"train_info/time_between_train_steps": 0.004883527755737305, "step": 408}
{"info/global_step": 409, "train_info/time_within_train_step": 38.5407772064209, "step": 409}
{"train_info/time_between_train_steps": 0.005536556243896484, "step": 409}
{"info/global_step": 410, "train_info/time_within_train_step": 37.59358096122742, "step": 410}
{"train_info/time_between_train_steps": 0.0052928924560546875, "step": 410}
{"info/global_step": 411, "train_info/time_within_train_step": 38.48497653007507, "step": 411}
{"train_info/time_between_train_steps": 0.00537562370300293, "step": 411}
{"info/global_step": 412, "train_info/time_within_train_step": 37.679537773132324, "step": 412}
{"train_info/time_between_train_steps": 0.0055637359619140625, "step": 412}
{"info/global_step": 413, "train_info/time_within_train_step": 38.478891372680664, "step": 413}
{"train_info/time_between_train_steps": 0.0054242610931396484, "step": 413}
{"info/global_step": 414, "train_info/time_within_train_step": 37.68219232559204, "step": 414}
{"train_info/time_between_train_steps": 0.004972934722900391, "step": 414}
{"info/global_step": 415, "train_info/time_within_train_step": 38.3980770111084, "step": 415}
{"train_info/time_between_train_steps": 0.005049228668212891, "step": 415}
{"info/global_step": 416, "train_info/time_within_train_step": 37.64945316314697, "step": 416}
{"train_info/time_between_train_steps": 0.005098104476928711, "step": 416}
{"info/global_step": 417, "train_info/time_within_train_step": 38.425328493118286, "step": 417}
{"train_info/time_between_train_steps": 0.005078315734863281, "step": 417}
{"info/global_step": 418, "train_info/time_within_train_step": 37.700029611587524, "step": 418}
{"train_info/time_between_train_steps": 0.00509190559387207, "step": 418}
{"info/global_step": 419, "train_info/time_within_train_step": 38.419657945632935, "step": 419}
{"train_info/time_between_train_steps": 0.005196809768676758, "step": 419}
{"info/global_step": 420, "train_info/time_within_train_step": 37.78588628768921, "step": 420}
{"train_info/time_between_train_steps": 0.005221843719482422, "step": 420}
{"info/global_step": 421, "train_info/time_within_train_step": 38.46073627471924, "step": 421}
{"train_info/time_between_train_steps": 0.005094051361083984, "step": 421}
{"info/global_step": 422, "train_info/time_within_train_step": 38.40254998207092, "step": 422}
{"train_info/time_between_train_steps": 0.00503849983215332, "step": 422}
{"info/global_step": 423, "train_info/time_within_train_step": 37.671517848968506, "step": 423}
{"train_info/time_between_train_steps": 0.004931211471557617, "step": 423}
{"info/global_step": 424, "train_info/time_within_train_step": 38.48318600654602, "step": 424}
{"train_info/time_between_train_steps": 0.005322456359863281, "step": 424}
{"info/global_step": 425, "train_info/time_within_train_step": 37.64844727516174, "step": 425}
{"train_info/time_between_train_steps": 0.005113840103149414, "step": 425}
{"info/global_step": 426, "train_info/time_within_train_step": 38.39401841163635, "step": 426}
{"train_info/time_between_train_steps": 0.009489774703979492, "step": 426}
{"info/global_step": 427, "train_info/time_within_train_step": 37.52535104751587, "step": 427}
{"train_info/time_between_train_steps": 0.005055904388427734, "step": 427}
{"info/global_step": 428, "train_info/time_within_train_step": 38.40097165107727, "step": 428}
{"train_info/time_between_train_steps": 0.005258083343505859, "step": 428}
{"info/global_step": 429, "train_info/time_within_train_step": 38.03896975517273, "step": 429}
{"train_info/time_between_train_steps": 0.005400419235229492, "step": 429}
{"info/global_step": 430, "train_info/time_within_train_step": 38.360864877700806, "step": 430}
{"train_info/time_between_train_steps": 0.0056803226470947266, "step": 430}
{"info/global_step": 431, "train_info/time_within_train_step": 37.63060235977173, "step": 431}
{"train_info/time_between_train_steps": 0.005281686782836914, "step": 431}
{"info/global_step": 432, "train_info/time_within_train_step": 38.31300187110901, "step": 432}
{"train_info/time_between_train_steps": 0.005692958831787109, "step": 432}
{"train_info/time_between_train_steps": 27.060678720474243, "step": 432}
{"info/global_step": 433, "train_info/time_within_train_step": 37.44627356529236, "step": 433}
{"train_info/time_between_train_steps": 0.004921674728393555, "step": 433}
{"info/global_step": 434, "train_info/time_within_train_step": 38.45175552368164, "step": 434}
{"train_info/time_between_train_steps": 0.0051348209381103516, "step": 434}
{"info/global_step": 435, "train_info/time_within_train_step": 37.68667769432068, "step": 435}
{"train_info/time_between_train_steps": 0.005103588104248047, "step": 435}
{"info/global_step": 436, "train_info/time_within_train_step": 38.56371212005615, "step": 436}
{"train_info/time_between_train_steps": 0.005276679992675781, "step": 436}
{"info/global_step": 437, "train_info/time_within_train_step": 38.37545394897461, "step": 437}
{"train_info/time_between_train_steps": 0.005784273147583008, "step": 437}
{"info/global_step": 438, "train_info/time_within_train_step": 37.81862783432007, "step": 438}
{"train_info/time_between_train_steps": 0.009490966796875, "step": 438}
{"info/global_step": 439, "train_info/time_within_train_step": 38.428871631622314, "step": 439}
{"train_info/time_between_train_steps": 0.00535893440246582, "step": 439}
{"info/global_step": 440, "train_info/time_within_train_step": 37.62326407432556, "step": 440}
{"train_info/time_between_train_steps": 0.005280971527099609, "step": 440}
{"info/global_step": 441, "train_info/time_within_train_step": 38.20225691795349, "step": 441}
{"train_info/time_between_train_steps": 0.004851341247558594, "step": 441}
{"info/global_step": 442, "train_info/time_within_train_step": 37.47977375984192, "step": 442}
{"train_info/time_between_train_steps": 0.004888772964477539, "step": 442}
{"info/global_step": 443, "train_info/time_within_train_step": 38.427738189697266, "step": 443}
{"train_info/time_between_train_steps": 0.005007028579711914, "step": 443}
{"info/global_step": 444, "train_info/time_within_train_step": 38.687655210494995, "step": 444}
{"train_info/time_between_train_steps": 0.005009889602661133, "step": 444}
{"info/global_step": 445, "train_info/time_within_train_step": 37.653188943862915, "step": 445}
{"train_info/time_between_train_steps": 0.0051496028900146484, "step": 445}
{"info/global_step": 446, "train_info/time_within_train_step": 38.36767625808716, "step": 446}
{"train_info/time_between_train_steps": 0.0052509307861328125, "step": 446}
{"info/global_step": 447, "train_info/time_within_train_step": 37.717007637023926, "step": 447}
{"train_info/time_between_train_steps": 0.005096435546875, "step": 447}
{"info/global_step": 448, "train_info/time_within_train_step": 38.446394205093384, "step": 448}
{"train_info/time_between_train_steps": 0.005128622055053711, "step": 448}
{"info/global_step": 449, "train_info/time_within_train_step": 38.46570873260498, "step": 449}
{"train_info/time_between_train_steps": 0.005014181137084961, "step": 449}
{"info/global_step": 450, "train_info/time_within_train_step": 37.513752937316895, "step": 450}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733704445, "_runtime": 17334}, "step": 450}
{"logs": {"train/loss": 4.7012, "train/learning_rate": 0.00041666666666666664, "train/epoch": 16.02, "_timestamp": 1733704445, "_runtime": 17334}, "step": 450}
{"train_info/time_between_train_steps": 0.006991147994995117, "step": 450}
{"info/global_step": 451, "train_info/time_within_train_step": 38.22387194633484, "step": 451}
{"train_info/time_between_train_steps": 0.00504302978515625, "step": 451}
{"info/global_step": 452, "train_info/time_within_train_step": 37.669955253601074, "step": 452}
{"train_info/time_between_train_steps": 0.004972696304321289, "step": 452}
{"info/global_step": 453, "train_info/time_within_train_step": 38.451425313949585, "step": 453}
{"train_info/time_between_train_steps": 0.005254030227661133, "step": 453}
{"info/global_step": 454, "train_info/time_within_train_step": 37.64792084693909, "step": 454}
{"train_info/time_between_train_steps": 0.005084514617919922, "step": 454}
{"info/global_step": 455, "train_info/time_within_train_step": 38.258878231048584, "step": 455}
{"train_info/time_between_train_steps": 0.005274295806884766, "step": 455}
{"info/global_step": 456, "train_info/time_within_train_step": 38.32478094100952, "step": 456}
{"train_info/time_between_train_steps": 0.005233049392700195, "step": 456}
{"info/global_step": 457, "train_info/time_within_train_step": 37.56517004966736, "step": 457}
{"train_info/time_between_train_steps": 0.005063533782958984, "step": 457}
{"info/global_step": 458, "train_info/time_within_train_step": 38.278738498687744, "step": 458}
{"train_info/time_between_train_steps": 0.00541234016418457, "step": 458}
{"info/global_step": 459, "train_info/time_within_train_step": 37.80143594741821, "step": 459}
{"train_info/time_between_train_steps": 0.005564689636230469, "step": 459}
{"train_info/time_between_train_steps": 27.1374409198761, "step": 459}
{"info/global_step": 460, "train_info/time_within_train_step": 38.44696593284607, "step": 460}
{"train_info/time_between_train_steps": 0.010172128677368164, "step": 460}
{"info/global_step": 461, "train_info/time_within_train_step": 37.793795347213745, "step": 461}
{"train_info/time_between_train_steps": 0.005240440368652344, "step": 461}
{"info/global_step": 462, "train_info/time_within_train_step": 38.112133741378784, "step": 462}
{"train_info/time_between_train_steps": 0.00513911247253418, "step": 462}
{"info/global_step": 463, "train_info/time_within_train_step": 38.23997712135315, "step": 463}
{"train_info/time_between_train_steps": 0.010350704193115234, "step": 463}
{"info/global_step": 464, "train_info/time_within_train_step": 37.59597110748291, "step": 464}
{"train_info/time_between_train_steps": 0.00518798828125, "step": 464}
{"info/global_step": 465, "train_info/time_within_train_step": 38.49082326889038, "step": 465}
{"train_info/time_between_train_steps": 0.00559234619140625, "step": 465}
{"info/global_step": 466, "train_info/time_within_train_step": 37.66032290458679, "step": 466}
{"train_info/time_between_train_steps": 0.005483865737915039, "step": 466}
{"info/global_step": 467, "train_info/time_within_train_step": 38.46740794181824, "step": 467}
{"train_info/time_between_train_steps": 0.005265951156616211, "step": 467}
{"info/global_step": 468, "train_info/time_within_train_step": 38.28790092468262, "step": 468}
{"train_info/time_between_train_steps": 0.005181550979614258, "step": 468}
{"info/global_step": 469, "train_info/time_within_train_step": 37.48175597190857, "step": 469}
{"train_info/time_between_train_steps": 0.004969120025634766, "step": 469}
{"info/global_step": 470, "train_info/time_within_train_step": 38.4068169593811, "step": 470}
{"train_info/time_between_train_steps": 0.005133152008056641, "step": 470}
{"info/global_step": 471, "train_info/time_within_train_step": 37.5042290687561, "step": 471}
{"train_info/time_between_train_steps": 0.004973173141479492, "step": 471}
{"info/global_step": 472, "train_info/time_within_train_step": 38.26225709915161, "step": 472}
{"train_info/time_between_train_steps": 0.005028724670410156, "step": 472}
{"info/global_step": 473, "train_info/time_within_train_step": 38.44081425666809, "step": 473}
{"train_info/time_between_train_steps": 0.005062580108642578, "step": 473}
{"info/global_step": 474, "train_info/time_within_train_step": 37.90310978889465, "step": 474}
{"train_info/time_between_train_steps": 0.005038261413574219, "step": 474}
{"info/global_step": 475, "train_info/time_within_train_step": 38.32544493675232, "step": 475}
{"train_info/time_between_train_steps": 0.009748697280883789, "step": 475}
{"info/global_step": 476, "train_info/time_within_train_step": 37.540053367614746, "step": 476}
{"train_info/time_between_train_steps": 0.009844064712524414, "step": 476}
{"info/global_step": 477, "train_info/time_within_train_step": 38.36300826072693, "step": 477}
{"train_info/time_between_train_steps": 0.005196809768676758, "step": 477}
{"info/global_step": 478, "train_info/time_within_train_step": 38.13516974449158, "step": 478}
{"train_info/time_between_train_steps": 0.0052797794342041016, "step": 478}
{"info/global_step": 479, "train_info/time_within_train_step": 37.61718535423279, "step": 479}
{"train_info/time_between_train_steps": 0.005158901214599609, "step": 479}
{"info/global_step": 480, "train_info/time_within_train_step": 38.319281339645386, "step": 480}
{"train_info/time_between_train_steps": 0.00517725944519043, "step": 480}
{"info/global_step": 481, "train_info/time_within_train_step": 38.40346646308899, "step": 481}
{"train_info/time_between_train_steps": 0.00742340087890625, "step": 481}
{"info/global_step": 482, "train_info/time_within_train_step": 37.64585518836975, "step": 482}
{"train_info/time_between_train_steps": 0.013733386993408203, "step": 482}
{"info/global_step": 483, "train_info/time_within_train_step": 38.30148386955261, "step": 483}
{"train_info/time_between_train_steps": 0.005596637725830078, "step": 483}
{"info/global_step": 484, "train_info/time_within_train_step": 37.39821195602417, "step": 484}
{"train_info/time_between_train_steps": 0.005341291427612305, "step": 484}
{"info/global_step": 485, "train_info/time_within_train_step": 38.37417221069336, "step": 485}
{"train_info/time_between_train_steps": 0.0059545040130615234, "step": 485}
{"info/global_step": 486, "train_info/time_within_train_step": 38.53730893135071, "step": 486}
{"train_info/time_between_train_steps": 0.0058345794677734375, "step": 486}
{"train_info/time_between_train_steps": 26.166860818862915, "step": 486}
{"info/global_step": 487, "train_info/time_within_train_step": 38.295063734054565, "step": 487}
{"train_info/time_between_train_steps": 0.005550861358642578, "step": 487}
{"info/global_step": 488, "train_info/time_within_train_step": 38.48375582695007, "step": 488}
{"train_info/time_between_train_steps": 0.0052640438079833984, "step": 488}
{"info/global_step": 489, "train_info/time_within_train_step": 37.80569934844971, "step": 489}
{"train_info/time_between_train_steps": 0.005534648895263672, "step": 489}
{"info/global_step": 490, "train_info/time_within_train_step": 38.642232179641724, "step": 490}
{"train_info/time_between_train_steps": 0.005292654037475586, "step": 490}
{"info/global_step": 491, "train_info/time_within_train_step": 38.136207818984985, "step": 491}
{"train_info/time_between_train_steps": 0.005647182464599609, "step": 491}
{"info/global_step": 492, "train_info/time_within_train_step": 37.99000287055969, "step": 492}
{"train_info/time_between_train_steps": 0.005370616912841797, "step": 492}
{"info/global_step": 493, "train_info/time_within_train_step": 38.45606446266174, "step": 493}
{"train_info/time_between_train_steps": 0.005507707595825195, "step": 493}
{"info/global_step": 494, "train_info/time_within_train_step": 37.489924907684326, "step": 494}
{"train_info/time_between_train_steps": 0.0051670074462890625, "step": 494}
{"info/global_step": 495, "train_info/time_within_train_step": 38.366944313049316, "step": 495}
{"train_info/time_between_train_steps": 0.005255937576293945, "step": 495}
{"info/global_step": 496, "train_info/time_within_train_step": 38.345271587371826, "step": 496}
{"train_info/time_between_train_steps": 0.005021095275878906, "step": 496}
{"info/global_step": 497, "train_info/time_within_train_step": 37.451215505599976, "step": 497}
{"train_info/time_between_train_steps": 0.011932134628295898, "step": 497}
{"info/global_step": 498, "train_info/time_within_train_step": 38.306739807128906, "step": 498}
{"train_info/time_between_train_steps": 0.00506281852722168, "step": 498}
{"info/global_step": 499, "train_info/time_within_train_step": 38.53729438781738, "step": 499}
{"train_info/time_between_train_steps": 0.005245685577392578, "step": 499}
{"info/global_step": 500, "train_info/time_within_train_step": 37.43404030799866, "step": 500}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733706402, "_runtime": 19291}, "step": 500}
{"logs": {"train/loss": 4.4919, "train/learning_rate": 0.00038888888888888887, "train/epoch": 18.01, "_timestamp": 1733706402, "_runtime": 19291}, "step": 500}
{"train_info/time_between_train_steps": 2.380805015563965, "step": 500}
{"info/global_step": 501, "train_info/time_within_train_step": 38.350409746170044, "step": 501}
{"train_info/time_between_train_steps": 0.005192756652832031, "step": 501}
{"info/global_step": 502, "train_info/time_within_train_step": 37.60729169845581, "step": 502}
{"train_info/time_between_train_steps": 0.005228281021118164, "step": 502}
{"info/global_step": 503, "train_info/time_within_train_step": 38.57371640205383, "step": 503}
{"train_info/time_between_train_steps": 0.013716936111450195, "step": 503}
{"info/global_step": 504, "train_info/time_within_train_step": 38.37633442878723, "step": 504}
{"train_info/time_between_train_steps": 0.0051152706146240234, "step": 504}
{"info/global_step": 505, "train_info/time_within_train_step": 37.734882831573486, "step": 505}
{"train_info/time_between_train_steps": 0.010079145431518555, "step": 505}
{"info/global_step": 506, "train_info/time_within_train_step": 38.40309381484985, "step": 506}
{"train_info/time_between_train_steps": 0.015068531036376953, "step": 506}
{"info/global_step": 507, "train_info/time_within_train_step": 38.46753907203674, "step": 507}
{"train_info/time_between_train_steps": 0.0051496028900146484, "step": 507}
{"info/global_step": 508, "train_info/time_within_train_step": 37.484381675720215, "step": 508}
{"train_info/time_between_train_steps": 0.0051898956298828125, "step": 508}
{"info/global_step": 509, "train_info/time_within_train_step": 38.27276682853699, "step": 509}
{"train_info/time_between_train_steps": 0.005414009094238281, "step": 509}
{"info/global_step": 510, "train_info/time_within_train_step": 38.37947154045105, "step": 510}
{"train_info/time_between_train_steps": 0.005554914474487305, "step": 510}
{"info/global_step": 511, "train_info/time_within_train_step": 37.40973424911499, "step": 511}
{"train_info/time_between_train_steps": 0.0053348541259765625, "step": 511}
{"info/global_step": 512, "train_info/time_within_train_step": 38.367960691452026, "step": 512}
{"train_info/time_between_train_steps": 0.00574946403503418, "step": 512}
{"info/global_step": 513, "train_info/time_within_train_step": 38.46510028839111, "step": 513}
{"train_info/time_between_train_steps": 0.005616426467895508, "step": 513}
{"train_info/time_between_train_steps": 26.27292490005493, "step": 513}
{"info/global_step": 514, "train_info/time_within_train_step": 38.42897152900696, "step": 514}
{"train_info/time_between_train_steps": 0.010525703430175781, "step": 514}
{"info/global_step": 515, "train_info/time_within_train_step": 38.51241755485535, "step": 515}
{"train_info/time_between_train_steps": 0.005308866500854492, "step": 515}
{"info/global_step": 516, "train_info/time_within_train_step": 37.43651223182678, "step": 516}
{"train_info/time_between_train_steps": 0.005268096923828125, "step": 516}
{"info/global_step": 517, "train_info/time_within_train_step": 35.338197231292725, "step": 517}
{"train_info/time_between_train_steps": 0.0052340030670166016, "step": 517}
{"info/global_step": 518, "train_info/time_within_train_step": 27.74600386619568, "step": 518}
{"train_info/time_between_train_steps": 0.0055735111236572266, "step": 518}
{"info/global_step": 519, "train_info/time_within_train_step": 27.956321001052856, "step": 519}
{"train_info/time_between_train_steps": 0.0053517818450927734, "step": 519}
{"info/global_step": 520, "train_info/time_within_train_step": 27.909276723861694, "step": 520}
{"train_info/time_between_train_steps": 0.00556182861328125, "step": 520}
{"info/global_step": 521, "train_info/time_within_train_step": 27.868164777755737, "step": 521}
{"train_info/time_between_train_steps": 0.01038813591003418, "step": 521}
{"info/global_step": 522, "train_info/time_within_train_step": 27.88509178161621, "step": 522}
{"train_info/time_between_train_steps": 0.005066394805908203, "step": 522}
{"info/global_step": 523, "train_info/time_within_train_step": 36.79111409187317, "step": 523}
{"train_info/time_between_train_steps": 0.0050203800201416016, "step": 523}
{"info/global_step": 524, "train_info/time_within_train_step": 38.88663339614868, "step": 524}
{"train_info/time_between_train_steps": 0.010847091674804688, "step": 524}
{"info/global_step": 525, "train_info/time_within_train_step": 36.38038611412048, "step": 525}
{"train_info/time_between_train_steps": 0.005192995071411133, "step": 525}
{"info/global_step": 526, "train_info/time_within_train_step": 38.73355674743652, "step": 526}
{"train_info/time_between_train_steps": 0.004907369613647461, "step": 526}
{"info/global_step": 527, "train_info/time_within_train_step": 38.945637464523315, "step": 527}
{"train_info/time_between_train_steps": 0.005192279815673828, "step": 527}
{"info/global_step": 528, "train_info/time_within_train_step": 39.07197165489197, "step": 528}
{"train_info/time_between_train_steps": 0.005143165588378906, "step": 528}
{"info/global_step": 529, "train_info/time_within_train_step": 28.64887285232544, "step": 529}
{"train_info/time_between_train_steps": 0.0051229000091552734, "step": 529}
{"info/global_step": 530, "train_info/time_within_train_step": 27.767078399658203, "step": 530}
{"train_info/time_between_train_steps": 0.006017446517944336, "step": 530}
{"info/global_step": 531, "train_info/time_within_train_step": 27.718331336975098, "step": 531}
{"train_info/time_between_train_steps": 0.005152463912963867, "step": 531}
{"info/global_step": 532, "train_info/time_within_train_step": 27.762320518493652, "step": 532}
{"train_info/time_between_train_steps": 0.005061149597167969, "step": 532}
{"info/global_step": 533, "train_info/time_within_train_step": 27.745726108551025, "step": 533}
{"train_info/time_between_train_steps": 0.0072345733642578125, "step": 533}
{"info/global_step": 534, "train_info/time_within_train_step": 27.797380208969116, "step": 534}
{"train_info/time_between_train_steps": 0.005102872848510742, "step": 534}
{"info/global_step": 535, "train_info/time_within_train_step": 27.84581708908081, "step": 535}
{"train_info/time_between_train_steps": 0.00966787338256836, "step": 535}
{"info/global_step": 536, "train_info/time_within_train_step": 27.77159094810486, "step": 536}
{"train_info/time_between_train_steps": 0.009623527526855469, "step": 536}
{"info/global_step": 537, "train_info/time_within_train_step": 27.73066806793213, "step": 537}
{"train_info/time_between_train_steps": 0.00516819953918457, "step": 537}
{"info/global_step": 538, "train_info/time_within_train_step": 27.739271640777588, "step": 538}
{"train_info/time_between_train_steps": 0.005141019821166992, "step": 538}
{"info/global_step": 539, "train_info/time_within_train_step": 27.799827575683594, "step": 539}
{"train_info/time_between_train_steps": 0.005452394485473633, "step": 539}
{"info/global_step": 540, "train_info/time_within_train_step": 27.77248454093933, "step": 540}
{"train_info/time_between_train_steps": 0.0057201385498046875, "step": 540}
{"train_info/time_between_train_steps": 20.776631116867065, "step": 540}
{"info/global_step": 541, "train_info/time_within_train_step": 27.800010919570923, "step": 541}
{"train_info/time_between_train_steps": 0.009841442108154297, "step": 541}
{"info/global_step": 542, "train_info/time_within_train_step": 27.90664768218994, "step": 542}
{"train_info/time_between_train_steps": 0.004964113235473633, "step": 542}
{"info/global_step": 543, "train_info/time_within_train_step": 27.769459009170532, "step": 543}
{"train_info/time_between_train_steps": 0.004899024963378906, "step": 543}
{"info/global_step": 544, "train_info/time_within_train_step": 27.870576858520508, "step": 544}
{"train_info/time_between_train_steps": 0.004960298538208008, "step": 544}
{"info/global_step": 545, "train_info/time_within_train_step": 27.750564336776733, "step": 545}
{"train_info/time_between_train_steps": 0.0050809383392333984, "step": 545}
{"info/global_step": 546, "train_info/time_within_train_step": 27.89166569709778, "step": 546}
{"train_info/time_between_train_steps": 0.005278825759887695, "step": 546}
{"info/global_step": 547, "train_info/time_within_train_step": 27.775656700134277, "step": 547}
{"train_info/time_between_train_steps": 0.005108356475830078, "step": 547}
{"info/global_step": 548, "train_info/time_within_train_step": 27.81204652786255, "step": 548}
{"train_info/time_between_train_steps": 0.005173921585083008, "step": 548}
{"info/global_step": 549, "train_info/time_within_train_step": 27.742393016815186, "step": 549}
{"train_info/time_between_train_steps": 0.00496220588684082, "step": 549}
{"info/global_step": 550, "train_info/time_within_train_step": 27.879333019256592, "step": 550}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733708078, "_runtime": 20967}, "step": 550}
{"logs": {"train/loss": 4.323, "train/learning_rate": 0.0003611111111111111, "train/epoch": 20.01, "_timestamp": 1733708078, "_runtime": 20967}, "step": 550}
{"train_info/time_between_train_steps": 0.006883382797241211, "step": 550}
{"info/global_step": 551, "train_info/time_within_train_step": 27.807863473892212, "step": 551}
{"train_info/time_between_train_steps": 0.004964351654052734, "step": 551}
{"info/global_step": 552, "train_info/time_within_train_step": 27.755377531051636, "step": 552}
{"train_info/time_between_train_steps": 0.00937032699584961, "step": 552}
{"info/global_step": 553, "train_info/time_within_train_step": 27.77844786643982, "step": 553}
{"train_info/time_between_train_steps": 0.004885673522949219, "step": 553}
{"info/global_step": 554, "train_info/time_within_train_step": 27.76058030128479, "step": 554}
{"train_info/time_between_train_steps": 0.005040884017944336, "step": 554}
{"info/global_step": 555, "train_info/time_within_train_step": 27.761868476867676, "step": 555}
{"train_info/time_between_train_steps": 0.005075931549072266, "step": 555}
{"info/global_step": 556, "train_info/time_within_train_step": 27.74788999557495, "step": 556}
{"train_info/time_between_train_steps": 0.004909515380859375, "step": 556}
{"info/global_step": 557, "train_info/time_within_train_step": 27.771223545074463, "step": 557}
{"train_info/time_between_train_steps": 0.004992008209228516, "step": 557}
{"info/global_step": 558, "train_info/time_within_train_step": 27.74686861038208, "step": 558}
{"train_info/time_between_train_steps": 0.009532928466796875, "step": 558}
{"info/global_step": 559, "train_info/time_within_train_step": 27.73803472518921, "step": 559}
{"train_info/time_between_train_steps": 0.009704113006591797, "step": 559}
{"info/global_step": 560, "train_info/time_within_train_step": 27.791505813598633, "step": 560}
{"train_info/time_between_train_steps": 0.0050928592681884766, "step": 560}
{"info/global_step": 561, "train_info/time_within_train_step": 27.787635326385498, "step": 561}
{"train_info/time_between_train_steps": 0.005636930465698242, "step": 561}
{"info/global_step": 562, "train_info/time_within_train_step": 27.756022930145264, "step": 562}
{"train_info/time_between_train_steps": 0.0049800872802734375, "step": 562}
{"info/global_step": 563, "train_info/time_within_train_step": 27.79373598098755, "step": 563}
{"train_info/time_between_train_steps": 0.005096435546875, "step": 563}
{"info/global_step": 564, "train_info/time_within_train_step": 27.78128218650818, "step": 564}
{"train_info/time_between_train_steps": 0.005238533020019531, "step": 564}
{"info/global_step": 565, "train_info/time_within_train_step": 27.75809645652771, "step": 565}
{"train_info/time_between_train_steps": 0.005407571792602539, "step": 565}
{"info/global_step": 566, "train_info/time_within_train_step": 27.896962881088257, "step": 566}
{"train_info/time_between_train_steps": 0.0054378509521484375, "step": 566}
{"info/global_step": 567, "train_info/time_within_train_step": 27.79349446296692, "step": 567}
{"train_info/time_between_train_steps": 0.0056264400482177734, "step": 567}
{"train_info/time_between_train_steps": 20.34293246269226, "step": 567}
{"info/global_step": 568, "train_info/time_within_train_step": 27.756662607192993, "step": 568}
{"train_info/time_between_train_steps": 0.005367755889892578, "step": 568}
{"info/global_step": 569, "train_info/time_within_train_step": 27.93135976791382, "step": 569}
{"train_info/time_between_train_steps": 0.005272865295410156, "step": 569}
{"info/global_step": 570, "train_info/time_within_train_step": 27.79439902305603, "step": 570}
{"train_info/time_between_train_steps": 0.0052928924560546875, "step": 570}
{"info/global_step": 571, "train_info/time_within_train_step": 27.90722131729126, "step": 571}
{"train_info/time_between_train_steps": 0.005208492279052734, "step": 571}
{"info/global_step": 572, "train_info/time_within_train_step": 27.78431510925293, "step": 572}
{"train_info/time_between_train_steps": 0.00509190559387207, "step": 572}
{"info/global_step": 573, "train_info/time_within_train_step": 27.92939305305481, "step": 573}
{"train_info/time_between_train_steps": 0.009448528289794922, "step": 573}
{"info/global_step": 574, "train_info/time_within_train_step": 27.793753147125244, "step": 574}
{"train_info/time_between_train_steps": 0.0054700374603271484, "step": 574}
{"info/global_step": 575, "train_info/time_within_train_step": 27.841153621673584, "step": 575}
{"train_info/time_between_train_steps": 0.0051403045654296875, "step": 575}
{"info/global_step": 576, "train_info/time_within_train_step": 27.777313709259033, "step": 576}
{"train_info/time_between_train_steps": 0.0051157474517822266, "step": 576}
{"info/global_step": 577, "train_info/time_within_train_step": 27.76002025604248, "step": 577}
{"train_info/time_between_train_steps": 0.0050258636474609375, "step": 577}
{"info/global_step": 578, "train_info/time_within_train_step": 27.752168893814087, "step": 578}
{"train_info/time_between_train_steps": 0.005072832107543945, "step": 578}
{"info/global_step": 579, "train_info/time_within_train_step": 27.771592140197754, "step": 579}
{"train_info/time_between_train_steps": 0.005240440368652344, "step": 579}
{"info/global_step": 580, "train_info/time_within_train_step": 27.779151439666748, "step": 580}
{"train_info/time_between_train_steps": 0.0051462650299072266, "step": 580}
{"info/global_step": 581, "train_info/time_within_train_step": 27.875625133514404, "step": 581}
{"train_info/time_between_train_steps": 0.0050885677337646484, "step": 581}
{"info/global_step": 582, "train_info/time_within_train_step": 27.78668522834778, "step": 582}
{"train_info/time_between_train_steps": 0.009844303131103516, "step": 582}
{"info/global_step": 583, "train_info/time_within_train_step": 27.777088403701782, "step": 583}
{"train_info/time_between_train_steps": 0.008312225341796875, "step": 583}
{"info/global_step": 584, "train_info/time_within_train_step": 27.773412227630615, "step": 584}
{"train_info/time_between_train_steps": 0.005174160003662109, "step": 584}
{"info/global_step": 585, "train_info/time_within_train_step": 27.731494903564453, "step": 585}
{"train_info/time_between_train_steps": 0.004965066909790039, "step": 585}
{"info/global_step": 586, "train_info/time_within_train_step": 27.746325969696045, "step": 586}
{"train_info/time_between_train_steps": 0.006013393402099609, "step": 586}
{"info/global_step": 587, "train_info/time_within_train_step": 27.748615264892578, "step": 587}
{"train_info/time_between_train_steps": 0.0049495697021484375, "step": 587}
{"info/global_step": 588, "train_info/time_within_train_step": 27.736070156097412, "step": 588}
{"train_info/time_between_train_steps": 0.005023479461669922, "step": 588}
{"info/global_step": 589, "train_info/time_within_train_step": 27.725579023361206, "step": 589}
{"train_info/time_between_train_steps": 0.005301952362060547, "step": 589}
{"info/global_step": 590, "train_info/time_within_train_step": 27.74281883239746, "step": 590}
{"train_info/time_between_train_steps": 0.005057573318481445, "step": 590}
{"info/global_step": 591, "train_info/time_within_train_step": 27.74739670753479, "step": 591}
{"train_info/time_between_train_steps": 0.010155439376831055, "step": 591}
{"info/global_step": 592, "train_info/time_within_train_step": 27.754408359527588, "step": 592}
{"train_info/time_between_train_steps": 0.010066032409667969, "step": 592}
{"info/global_step": 593, "train_info/time_within_train_step": 27.912235498428345, "step": 593}
{"train_info/time_between_train_steps": 0.010439872741699219, "step": 593}
{"info/global_step": 594, "train_info/time_within_train_step": 27.779058694839478, "step": 594}
{"train_info/time_between_train_steps": 0.005601644515991211, "step": 594}
{"train_info/time_between_train_steps": 20.55850601196289, "step": 594}
{"info/global_step": 595, "train_info/time_within_train_step": 27.730579376220703, "step": 595}
{"train_info/time_between_train_steps": 0.010265111923217773, "step": 595}
{"info/global_step": 596, "train_info/time_within_train_step": 27.97420310974121, "step": 596}
{"train_info/time_between_train_steps": 0.010267019271850586, "step": 596}
{"info/global_step": 597, "train_info/time_within_train_step": 27.790801286697388, "step": 597}
{"train_info/time_between_train_steps": 0.005200624465942383, "step": 597}
{"info/global_step": 598, "train_info/time_within_train_step": 27.94940757751465, "step": 598}
{"train_info/time_between_train_steps": 0.005373716354370117, "step": 598}
{"info/global_step": 599, "train_info/time_within_train_step": 27.793458461761475, "step": 599}
{"train_info/time_between_train_steps": 0.005300760269165039, "step": 599}
{"info/global_step": 600, "train_info/time_within_train_step": 28.044199228286743, "step": 600}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733709509, "_runtime": 22398}, "step": 600}
{"logs": {"train/loss": 4.1768, "train/learning_rate": 0.0003333333333333333, "train/epoch": 22.0, "_timestamp": 1733709509, "_runtime": 22398}, "step": 600}
{"train_info/time_between_train_steps": 2.2948155403137207, "step": 600}
{"info/global_step": 601, "train_info/time_within_train_step": 27.769065856933594, "step": 601}
{"train_info/time_between_train_steps": 0.005604267120361328, "step": 601}
{"info/global_step": 602, "train_info/time_within_train_step": 27.81279706954956, "step": 602}
{"train_info/time_between_train_steps": 0.005178689956665039, "step": 602}
{"info/global_step": 603, "train_info/time_within_train_step": 27.765363931655884, "step": 603}
{"train_info/time_between_train_steps": 0.009655952453613281, "step": 603}
{"info/global_step": 604, "train_info/time_within_train_step": 27.720419883728027, "step": 604}
{"train_info/time_between_train_steps": 0.005009174346923828, "step": 604}
{"info/global_step": 605, "train_info/time_within_train_step": 27.72052788734436, "step": 605}
{"train_info/time_between_train_steps": 0.004939079284667969, "step": 605}
{"info/global_step": 606, "train_info/time_within_train_step": 27.719173431396484, "step": 606}
{"train_info/time_between_train_steps": 0.0049114227294921875, "step": 606}
{"info/global_step": 607, "train_info/time_within_train_step": 27.732892990112305, "step": 607}
{"train_info/time_between_train_steps": 0.00495457649230957, "step": 607}
{"info/global_step": 608, "train_info/time_within_train_step": 27.716776371002197, "step": 608}
{"train_info/time_between_train_steps": 0.004946708679199219, "step": 608}
{"info/global_step": 609, "train_info/time_within_train_step": 27.724302291870117, "step": 609}
{"train_info/time_between_train_steps": 0.004942417144775391, "step": 609}
{"info/global_step": 610, "train_info/time_within_train_step": 28.0209858417511, "step": 610}
{"train_info/time_between_train_steps": 0.004888057708740234, "step": 610}
{"info/global_step": 611, "train_info/time_within_train_step": 27.729285955429077, "step": 611}
{"train_info/time_between_train_steps": 0.00973820686340332, "step": 611}
{"info/global_step": 612, "train_info/time_within_train_step": 27.822223901748657, "step": 612}
{"train_info/time_between_train_steps": 0.005052804946899414, "step": 612}
{"info/global_step": 613, "train_info/time_within_train_step": 27.73978281021118, "step": 613}
{"train_info/time_between_train_steps": 0.009724617004394531, "step": 613}
{"info/global_step": 614, "train_info/time_within_train_step": 27.745355367660522, "step": 614}
{"train_info/time_between_train_steps": 0.004983186721801758, "step": 614}
{"info/global_step": 615, "train_info/time_within_train_step": 27.723092317581177, "step": 615}
{"train_info/time_between_train_steps": 0.00497126579284668, "step": 615}
{"info/global_step": 616, "train_info/time_within_train_step": 28.170215368270874, "step": 616}
{"train_info/time_between_train_steps": 0.00960683822631836, "step": 616}
{"info/global_step": 617, "train_info/time_within_train_step": 27.854368686676025, "step": 617}
{"train_info/time_between_train_steps": 0.005097150802612305, "step": 617}
{"info/global_step": 618, "train_info/time_within_train_step": 27.74959421157837, "step": 618}
{"train_info/time_between_train_steps": 0.0051534175872802734, "step": 618}
{"info/global_step": 619, "train_info/time_within_train_step": 27.738068103790283, "step": 619}
{"train_info/time_between_train_steps": 0.0053577423095703125, "step": 619}
{"info/global_step": 620, "train_info/time_within_train_step": 27.894102573394775, "step": 620}
{"train_info/time_between_train_steps": 0.009743213653564453, "step": 620}
{"info/global_step": 621, "train_info/time_within_train_step": 27.782708168029785, "step": 621}
{"train_info/time_between_train_steps": 0.005548715591430664, "step": 621}
{"train_info/time_between_train_steps": 20.660372018814087, "step": 621}
{"info/global_step": 622, "train_info/time_within_train_step": 27.730696439743042, "step": 622}
{"train_info/time_between_train_steps": 0.005255937576293945, "step": 622}
{"info/global_step": 623, "train_info/time_within_train_step": 27.912712335586548, "step": 623}
{"train_info/time_between_train_steps": 0.005344867706298828, "step": 623}
{"info/global_step": 624, "train_info/time_within_train_step": 27.74170756340027, "step": 624}
{"train_info/time_between_train_steps": 0.0049860477447509766, "step": 624}
{"info/global_step": 625, "train_info/time_within_train_step": 27.931774377822876, "step": 625}
{"train_info/time_between_train_steps": 0.0051152706146240234, "step": 625}
{"info/global_step": 626, "train_info/time_within_train_step": 27.735053062438965, "step": 626}
{"train_info/time_between_train_steps": 0.005330324172973633, "step": 626}
{"info/global_step": 627, "train_info/time_within_train_step": 27.99443817138672, "step": 627}
{"train_info/time_between_train_steps": 0.005278348922729492, "step": 627}
{"info/global_step": 628, "train_info/time_within_train_step": 27.753771781921387, "step": 628}
{"train_info/time_between_train_steps": 0.00523686408996582, "step": 628}
{"info/global_step": 629, "train_info/time_within_train_step": 27.82356023788452, "step": 629}
{"train_info/time_between_train_steps": 0.005212306976318359, "step": 629}
{"info/global_step": 630, "train_info/time_within_train_step": 27.75337529182434, "step": 630}
{"train_info/time_between_train_steps": 0.005106449127197266, "step": 630}
{"info/global_step": 631, "train_info/time_within_train_step": 27.725106716156006, "step": 631}
{"train_info/time_between_train_steps": 0.005006551742553711, "step": 631}
{"info/global_step": 632, "train_info/time_within_train_step": 27.7359299659729, "step": 632}
{"train_info/time_between_train_steps": 0.009868621826171875, "step": 632}
{"info/global_step": 633, "train_info/time_within_train_step": 27.761916875839233, "step": 633}
{"train_info/time_between_train_steps": 0.005119800567626953, "step": 633}
{"info/global_step": 634, "train_info/time_within_train_step": 27.731351375579834, "step": 634}
{"train_info/time_between_train_steps": 0.005158901214599609, "step": 634}
{"info/global_step": 635, "train_info/time_within_train_step": 27.72994112968445, "step": 635}
{"train_info/time_between_train_steps": 0.00512242317199707, "step": 635}
{"info/global_step": 636, "train_info/time_within_train_step": 27.725136518478394, "step": 636}
{"train_info/time_between_train_steps": 0.004975557327270508, "step": 636}
{"info/global_step": 637, "train_info/time_within_train_step": 27.799412965774536, "step": 637}
{"train_info/time_between_train_steps": 0.009741783142089844, "step": 637}
{"info/global_step": 638, "train_info/time_within_train_step": 27.805433750152588, "step": 638}
{"train_info/time_between_train_steps": 0.005217790603637695, "step": 638}
{"info/global_step": 639, "train_info/time_within_train_step": 27.78012990951538, "step": 639}
{"train_info/time_between_train_steps": 0.005226850509643555, "step": 639}
{"info/global_step": 640, "train_info/time_within_train_step": 27.745830297470093, "step": 640}
{"train_info/time_between_train_steps": 0.0051212310791015625, "step": 640}
{"info/global_step": 641, "train_info/time_within_train_step": 27.84509825706482, "step": 641}
{"train_info/time_between_train_steps": 0.014852046966552734, "step": 641}
{"info/global_step": 642, "train_info/time_within_train_step": 27.798112154006958, "step": 642}
{"train_info/time_between_train_steps": 0.0051975250244140625, "step": 642}
{"info/global_step": 643, "train_info/time_within_train_step": 27.7318754196167, "step": 643}
{"train_info/time_between_train_steps": 0.0050678253173828125, "step": 643}
{"info/global_step": 644, "train_info/time_within_train_step": 27.77196717262268, "step": 644}
{"train_info/time_between_train_steps": 0.005663394927978516, "step": 644}
{"info/global_step": 645, "train_info/time_within_train_step": 27.803290367126465, "step": 645}
{"train_info/time_between_train_steps": 0.005301237106323242, "step": 645}
{"info/global_step": 646, "train_info/time_within_train_step": 27.739213705062866, "step": 646}
{"train_info/time_between_train_steps": 0.010453939437866211, "step": 646}
{"info/global_step": 647, "train_info/time_within_train_step": 27.741843938827515, "step": 647}
{"train_info/time_between_train_steps": 0.005456447601318359, "step": 647}
{"info/global_step": 648, "train_info/time_within_train_step": 27.76271104812622, "step": 648}
{"train_info/time_between_train_steps": 0.005718708038330078, "step": 648}
{"train_info/time_between_train_steps": 20.312819480895996, "step": 648}
{"info/global_step": 649, "train_info/time_within_train_step": 27.761129140853882, "step": 649}
{"train_info/time_between_train_steps": 0.005534172058105469, "step": 649}
{"info/global_step": 650, "train_info/time_within_train_step": 27.93407368659973, "step": 650}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733710942, "_runtime": 23831}, "step": 650}
{"logs": {"train/loss": 4.06, "train/learning_rate": 0.00030555555555555555, "train/epoch": 24.0, "_timestamp": 1733710942, "_runtime": 23831}, "step": 650}
{"train_info/time_between_train_steps": 0.0070726871490478516, "step": 650}
{"info/global_step": 651, "train_info/time_within_train_step": 27.737892389297485, "step": 651}
{"train_info/time_between_train_steps": 0.005242824554443359, "step": 651}
{"info/global_step": 652, "train_info/time_within_train_step": 27.94392228126526, "step": 652}
{"train_info/time_between_train_steps": 0.005202054977416992, "step": 652}
{"info/global_step": 653, "train_info/time_within_train_step": 27.782952547073364, "step": 653}
{"train_info/time_between_train_steps": 0.005475759506225586, "step": 653}
{"info/global_step": 654, "train_info/time_within_train_step": 27.922109365463257, "step": 654}
{"train_info/time_between_train_steps": 0.005246639251708984, "step": 654}
{"info/global_step": 655, "train_info/time_within_train_step": 27.743444442749023, "step": 655}
{"train_info/time_between_train_steps": 0.005515575408935547, "step": 655}
{"info/global_step": 656, "train_info/time_within_train_step": 27.79679298400879, "step": 656}
{"train_info/time_between_train_steps": 0.008013725280761719, "step": 656}
{"info/global_step": 657, "train_info/time_within_train_step": 27.82749366760254, "step": 657}
{"train_info/time_between_train_steps": 0.009926795959472656, "step": 657}
{"info/global_step": 658, "train_info/time_within_train_step": 27.74341630935669, "step": 658}
{"train_info/time_between_train_steps": 0.0049054622650146484, "step": 658}
{"info/global_step": 659, "train_info/time_within_train_step": 27.743324756622314, "step": 659}
{"train_info/time_between_train_steps": 0.005011081695556641, "step": 659}
{"info/global_step": 660, "train_info/time_within_train_step": 27.73909330368042, "step": 660}
{"train_info/time_between_train_steps": 0.005059480667114258, "step": 660}
{"info/global_step": 661, "train_info/time_within_train_step": 27.72397494316101, "step": 661}
{"train_info/time_between_train_steps": 0.005120038986206055, "step": 661}
{"info/global_step": 662, "train_info/time_within_train_step": 27.717169046401978, "step": 662}
{"train_info/time_between_train_steps": 0.009715080261230469, "step": 662}
{"info/global_step": 663, "train_info/time_within_train_step": 27.951386213302612, "step": 663}
{"train_info/time_between_train_steps": 0.005510091781616211, "step": 663}
{"info/global_step": 664, "train_info/time_within_train_step": 27.79557752609253, "step": 664}
{"train_info/time_between_train_steps": 0.0056002140045166016, "step": 664}
{"info/global_step": 665, "train_info/time_within_train_step": 27.79748225212097, "step": 665}
{"train_info/time_between_train_steps": 0.005186796188354492, "step": 665}
{"info/global_step": 666, "train_info/time_within_train_step": 27.748673677444458, "step": 666}
{"train_info/time_between_train_steps": 0.0052068233489990234, "step": 666}
{"info/global_step": 667, "train_info/time_within_train_step": 27.761369228363037, "step": 667}
{"train_info/time_between_train_steps": 0.004897356033325195, "step": 667}
{"info/global_step": 668, "train_info/time_within_train_step": 27.74596333503723, "step": 668}
{"train_info/time_between_train_steps": 0.009717226028442383, "step": 668}
{"info/global_step": 669, "train_info/time_within_train_step": 27.77782392501831, "step": 669}
{"train_info/time_between_train_steps": 0.010507345199584961, "step": 669}
{"info/global_step": 670, "train_info/time_within_train_step": 27.778644561767578, "step": 670}
{"train_info/time_between_train_steps": 0.005096435546875, "step": 670}
{"info/global_step": 671, "train_info/time_within_train_step": 27.74852156639099, "step": 671}
{"train_info/time_between_train_steps": 0.005118131637573242, "step": 671}
{"info/global_step": 672, "train_info/time_within_train_step": 27.7373104095459, "step": 672}
{"train_info/time_between_train_steps": 0.005471467971801758, "step": 672}
{"info/global_step": 673, "train_info/time_within_train_step": 27.82885432243347, "step": 673}
{"train_info/time_between_train_steps": 0.0052530765533447266, "step": 673}
{"info/global_step": 674, "train_info/time_within_train_step": 27.77017569541931, "step": 674}
{"train_info/time_between_train_steps": 0.01062774658203125, "step": 674}
{"info/global_step": 675, "train_info/time_within_train_step": 27.767754554748535, "step": 675}
{"train_info/time_between_train_steps": 0.005682706832885742, "step": 675}
{"train_info/time_between_train_steps": 20.523484468460083, "step": 675}
{"info/global_step": 676, "train_info/time_within_train_step": 27.80510926246643, "step": 676}
{"train_info/time_between_train_steps": 0.005422353744506836, "step": 676}
{"info/global_step": 677, "train_info/time_within_train_step": 27.95992374420166, "step": 677}
{"train_info/time_between_train_steps": 0.009992122650146484, "step": 677}
{"info/global_step": 678, "train_info/time_within_train_step": 27.77140212059021, "step": 678}
{"train_info/time_between_train_steps": 0.010134220123291016, "step": 678}
{"info/global_step": 679, "train_info/time_within_train_step": 27.988311290740967, "step": 679}
{"train_info/time_between_train_steps": 0.00519251823425293, "step": 679}
{"info/global_step": 680, "train_info/time_within_train_step": 27.737353086471558, "step": 680}
{"train_info/time_between_train_steps": 0.005475044250488281, "step": 680}
{"info/global_step": 681, "train_info/time_within_train_step": 28.010967254638672, "step": 681}
{"train_info/time_between_train_steps": 0.005573749542236328, "step": 681}
{"info/global_step": 682, "train_info/time_within_train_step": 27.832047939300537, "step": 682}
{"train_info/time_between_train_steps": 0.0051021575927734375, "step": 682}
{"info/global_step": 683, "train_info/time_within_train_step": 27.8659725189209, "step": 683}
{"train_info/time_between_train_steps": 0.005281686782836914, "step": 683}
{"info/global_step": 684, "train_info/time_within_train_step": 27.744741201400757, "step": 684}
{"train_info/time_between_train_steps": 0.0052378177642822266, "step": 684}
{"info/global_step": 685, "train_info/time_within_train_step": 27.732083082199097, "step": 685}
{"train_info/time_between_train_steps": 0.005105495452880859, "step": 685}
{"info/global_step": 686, "train_info/time_within_train_step": 27.75086760520935, "step": 686}
{"train_info/time_between_train_steps": 0.005083560943603516, "step": 686}
{"info/global_step": 687, "train_info/time_within_train_step": 27.725483179092407, "step": 687}
{"train_info/time_between_train_steps": 0.004872322082519531, "step": 687}
{"info/global_step": 688, "train_info/time_within_train_step": 27.846137285232544, "step": 688}
{"train_info/time_between_train_steps": 0.006087541580200195, "step": 688}
{"info/global_step": 689, "train_info/time_within_train_step": 27.736010789871216, "step": 689}
{"train_info/time_between_train_steps": 0.004924297332763672, "step": 689}
{"info/global_step": 690, "train_info/time_within_train_step": 27.723135948181152, "step": 690}
{"train_info/time_between_train_steps": 0.004933834075927734, "step": 690}
{"info/global_step": 691, "train_info/time_within_train_step": 27.72514009475708, "step": 691}
{"train_info/time_between_train_steps": 0.005276679992675781, "step": 691}
{"info/global_step": 692, "train_info/time_within_train_step": 27.72648787498474, "step": 692}
{"train_info/time_between_train_steps": 0.004997968673706055, "step": 692}
{"info/global_step": 693, "train_info/time_within_train_step": 27.73972988128662, "step": 693}
{"train_info/time_between_train_steps": 0.00505518913269043, "step": 693}
{"info/global_step": 694, "train_info/time_within_train_step": 27.78529977798462, "step": 694}
{"train_info/time_between_train_steps": 0.005040645599365234, "step": 694}
{"info/global_step": 695, "train_info/time_within_train_step": 27.81084680557251, "step": 695}
{"train_info/time_between_train_steps": 0.005101919174194336, "step": 695}
{"info/global_step": 696, "train_info/time_within_train_step": 27.73995041847229, "step": 696}
{"train_info/time_between_train_steps": 0.01003885269165039, "step": 696}
{"info/global_step": 697, "train_info/time_within_train_step": 27.748756647109985, "step": 697}
{"train_info/time_between_train_steps": 0.005121707916259766, "step": 697}
{"info/global_step": 698, "train_info/time_within_train_step": 27.76257586479187, "step": 698}
{"train_info/time_between_train_steps": 0.005231142044067383, "step": 698}
{"info/global_step": 699, "train_info/time_within_train_step": 27.864941835403442, "step": 699}
{"train_info/time_between_train_steps": 0.009796380996704102, "step": 699}
{"info/global_step": 700, "train_info/time_within_train_step": 27.82843327522278, "step": 700}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733712353, "_runtime": 25242}, "step": 700}
{"logs": {"train/loss": 3.9095, "train/learning_rate": 0.0002777777777777778, "train/epoch": 25.02, "_timestamp": 1733712353, "_runtime": 25242}, "step": 700}
{"train_info/time_between_train_steps": 2.2317988872528076, "step": 700}
{"info/global_step": 701, "train_info/time_within_train_step": 27.810170888900757, "step": 701}
{"train_info/time_between_train_steps": 0.006227016448974609, "step": 701}
{"info/global_step": 702, "train_info/time_within_train_step": 27.773563385009766, "step": 702}
{"train_info/time_between_train_steps": 0.005888223648071289, "step": 702}
{"train_info/time_between_train_steps": 20.562382698059082, "step": 702}
{"info/global_step": 703, "train_info/time_within_train_step": 27.908376693725586, "step": 703}
{"train_info/time_between_train_steps": 0.005598306655883789, "step": 703}
{"info/global_step": 704, "train_info/time_within_train_step": 27.939062356948853, "step": 704}
{"train_info/time_between_train_steps": 0.0050754547119140625, "step": 704}
{"info/global_step": 705, "train_info/time_within_train_step": 27.792919874191284, "step": 705}
{"train_info/time_between_train_steps": 0.005170583724975586, "step": 705}
{"info/global_step": 706, "train_info/time_within_train_step": 27.924243927001953, "step": 706}
{"train_info/time_between_train_steps": 0.005324602127075195, "step": 706}
{"info/global_step": 707, "train_info/time_within_train_step": 27.75016498565674, "step": 707}
{"train_info/time_between_train_steps": 0.005554676055908203, "step": 707}
{"info/global_step": 708, "train_info/time_within_train_step": 27.932002782821655, "step": 708}
{"train_info/time_between_train_steps": 0.0053026676177978516, "step": 708}
{"info/global_step": 709, "train_info/time_within_train_step": 27.732150077819824, "step": 709}
{"train_info/time_between_train_steps": 0.005265235900878906, "step": 709}
{"info/global_step": 710, "train_info/time_within_train_step": 27.826282739639282, "step": 710}
{"train_info/time_between_train_steps": 0.005218982696533203, "step": 710}
{"info/global_step": 711, "train_info/time_within_train_step": 27.741053819656372, "step": 711}
{"train_info/time_between_train_steps": 0.004888772964477539, "step": 711}
{"info/global_step": 712, "train_info/time_within_train_step": 27.728917121887207, "step": 712}
{"train_info/time_between_train_steps": 0.004945039749145508, "step": 712}
{"info/global_step": 713, "train_info/time_within_train_step": 27.764711141586304, "step": 713}
{"train_info/time_between_train_steps": 0.004981040954589844, "step": 713}
{"info/global_step": 714, "train_info/time_within_train_step": 27.733898878097534, "step": 714}
{"train_info/time_between_train_steps": 0.004973888397216797, "step": 714}
{"info/global_step": 715, "train_info/time_within_train_step": 27.725891828536987, "step": 715}
{"train_info/time_between_train_steps": 0.004980564117431641, "step": 715}
{"info/global_step": 716, "train_info/time_within_train_step": 27.798224449157715, "step": 716}
{"train_info/time_between_train_steps": 0.004980325698852539, "step": 716}
{"info/global_step": 717, "train_info/time_within_train_step": 27.77056360244751, "step": 717}
{"train_info/time_between_train_steps": 0.0049381256103515625, "step": 717}
{"info/global_step": 718, "train_info/time_within_train_step": 27.748422622680664, "step": 718}
{"train_info/time_between_train_steps": 0.0052449703216552734, "step": 718}
{"info/global_step": 719, "train_info/time_within_train_step": 27.90636157989502, "step": 719}
{"train_info/time_between_train_steps": 0.0051081180572509766, "step": 719}
{"info/global_step": 720, "train_info/time_within_train_step": 27.74673891067505, "step": 720}
{"train_info/time_between_train_steps": 0.005164146423339844, "step": 720}
{"info/global_step": 721, "train_info/time_within_train_step": 27.794116497039795, "step": 721}
{"train_info/time_between_train_steps": 0.005000114440917969, "step": 721}
{"info/global_step": 722, "train_info/time_within_train_step": 27.753920793533325, "step": 722}
{"train_info/time_between_train_steps": 0.005158185958862305, "step": 722}
{"info/global_step": 723, "train_info/time_within_train_step": 27.764888286590576, "step": 723}
{"train_info/time_between_train_steps": 0.00564885139465332, "step": 723}
{"info/global_step": 724, "train_info/time_within_train_step": 27.73707413673401, "step": 724}
{"train_info/time_between_train_steps": 0.005169868469238281, "step": 724}
{"info/global_step": 725, "train_info/time_within_train_step": 27.735971927642822, "step": 725}
{"train_info/time_between_train_steps": 0.00512385368347168, "step": 725}
{"info/global_step": 726, "train_info/time_within_train_step": 27.733691692352295, "step": 726}
{"train_info/time_between_train_steps": 0.005291461944580078, "step": 726}
{"info/global_step": 727, "train_info/time_within_train_step": 27.77467679977417, "step": 727}
{"train_info/time_between_train_steps": 0.005294084548950195, "step": 727}
{"info/global_step": 728, "train_info/time_within_train_step": 27.759932041168213, "step": 728}
{"train_info/time_between_train_steps": 0.006579160690307617, "step": 728}
{"info/global_step": 729, "train_info/time_within_train_step": 27.754197359085083, "step": 729}
{"train_info/time_between_train_steps": 0.005591869354248047, "step": 729}
{"train_info/time_between_train_steps": 20.390228271484375, "step": 729}
{"info/global_step": 730, "train_info/time_within_train_step": 27.757381439208984, "step": 730}
{"train_info/time_between_train_steps": 0.005480051040649414, "step": 730}
{"info/global_step": 731, "train_info/time_within_train_step": 27.903918027877808, "step": 731}
{"train_info/time_between_train_steps": 0.0052547454833984375, "step": 731}
{"info/global_step": 732, "train_info/time_within_train_step": 27.743619918823242, "step": 732}
{"train_info/time_between_train_steps": 0.005373239517211914, "step": 732}
{"info/global_step": 733, "train_info/time_within_train_step": 27.881761074066162, "step": 733}
{"train_info/time_between_train_steps": 0.010762214660644531, "step": 733}
{"info/global_step": 734, "train_info/time_within_train_step": 27.823755741119385, "step": 734}
{"train_info/time_between_train_steps": 0.0051898956298828125, "step": 734}
{"info/global_step": 735, "train_info/time_within_train_step": 27.916663885116577, "step": 735}
{"train_info/time_between_train_steps": 0.0054361820220947266, "step": 735}
{"info/global_step": 736, "train_info/time_within_train_step": 27.762048721313477, "step": 736}
{"train_info/time_between_train_steps": 0.01621222496032715, "step": 736}
{"info/global_step": 737, "train_info/time_within_train_step": 27.77504324913025, "step": 737}
{"train_info/time_between_train_steps": 0.005305767059326172, "step": 737}
{"info/global_step": 738, "train_info/time_within_train_step": 27.74943470954895, "step": 738}
{"train_info/time_between_train_steps": 0.004940032958984375, "step": 738}
{"info/global_step": 739, "train_info/time_within_train_step": 27.732990503311157, "step": 739}
{"train_info/time_between_train_steps": 0.004930257797241211, "step": 739}
{"info/global_step": 740, "train_info/time_within_train_step": 27.76683211326599, "step": 740}
{"train_info/time_between_train_steps": 0.005079746246337891, "step": 740}
{"info/global_step": 741, "train_info/time_within_train_step": 27.736160039901733, "step": 741}
{"train_info/time_between_train_steps": 0.009834766387939453, "step": 741}
{"info/global_step": 742, "train_info/time_within_train_step": 27.766501903533936, "step": 742}
{"train_info/time_between_train_steps": 0.005002737045288086, "step": 742}
{"info/global_step": 743, "train_info/time_within_train_step": 27.74095106124878, "step": 743}
{"train_info/time_between_train_steps": 0.005070686340332031, "step": 743}
{"info/global_step": 744, "train_info/time_within_train_step": 27.79858088493347, "step": 744}
{"train_info/time_between_train_steps": 0.009718656539916992, "step": 744}
{"info/global_step": 745, "train_info/time_within_train_step": 27.754772186279297, "step": 745}
{"train_info/time_between_train_steps": 0.0051233768463134766, "step": 745}
{"info/global_step": 746, "train_info/time_within_train_step": 27.794233083724976, "step": 746}
{"train_info/time_between_train_steps": 0.009931325912475586, "step": 746}
{"info/global_step": 747, "train_info/time_within_train_step": 27.872669219970703, "step": 747}
{"train_info/time_between_train_steps": 0.005090951919555664, "step": 747}
{"info/global_step": 748, "train_info/time_within_train_step": 27.75768232345581, "step": 748}
{"train_info/time_between_train_steps": 0.005207538604736328, "step": 748}
{"info/global_step": 749, "train_info/time_within_train_step": 27.827285289764404, "step": 749}
{"train_info/time_between_train_steps": 0.0052738189697265625, "step": 749}
{"info/global_step": 750, "train_info/time_within_train_step": 27.75991678237915, "step": 750}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733713786, "_runtime": 26675}, "step": 750}
{"logs": {"train/loss": 3.8755, "train/learning_rate": 0.00025, "train/epoch": 27.02, "_timestamp": 1733713786, "_runtime": 26675}, "step": 750}
{"train_info/time_between_train_steps": 0.006995201110839844, "step": 750}
{"info/global_step": 751, "train_info/time_within_train_step": 27.787877798080444, "step": 751}
{"train_info/time_between_train_steps": 0.005099058151245117, "step": 751}
{"info/global_step": 752, "train_info/time_within_train_step": 27.777555227279663, "step": 752}
{"train_info/time_between_train_steps": 0.005087852478027344, "step": 752}
{"info/global_step": 753, "train_info/time_within_train_step": 27.755293607711792, "step": 753}
{"train_info/time_between_train_steps": 0.008285760879516602, "step": 753}
{"info/global_step": 754, "train_info/time_within_train_step": 27.769490242004395, "step": 754}
{"train_info/time_between_train_steps": 0.005283832550048828, "step": 754}
{"info/global_step": 755, "train_info/time_within_train_step": 27.79166269302368, "step": 755}
{"train_info/time_between_train_steps": 0.005557060241699219, "step": 755}
{"info/global_step": 756, "train_info/time_within_train_step": 27.76967144012451, "step": 756}
{"train_info/time_between_train_steps": 0.01592421531677246, "step": 756}
{"train_info/time_between_train_steps": 20.475857496261597, "step": 756}
{"info/global_step": 757, "train_info/time_within_train_step": 27.70934796333313, "step": 757}
{"train_info/time_between_train_steps": 0.005507230758666992, "step": 757}
{"info/global_step": 758, "train_info/time_within_train_step": 27.85675621032715, "step": 758}
{"train_info/time_between_train_steps": 0.005226612091064453, "step": 758}
{"info/global_step": 759, "train_info/time_within_train_step": 27.747132539749146, "step": 759}
{"train_info/time_between_train_steps": 0.005135059356689453, "step": 759}
{"info/global_step": 760, "train_info/time_within_train_step": 27.874979972839355, "step": 760}
{"train_info/time_between_train_steps": 0.005171537399291992, "step": 760}
{"info/global_step": 761, "train_info/time_within_train_step": 27.738040685653687, "step": 761}
{"train_info/time_between_train_steps": 0.005624055862426758, "step": 761}
{"info/global_step": 762, "train_info/time_within_train_step": 27.899692058563232, "step": 762}
{"train_info/time_between_train_steps": 0.0052928924560546875, "step": 762}
{"info/global_step": 763, "train_info/time_within_train_step": 27.71297335624695, "step": 763}
{"train_info/time_between_train_steps": 0.00507807731628418, "step": 763}
{"info/global_step": 764, "train_info/time_within_train_step": 27.904111623764038, "step": 764}
{"train_info/time_between_train_steps": 0.0052454471588134766, "step": 764}
{"info/global_step": 765, "train_info/time_within_train_step": 27.705394983291626, "step": 765}
{"train_info/time_between_train_steps": 0.009814739227294922, "step": 765}
{"info/global_step": 766, "train_info/time_within_train_step": 27.717728853225708, "step": 766}
{"train_info/time_between_train_steps": 0.0050356388092041016, "step": 766}
{"info/global_step": 767, "train_info/time_within_train_step": 27.724799156188965, "step": 767}
{"train_info/time_between_train_steps": 0.005048990249633789, "step": 767}
{"info/global_step": 768, "train_info/time_within_train_step": 27.761461973190308, "step": 768}
{"train_info/time_between_train_steps": 0.00502467155456543, "step": 768}
{"info/global_step": 769, "train_info/time_within_train_step": 27.90429949760437, "step": 769}
{"train_info/time_between_train_steps": 0.00979471206665039, "step": 769}
{"info/global_step": 770, "train_info/time_within_train_step": 27.766674518585205, "step": 770}
{"train_info/time_between_train_steps": 0.010080099105834961, "step": 770}
{"info/global_step": 771, "train_info/time_within_train_step": 27.761996507644653, "step": 771}
{"train_info/time_between_train_steps": 0.0051038265228271484, "step": 771}
{"info/global_step": 772, "train_info/time_within_train_step": 27.723172664642334, "step": 772}
{"train_info/time_between_train_steps": 0.005189180374145508, "step": 772}
{"info/global_step": 773, "train_info/time_within_train_step": 27.79213857650757, "step": 773}
{"train_info/time_between_train_steps": 0.004953622817993164, "step": 773}
{"info/global_step": 774, "train_info/time_within_train_step": 27.738049507141113, "step": 774}
{"train_info/time_between_train_steps": 0.005045175552368164, "step": 774}
{"info/global_step": 775, "train_info/time_within_train_step": 27.732205390930176, "step": 775}
{"train_info/time_between_train_steps": 0.004935741424560547, "step": 775}
{"info/global_step": 776, "train_info/time_within_train_step": 27.735947132110596, "step": 776}
{"train_info/time_between_train_steps": 0.009839296340942383, "step": 776}
{"info/global_step": 777, "train_info/time_within_train_step": 27.722466468811035, "step": 777}
{"train_info/time_between_train_steps": 0.00502777099609375, "step": 777}
{"info/global_step": 778, "train_info/time_within_train_step": 27.722760915756226, "step": 778}
{"train_info/time_between_train_steps": 0.009679079055786133, "step": 778}
{"info/global_step": 779, "train_info/time_within_train_step": 27.751768350601196, "step": 779}
{"train_info/time_between_train_steps": 0.009930133819580078, "step": 779}
{"info/global_step": 780, "train_info/time_within_train_step": 28.075591564178467, "step": 780}
{"train_info/time_between_train_steps": 0.0054438114166259766, "step": 780}
{"info/global_step": 781, "train_info/time_within_train_step": 27.74714732170105, "step": 781}
{"train_info/time_between_train_steps": 0.005179643630981445, "step": 781}
{"info/global_step": 782, "train_info/time_within_train_step": 27.734503030776978, "step": 782}
{"train_info/time_between_train_steps": 0.005360841751098633, "step": 782}
{"info/global_step": 783, "train_info/time_within_train_step": 27.734605312347412, "step": 783}
{"train_info/time_between_train_steps": 0.005555391311645508, "step": 783}
{"train_info/time_between_train_steps": 20.58989429473877, "step": 783}
{"info/global_step": 784, "train_info/time_within_train_step": 27.722477436065674, "step": 784}
{"train_info/time_between_train_steps": 0.004907846450805664, "step": 784}
{"info/global_step": 785, "train_info/time_within_train_step": 27.829953908920288, "step": 785}
{"train_info/time_between_train_steps": 0.004975557327270508, "step": 785}
{"info/global_step": 786, "train_info/time_within_train_step": 27.72521185874939, "step": 786}
{"train_info/time_between_train_steps": 0.005186319351196289, "step": 786}
{"info/global_step": 787, "train_info/time_within_train_step": 27.92698073387146, "step": 787}
{"train_info/time_between_train_steps": 0.0052874088287353516, "step": 787}
{"info/global_step": 788, "train_info/time_within_train_step": 27.7392475605011, "step": 788}
{"train_info/time_between_train_steps": 0.005389690399169922, "step": 788}
{"info/global_step": 789, "train_info/time_within_train_step": 27.89896059036255, "step": 789}
{"train_info/time_between_train_steps": 0.005269050598144531, "step": 789}
{"info/global_step": 790, "train_info/time_within_train_step": 27.747467041015625, "step": 790}
{"train_info/time_between_train_steps": 0.0056154727935791016, "step": 790}
{"info/global_step": 791, "train_info/time_within_train_step": 27.83594799041748, "step": 791}
{"train_info/time_between_train_steps": 0.005235195159912109, "step": 791}
{"info/global_step": 792, "train_info/time_within_train_step": 27.721369743347168, "step": 792}
{"train_info/time_between_train_steps": 0.0048983097076416016, "step": 792}
{"info/global_step": 793, "train_info/time_within_train_step": 27.91850447654724, "step": 793}
{"train_info/time_between_train_steps": 0.004992485046386719, "step": 793}
{"info/global_step": 794, "train_info/time_within_train_step": 27.720670223236084, "step": 794}
{"train_info/time_between_train_steps": 0.009456872940063477, "step": 794}
{"info/global_step": 795, "train_info/time_within_train_step": 27.839693307876587, "step": 795}
{"train_info/time_between_train_steps": 0.009981870651245117, "step": 795}
{"info/global_step": 796, "train_info/time_within_train_step": 27.743095636367798, "step": 796}
{"train_info/time_between_train_steps": 0.004902362823486328, "step": 796}
{"info/global_step": 797, "train_info/time_within_train_step": 27.73072600364685, "step": 797}
{"train_info/time_between_train_steps": 0.004886150360107422, "step": 797}
{"info/global_step": 798, "train_info/time_within_train_step": 27.728447675704956, "step": 798}
{"train_info/time_between_train_steps": 0.0052013397216796875, "step": 798}
{"info/global_step": 799, "train_info/time_within_train_step": 27.774332761764526, "step": 799}
{"train_info/time_between_train_steps": 0.005066871643066406, "step": 799}
{"info/global_step": 800, "train_info/time_within_train_step": 27.723167181015015, "step": 800}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733715216, "_runtime": 28105}, "step": 800}
{"logs": {"train/loss": 3.7958, "train/learning_rate": 0.00022222222222222218, "train/epoch": 29.01, "_timestamp": 1733715216, "_runtime": 28105}, "step": 800}
{"train_info/time_between_train_steps": 2.205549716949463, "step": 800}
{"info/global_step": 801, "train_info/time_within_train_step": 27.76022505760193, "step": 801}
{"train_info/time_between_train_steps": 0.005002260208129883, "step": 801}
{"info/global_step": 802, "train_info/time_within_train_step": 27.748178243637085, "step": 802}
{"train_info/time_between_train_steps": 0.005094766616821289, "step": 802}
{"info/global_step": 803, "train_info/time_within_train_step": 27.75632071495056, "step": 803}
{"train_info/time_between_train_steps": 0.005112409591674805, "step": 803}
{"info/global_step": 804, "train_info/time_within_train_step": 27.78942346572876, "step": 804}
{"train_info/time_between_train_steps": 0.005110979080200195, "step": 804}
{"info/global_step": 805, "train_info/time_within_train_step": 27.73046040534973, "step": 805}
{"train_info/time_between_train_steps": 0.004993915557861328, "step": 805}
{"info/global_step": 806, "train_info/time_within_train_step": 27.76440191268921, "step": 806}
{"train_info/time_between_train_steps": 0.005078554153442383, "step": 806}
{"info/global_step": 807, "train_info/time_within_train_step": 27.77944302558899, "step": 807}
{"train_info/time_between_train_steps": 0.0052947998046875, "step": 807}
{"info/global_step": 808, "train_info/time_within_train_step": 27.755126953125, "step": 808}
{"train_info/time_between_train_steps": 0.005399227142333984, "step": 808}
{"info/global_step": 809, "train_info/time_within_train_step": 27.764241933822632, "step": 809}
{"train_info/time_between_train_steps": 0.005651712417602539, "step": 809}
{"info/global_step": 810, "train_info/time_within_train_step": 27.851664543151855, "step": 810}
{"train_info/time_between_train_steps": 0.005494832992553711, "step": 810}
{"train_info/time_between_train_steps": 20.325941801071167, "step": 810}
{"info/global_step": 811, "train_info/time_within_train_step": 27.789501905441284, "step": 811}
{"train_info/time_between_train_steps": 0.005624055862426758, "step": 811}
{"info/global_step": 812, "train_info/time_within_train_step": 27.918530225753784, "step": 812}
{"train_info/time_between_train_steps": 0.005295276641845703, "step": 812}
{"info/global_step": 813, "train_info/time_within_train_step": 27.783551692962646, "step": 813}
{"train_info/time_between_train_steps": 0.0054645538330078125, "step": 813}
{"info/global_step": 814, "train_info/time_within_train_step": 28.054149627685547, "step": 814}
{"train_info/time_between_train_steps": 0.005368947982788086, "step": 814}
{"info/global_step": 815, "train_info/time_within_train_step": 27.83423376083374, "step": 815}
{"train_info/time_between_train_steps": 0.005518198013305664, "step": 815}
{"info/global_step": 816, "train_info/time_within_train_step": 27.907285451889038, "step": 816}
{"train_info/time_between_train_steps": 0.005202293395996094, "step": 816}
{"info/global_step": 817, "train_info/time_within_train_step": 27.791210412979126, "step": 817}
{"train_info/time_between_train_steps": 0.005591154098510742, "step": 817}
{"info/global_step": 818, "train_info/time_within_train_step": 27.799635648727417, "step": 818}
{"train_info/time_between_train_steps": 0.0051958560943603516, "step": 818}
{"info/global_step": 819, "train_info/time_within_train_step": 27.760782957077026, "step": 819}
{"train_info/time_between_train_steps": 0.004947662353515625, "step": 819}
{"info/global_step": 820, "train_info/time_within_train_step": 27.72799253463745, "step": 820}
{"train_info/time_between_train_steps": 0.004919290542602539, "step": 820}
{"info/global_step": 821, "train_info/time_within_train_step": 27.730619192123413, "step": 821}
{"train_info/time_between_train_steps": 0.004992008209228516, "step": 821}
{"info/global_step": 822, "train_info/time_within_train_step": 27.740065574645996, "step": 822}
{"train_info/time_between_train_steps": 0.010015487670898438, "step": 822}
{"info/global_step": 823, "train_info/time_within_train_step": 27.73943328857422, "step": 823}
{"train_info/time_between_train_steps": 0.009963035583496094, "step": 823}
{"info/global_step": 824, "train_info/time_within_train_step": 27.729437828063965, "step": 824}
{"train_info/time_between_train_steps": 0.005172014236450195, "step": 824}
{"info/global_step": 825, "train_info/time_within_train_step": 27.795557260513306, "step": 825}
{"train_info/time_between_train_steps": 0.006175994873046875, "step": 825}
{"info/global_step": 826, "train_info/time_within_train_step": 27.713051319122314, "step": 826}
{"train_info/time_between_train_steps": 0.004995107650756836, "step": 826}
{"info/global_step": 827, "train_info/time_within_train_step": 27.705605268478394, "step": 827}
{"train_info/time_between_train_steps": 0.005152463912963867, "step": 827}
{"info/global_step": 828, "train_info/time_within_train_step": 27.701843976974487, "step": 828}
{"train_info/time_between_train_steps": 0.005079507827758789, "step": 828}
{"info/global_step": 829, "train_info/time_within_train_step": 27.73487615585327, "step": 829}
{"train_info/time_between_train_steps": 0.005068778991699219, "step": 829}
{"info/global_step": 830, "train_info/time_within_train_step": 27.730942964553833, "step": 830}
{"train_info/time_between_train_steps": 0.009874820709228516, "step": 830}
{"info/global_step": 831, "train_info/time_within_train_step": 27.710366249084473, "step": 831}
{"train_info/time_between_train_steps": 0.0050792694091796875, "step": 831}
{"info/global_step": 832, "train_info/time_within_train_step": 27.713176488876343, "step": 832}
{"train_info/time_between_train_steps": 0.005037546157836914, "step": 832}
{"info/global_step": 833, "train_info/time_within_train_step": 28.01250672340393, "step": 833}
{"train_info/time_between_train_steps": 0.004963874816894531, "step": 833}
{"info/global_step": 834, "train_info/time_within_train_step": 27.732420206069946, "step": 834}
{"train_info/time_between_train_steps": 0.005366325378417969, "step": 834}
{"info/global_step": 835, "train_info/time_within_train_step": 27.70892596244812, "step": 835}
{"train_info/time_between_train_steps": 0.009644746780395508, "step": 835}
{"info/global_step": 836, "train_info/time_within_train_step": 27.736096382141113, "step": 836}
{"train_info/time_between_train_steps": 0.0066759586334228516, "step": 836}
{"info/global_step": 837, "train_info/time_within_train_step": 27.871622323989868, "step": 837}
{"train_info/time_between_train_steps": 0.015737295150756836, "step": 837}
{"train_info/time_between_train_steps": 20.462361574172974, "step": 837}
{"info/global_step": 838, "train_info/time_within_train_step": 27.72900676727295, "step": 838}
{"train_info/time_between_train_steps": 0.005644321441650391, "step": 838}
{"info/global_step": 839, "train_info/time_within_train_step": 27.970431327819824, "step": 839}
{"train_info/time_between_train_steps": 0.0052623748779296875, "step": 839}
{"info/global_step": 840, "train_info/time_within_train_step": 27.866634845733643, "step": 840}
{"train_info/time_between_train_steps": 0.005210161209106445, "step": 840}
{"info/global_step": 841, "train_info/time_within_train_step": 27.931886672973633, "step": 841}
{"train_info/time_between_train_steps": 0.0054209232330322266, "step": 841}
{"info/global_step": 842, "train_info/time_within_train_step": 27.808806657791138, "step": 842}
{"train_info/time_between_train_steps": 0.0052678585052490234, "step": 842}
{"info/global_step": 843, "train_info/time_within_train_step": 27.967466592788696, "step": 843}
{"train_info/time_between_train_steps": 0.00536036491394043, "step": 843}
{"info/global_step": 844, "train_info/time_within_train_step": 27.802881240844727, "step": 844}
{"train_info/time_between_train_steps": 0.005560159683227539, "step": 844}
{"info/global_step": 845, "train_info/time_within_train_step": 27.825573921203613, "step": 845}
{"train_info/time_between_train_steps": 0.005094289779663086, "step": 845}
{"info/global_step": 846, "train_info/time_within_train_step": 27.74584436416626, "step": 846}
{"train_info/time_between_train_steps": 0.008097410202026367, "step": 846}
{"info/global_step": 847, "train_info/time_within_train_step": 27.726070880889893, "step": 847}
{"train_info/time_between_train_steps": 0.004908561706542969, "step": 847}
{"info/global_step": 848, "train_info/time_within_train_step": 27.740153789520264, "step": 848}
{"train_info/time_between_train_steps": 0.005003213882446289, "step": 848}
{"info/global_step": 849, "train_info/time_within_train_step": 27.716015577316284, "step": 849}
{"train_info/time_between_train_steps": 0.00500178337097168, "step": 849}
{"info/global_step": 850, "train_info/time_within_train_step": 27.71400499343872, "step": 850}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733716649, "_runtime": 29538}, "step": 850}
{"logs": {"train/loss": 3.7265, "train/learning_rate": 0.00019444444444444443, "train/epoch": 31.01, "_timestamp": 1733716649, "_runtime": 29538}, "step": 850}
{"train_info/time_between_train_steps": 0.006962299346923828, "step": 850}
{"info/global_step": 851, "train_info/time_within_train_step": 27.711469411849976, "step": 851}
{"train_info/time_between_train_steps": 0.0051691532135009766, "step": 851}
{"info/global_step": 852, "train_info/time_within_train_step": 27.719529390335083, "step": 852}
{"train_info/time_between_train_steps": 0.0051839351654052734, "step": 852}
{"info/global_step": 853, "train_info/time_within_train_step": 27.947423219680786, "step": 853}
{"train_info/time_between_train_steps": 0.014630556106567383, "step": 853}
{"info/global_step": 854, "train_info/time_within_train_step": 27.734187602996826, "step": 854}
{"train_info/time_between_train_steps": 0.00517725944519043, "step": 854}
{"info/global_step": 855, "train_info/time_within_train_step": 27.70017910003662, "step": 855}
{"train_info/time_between_train_steps": 0.005007266998291016, "step": 855}
{"info/global_step": 856, "train_info/time_within_train_step": 27.834468603134155, "step": 856}
{"train_info/time_between_train_steps": 0.005035400390625, "step": 856}
{"info/global_step": 857, "train_info/time_within_train_step": 27.71995759010315, "step": 857}
{"train_info/time_between_train_steps": 0.005072593688964844, "step": 857}
{"info/global_step": 858, "train_info/time_within_train_step": 27.744977951049805, "step": 858}
{"train_info/time_between_train_steps": 0.0052034854888916016, "step": 858}
{"info/global_step": 859, "train_info/time_within_train_step": 27.714545965194702, "step": 859}
{"train_info/time_between_train_steps": 0.0051784515380859375, "step": 859}
{"info/global_step": 860, "train_info/time_within_train_step": 27.72805690765381, "step": 860}
{"train_info/time_between_train_steps": 0.009775400161743164, "step": 860}
{"info/global_step": 861, "train_info/time_within_train_step": 27.7793071269989, "step": 861}
{"train_info/time_between_train_steps": 0.0053827762603759766, "step": 861}
{"info/global_step": 862, "train_info/time_within_train_step": 27.71979522705078, "step": 862}
{"train_info/time_between_train_steps": 0.010245561599731445, "step": 862}
{"info/global_step": 863, "train_info/time_within_train_step": 27.831526279449463, "step": 863}
{"train_info/time_between_train_steps": 0.01037287712097168, "step": 863}
{"info/global_step": 864, "train_info/time_within_train_step": 28.151416778564453, "step": 864}
{"train_info/time_between_train_steps": 0.005588054656982422, "step": 864}
{"train_info/time_between_train_steps": 20.64278244972229, "step": 864}
{"info/global_step": 865, "train_info/time_within_train_step": 27.73288917541504, "step": 865}
{"train_info/time_between_train_steps": 0.010633707046508789, "step": 865}
{"info/global_step": 866, "train_info/time_within_train_step": 27.924200296401978, "step": 866}
{"train_info/time_between_train_steps": 0.006567478179931641, "step": 866}
{"info/global_step": 867, "train_info/time_within_train_step": 27.924057245254517, "step": 867}
{"train_info/time_between_train_steps": 0.005634307861328125, "step": 867}
{"info/global_step": 868, "train_info/time_within_train_step": 28.04706621170044, "step": 868}
{"train_info/time_between_train_steps": 0.005365610122680664, "step": 868}
{"info/global_step": 869, "train_info/time_within_train_step": 27.73886013031006, "step": 869}
{"train_info/time_between_train_steps": 0.006140708923339844, "step": 869}
{"info/global_step": 870, "train_info/time_within_train_step": 28.03182315826416, "step": 870}
{"train_info/time_between_train_steps": 0.005602836608886719, "step": 870}
{"info/global_step": 871, "train_info/time_within_train_step": 27.860767602920532, "step": 871}
{"train_info/time_between_train_steps": 0.005512237548828125, "step": 871}
{"info/global_step": 872, "train_info/time_within_train_step": 27.8009352684021, "step": 872}
{"train_info/time_between_train_steps": 0.0052220821380615234, "step": 872}
{"info/global_step": 873, "train_info/time_within_train_step": 27.731201171875, "step": 873}
{"train_info/time_between_train_steps": 0.005197286605834961, "step": 873}
{"info/global_step": 874, "train_info/time_within_train_step": 27.766886472702026, "step": 874}
{"train_info/time_between_train_steps": 0.005062103271484375, "step": 874}
{"info/global_step": 875, "train_info/time_within_train_step": 27.711591243743896, "step": 875}
{"train_info/time_between_train_steps": 0.005216836929321289, "step": 875}
{"info/global_step": 876, "train_info/time_within_train_step": 27.72003173828125, "step": 876}
{"train_info/time_between_train_steps": 0.004950523376464844, "step": 876}
{"info/global_step": 877, "train_info/time_within_train_step": 27.767447233200073, "step": 877}
{"train_info/time_between_train_steps": 0.005196094512939453, "step": 877}
{"info/global_step": 878, "train_info/time_within_train_step": 27.701395988464355, "step": 878}
{"train_info/time_between_train_steps": 0.005035400390625, "step": 878}
{"info/global_step": 879, "train_info/time_within_train_step": 27.72297430038452, "step": 879}
{"train_info/time_between_train_steps": 0.005120754241943359, "step": 879}
{"info/global_step": 880, "train_info/time_within_train_step": 27.71203875541687, "step": 880}
{"train_info/time_between_train_steps": 0.005125761032104492, "step": 880}
{"info/global_step": 881, "train_info/time_within_train_step": 27.71765446662903, "step": 881}
{"train_info/time_between_train_steps": 0.004941225051879883, "step": 881}
{"info/global_step": 882, "train_info/time_within_train_step": 27.70330548286438, "step": 882}
{"train_info/time_between_train_steps": 0.0051727294921875, "step": 882}
{"info/global_step": 883, "train_info/time_within_train_step": 27.710264444351196, "step": 883}
{"train_info/time_between_train_steps": 0.0051114559173583984, "step": 883}
{"info/global_step": 884, "train_info/time_within_train_step": 27.742812395095825, "step": 884}
{"train_info/time_between_train_steps": 0.0049779415130615234, "step": 884}
{"info/global_step": 885, "train_info/time_within_train_step": 27.712215662002563, "step": 885}
{"train_info/time_between_train_steps": 0.014586448669433594, "step": 885}
{"info/global_step": 886, "train_info/time_within_train_step": 27.721153497695923, "step": 886}
{"train_info/time_between_train_steps": 0.005057573318481445, "step": 886}
{"info/global_step": 887, "train_info/time_within_train_step": 27.821155309677124, "step": 887}
{"train_info/time_between_train_steps": 0.005003452301025391, "step": 887}
{"info/global_step": 888, "train_info/time_within_train_step": 27.70161533355713, "step": 888}
{"train_info/time_between_train_steps": 0.005099296569824219, "step": 888}
{"info/global_step": 889, "train_info/time_within_train_step": 27.703938961029053, "step": 889}
{"train_info/time_between_train_steps": 0.0049440860748291016, "step": 889}
{"info/global_step": 890, "train_info/time_within_train_step": 27.750370502471924, "step": 890}
{"train_info/time_between_train_steps": 0.0055844783782958984, "step": 890}
{"info/global_step": 891, "train_info/time_within_train_step": 27.7386953830719, "step": 891}
{"train_info/time_between_train_steps": 0.0075762271881103516, "step": 891}
{"train_info/time_between_train_steps": 20.40406584739685, "step": 891}
{"info/global_step": 892, "train_info/time_within_train_step": 27.75487518310547, "step": 892}
{"train_info/time_between_train_steps": 0.005663394927978516, "step": 892}
{"info/global_step": 893, "train_info/time_within_train_step": 28.34470295906067, "step": 893}
{"train_info/time_between_train_steps": 0.004979610443115234, "step": 893}
{"info/global_step": 894, "train_info/time_within_train_step": 27.722283840179443, "step": 894}
{"train_info/time_between_train_steps": 0.0054779052734375, "step": 894}
{"info/global_step": 895, "train_info/time_within_train_step": 27.874066829681396, "step": 895}
{"train_info/time_between_train_steps": 0.010184288024902344, "step": 895}
{"info/global_step": 896, "train_info/time_within_train_step": 27.75307607650757, "step": 896}
{"train_info/time_between_train_steps": 0.0053904056549072266, "step": 896}
{"info/global_step": 897, "train_info/time_within_train_step": 27.868252992630005, "step": 897}
{"train_info/time_between_train_steps": 0.005307435989379883, "step": 897}
{"info/global_step": 898, "train_info/time_within_train_step": 27.73880887031555, "step": 898}
{"train_info/time_between_train_steps": 0.0052928924560546875, "step": 898}
{"info/global_step": 899, "train_info/time_within_train_step": 27.7532377243042, "step": 899}
{"train_info/time_between_train_steps": 0.0051381587982177734, "step": 899}
{"info/global_step": 900, "train_info/time_within_train_step": 27.710609197616577, "step": 900}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733718080, "_runtime": 30969}, "step": 900}
{"logs": {"train/loss": 3.6637, "train/learning_rate": 0.00016666666666666666, "train/epoch": 33.01, "_timestamp": 1733718080, "_runtime": 30969}, "step": 900}
{"train_info/time_between_train_steps": 2.2302613258361816, "step": 900}
{"info/global_step": 901, "train_info/time_within_train_step": 27.717439889907837, "step": 901}
{"train_info/time_between_train_steps": 0.004999876022338867, "step": 901}
{"info/global_step": 902, "train_info/time_within_train_step": 27.86817955970764, "step": 902}
{"train_info/time_between_train_steps": 0.005144357681274414, "step": 902}
{"info/global_step": 903, "train_info/time_within_train_step": 27.903985261917114, "step": 903}
{"train_info/time_between_train_steps": 0.005113840103149414, "step": 903}
{"info/global_step": 904, "train_info/time_within_train_step": 27.74162483215332, "step": 904}
{"train_info/time_between_train_steps": 0.009600639343261719, "step": 904}
{"info/global_step": 905, "train_info/time_within_train_step": 27.721954345703125, "step": 905}
{"train_info/time_between_train_steps": 0.005068063735961914, "step": 905}
{"info/global_step": 906, "train_info/time_within_train_step": 27.73103904724121, "step": 906}
{"train_info/time_between_train_steps": 0.004923582077026367, "step": 906}
{"info/global_step": 907, "train_info/time_within_train_step": 27.71013569831848, "step": 907}
{"train_info/time_between_train_steps": 0.005023002624511719, "step": 907}
{"info/global_step": 908, "train_info/time_within_train_step": 27.69783115386963, "step": 908}
{"train_info/time_between_train_steps": 0.005005836486816406, "step": 908}
{"info/global_step": 909, "train_info/time_within_train_step": 27.736561059951782, "step": 909}
{"train_info/time_between_train_steps": 0.004915714263916016, "step": 909}
{"info/global_step": 910, "train_info/time_within_train_step": 27.71394157409668, "step": 910}
{"train_info/time_between_train_steps": 0.005121707916259766, "step": 910}
{"info/global_step": 911, "train_info/time_within_train_step": 27.75740957260132, "step": 911}
{"train_info/time_between_train_steps": 0.005249977111816406, "step": 911}
{"info/global_step": 912, "train_info/time_within_train_step": 27.795924186706543, "step": 912}
{"train_info/time_between_train_steps": 0.005151987075805664, "step": 912}
{"info/global_step": 913, "train_info/time_within_train_step": 27.73706579208374, "step": 913}
{"train_info/time_between_train_steps": 0.0051500797271728516, "step": 913}
{"info/global_step": 914, "train_info/time_within_train_step": 27.726046562194824, "step": 914}
{"train_info/time_between_train_steps": 0.0050623416900634766, "step": 914}
{"info/global_step": 915, "train_info/time_within_train_step": 27.789567708969116, "step": 915}
{"train_info/time_between_train_steps": 0.009974241256713867, "step": 915}
{"info/global_step": 916, "train_info/time_within_train_step": 27.7273108959198, "step": 916}
{"train_info/time_between_train_steps": 0.005219936370849609, "step": 916}
{"info/global_step": 917, "train_info/time_within_train_step": 27.888763189315796, "step": 917}
{"train_info/time_between_train_steps": 0.005603313446044922, "step": 917}
{"info/global_step": 918, "train_info/time_within_train_step": 27.879773139953613, "step": 918}
{"train_info/time_between_train_steps": 0.005483865737915039, "step": 918}
{"train_info/time_between_train_steps": 20.402026653289795, "step": 918}
{"info/global_step": 919, "train_info/time_within_train_step": 27.766384601593018, "step": 919}
{"train_info/time_between_train_steps": 0.004924774169921875, "step": 919}
{"info/global_step": 920, "train_info/time_within_train_step": 27.907426834106445, "step": 920}
{"train_info/time_between_train_steps": 0.005356311798095703, "step": 920}
{"info/global_step": 921, "train_info/time_within_train_step": 27.792561054229736, "step": 921}
{"train_info/time_between_train_steps": 0.005573272705078125, "step": 921}
{"info/global_step": 922, "train_info/time_within_train_step": 27.89029049873352, "step": 922}
{"train_info/time_between_train_steps": 0.005259990692138672, "step": 922}
{"info/global_step": 923, "train_info/time_within_train_step": 27.8155415058136, "step": 923}
{"train_info/time_between_train_steps": 0.005248308181762695, "step": 923}
{"info/global_step": 924, "train_info/time_within_train_step": 27.891696214675903, "step": 924}
{"train_info/time_between_train_steps": 0.010205268859863281, "step": 924}
{"info/global_step": 925, "train_info/time_within_train_step": 27.75565266609192, "step": 925}
{"train_info/time_between_train_steps": 0.005608558654785156, "step": 925}
{"info/global_step": 926, "train_info/time_within_train_step": 27.82451868057251, "step": 926}
{"train_info/time_between_train_steps": 0.005382061004638672, "step": 926}
{"info/global_step": 927, "train_info/time_within_train_step": 27.773369789123535, "step": 927}
{"train_info/time_between_train_steps": 0.005212306976318359, "step": 927}
{"info/global_step": 928, "train_info/time_within_train_step": 27.718685388565063, "step": 928}
{"train_info/time_between_train_steps": 0.004923105239868164, "step": 928}
{"info/global_step": 929, "train_info/time_within_train_step": 27.766822576522827, "step": 929}
{"train_info/time_between_train_steps": 0.005538225173950195, "step": 929}
{"info/global_step": 930, "train_info/time_within_train_step": 27.751800060272217, "step": 930}
{"train_info/time_between_train_steps": 0.005089998245239258, "step": 930}
{"info/global_step": 931, "train_info/time_within_train_step": 27.74960207939148, "step": 931}
{"train_info/time_between_train_steps": 0.010140657424926758, "step": 931}
{"info/global_step": 932, "train_info/time_within_train_step": 27.94522261619568, "step": 932}
{"train_info/time_between_train_steps": 0.009829044342041016, "step": 932}
{"info/global_step": 933, "train_info/time_within_train_step": 27.908477067947388, "step": 933}
{"train_info/time_between_train_steps": 0.009999752044677734, "step": 933}
{"info/global_step": 934, "train_info/time_within_train_step": 27.78176522254944, "step": 934}
{"train_info/time_between_train_steps": 0.005120515823364258, "step": 934}
{"info/global_step": 935, "train_info/time_within_train_step": 27.739867210388184, "step": 935}
{"train_info/time_between_train_steps": 0.005221843719482422, "step": 935}
{"info/global_step": 936, "train_info/time_within_train_step": 27.734850883483887, "step": 936}
{"train_info/time_between_train_steps": 0.00497889518737793, "step": 936}
{"info/global_step": 937, "train_info/time_within_train_step": 27.72270131111145, "step": 937}
{"train_info/time_between_train_steps": 0.005103349685668945, "step": 937}
{"info/global_step": 938, "train_info/time_within_train_step": 27.73833465576172, "step": 938}
{"train_info/time_between_train_steps": 0.0050771236419677734, "step": 938}
{"info/global_step": 939, "train_info/time_within_train_step": 27.75187635421753, "step": 939}
{"train_info/time_between_train_steps": 0.0052411556243896484, "step": 939}
{"info/global_step": 940, "train_info/time_within_train_step": 27.739800214767456, "step": 940}
{"train_info/time_between_train_steps": 0.005091428756713867, "step": 940}
{"info/global_step": 941, "train_info/time_within_train_step": 27.760770559310913, "step": 941}
{"train_info/time_between_train_steps": 0.005076408386230469, "step": 941}
{"info/global_step": 942, "train_info/time_within_train_step": 27.76490569114685, "step": 942}
{"train_info/time_between_train_steps": 0.005514383316040039, "step": 942}
{"info/global_step": 943, "train_info/time_within_train_step": 27.7442147731781, "step": 943}
{"train_info/time_between_train_steps": 0.005320310592651367, "step": 943}
{"info/global_step": 944, "train_info/time_within_train_step": 27.740784883499146, "step": 944}
{"train_info/time_between_train_steps": 0.005728006362915039, "step": 944}
{"info/global_step": 945, "train_info/time_within_train_step": 27.778006076812744, "step": 945}
{"train_info/time_between_train_steps": 0.0054759979248046875, "step": 945}
{"train_info/time_between_train_steps": 20.552776098251343, "step": 945}
{"info/global_step": 946, "train_info/time_within_train_step": 27.732436180114746, "step": 946}
{"train_info/time_between_train_steps": 0.004860877990722656, "step": 946}
{"info/global_step": 947, "train_info/time_within_train_step": 27.93380880355835, "step": 947}
{"train_info/time_between_train_steps": 0.005039691925048828, "step": 947}
{"info/global_step": 948, "train_info/time_within_train_step": 27.72029733657837, "step": 948}
{"train_info/time_between_train_steps": 0.0051844120025634766, "step": 948}
{"info/global_step": 949, "train_info/time_within_train_step": 27.84953808784485, "step": 949}
{"train_info/time_between_train_steps": 0.005157470703125, "step": 949}
{"info/global_step": 950, "train_info/time_within_train_step": 27.769633531570435, "step": 950}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733719512, "_runtime": 32401}, "step": 950}
{"logs": {"train/loss": 3.6063, "train/learning_rate": 0.0001388888888888889, "train/epoch": 35.0, "_timestamp": 1733719512, "_runtime": 32401}, "step": 950}
{"train_info/time_between_train_steps": 0.006909847259521484, "step": 950}
{"info/global_step": 951, "train_info/time_within_train_step": 27.82872176170349, "step": 951}
{"train_info/time_between_train_steps": 0.010039567947387695, "step": 951}
{"info/global_step": 952, "train_info/time_within_train_step": 27.744431972503662, "step": 952}
{"train_info/time_between_train_steps": 0.005321502685546875, "step": 952}
{"info/global_step": 953, "train_info/time_within_train_step": 27.780563831329346, "step": 953}
{"train_info/time_between_train_steps": 0.005228519439697266, "step": 953}
{"info/global_step": 954, "train_info/time_within_train_step": 27.75871181488037, "step": 954}
{"train_info/time_between_train_steps": 0.00491786003112793, "step": 954}
{"info/global_step": 955, "train_info/time_within_train_step": 27.816804885864258, "step": 955}
{"train_info/time_between_train_steps": 0.005047321319580078, "step": 955}
{"info/global_step": 956, "train_info/time_within_train_step": 27.71284008026123, "step": 956}
{"train_info/time_between_train_steps": 0.01001119613647461, "step": 956}
{"info/global_step": 957, "train_info/time_within_train_step": 27.714195489883423, "step": 957}
{"train_info/time_between_train_steps": 0.005078554153442383, "step": 957}
{"info/global_step": 958, "train_info/time_within_train_step": 27.705259084701538, "step": 958}
{"train_info/time_between_train_steps": 0.009818077087402344, "step": 958}
{"info/global_step": 959, "train_info/time_within_train_step": 27.72949981689453, "step": 959}
{"train_info/time_between_train_steps": 0.009908437728881836, "step": 959}
{"info/global_step": 960, "train_info/time_within_train_step": 27.74699878692627, "step": 960}
{"train_info/time_between_train_steps": 0.00510096549987793, "step": 960}
{"info/global_step": 961, "train_info/time_within_train_step": 27.730856895446777, "step": 961}
{"train_info/time_between_train_steps": 0.005176067352294922, "step": 961}
{"info/global_step": 962, "train_info/time_within_train_step": 27.716304540634155, "step": 962}
{"train_info/time_between_train_steps": 0.005219697952270508, "step": 962}
{"info/global_step": 963, "train_info/time_within_train_step": 27.825742959976196, "step": 963}
{"train_info/time_between_train_steps": 0.004893064498901367, "step": 963}
{"info/global_step": 964, "train_info/time_within_train_step": 27.70690608024597, "step": 964}
{"train_info/time_between_train_steps": 0.004981517791748047, "step": 964}
{"info/global_step": 965, "train_info/time_within_train_step": 27.711451768875122, "step": 965}
{"train_info/time_between_train_steps": 0.005075693130493164, "step": 965}
{"info/global_step": 966, "train_info/time_within_train_step": 27.714987754821777, "step": 966}
{"train_info/time_between_train_steps": 0.0050542354583740234, "step": 966}
{"info/global_step": 967, "train_info/time_within_train_step": 27.729580879211426, "step": 967}
{"train_info/time_between_train_steps": 0.005266427993774414, "step": 967}
{"info/global_step": 968, "train_info/time_within_train_step": 27.73889970779419, "step": 968}
{"train_info/time_between_train_steps": 0.00516510009765625, "step": 968}
{"info/global_step": 969, "train_info/time_within_train_step": 27.758843660354614, "step": 969}
{"train_info/time_between_train_steps": 0.005438804626464844, "step": 969}
{"info/global_step": 970, "train_info/time_within_train_step": 27.76294708251953, "step": 970}
{"train_info/time_between_train_steps": 0.005095720291137695, "step": 970}
{"info/global_step": 971, "train_info/time_within_train_step": 27.73504090309143, "step": 971}
{"train_info/time_between_train_steps": 0.005642414093017578, "step": 971}
{"info/global_step": 972, "train_info/time_within_train_step": 27.74698567390442, "step": 972}
{"train_info/time_between_train_steps": 0.006754398345947266, "step": 972}
{"train_info/time_between_train_steps": 20.673145055770874, "step": 972}
{"info/global_step": 973, "train_info/time_within_train_step": 27.78062081336975, "step": 973}
{"train_info/time_between_train_steps": 0.005954742431640625, "step": 973}
{"info/global_step": 974, "train_info/time_within_train_step": 27.906920671463013, "step": 974}
{"train_info/time_between_train_steps": 0.0054738521575927734, "step": 974}
{"info/global_step": 975, "train_info/time_within_train_step": 27.726618766784668, "step": 975}
{"train_info/time_between_train_steps": 0.005158662796020508, "step": 975}
{"info/global_step": 976, "train_info/time_within_train_step": 27.915189266204834, "step": 976}
{"train_info/time_between_train_steps": 0.005345344543457031, "step": 976}
{"info/global_step": 977, "train_info/time_within_train_step": 27.772154569625854, "step": 977}
{"train_info/time_between_train_steps": 0.010063648223876953, "step": 977}
{"info/global_step": 978, "train_info/time_within_train_step": 27.9952175617218, "step": 978}
{"train_info/time_between_train_steps": 0.005265474319458008, "step": 978}
{"info/global_step": 979, "train_info/time_within_train_step": 27.768432140350342, "step": 979}
{"train_info/time_between_train_steps": 0.005507230758666992, "step": 979}
{"info/global_step": 980, "train_info/time_within_train_step": 27.808415174484253, "step": 980}
{"train_info/time_between_train_steps": 0.0052220821380615234, "step": 980}
{"info/global_step": 981, "train_info/time_within_train_step": 27.75856041908264, "step": 981}
{"train_info/time_between_train_steps": 0.009850740432739258, "step": 981}
{"info/global_step": 982, "train_info/time_within_train_step": 27.713550806045532, "step": 982}
{"train_info/time_between_train_steps": 0.0049343109130859375, "step": 982}
{"info/global_step": 983, "train_info/time_within_train_step": 27.72117519378662, "step": 983}
{"train_info/time_between_train_steps": 0.009969472885131836, "step": 983}
{"info/global_step": 984, "train_info/time_within_train_step": 27.70388698577881, "step": 984}
{"train_info/time_between_train_steps": 0.0049245357513427734, "step": 984}
{"info/global_step": 985, "train_info/time_within_train_step": 27.739664316177368, "step": 985}
{"train_info/time_between_train_steps": 0.009700298309326172, "step": 985}
{"info/global_step": 986, "train_info/time_within_train_step": 27.711057662963867, "step": 986}
{"train_info/time_between_train_steps": 0.0049877166748046875, "step": 986}
{"info/global_step": 987, "train_info/time_within_train_step": 27.719268083572388, "step": 987}
{"train_info/time_between_train_steps": 0.0050389766693115234, "step": 987}
{"info/global_step": 988, "train_info/time_within_train_step": 27.78330969810486, "step": 988}
{"train_info/time_between_train_steps": 0.005132436752319336, "step": 988}
{"info/global_step": 989, "train_info/time_within_train_step": 27.797218561172485, "step": 989}
{"train_info/time_between_train_steps": 0.005122661590576172, "step": 989}
{"info/global_step": 990, "train_info/time_within_train_step": 27.771557807922363, "step": 990}
{"train_info/time_between_train_steps": 0.013197660446166992, "step": 990}
{"info/global_step": 991, "train_info/time_within_train_step": 27.744916915893555, "step": 991}
{"train_info/time_between_train_steps": 0.014278650283813477, "step": 991}
{"info/global_step": 992, "train_info/time_within_train_step": 27.978660583496094, "step": 992}
{"train_info/time_between_train_steps": 0.012099981307983398, "step": 992}
{"info/global_step": 993, "train_info/time_within_train_step": 27.731463193893433, "step": 993}
{"train_info/time_between_train_steps": 0.004978179931640625, "step": 993}
{"info/global_step": 994, "train_info/time_within_train_step": 27.83297348022461, "step": 994}
{"train_info/time_between_train_steps": 0.005085468292236328, "step": 994}
{"info/global_step": 995, "train_info/time_within_train_step": 27.71954345703125, "step": 995}
{"train_info/time_between_train_steps": 0.005003690719604492, "step": 995}
{"info/global_step": 996, "train_info/time_within_train_step": 27.767013549804688, "step": 996}
{"train_info/time_between_train_steps": 0.005197048187255859, "step": 996}
{"info/global_step": 997, "train_info/time_within_train_step": 27.77447819709778, "step": 997}
{"train_info/time_between_train_steps": 0.005070924758911133, "step": 997}
{"info/global_step": 998, "train_info/time_within_train_step": 27.74242067337036, "step": 998}
{"train_info/time_between_train_steps": 0.005674600601196289, "step": 998}
{"info/global_step": 999, "train_info/time_within_train_step": 27.747557401657104, "step": 999}
{"train_info/time_between_train_steps": 0.01027226448059082, "step": 999}
{"train_info/time_between_train_steps": 20.422119140625, "step": 999}
{"info/global_step": 1000, "train_info/time_within_train_step": 27.749995708465576, "step": 1000}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1733720942, "_runtime": 33831}, "step": 1000}
{"logs": {"train/loss": 3.5555, "train/learning_rate": 0.00011111111111111109, "train/epoch": 37.0, "_timestamp": 1733720942, "_runtime": 33831}, "step": 1000}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1733720944, "_runtime": 33833}, "step": 1000}
{"logs": {"eval/loss": 4.463772773742676, "eval/runtime": 1.9775, "eval/samples_per_second": 50.57, "eval/steps_per_second": 3.54, "train/epoch": 37.0, "_timestamp": 1733720944, "_runtime": 33833}, "step": 1000}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1733720944, "_runtime": 33833}, "step": 1000}
{"logs": {"eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_loss": 4.463772773742676, "eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_ppl": 86.81442319841803, "eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_runtime": 1.9775, "eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_samples_per_second": 50.57, "train/epoch": 37.0, "_timestamp": 1733720944, "_runtime": 33833}, "step": 1000}
{"train_info/time_between_train_steps": 4.17415452003479, "step": 1000}
{"info/global_step": 1001, "train_info/time_within_train_step": 27.991593837738037, "step": 1001}
{"train_info/time_between_train_steps": 0.005219459533691406, "step": 1001}
{"info/global_step": 1002, "train_info/time_within_train_step": 27.745720863342285, "step": 1002}
{"train_info/time_between_train_steps": 0.005284309387207031, "step": 1002}
{"info/global_step": 1003, "train_info/time_within_train_step": 27.927810192108154, "step": 1003}
{"train_info/time_between_train_steps": 0.00554656982421875, "step": 1003}
{"info/global_step": 1004, "train_info/time_within_train_step": 27.749001026153564, "step": 1004}
{"train_info/time_between_train_steps": 0.005475044250488281, "step": 1004}
{"info/global_step": 1005, "train_info/time_within_train_step": 27.954286098480225, "step": 1005}
{"train_info/time_between_train_steps": 0.005254983901977539, "step": 1005}
{"info/global_step": 1006, "train_info/time_within_train_step": 27.77864694595337, "step": 1006}
{"train_info/time_between_train_steps": 0.009961843490600586, "step": 1006}
{"info/global_step": 1007, "train_info/time_within_train_step": 27.815456867218018, "step": 1007}
{"train_info/time_between_train_steps": 0.005338907241821289, "step": 1007}
{"info/global_step": 1008, "train_info/time_within_train_step": 27.7758572101593, "step": 1008}
{"train_info/time_between_train_steps": 0.005122184753417969, "step": 1008}
{"info/global_step": 1009, "train_info/time_within_train_step": 27.84366011619568, "step": 1009}
{"train_info/time_between_train_steps": 0.005027055740356445, "step": 1009}
{"info/global_step": 1010, "train_info/time_within_train_step": 27.721818447113037, "step": 1010}
{"train_info/time_between_train_steps": 0.005094289779663086, "step": 1010}
{"info/global_step": 1011, "train_info/time_within_train_step": 27.73899269104004, "step": 1011}
{"train_info/time_between_train_steps": 0.0049626827239990234, "step": 1011}
{"info/global_step": 1012, "train_info/time_within_train_step": 27.77725839614868, "step": 1012}
{"train_info/time_between_train_steps": 0.0051229000091552734, "step": 1012}
{"info/global_step": 1013, "train_info/time_within_train_step": 27.732489585876465, "step": 1013}
{"train_info/time_between_train_steps": 0.005312919616699219, "step": 1013}
{"info/global_step": 1014, "train_info/time_within_train_step": 27.72848105430603, "step": 1014}
{"train_info/time_between_train_steps": 0.005142688751220703, "step": 1014}
{"info/global_step": 1015, "train_info/time_within_train_step": 27.72519850730896, "step": 1015}
{"train_info/time_between_train_steps": 0.005167484283447266, "step": 1015}
{"info/global_step": 1016, "train_info/time_within_train_step": 27.76703429222107, "step": 1016}
{"train_info/time_between_train_steps": 0.00882863998413086, "step": 1016}
{"info/global_step": 1017, "train_info/time_within_train_step": 27.802080392837524, "step": 1017}
{"train_info/time_between_train_steps": 0.004950761795043945, "step": 1017}
{"info/global_step": 1018, "train_info/time_within_train_step": 27.8357150554657, "step": 1018}
{"train_info/time_between_train_steps": 0.012461423873901367, "step": 1018}
{"info/global_step": 1019, "train_info/time_within_train_step": 27.7370548248291, "step": 1019}
{"train_info/time_between_train_steps": 0.005002498626708984, "step": 1019}
{"info/global_step": 1020, "train_info/time_within_train_step": 27.729429244995117, "step": 1020}
{"train_info/time_between_train_steps": 0.0049936771392822266, "step": 1020}
{"info/global_step": 1021, "train_info/time_within_train_step": 27.741766214370728, "step": 1021}
{"train_info/time_between_train_steps": 0.004937171936035156, "step": 1021}
{"info/global_step": 1022, "train_info/time_within_train_step": 27.777987241744995, "step": 1022}
{"train_info/time_between_train_steps": 0.005203723907470703, "step": 1022}
{"info/global_step": 1023, "train_info/time_within_train_step": 27.738245248794556, "step": 1023}
{"train_info/time_between_train_steps": 0.005335092544555664, "step": 1023}
{"info/global_step": 1024, "train_info/time_within_train_step": 27.864444255828857, "step": 1024}
{"train_info/time_between_train_steps": 0.005197286605834961, "step": 1024}
{"info/global_step": 1025, "train_info/time_within_train_step": 27.775732278823853, "step": 1025}
{"train_info/time_between_train_steps": 0.005827426910400391, "step": 1025}
{"info/global_step": 1026, "train_info/time_within_train_step": 27.992831707000732, "step": 1026}
{"train_info/time_between_train_steps": 0.005486011505126953, "step": 1026}
{"train_info/time_between_train_steps": 20.711559534072876, "step": 1026}
{"info/global_step": 1027, "train_info/time_within_train_step": 27.731252670288086, "step": 1027}
{"train_info/time_between_train_steps": 0.004859447479248047, "step": 1027}
{"info/global_step": 1028, "train_info/time_within_train_step": 27.931817531585693, "step": 1028}
{"train_info/time_between_train_steps": 0.0051386356353759766, "step": 1028}
{"info/global_step": 1029, "train_info/time_within_train_step": 27.786075592041016, "step": 1029}
{"train_info/time_between_train_steps": 0.005092144012451172, "step": 1029}
{"info/global_step": 1030, "train_info/time_within_train_step": 27.956151723861694, "step": 1030}
{"train_info/time_between_train_steps": 0.0050811767578125, "step": 1030}
{"info/global_step": 1031, "train_info/time_within_train_step": 27.739866971969604, "step": 1031}
{"train_info/time_between_train_steps": 0.005114078521728516, "step": 1031}
{"info/global_step": 1032, "train_info/time_within_train_step": 27.956751346588135, "step": 1032}
{"train_info/time_between_train_steps": 0.010126829147338867, "step": 1032}
{"info/global_step": 1033, "train_info/time_within_train_step": 27.751357316970825, "step": 1033}
{"train_info/time_between_train_steps": 0.005181550979614258, "step": 1033}
{"info/global_step": 1034, "train_info/time_within_train_step": 27.77585768699646, "step": 1034}
{"train_info/time_between_train_steps": 0.0050716400146484375, "step": 1034}
{"info/global_step": 1035, "train_info/time_within_train_step": 27.73640203475952, "step": 1035}
{"train_info/time_between_train_steps": 0.00486302375793457, "step": 1035}
{"info/global_step": 1036, "train_info/time_within_train_step": 27.821069478988647, "step": 1036}
{"train_info/time_between_train_steps": 0.004953145980834961, "step": 1036}
{"info/global_step": 1037, "train_info/time_within_train_step": 27.731759071350098, "step": 1037}
{"train_info/time_between_train_steps": 0.0050029754638671875, "step": 1037}
{"info/global_step": 1038, "train_info/time_within_train_step": 27.771746158599854, "step": 1038}
{"train_info/time_between_train_steps": 0.0049724578857421875, "step": 1038}
{"info/global_step": 1039, "train_info/time_within_train_step": 27.798981189727783, "step": 1039}
{"train_info/time_between_train_steps": 0.0049474239349365234, "step": 1039}
{"info/global_step": 1040, "train_info/time_within_train_step": 27.714587688446045, "step": 1040}
{"train_info/time_between_train_steps": 0.004990339279174805, "step": 1040}
{"info/global_step": 1041, "train_info/time_within_train_step": 27.732833862304688, "step": 1041}
{"train_info/time_between_train_steps": 0.0051991939544677734, "step": 1041}
{"info/global_step": 1042, "train_info/time_within_train_step": 27.775938272476196, "step": 1042}
{"train_info/time_between_train_steps": 0.005074739456176758, "step": 1042}
{"info/global_step": 1043, "train_info/time_within_train_step": 27.997113466262817, "step": 1043}
{"train_info/time_between_train_steps": 0.009951591491699219, "step": 1043}
{"info/global_step": 1044, "train_info/time_within_train_step": 27.7270724773407, "step": 1044}
{"train_info/time_between_train_steps": 0.014493227005004883, "step": 1044}
{"info/global_step": 1045, "train_info/time_within_train_step": 27.881389617919922, "step": 1045}
{"train_info/time_between_train_steps": 0.005152702331542969, "step": 1045}
{"info/global_step": 1046, "train_info/time_within_train_step": 27.72917652130127, "step": 1046}
{"train_info/time_between_train_steps": 0.004954338073730469, "step": 1046}
{"info/global_step": 1047, "train_info/time_within_train_step": 27.721304655075073, "step": 1047}
{"train_info/time_between_train_steps": 0.009722709655761719, "step": 1047}
{"info/global_step": 1048, "train_info/time_within_train_step": 27.737181901931763, "step": 1048}
{"train_info/time_between_train_steps": 0.005473613739013672, "step": 1048}
{"info/global_step": 1049, "train_info/time_within_train_step": 27.772560834884644, "step": 1049}
{"train_info/time_between_train_steps": 0.004973411560058594, "step": 1049}
{"info/global_step": 1050, "train_info/time_within_train_step": 27.752525091171265, "step": 1050}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1733722357, "_runtime": 35246}, "step": 1050}
{"logs": {"train/loss": 3.4698, "train/learning_rate": 8.333333333333333e-05, "train/epoch": 38.02, "_timestamp": 1733722357, "_runtime": 35246}, "step": 1050}
{"train_info/time_between_train_steps": 0.012894153594970703, "step": 1050}
{"info/global_step": 1051, "train_info/time_within_train_step": 27.735488653182983, "step": 1051}
{"train_info/time_between_train_steps": 0.005217313766479492, "step": 1051}
{"info/global_step": 1052, "train_info/time_within_train_step": 27.87801742553711, "step": 1052}
{"train_info/time_between_train_steps": 0.014874458312988281, "step": 1052}
{"info/global_step": 1053, "train_info/time_within_train_step": 27.770021438598633, "step": 1053}
{"train_info/time_between_train_steps": 0.010504007339477539, "step": 1053}
{"train_info/time_between_train_steps": 20.743542671203613, "step": 1053}
{"info/global_step": 1054, "train_info/time_within_train_step": 27.844751596450806, "step": 1054}
{"train_info/time_between_train_steps": 0.0055999755859375, "step": 1054}
{"info/global_step": 1055, "train_info/time_within_train_step": 28.02283501625061, "step": 1055}
{"train_info/time_between_train_steps": 0.005312204360961914, "step": 1055}
{"info/global_step": 1056, "train_info/time_within_train_step": 27.79671812057495, "step": 1056}
{"train_info/time_between_train_steps": 0.0051386356353759766, "step": 1056}
{"info/global_step": 1057, "train_info/time_within_train_step": 28.010501384735107, "step": 1057}
{"train_info/time_between_train_steps": 0.005328178405761719, "step": 1057}
{"info/global_step": 1058, "train_info/time_within_train_step": 27.73310685157776, "step": 1058}
{"train_info/time_between_train_steps": 0.0052182674407958984, "step": 1058}
{"info/global_step": 1059, "train_info/time_within_train_step": 28.060102939605713, "step": 1059}
{"train_info/time_between_train_steps": 0.005334377288818359, "step": 1059}
{"info/global_step": 1060, "train_info/time_within_train_step": 27.80209255218506, "step": 1060}
{"train_info/time_between_train_steps": 0.005445003509521484, "step": 1060}
{"info/global_step": 1061, "train_info/time_within_train_step": 27.839007139205933, "step": 1061}
{"train_info/time_between_train_steps": 0.009923934936523438, "step": 1061}
{"info/global_step": 1062, "train_info/time_within_train_step": 27.73200798034668, "step": 1062}
{"train_info/time_between_train_steps": 0.004990577697753906, "step": 1062}
{"info/global_step": 1063, "train_info/time_within_train_step": 27.734421253204346, "step": 1063}
{"train_info/time_between_train_steps": 0.004995822906494141, "step": 1063}
{"info/global_step": 1064, "train_info/time_within_train_step": 27.7232186794281, "step": 1064}
{"train_info/time_between_train_steps": 0.0049364566802978516, "step": 1064}
{"info/global_step": 1065, "train_info/time_within_train_step": 27.73325777053833, "step": 1065}
{"train_info/time_between_train_steps": 0.00504612922668457, "step": 1065}
{"info/global_step": 1066, "train_info/time_within_train_step": 27.73606562614441, "step": 1066}
{"train_info/time_between_train_steps": 0.004914760589599609, "step": 1066}
{"info/global_step": 1067, "train_info/time_within_train_step": 27.738201141357422, "step": 1067}
{"train_info/time_between_train_steps": 0.009801626205444336, "step": 1067}
{"info/global_step": 1068, "train_info/time_within_train_step": 27.86996364593506, "step": 1068}
{"train_info/time_between_train_steps": 0.008728265762329102, "step": 1068}
{"info/global_step": 1069, "train_info/time_within_train_step": 27.760778188705444, "step": 1069}
{"train_info/time_between_train_steps": 0.005825519561767578, "step": 1069}
{"info/global_step": 1070, "train_info/time_within_train_step": 27.874186754226685, "step": 1070}
{"train_info/time_between_train_steps": 0.005445241928100586, "step": 1070}
{"info/global_step": 1071, "train_info/time_within_train_step": 27.71488046646118, "step": 1071}
{"train_info/time_between_train_steps": 0.005337953567504883, "step": 1071}
{"info/global_step": 1072, "train_info/time_within_train_step": 27.72305917739868, "step": 1072}
{"train_info/time_between_train_steps": 0.005236387252807617, "step": 1072}
{"info/global_step": 1073, "train_info/time_within_train_step": 27.73171305656433, "step": 1073}
{"train_info/time_between_train_steps": 0.005153179168701172, "step": 1073}
{"info/global_step": 1074, "train_info/time_within_train_step": 27.752735137939453, "step": 1074}
{"train_info/time_between_train_steps": 0.00545811653137207, "step": 1074}
{"info/global_step": 1075, "train_info/time_within_train_step": 27.723724603652954, "step": 1075}
{"train_info/time_between_train_steps": 0.005612611770629883, "step": 1075}
{"info/global_step": 1076, "train_info/time_within_train_step": 27.72422981262207, "step": 1076}
{"train_info/time_between_train_steps": 0.005243778228759766, "step": 1076}
{"info/global_step": 1077, "train_info/time_within_train_step": 27.732285737991333, "step": 1077}
{"train_info/time_between_train_steps": 0.005746603012084961, "step": 1077}
{"info/global_step": 1078, "train_info/time_within_train_step": 27.803054809570312, "step": 1078}
{"train_info/time_between_train_steps": 0.005701303482055664, "step": 1078}
{"info/global_step": 1079, "train_info/time_within_train_step": 27.747830867767334, "step": 1079}
{"train_info/time_between_train_steps": 0.005709171295166016, "step": 1079}
{"info/global_step": 1080, "train_info/time_within_train_step": 27.77984094619751, "step": 1080}
{"train_info/time_between_train_steps": 0.006214141845703125, "step": 1080}
{"train_info/time_between_train_steps": 20.590466737747192, "step": 1080}
{"info/global_step": 1081, "train_info/time_within_train_step": 27.783493518829346, "step": 1081}
{"train_info/time_between_train_steps": 0.009607791900634766, "step": 1081}
{"info/global_step": 1082, "train_info/time_within_train_step": 27.84639549255371, "step": 1082}
{"train_info/time_between_train_steps": 0.0050029754638671875, "step": 1082}
{"info/global_step": 1083, "train_info/time_within_train_step": 27.808008670806885, "step": 1083}
{"train_info/time_between_train_steps": 0.00592494010925293, "step": 1083}
{"info/global_step": 1084, "train_info/time_within_train_step": 27.927143096923828, "step": 1084}
{"train_info/time_between_train_steps": 0.00539708137512207, "step": 1084}
{"info/global_step": 1085, "train_info/time_within_train_step": 28.02059054374695, "step": 1085}
{"train_info/time_between_train_steps": 0.005728721618652344, "step": 1085}
{"info/global_step": 1086, "train_info/time_within_train_step": 27.93469524383545, "step": 1086}
{"train_info/time_between_train_steps": 0.005421876907348633, "step": 1086}
{"info/global_step": 1087, "train_info/time_within_train_step": 28.019818544387817, "step": 1087}
{"train_info/time_between_train_steps": 0.009821176528930664, "step": 1087}
{"info/global_step": 1088, "train_info/time_within_train_step": 28.02836775779724, "step": 1088}
{"train_info/time_between_train_steps": 0.006028175354003906, "step": 1088}
{"info/global_step": 1089, "train_info/time_within_train_step": 27.736282110214233, "step": 1089}
{"train_info/time_between_train_steps": 0.00518488883972168, "step": 1089}
{"info/global_step": 1090, "train_info/time_within_train_step": 27.8039333820343, "step": 1090}
{"train_info/time_between_train_steps": 0.0054149627685546875, "step": 1090}
{"info/global_step": 1091, "train_info/time_within_train_step": 27.751394748687744, "step": 1091}
{"train_info/time_between_train_steps": 0.005066871643066406, "step": 1091}
{"info/global_step": 1092, "train_info/time_within_train_step": 27.765512704849243, "step": 1092}
{"train_info/time_between_train_steps": 0.0051975250244140625, "step": 1092}
{"info/global_step": 1093, "train_info/time_within_train_step": 27.761812448501587, "step": 1093}
{"train_info/time_between_train_steps": 0.005250215530395508, "step": 1093}
{"info/global_step": 1094, "train_info/time_within_train_step": 27.7618567943573, "step": 1094}
{"train_info/time_between_train_steps": 0.005236625671386719, "step": 1094}
{"info/global_step": 1095, "train_info/time_within_train_step": 27.78457522392273, "step": 1095}
{"train_info/time_between_train_steps": 0.005249738693237305, "step": 1095}
{"info/global_step": 1096, "train_info/time_within_train_step": 27.755897521972656, "step": 1096}
{"train_info/time_between_train_steps": 0.009884357452392578, "step": 1096}
{"info/global_step": 1097, "train_info/time_within_train_step": 27.754717111587524, "step": 1097}
{"train_info/time_between_train_steps": 0.01003122329711914, "step": 1097}
{"info/global_step": 1098, "train_info/time_within_train_step": 27.75508999824524, "step": 1098}
{"train_info/time_between_train_steps": 0.005212068557739258, "step": 1098}
{"info/global_step": 1099, "train_info/time_within_train_step": 27.75355839729309, "step": 1099}
{"train_info/time_between_train_steps": 0.005335330963134766, "step": 1099}
{"info/global_step": 1100, "train_info/time_within_train_step": 27.85081696510315, "step": 1100}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1733723789, "_runtime": 36678}, "step": 1100}
{"logs": {"train/loss": 3.4747, "train/learning_rate": 5.5555555555555545e-05, "train/epoch": 40.02, "_timestamp": 1733723789, "_runtime": 36678}, "step": 1100}
{"train_info/time_between_train_steps": 2.773588180541992, "step": 1100}
{"info/global_step": 1101, "train_info/time_within_train_step": 27.770954370498657, "step": 1101}
{"train_info/time_between_train_steps": 0.0052509307861328125, "step": 1101}
{"info/global_step": 1102, "train_info/time_within_train_step": 27.75339126586914, "step": 1102}
{"train_info/time_between_train_steps": 0.005370140075683594, "step": 1102}
{"info/global_step": 1103, "train_info/time_within_train_step": 27.7463698387146, "step": 1103}
{"train_info/time_between_train_steps": 0.005217313766479492, "step": 1103}
{"info/global_step": 1104, "train_info/time_within_train_step": 27.752886056900024, "step": 1104}
{"train_info/time_between_train_steps": 0.014444828033447266, "step": 1104}
{"info/global_step": 1105, "train_info/time_within_train_step": 27.92673134803772, "step": 1105}
{"train_info/time_between_train_steps": 0.005487203598022461, "step": 1105}
{"info/global_step": 1106, "train_info/time_within_train_step": 27.763165712356567, "step": 1106}
{"train_info/time_between_train_steps": 0.005783796310424805, "step": 1106}
{"info/global_step": 1107, "train_info/time_within_train_step": 27.76275372505188, "step": 1107}
{"train_info/time_between_train_steps": 0.005758047103881836, "step": 1107}
{"train_info/time_between_train_steps": 20.531879425048828, "step": 1107}
{"info/global_step": 1108, "train_info/time_within_train_step": 27.749075889587402, "step": 1108}
{"train_info/time_between_train_steps": 0.005650520324707031, "step": 1108}
{"info/global_step": 1109, "train_info/time_within_train_step": 27.944307565689087, "step": 1109}
{"train_info/time_between_train_steps": 0.005466461181640625, "step": 1109}
{"info/global_step": 1110, "train_info/time_within_train_step": 27.89180827140808, "step": 1110}
{"train_info/time_between_train_steps": 0.005216121673583984, "step": 1110}
{"info/global_step": 1111, "train_info/time_within_train_step": 27.836729049682617, "step": 1111}
{"train_info/time_between_train_steps": 0.005219459533691406, "step": 1111}
{"info/global_step": 1112, "train_info/time_within_train_step": 27.820615768432617, "step": 1112}
{"train_info/time_between_train_steps": 0.005724906921386719, "step": 1112}
{"info/global_step": 1113, "train_info/time_within_train_step": 27.905596017837524, "step": 1113}
{"train_info/time_between_train_steps": 0.005454301834106445, "step": 1113}
{"info/global_step": 1114, "train_info/time_within_train_step": 27.75635838508606, "step": 1114}
{"train_info/time_between_train_steps": 0.005450010299682617, "step": 1114}
{"info/global_step": 1115, "train_info/time_within_train_step": 27.926457166671753, "step": 1115}
{"train_info/time_between_train_steps": 0.005171537399291992, "step": 1115}
{"info/global_step": 1116, "train_info/time_within_train_step": 27.732614994049072, "step": 1116}
{"train_info/time_between_train_steps": 0.005179166793823242, "step": 1116}
{"info/global_step": 1117, "train_info/time_within_train_step": 27.7216317653656, "step": 1117}
{"train_info/time_between_train_steps": 0.0055201053619384766, "step": 1117}
{"info/global_step": 1118, "train_info/time_within_train_step": 27.717243909835815, "step": 1118}
{"train_info/time_between_train_steps": 0.005150794982910156, "step": 1118}
{"info/global_step": 1119, "train_info/time_within_train_step": 27.7287859916687, "step": 1119}
{"train_info/time_between_train_steps": 0.00500798225402832, "step": 1119}
{"info/global_step": 1120, "train_info/time_within_train_step": 27.713724374771118, "step": 1120}
{"train_info/time_between_train_steps": 0.005156517028808594, "step": 1120}
{"info/global_step": 1121, "train_info/time_within_train_step": 27.7301504611969, "step": 1121}
{"train_info/time_between_train_steps": 0.005213499069213867, "step": 1121}
{"info/global_step": 1122, "train_info/time_within_train_step": 27.71215009689331, "step": 1122}
{"train_info/time_between_train_steps": 0.005129575729370117, "step": 1122}
{"info/global_step": 1123, "train_info/time_within_train_step": 27.745173931121826, "step": 1123}
{"train_info/time_between_train_steps": 0.009558916091918945, "step": 1123}
{"info/global_step": 1124, "train_info/time_within_train_step": 27.7522292137146, "step": 1124}
{"train_info/time_between_train_steps": 0.005084037780761719, "step": 1124}
{"info/global_step": 1125, "train_info/time_within_train_step": 27.8046715259552, "step": 1125}
{"train_info/time_between_train_steps": 0.0050623416900634766, "step": 1125}
{"info/global_step": 1126, "train_info/time_within_train_step": 27.740708827972412, "step": 1126}
{"train_info/time_between_train_steps": 0.0052187442779541016, "step": 1126}
{"info/global_step": 1127, "train_info/time_within_train_step": 27.741695642471313, "step": 1127}
{"train_info/time_between_train_steps": 0.005240917205810547, "step": 1127}
{"info/global_step": 1128, "train_info/time_within_train_step": 27.752994298934937, "step": 1128}
{"train_info/time_between_train_steps": 0.0051479339599609375, "step": 1128}
{"info/global_step": 1129, "train_info/time_within_train_step": 27.76290225982666, "step": 1129}
{"train_info/time_between_train_steps": 0.005084037780761719, "step": 1129}
{"info/global_step": 1130, "train_info/time_within_train_step": 27.745094060897827, "step": 1130}
{"train_info/time_between_train_steps": 0.009603500366210938, "step": 1130}
{"info/global_step": 1131, "train_info/time_within_train_step": 27.838648319244385, "step": 1131}
{"train_info/time_between_train_steps": 0.005501270294189453, "step": 1131}
{"info/global_step": 1132, "train_info/time_within_train_step": 27.74559497833252, "step": 1132}
{"train_info/time_between_train_steps": 0.005270481109619141, "step": 1132}
{"info/global_step": 1133, "train_info/time_within_train_step": 27.750768423080444, "step": 1133}
{"train_info/time_between_train_steps": 0.0054721832275390625, "step": 1133}
{"info/global_step": 1134, "train_info/time_within_train_step": 27.767838716506958, "step": 1134}
{"train_info/time_between_train_steps": 0.0059680938720703125, "step": 1134}
{"train_info/time_between_train_steps": 20.676860570907593, "step": 1134}
{"info/global_step": 1135, "train_info/time_within_train_step": 27.719276666641235, "step": 1135}
{"train_info/time_between_train_steps": 0.004936695098876953, "step": 1135}
{"info/global_step": 1136, "train_info/time_within_train_step": 27.892005681991577, "step": 1136}
{"train_info/time_between_train_steps": 0.005208015441894531, "step": 1136}
{"info/global_step": 1137, "train_info/time_within_train_step": 27.739113807678223, "step": 1137}
{"train_info/time_between_train_steps": 0.005192279815673828, "step": 1137}
{"info/global_step": 1138, "train_info/time_within_train_step": 27.854159116744995, "step": 1138}
{"train_info/time_between_train_steps": 0.005142927169799805, "step": 1138}
{"info/global_step": 1139, "train_info/time_within_train_step": 27.744654178619385, "step": 1139}
{"train_info/time_between_train_steps": 0.0054340362548828125, "step": 1139}
{"info/global_step": 1140, "train_info/time_within_train_step": 27.915640592575073, "step": 1140}
{"train_info/time_between_train_steps": 0.005283355712890625, "step": 1140}
{"info/global_step": 1141, "train_info/time_within_train_step": 27.737854480743408, "step": 1141}
{"train_info/time_between_train_steps": 0.005244731903076172, "step": 1141}
{"info/global_step": 1142, "train_info/time_within_train_step": 27.882392168045044, "step": 1142}
{"train_info/time_between_train_steps": 0.014201879501342773, "step": 1142}
{"info/global_step": 1143, "train_info/time_within_train_step": 27.736708402633667, "step": 1143}
{"train_info/time_between_train_steps": 0.005250692367553711, "step": 1143}
{"info/global_step": 1144, "train_info/time_within_train_step": 27.73782253265381, "step": 1144}
{"train_info/time_between_train_steps": 0.004996776580810547, "step": 1144}
{"info/global_step": 1145, "train_info/time_within_train_step": 27.85634684562683, "step": 1145}
{"train_info/time_between_train_steps": 0.005312919616699219, "step": 1145}
{"info/global_step": 1146, "train_info/time_within_train_step": 28.08274531364441, "step": 1146}
{"train_info/time_between_train_steps": 0.005119800567626953, "step": 1146}
{"info/global_step": 1147, "train_info/time_within_train_step": 27.733407735824585, "step": 1147}
{"train_info/time_between_train_steps": 0.004985809326171875, "step": 1147}
{"info/global_step": 1148, "train_info/time_within_train_step": 27.750118255615234, "step": 1148}
{"train_info/time_between_train_steps": 0.0051517486572265625, "step": 1148}
{"info/global_step": 1149, "train_info/time_within_train_step": 27.73752737045288, "step": 1149}
{"train_info/time_between_train_steps": 0.005091190338134766, "step": 1149}
{"info/global_step": 1150, "train_info/time_within_train_step": 27.731547832489014, "step": 1150}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1733725223, "_runtime": 38112}, "step": 1150}
{"logs": {"train/loss": 3.4438, "train/learning_rate": 2.7777777777777772e-05, "train/epoch": 42.01, "_timestamp": 1733725223, "_runtime": 38112}, "step": 1150}
{"train_info/time_between_train_steps": 0.012080669403076172, "step": 1150}
{"info/global_step": 1151, "train_info/time_within_train_step": 27.72833800315857, "step": 1151}
{"train_info/time_between_train_steps": 0.005068540573120117, "step": 1151}
{"info/global_step": 1152, "train_info/time_within_train_step": 27.746594667434692, "step": 1152}
{"train_info/time_between_train_steps": 0.005072116851806641, "step": 1152}
{"info/global_step": 1153, "train_info/time_within_train_step": 27.73059844970703, "step": 1153}
{"train_info/time_between_train_steps": 0.005078554153442383, "step": 1153}
{"info/global_step": 1154, "train_info/time_within_train_step": 27.742478370666504, "step": 1154}
{"train_info/time_between_train_steps": 0.005200862884521484, "step": 1154}
{"info/global_step": 1155, "train_info/time_within_train_step": 27.750205993652344, "step": 1155}
{"train_info/time_between_train_steps": 0.00504612922668457, "step": 1155}
{"info/global_step": 1156, "train_info/time_within_train_step": 27.744548797607422, "step": 1156}
{"train_info/time_between_train_steps": 0.005206108093261719, "step": 1156}
{"info/global_step": 1157, "train_info/time_within_train_step": 27.74777340888977, "step": 1157}
{"train_info/time_between_train_steps": 0.005246639251708984, "step": 1157}
{"info/global_step": 1158, "train_info/time_within_train_step": 27.740314722061157, "step": 1158}
{"train_info/time_between_train_steps": 0.005386829376220703, "step": 1158}
{"info/global_step": 1159, "train_info/time_within_train_step": 27.783123016357422, "step": 1159}
{"train_info/time_between_train_steps": 0.00528717041015625, "step": 1159}
{"info/global_step": 1160, "train_info/time_within_train_step": 27.815505743026733, "step": 1160}
{"train_info/time_between_train_steps": 0.005701780319213867, "step": 1160}
{"info/global_step": 1161, "train_info/time_within_train_step": 27.76978063583374, "step": 1161}
{"train_info/time_between_train_steps": 0.005719423294067383, "step": 1161}
{"train_info/time_between_train_steps": 20.482524633407593, "step": 1161}
{"info/global_step": 1162, "train_info/time_within_train_step": 27.756129026412964, "step": 1162}
{"train_info/time_between_train_steps": 0.005509614944458008, "step": 1162}
{"info/global_step": 1163, "train_info/time_within_train_step": 27.908124685287476, "step": 1163}
{"train_info/time_between_train_steps": 0.005292177200317383, "step": 1163}
{"info/global_step": 1164, "train_info/time_within_train_step": 27.766932010650635, "step": 1164}
{"train_info/time_between_train_steps": 0.005484104156494141, "step": 1164}
{"info/global_step": 1165, "train_info/time_within_train_step": 27.91253662109375, "step": 1165}
{"train_info/time_between_train_steps": 0.005154609680175781, "step": 1165}
{"info/global_step": 1166, "train_info/time_within_train_step": 27.763454914093018, "step": 1166}
{"train_info/time_between_train_steps": 0.005514860153198242, "step": 1166}
{"info/global_step": 1167, "train_info/time_within_train_step": 27.94444513320923, "step": 1167}
{"train_info/time_between_train_steps": 0.005471467971801758, "step": 1167}
{"info/global_step": 1168, "train_info/time_within_train_step": 27.79104471206665, "step": 1168}
{"train_info/time_between_train_steps": 0.005751609802246094, "step": 1168}
{"info/global_step": 1169, "train_info/time_within_train_step": 27.904381036758423, "step": 1169}
{"train_info/time_between_train_steps": 0.005948066711425781, "step": 1169}
{"info/global_step": 1170, "train_info/time_within_train_step": 27.78229284286499, "step": 1170}
{"train_info/time_between_train_steps": 0.0050013065338134766, "step": 1170}
{"info/global_step": 1171, "train_info/time_within_train_step": 27.79287314414978, "step": 1171}
{"train_info/time_between_train_steps": 0.009923696517944336, "step": 1171}
{"info/global_step": 1172, "train_info/time_within_train_step": 27.766432762145996, "step": 1172}
{"train_info/time_between_train_steps": 0.005154609680175781, "step": 1172}
{"info/global_step": 1173, "train_info/time_within_train_step": 27.771057844161987, "step": 1173}
{"train_info/time_between_train_steps": 0.005152463912963867, "step": 1173}
{"info/global_step": 1174, "train_info/time_within_train_step": 27.85442090034485, "step": 1174}
{"train_info/time_between_train_steps": 0.005156993865966797, "step": 1174}
{"info/global_step": 1175, "train_info/time_within_train_step": 27.808170557022095, "step": 1175}
{"train_info/time_between_train_steps": 0.009945869445800781, "step": 1175}
{"info/global_step": 1176, "train_info/time_within_train_step": 27.841625928878784, "step": 1176}
{"train_info/time_between_train_steps": 0.005191326141357422, "step": 1176}
{"info/global_step": 1177, "train_info/time_within_train_step": 27.89263415336609, "step": 1177}
{"train_info/time_between_train_steps": 0.005078792572021484, "step": 1177}
{"info/global_step": 1178, "train_info/time_within_train_step": 27.757487058639526, "step": 1178}
{"train_info/time_between_train_steps": 0.0052340030670166016, "step": 1178}
{"info/global_step": 1179, "train_info/time_within_train_step": 27.761606216430664, "step": 1179}
{"train_info/time_between_train_steps": 0.006364107131958008, "step": 1179}
{"info/global_step": 1180, "train_info/time_within_train_step": 27.7913019657135, "step": 1180}
{"train_info/time_between_train_steps": 0.005042314529418945, "step": 1180}
{"info/global_step": 1181, "train_info/time_within_train_step": 27.754710912704468, "step": 1181}
{"train_info/time_between_train_steps": 0.009563207626342773, "step": 1181}
{"info/global_step": 1182, "train_info/time_within_train_step": 27.778310537338257, "step": 1182}
{"train_info/time_between_train_steps": 0.005070686340332031, "step": 1182}
{"info/global_step": 1183, "train_info/time_within_train_step": 27.788095712661743, "step": 1183}
{"train_info/time_between_train_steps": 0.0051212310791015625, "step": 1183}
{"info/global_step": 1184, "train_info/time_within_train_step": 27.772324323654175, "step": 1184}
{"train_info/time_between_train_steps": 0.005327939987182617, "step": 1184}
{"info/global_step": 1185, "train_info/time_within_train_step": 27.77214813232422, "step": 1185}
{"train_info/time_between_train_steps": 0.005579471588134766, "step": 1185}
{"info/global_step": 1186, "train_info/time_within_train_step": 27.805439472198486, "step": 1186}
{"train_info/time_between_train_steps": 0.005265474319458008, "step": 1186}
{"info/global_step": 1187, "train_info/time_within_train_step": 27.818565368652344, "step": 1187}
{"train_info/time_between_train_steps": 0.005339384078979492, "step": 1187}
{"info/global_step": 1188, "train_info/time_within_train_step": 27.785199642181396, "step": 1188}
{"train_info/time_between_train_steps": 0.00563502311706543, "step": 1188}
{"train_info/time_between_train_steps": 20.964935779571533, "step": 1188}
{"info/global_step": 1189, "train_info/time_within_train_step": 27.7438223361969, "step": 1189}
{"train_info/time_between_train_steps": 0.004935741424560547, "step": 1189}
{"info/global_step": 1190, "train_info/time_within_train_step": 27.809679746627808, "step": 1190}
{"train_info/time_between_train_steps": 0.004979848861694336, "step": 1190}
{"info/global_step": 1191, "train_info/time_within_train_step": 27.696479558944702, "step": 1191}
{"train_info/time_between_train_steps": 0.004891395568847656, "step": 1191}
{"info/global_step": 1192, "train_info/time_within_train_step": 27.946634531021118, "step": 1192}
{"train_info/time_between_train_steps": 0.004942893981933594, "step": 1192}
{"info/global_step": 1193, "train_info/time_within_train_step": 27.767290830612183, "step": 1193}
{"train_info/time_between_train_steps": 0.005411624908447266, "step": 1193}
{"info/global_step": 1194, "train_info/time_within_train_step": 27.887458324432373, "step": 1194}
{"train_info/time_between_train_steps": 0.005109071731567383, "step": 1194}
{"info/global_step": 1195, "train_info/time_within_train_step": 27.78939652442932, "step": 1195}
{"train_info/time_between_train_steps": 0.005480051040649414, "step": 1195}
{"info/global_step": 1196, "train_info/time_within_train_step": 27.93115258216858, "step": 1196}
{"train_info/time_between_train_steps": 0.01096034049987793, "step": 1196}
{"info/global_step": 1197, "train_info/time_within_train_step": 27.75483536720276, "step": 1197}
{"train_info/time_between_train_steps": 0.005206108093261719, "step": 1197}
{"info/global_step": 1198, "train_info/time_within_train_step": 27.742254734039307, "step": 1198}
{"train_info/time_between_train_steps": 0.005267620086669922, "step": 1198}
{"info/global_step": 1199, "train_info/time_within_train_step": 27.77887797355652, "step": 1199}
{"train_info/time_between_train_steps": 0.005394458770751953, "step": 1199}
{"info/global_step": 1200, "train_info/time_within_train_step": 27.764997482299805, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1733726654, "_runtime": 39543}, "step": 1200}
{"logs": {"train/loss": 3.421, "train/learning_rate": 0.0, "train/epoch": 44.01, "_timestamp": 1733726654, "_runtime": 39543}, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1733726658, "_runtime": 39547}, "step": 1200}
{"logs": {"train/train_runtime": 39547.528, "train/train_samples_per_second": 15.536, "train/train_steps_per_second": 0.03, "train/total_flos": 3.2843363254272e+17, "train/train_loss": 4.614480017026265, "train/epoch": 44.01, "_timestamp": 1733726658, "_runtime": 39547}, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1922.4453125, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1733726661, "_runtime": 39550}, "step": 1200}
{"logs": {"eval/loss": 4.472858428955078, "eval/runtime": 1.9718, "eval/samples_per_second": 50.716, "eval/steps_per_second": 3.55, "train/epoch": 44.01, "_timestamp": 1733726661, "_runtime": 39550}, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1922.4453125, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1733726661, "_runtime": 39550}, "step": 1200}
{"logs": {"eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_loss": 4.472858428955078, "eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_ppl": 87.60678321932774, "eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_runtime": 1.9718, "eval//local/xiulyang/mission-impossible-language-models/training/babylm_dataset.py_samples_per_second": 50.716, "train/epoch": 44.01, "_timestamp": 1733726661, "_runtime": 39550}, "step": 1200}