DNNA_EN / metrics.json
xiulinyang's picture
Adding model checkpoints and config files
cc00969
Invalid JSON: Unexpected non-whitespace character after JSONat line 2, column 1
{"num_parameters": 124439808, "trainable_parameters": 124439808, "step": 0}
{"train_info/time_between_train_steps": 3.834409475326538, "step": 0}
{"info/global_step": 1, "train_info/time_within_train_step": 28.269936561584473, "step": 1}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 19761.71484375, "train_info/memory_reserved": 22624.0, "train_info/memory_max_reserved": 22624.0, "_timestamp": 1740824103, "_runtime": 52}, "step": 1}
{"logs": {"train/loss": 11.0211, "train/learning_rate": 4.9999999999999996e-06, "train/epoch": 0.0, "_timestamp": 1740824103, "_runtime": 52}, "step": 1}
{"train_info/time_between_train_steps": 0.026109695434570312, "step": 1}
{"info/global_step": 2, "train_info/time_within_train_step": 27.96107530593872, "step": 2}
{"train_info/time_between_train_steps": 0.0055828094482421875, "step": 2}
{"info/global_step": 3, "train_info/time_within_train_step": 27.747483015060425, "step": 3}
{"train_info/time_between_train_steps": 0.005789756774902344, "step": 3}
{"info/global_step": 4, "train_info/time_within_train_step": 27.982068300247192, "step": 4}
{"train_info/time_between_train_steps": 0.005511045455932617, "step": 4}
{"info/global_step": 5, "train_info/time_within_train_step": 27.70697832107544, "step": 5}
{"train_info/time_between_train_steps": 0.0058476924896240234, "step": 5}
{"info/global_step": 6, "train_info/time_within_train_step": 27.943527221679688, "step": 6}
{"train_info/time_between_train_steps": 0.005895137786865234, "step": 6}
{"info/global_step": 7, "train_info/time_within_train_step": 27.729538917541504, "step": 7}
{"train_info/time_between_train_steps": 0.005954265594482422, "step": 7}
{"info/global_step": 8, "train_info/time_within_train_step": 27.79095482826233, "step": 8}
{"train_info/time_between_train_steps": 0.005672931671142578, "step": 8}
{"info/global_step": 9, "train_info/time_within_train_step": 27.74953317642212, "step": 9}
{"train_info/time_between_train_steps": 0.0053288936614990234, "step": 9}
{"info/global_step": 10, "train_info/time_within_train_step": 27.73552966117859, "step": 10}
{"train_info/time_between_train_steps": 0.005738258361816406, "step": 10}
{"info/global_step": 11, "train_info/time_within_train_step": 27.72998809814453, "step": 11}
{"train_info/time_between_train_steps": 0.007455587387084961, "step": 11}
{"info/global_step": 12, "train_info/time_within_train_step": 27.686981201171875, "step": 12}
{"train_info/time_between_train_steps": 0.005208730697631836, "step": 12}
{"info/global_step": 13, "train_info/time_within_train_step": 27.74906635284424, "step": 13}
{"train_info/time_between_train_steps": 0.00558924674987793, "step": 13}
{"info/global_step": 14, "train_info/time_within_train_step": 27.70365262031555, "step": 14}
{"train_info/time_between_train_steps": 0.00506138801574707, "step": 14}
{"info/global_step": 15, "train_info/time_within_train_step": 27.75977373123169, "step": 15}
{"train_info/time_between_train_steps": 0.005500316619873047, "step": 15}
{"info/global_step": 16, "train_info/time_within_train_step": 27.805790662765503, "step": 16}
{"train_info/time_between_train_steps": 0.005455970764160156, "step": 16}
{"info/global_step": 17, "train_info/time_within_train_step": 27.748814344406128, "step": 17}
{"train_info/time_between_train_steps": 0.0054476261138916016, "step": 17}
{"info/global_step": 18, "train_info/time_within_train_step": 27.711416006088257, "step": 18}
{"train_info/time_between_train_steps": 0.0054090023040771484, "step": 18}
{"info/global_step": 19, "train_info/time_within_train_step": 27.702415943145752, "step": 19}
{"train_info/time_between_train_steps": 0.005543231964111328, "step": 19}
{"info/global_step": 20, "train_info/time_within_train_step": 27.70447540283203, "step": 20}
{"train_info/time_between_train_steps": 0.005377531051635742, "step": 20}
{"info/global_step": 21, "train_info/time_within_train_step": 27.6956524848938, "step": 21}
{"train_info/time_between_train_steps": 0.005370378494262695, "step": 21}
{"info/global_step": 22, "train_info/time_within_train_step": 27.74699091911316, "step": 22}
{"train_info/time_between_train_steps": 0.005816936492919922, "step": 22}
{"info/global_step": 23, "train_info/time_within_train_step": 27.71714425086975, "step": 23}
{"train_info/time_between_train_steps": 0.005561113357543945, "step": 23}
{"info/global_step": 24, "train_info/time_within_train_step": 27.75273299217224, "step": 24}
{"train_info/time_between_train_steps": 0.005265951156616211, "step": 24}
{"info/global_step": 25, "train_info/time_within_train_step": 27.726463317871094, "step": 25}
{"train_info/time_between_train_steps": 0.0054473876953125, "step": 25}
{"info/global_step": 26, "train_info/time_within_train_step": 27.707585334777832, "step": 26}
{"train_info/time_between_train_steps": 0.0055713653564453125, "step": 26}
{"info/global_step": 27, "train_info/time_within_train_step": 27.714736700057983, "step": 27}
{"train_info/time_between_train_steps": 0.0059299468994140625, "step": 27}
{"train_info/time_between_train_steps": 30.024338722229004, "step": 27}
{"info/global_step": 28, "train_info/time_within_train_step": 27.69981575012207, "step": 28}
{"train_info/time_between_train_steps": 0.005093574523925781, "step": 28}
{"info/global_step": 29, "train_info/time_within_train_step": 27.826509475708008, "step": 29}
{"train_info/time_between_train_steps": 0.005326032638549805, "step": 29}
{"info/global_step": 30, "train_info/time_within_train_step": 27.691741943359375, "step": 30}
{"train_info/time_between_train_steps": 0.0053708553314208984, "step": 30}
{"info/global_step": 31, "train_info/time_within_train_step": 27.92835783958435, "step": 31}
{"train_info/time_between_train_steps": 0.005341529846191406, "step": 31}
{"info/global_step": 32, "train_info/time_within_train_step": 27.70521116256714, "step": 32}
{"train_info/time_between_train_steps": 0.0056476593017578125, "step": 32}
{"info/global_step": 33, "train_info/time_within_train_step": 27.8247287273407, "step": 33}
{"train_info/time_between_train_steps": 0.0053136348724365234, "step": 33}
{"info/global_step": 34, "train_info/time_within_train_step": 27.72082543373108, "step": 34}
{"train_info/time_between_train_steps": 0.005550861358642578, "step": 34}
{"info/global_step": 35, "train_info/time_within_train_step": 27.777339935302734, "step": 35}
{"train_info/time_between_train_steps": 0.00962376594543457, "step": 35}
{"info/global_step": 36, "train_info/time_within_train_step": 27.786529779434204, "step": 36}
{"train_info/time_between_train_steps": 0.004998207092285156, "step": 36}
{"info/global_step": 37, "train_info/time_within_train_step": 27.679280996322632, "step": 37}
{"train_info/time_between_train_steps": 0.0051403045654296875, "step": 37}
{"info/global_step": 38, "train_info/time_within_train_step": 27.7331485748291, "step": 38}
{"train_info/time_between_train_steps": 0.004999876022338867, "step": 38}
{"info/global_step": 39, "train_info/time_within_train_step": 27.695358753204346, "step": 39}
{"train_info/time_between_train_steps": 0.005034446716308594, "step": 39}
{"info/global_step": 40, "train_info/time_within_train_step": 27.748251914978027, "step": 40}
{"train_info/time_between_train_steps": 0.006163835525512695, "step": 40}
{"info/global_step": 41, "train_info/time_within_train_step": 27.712142944335938, "step": 41}
{"train_info/time_between_train_steps": 0.005028486251831055, "step": 41}
{"info/global_step": 42, "train_info/time_within_train_step": 27.708196878433228, "step": 42}
{"train_info/time_between_train_steps": 0.005339860916137695, "step": 42}
{"info/global_step": 43, "train_info/time_within_train_step": 27.70981764793396, "step": 43}
{"train_info/time_between_train_steps": 0.005110502243041992, "step": 43}
{"info/global_step": 44, "train_info/time_within_train_step": 27.730726718902588, "step": 44}
{"train_info/time_between_train_steps": 0.005344867706298828, "step": 44}
{"info/global_step": 45, "train_info/time_within_train_step": 27.690407752990723, "step": 45}
{"train_info/time_between_train_steps": 0.005085468292236328, "step": 45}
{"info/global_step": 46, "train_info/time_within_train_step": 27.801880836486816, "step": 46}
{"train_info/time_between_train_steps": 0.005202293395996094, "step": 46}
{"info/global_step": 47, "train_info/time_within_train_step": 27.708892583847046, "step": 47}
{"train_info/time_between_train_steps": 0.00518798828125, "step": 47}
{"info/global_step": 48, "train_info/time_within_train_step": 27.680726051330566, "step": 48}
{"train_info/time_between_train_steps": 0.005112886428833008, "step": 48}
{"info/global_step": 49, "train_info/time_within_train_step": 27.73026704788208, "step": 49}
{"train_info/time_between_train_steps": 0.009624958038330078, "step": 49}
{"info/global_step": 50, "train_info/time_within_train_step": 27.682641744613647, "step": 50}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740825494, "_runtime": 1443}, "step": 50}
{"logs": {"train/loss": 8.0192, "train/learning_rate": 0.00025, "train/epoch": 1.02, "_timestamp": 1740825494, "_runtime": 1443}, "step": 50}
{"train_info/time_between_train_steps": 0.03618454933166504, "step": 50}
{"info/global_step": 51, "train_info/time_within_train_step": 27.749083518981934, "step": 51}
{"train_info/time_between_train_steps": 0.005368947982788086, "step": 51}
{"info/global_step": 52, "train_info/time_within_train_step": 27.716320753097534, "step": 52}
{"train_info/time_between_train_steps": 0.010048627853393555, "step": 52}
{"info/global_step": 53, "train_info/time_within_train_step": 27.750917673110962, "step": 53}
{"train_info/time_between_train_steps": 0.010403156280517578, "step": 53}
{"info/global_step": 54, "train_info/time_within_train_step": 27.738163471221924, "step": 54}
{"train_info/time_between_train_steps": 0.006113290786743164, "step": 54}
{"train_info/time_between_train_steps": 29.88112735748291, "step": 54}
{"info/global_step": 55, "train_info/time_within_train_step": 27.69020414352417, "step": 55}
{"train_info/time_between_train_steps": 0.005527019500732422, "step": 55}
{"info/global_step": 56, "train_info/time_within_train_step": 27.89532732963562, "step": 56}
{"train_info/time_between_train_steps": 0.005464076995849609, "step": 56}
{"info/global_step": 57, "train_info/time_within_train_step": 27.71349859237671, "step": 57}
{"train_info/time_between_train_steps": 0.005156755447387695, "step": 57}
{"info/global_step": 58, "train_info/time_within_train_step": 27.8750262260437, "step": 58}
{"train_info/time_between_train_steps": 0.014440536499023438, "step": 58}
{"info/global_step": 59, "train_info/time_within_train_step": 27.7750084400177, "step": 59}
{"train_info/time_between_train_steps": 0.005329608917236328, "step": 59}
{"info/global_step": 60, "train_info/time_within_train_step": 27.820770502090454, "step": 60}
{"train_info/time_between_train_steps": 0.005283832550048828, "step": 60}
{"info/global_step": 61, "train_info/time_within_train_step": 28.03778576850891, "step": 61}
{"train_info/time_between_train_steps": 0.0058863162994384766, "step": 61}
{"info/global_step": 62, "train_info/time_within_train_step": 27.815269708633423, "step": 62}
{"train_info/time_between_train_steps": 0.00543522834777832, "step": 62}
{"info/global_step": 63, "train_info/time_within_train_step": 27.96509623527527, "step": 63}
{"train_info/time_between_train_steps": 0.005144357681274414, "step": 63}
{"info/global_step": 64, "train_info/time_within_train_step": 27.69447159767151, "step": 64}
{"train_info/time_between_train_steps": 0.010020971298217773, "step": 64}
{"info/global_step": 65, "train_info/time_within_train_step": 27.747154474258423, "step": 65}
{"train_info/time_between_train_steps": 0.005051136016845703, "step": 65}
{"info/global_step": 66, "train_info/time_within_train_step": 27.697684288024902, "step": 66}
{"train_info/time_between_train_steps": 0.010128021240234375, "step": 66}
{"info/global_step": 67, "train_info/time_within_train_step": 27.74103307723999, "step": 67}
{"train_info/time_between_train_steps": 0.0053462982177734375, "step": 67}
{"info/global_step": 68, "train_info/time_within_train_step": 27.778972625732422, "step": 68}
{"train_info/time_between_train_steps": 0.005719661712646484, "step": 68}
{"info/global_step": 69, "train_info/time_within_train_step": 27.798271894454956, "step": 69}
{"train_info/time_between_train_steps": 0.006541013717651367, "step": 69}
{"info/global_step": 70, "train_info/time_within_train_step": 27.766440391540527, "step": 70}
{"train_info/time_between_train_steps": 0.006812334060668945, "step": 70}
{"info/global_step": 71, "train_info/time_within_train_step": 27.778088092803955, "step": 71}
{"train_info/time_between_train_steps": 0.006823539733886719, "step": 71}
{"info/global_step": 72, "train_info/time_within_train_step": 27.800012588500977, "step": 72}
{"train_info/time_between_train_steps": 0.006250858306884766, "step": 72}
{"info/global_step": 73, "train_info/time_within_train_step": 27.788501977920532, "step": 73}
{"train_info/time_between_train_steps": 0.0063250064849853516, "step": 73}
{"info/global_step": 74, "train_info/time_within_train_step": 27.814247369766235, "step": 74}
{"train_info/time_between_train_steps": 0.006246805191040039, "step": 74}
{"info/global_step": 75, "train_info/time_within_train_step": 27.782124042510986, "step": 75}
{"train_info/time_between_train_steps": 0.0062274932861328125, "step": 75}
{"info/global_step": 76, "train_info/time_within_train_step": 27.81791639328003, "step": 76}
{"train_info/time_between_train_steps": 0.0061016082763671875, "step": 76}
{"info/global_step": 77, "train_info/time_within_train_step": 27.87493348121643, "step": 77}
{"train_info/time_between_train_steps": 0.006658077239990234, "step": 77}
{"info/global_step": 78, "train_info/time_within_train_step": 27.7807879447937, "step": 78}
{"train_info/time_between_train_steps": 0.0063762664794921875, "step": 78}
{"info/global_step": 79, "train_info/time_within_train_step": 27.789470195770264, "step": 79}
{"train_info/time_between_train_steps": 0.006345987319946289, "step": 79}
{"info/global_step": 80, "train_info/time_within_train_step": 27.8055100440979, "step": 80}
{"train_info/time_between_train_steps": 0.0065495967864990234, "step": 80}
{"info/global_step": 81, "train_info/time_within_train_step": 27.78734803199768, "step": 81}
{"train_info/time_between_train_steps": 0.007088899612426758, "step": 81}
{"train_info/time_between_train_steps": 30.505497694015503, "step": 81}
{"info/global_step": 82, "train_info/time_within_train_step": 27.715052366256714, "step": 82}
{"train_info/time_between_train_steps": 0.0055179595947265625, "step": 82}
{"info/global_step": 83, "train_info/time_within_train_step": 27.847105026245117, "step": 83}
{"train_info/time_between_train_steps": 0.005188465118408203, "step": 83}
{"info/global_step": 84, "train_info/time_within_train_step": 27.7117862701416, "step": 84}
{"train_info/time_between_train_steps": 0.0052890777587890625, "step": 84}
{"info/global_step": 85, "train_info/time_within_train_step": 27.873642206192017, "step": 85}
{"train_info/time_between_train_steps": 0.005289316177368164, "step": 85}
{"info/global_step": 86, "train_info/time_within_train_step": 27.733330249786377, "step": 86}
{"train_info/time_between_train_steps": 0.005342721939086914, "step": 86}
{"info/global_step": 87, "train_info/time_within_train_step": 27.823381185531616, "step": 87}
{"train_info/time_between_train_steps": 0.005438804626464844, "step": 87}
{"info/global_step": 88, "train_info/time_within_train_step": 27.719430208206177, "step": 88}
{"train_info/time_between_train_steps": 0.005362749099731445, "step": 88}
{"info/global_step": 89, "train_info/time_within_train_step": 27.77023959159851, "step": 89}
{"train_info/time_between_train_steps": 0.005185604095458984, "step": 89}
{"info/global_step": 90, "train_info/time_within_train_step": 27.711486101150513, "step": 90}
{"train_info/time_between_train_steps": 0.005261659622192383, "step": 90}
{"info/global_step": 91, "train_info/time_within_train_step": 27.796611785888672, "step": 91}
{"train_info/time_between_train_steps": 0.005070686340332031, "step": 91}
{"info/global_step": 92, "train_info/time_within_train_step": 27.700639247894287, "step": 92}
{"train_info/time_between_train_steps": 0.006469249725341797, "step": 92}
{"info/global_step": 93, "train_info/time_within_train_step": 27.700782299041748, "step": 93}
{"train_info/time_between_train_steps": 0.005188465118408203, "step": 93}
{"info/global_step": 94, "train_info/time_within_train_step": 27.70881199836731, "step": 94}
{"train_info/time_between_train_steps": 0.005133867263793945, "step": 94}
{"info/global_step": 95, "train_info/time_within_train_step": 27.706984043121338, "step": 95}
{"train_info/time_between_train_steps": 0.005070924758911133, "step": 95}
{"info/global_step": 96, "train_info/time_within_train_step": 27.74240016937256, "step": 96}
{"train_info/time_between_train_steps": 0.005093574523925781, "step": 96}
{"info/global_step": 97, "train_info/time_within_train_step": 27.710091829299927, "step": 97}
{"train_info/time_between_train_steps": 0.005159616470336914, "step": 97}
{"info/global_step": 98, "train_info/time_within_train_step": 27.746789693832397, "step": 98}
{"train_info/time_between_train_steps": 0.00518488883972168, "step": 98}
{"info/global_step": 99, "train_info/time_within_train_step": 27.70639181137085, "step": 99}
{"train_info/time_between_train_steps": 0.005252838134765625, "step": 99}
{"info/global_step": 100, "train_info/time_within_train_step": 27.856878757476807, "step": 100}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740826946, "_runtime": 2895}, "step": 100}
{"logs": {"train/loss": 5.7199, "train/learning_rate": 0.0005, "train/epoch": 3.02, "_timestamp": 1740826946, "_runtime": 2895}, "step": 100}
{"train_info/time_between_train_steps": 76.01396751403809, "step": 100}
{"info/global_step": 101, "train_info/time_within_train_step": 27.72314691543579, "step": 101}
{"train_info/time_between_train_steps": 0.00503849983215332, "step": 101}
{"info/global_step": 102, "train_info/time_within_train_step": 27.7017502784729, "step": 102}
{"train_info/time_between_train_steps": 0.005120038986206055, "step": 102}
{"info/global_step": 103, "train_info/time_within_train_step": 27.705806255340576, "step": 103}
{"train_info/time_between_train_steps": 0.005287647247314453, "step": 103}
{"info/global_step": 104, "train_info/time_within_train_step": 27.69396138191223, "step": 104}
{"train_info/time_between_train_steps": 0.005209207534790039, "step": 104}
{"info/global_step": 105, "train_info/time_within_train_step": 27.692888498306274, "step": 105}
{"train_info/time_between_train_steps": 0.005640983581542969, "step": 105}
{"info/global_step": 106, "train_info/time_within_train_step": 27.74486994743347, "step": 106}
{"train_info/time_between_train_steps": 0.005143165588378906, "step": 106}
{"info/global_step": 107, "train_info/time_within_train_step": 27.789852380752563, "step": 107}
{"train_info/time_between_train_steps": 0.006172895431518555, "step": 107}
{"info/global_step": 108, "train_info/time_within_train_step": 27.713579416275024, "step": 108}
{"train_info/time_between_train_steps": 0.0057528018951416016, "step": 108}
{"train_info/time_between_train_steps": 29.935186862945557, "step": 108}
{"info/global_step": 109, "train_info/time_within_train_step": 27.69963526725769, "step": 109}
{"train_info/time_between_train_steps": 0.005365848541259766, "step": 109}
{"info/global_step": 110, "train_info/time_within_train_step": 27.874626636505127, "step": 110}
{"train_info/time_between_train_steps": 0.005317211151123047, "step": 110}
{"info/global_step": 111, "train_info/time_within_train_step": 27.700846910476685, "step": 111}
{"train_info/time_between_train_steps": 0.005157470703125, "step": 111}
{"info/global_step": 112, "train_info/time_within_train_step": 27.880887269973755, "step": 112}
{"train_info/time_between_train_steps": 0.005501985549926758, "step": 112}
{"info/global_step": 113, "train_info/time_within_train_step": 27.720590114593506, "step": 113}
{"train_info/time_between_train_steps": 0.005461215972900391, "step": 113}
{"info/global_step": 114, "train_info/time_within_train_step": 27.82923436164856, "step": 114}
{"train_info/time_between_train_steps": 0.005305051803588867, "step": 114}
{"info/global_step": 115, "train_info/time_within_train_step": 27.72627019882202, "step": 115}
{"train_info/time_between_train_steps": 0.005540370941162109, "step": 115}
{"info/global_step": 116, "train_info/time_within_train_step": 27.7889621257782, "step": 116}
{"train_info/time_between_train_steps": 0.005234241485595703, "step": 116}
{"info/global_step": 117, "train_info/time_within_train_step": 27.726036310195923, "step": 117}
{"train_info/time_between_train_steps": 0.016416072845458984, "step": 117}
{"info/global_step": 118, "train_info/time_within_train_step": 27.7428936958313, "step": 118}
{"train_info/time_between_train_steps": 0.005290985107421875, "step": 118}
{"info/global_step": 119, "train_info/time_within_train_step": 27.737021923065186, "step": 119}
{"train_info/time_between_train_steps": 0.005154609680175781, "step": 119}
{"info/global_step": 120, "train_info/time_within_train_step": 27.734756231307983, "step": 120}
{"train_info/time_between_train_steps": 0.005208730697631836, "step": 120}
{"info/global_step": 121, "train_info/time_within_train_step": 27.759555101394653, "step": 121}
{"train_info/time_between_train_steps": 0.005346536636352539, "step": 121}
{"info/global_step": 122, "train_info/time_within_train_step": 27.8026864528656, "step": 122}
{"train_info/time_between_train_steps": 0.005013227462768555, "step": 122}
{"info/global_step": 123, "train_info/time_within_train_step": 27.72345805168152, "step": 123}
{"train_info/time_between_train_steps": 0.0053064823150634766, "step": 123}
{"info/global_step": 124, "train_info/time_within_train_step": 27.712083101272583, "step": 124}
{"train_info/time_between_train_steps": 0.005263090133666992, "step": 124}
{"info/global_step": 125, "train_info/time_within_train_step": 27.7495334148407, "step": 125}
{"train_info/time_between_train_steps": 0.005507230758666992, "step": 125}
{"info/global_step": 126, "train_info/time_within_train_step": 27.735219717025757, "step": 126}
{"train_info/time_between_train_steps": 0.005164146423339844, "step": 126}
{"info/global_step": 127, "train_info/time_within_train_step": 27.696925163269043, "step": 127}
{"train_info/time_between_train_steps": 0.005079507827758789, "step": 127}
{"info/global_step": 128, "train_info/time_within_train_step": 27.732449293136597, "step": 128}
{"train_info/time_between_train_steps": 0.0052568912506103516, "step": 128}
{"info/global_step": 129, "train_info/time_within_train_step": 27.760539531707764, "step": 129}
{"train_info/time_between_train_steps": 0.0051610469818115234, "step": 129}
{"info/global_step": 130, "train_info/time_within_train_step": 27.71502685546875, "step": 130}
{"train_info/time_between_train_steps": 0.005305051803588867, "step": 130}
{"info/global_step": 131, "train_info/time_within_train_step": 27.746113300323486, "step": 131}
{"train_info/time_between_train_steps": 0.0051763057708740234, "step": 131}
{"info/global_step": 132, "train_info/time_within_train_step": 27.72984027862549, "step": 132}
{"train_info/time_between_train_steps": 0.005165815353393555, "step": 132}
{"info/global_step": 133, "train_info/time_within_train_step": 27.73590087890625, "step": 133}
{"train_info/time_between_train_steps": 0.005527973175048828, "step": 133}
{"info/global_step": 134, "train_info/time_within_train_step": 27.728922367095947, "step": 134}
{"train_info/time_between_train_steps": 0.009885072708129883, "step": 134}
{"info/global_step": 135, "train_info/time_within_train_step": 27.742867469787598, "step": 135}
{"train_info/time_between_train_steps": 0.0058705806732177734, "step": 135}
{"train_info/time_between_train_steps": 30.101130485534668, "step": 135}
{"info/global_step": 136, "train_info/time_within_train_step": 27.80540442466736, "step": 136}
{"train_info/time_between_train_steps": 0.005100250244140625, "step": 136}
{"info/global_step": 137, "train_info/time_within_train_step": 27.935384035110474, "step": 137}
{"train_info/time_between_train_steps": 0.005282878875732422, "step": 137}
{"info/global_step": 138, "train_info/time_within_train_step": 27.70681118965149, "step": 138}
{"train_info/time_between_train_steps": 0.005229473114013672, "step": 138}
{"info/global_step": 139, "train_info/time_within_train_step": 27.95735764503479, "step": 139}
{"train_info/time_between_train_steps": 0.005908012390136719, "step": 139}
{"info/global_step": 140, "train_info/time_within_train_step": 27.745168685913086, "step": 140}
{"train_info/time_between_train_steps": 0.005393028259277344, "step": 140}
{"info/global_step": 141, "train_info/time_within_train_step": 27.905131101608276, "step": 141}
{"train_info/time_between_train_steps": 0.005289554595947266, "step": 141}
{"info/global_step": 142, "train_info/time_within_train_step": 27.756346702575684, "step": 142}
{"train_info/time_between_train_steps": 0.005654335021972656, "step": 142}
{"info/global_step": 143, "train_info/time_within_train_step": 27.840092658996582, "step": 143}
{"train_info/time_between_train_steps": 0.0052356719970703125, "step": 143}
{"info/global_step": 144, "train_info/time_within_train_step": 27.727481603622437, "step": 144}
{"train_info/time_between_train_steps": 0.005444765090942383, "step": 144}
{"info/global_step": 145, "train_info/time_within_train_step": 27.730412006378174, "step": 145}
{"train_info/time_between_train_steps": 0.0051805973052978516, "step": 145}
{"info/global_step": 146, "train_info/time_within_train_step": 27.70672106742859, "step": 146}
{"train_info/time_between_train_steps": 0.005202770233154297, "step": 146}
{"info/global_step": 147, "train_info/time_within_train_step": 27.70912456512451, "step": 147}
{"train_info/time_between_train_steps": 0.005299091339111328, "step": 147}
{"info/global_step": 148, "train_info/time_within_train_step": 27.734941482543945, "step": 148}
{"train_info/time_between_train_steps": 0.005257129669189453, "step": 148}
{"info/global_step": 149, "train_info/time_within_train_step": 27.709816455841064, "step": 149}
{"train_info/time_between_train_steps": 0.006234407424926758, "step": 149}
{"info/global_step": 150, "train_info/time_within_train_step": 27.756762266159058, "step": 150}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740828471, "_runtime": 4420}, "step": 150}
{"logs": {"train/loss": 5.1463, "train/learning_rate": 0.0005833333333333333, "train/epoch": 5.01, "_timestamp": 1740828471, "_runtime": 4420}, "step": 150}
{"train_info/time_between_train_steps": 0.027353286743164062, "step": 150}
{"info/global_step": 151, "train_info/time_within_train_step": 27.711707830429077, "step": 151}
{"train_info/time_between_train_steps": 0.005456686019897461, "step": 151}
{"info/global_step": 152, "train_info/time_within_train_step": 27.7993426322937, "step": 152}
{"train_info/time_between_train_steps": 0.00511622428894043, "step": 152}
{"info/global_step": 153, "train_info/time_within_train_step": 27.714701414108276, "step": 153}
{"train_info/time_between_train_steps": 0.005254030227661133, "step": 153}
{"info/global_step": 154, "train_info/time_within_train_step": 27.72619652748108, "step": 154}
{"train_info/time_between_train_steps": 0.005378246307373047, "step": 154}
{"info/global_step": 155, "train_info/time_within_train_step": 27.701313734054565, "step": 155}
{"train_info/time_between_train_steps": 0.005336284637451172, "step": 155}
{"info/global_step": 156, "train_info/time_within_train_step": 27.74224042892456, "step": 156}
{"train_info/time_between_train_steps": 0.005190849304199219, "step": 156}
{"info/global_step": 157, "train_info/time_within_train_step": 27.75897979736328, "step": 157}
{"train_info/time_between_train_steps": 0.005376100540161133, "step": 157}
{"info/global_step": 158, "train_info/time_within_train_step": 28.85250425338745, "step": 158}
{"train_info/time_between_train_steps": 0.00537562370300293, "step": 158}
{"info/global_step": 159, "train_info/time_within_train_step": 27.72560453414917, "step": 159}
{"train_info/time_between_train_steps": 0.0052258968353271484, "step": 159}
{"info/global_step": 160, "train_info/time_within_train_step": 27.713614463806152, "step": 160}
{"train_info/time_between_train_steps": 0.005553007125854492, "step": 160}
{"info/global_step": 161, "train_info/time_within_train_step": 27.734391927719116, "step": 161}
{"train_info/time_between_train_steps": 0.005696773529052734, "step": 161}
{"info/global_step": 162, "train_info/time_within_train_step": 27.723986864089966, "step": 162}
{"train_info/time_between_train_steps": 0.00583338737487793, "step": 162}
{"train_info/time_between_train_steps": 30.243193864822388, "step": 162}
{"info/global_step": 163, "train_info/time_within_train_step": 27.71804428100586, "step": 163}
{"train_info/time_between_train_steps": 0.005509614944458008, "step": 163}
{"info/global_step": 164, "train_info/time_within_train_step": 27.90368151664734, "step": 164}
{"train_info/time_between_train_steps": 0.0053670406341552734, "step": 164}
{"info/global_step": 165, "train_info/time_within_train_step": 27.702847719192505, "step": 165}
{"train_info/time_between_train_steps": 0.00960540771484375, "step": 165}
{"info/global_step": 166, "train_info/time_within_train_step": 27.822851419448853, "step": 166}
{"train_info/time_between_train_steps": 0.005239725112915039, "step": 166}
{"info/global_step": 167, "train_info/time_within_train_step": 27.81547474861145, "step": 167}
{"train_info/time_between_train_steps": 0.0053484439849853516, "step": 167}
{"info/global_step": 168, "train_info/time_within_train_step": 27.8442120552063, "step": 168}
{"train_info/time_between_train_steps": 0.0054836273193359375, "step": 168}
{"info/global_step": 169, "train_info/time_within_train_step": 27.77888822555542, "step": 169}
{"train_info/time_between_train_steps": 0.005716562271118164, "step": 169}
{"info/global_step": 170, "train_info/time_within_train_step": 27.82560443878174, "step": 170}
{"train_info/time_between_train_steps": 0.014793872833251953, "step": 170}
{"info/global_step": 171, "train_info/time_within_train_step": 27.71638560295105, "step": 171}
{"train_info/time_between_train_steps": 0.0049784183502197266, "step": 171}
{"info/global_step": 172, "train_info/time_within_train_step": 27.734620571136475, "step": 172}
{"train_info/time_between_train_steps": 0.0051538944244384766, "step": 172}
{"info/global_step": 173, "train_info/time_within_train_step": 27.697518825531006, "step": 173}
{"train_info/time_between_train_steps": 0.005089759826660156, "step": 173}
{"info/global_step": 174, "train_info/time_within_train_step": 27.705929279327393, "step": 174}
{"train_info/time_between_train_steps": 0.0051839351654052734, "step": 174}
{"info/global_step": 175, "train_info/time_within_train_step": 27.726815223693848, "step": 175}
{"train_info/time_between_train_steps": 0.005172014236450195, "step": 175}
{"info/global_step": 176, "train_info/time_within_train_step": 27.68779993057251, "step": 176}
{"train_info/time_between_train_steps": 0.0049707889556884766, "step": 176}
{"info/global_step": 177, "train_info/time_within_train_step": 27.736475944519043, "step": 177}
{"train_info/time_between_train_steps": 0.005163669586181641, "step": 177}
{"info/global_step": 178, "train_info/time_within_train_step": 27.709714651107788, "step": 178}
{"train_info/time_between_train_steps": 0.005128383636474609, "step": 178}
{"info/global_step": 179, "train_info/time_within_train_step": 27.695388555526733, "step": 179}
{"train_info/time_between_train_steps": 0.007013082504272461, "step": 179}
{"info/global_step": 180, "train_info/time_within_train_step": 27.714560747146606, "step": 180}
{"train_info/time_between_train_steps": 0.005243539810180664, "step": 180}
{"info/global_step": 181, "train_info/time_within_train_step": 27.70488691329956, "step": 181}
{"train_info/time_between_train_steps": 0.005000591278076172, "step": 181}
{"info/global_step": 182, "train_info/time_within_train_step": 27.797266483306885, "step": 182}
{"train_info/time_between_train_steps": 0.0050733089447021484, "step": 182}
{"info/global_step": 183, "train_info/time_within_train_step": 27.6882221698761, "step": 183}
{"train_info/time_between_train_steps": 0.005113840103149414, "step": 183}
{"info/global_step": 184, "train_info/time_within_train_step": 27.712251663208008, "step": 184}
{"train_info/time_between_train_steps": 0.004985809326171875, "step": 184}
{"info/global_step": 185, "train_info/time_within_train_step": 27.707184076309204, "step": 185}
{"train_info/time_between_train_steps": 0.005373477935791016, "step": 185}
{"info/global_step": 186, "train_info/time_within_train_step": 27.71699810028076, "step": 186}
{"train_info/time_between_train_steps": 0.00521540641784668, "step": 186}
{"info/global_step": 187, "train_info/time_within_train_step": 27.7187602519989, "step": 187}
{"train_info/time_between_train_steps": 0.00516057014465332, "step": 187}
{"info/global_step": 188, "train_info/time_within_train_step": 27.712733507156372, "step": 188}
{"train_info/time_between_train_steps": 0.005243062973022461, "step": 188}
{"info/global_step": 189, "train_info/time_within_train_step": 27.716069221496582, "step": 189}
{"train_info/time_between_train_steps": 0.005950212478637695, "step": 189}
{"train_info/time_between_train_steps": 29.952954530715942, "step": 189}
{"info/global_step": 190, "train_info/time_within_train_step": 27.69579768180847, "step": 190}
{"train_info/time_between_train_steps": 0.0050737857818603516, "step": 190}
{"info/global_step": 191, "train_info/time_within_train_step": 27.79578471183777, "step": 191}
{"train_info/time_between_train_steps": 0.004968881607055664, "step": 191}
{"info/global_step": 192, "train_info/time_within_train_step": 27.737427234649658, "step": 192}
{"train_info/time_between_train_steps": 0.005366325378417969, "step": 192}
{"info/global_step": 193, "train_info/time_within_train_step": 27.889018774032593, "step": 193}
{"train_info/time_between_train_steps": 0.005480766296386719, "step": 193}
{"info/global_step": 194, "train_info/time_within_train_step": 27.76640272140503, "step": 194}
{"train_info/time_between_train_steps": 0.005473136901855469, "step": 194}
{"info/global_step": 195, "train_info/time_within_train_step": 27.937748670578003, "step": 195}
{"train_info/time_between_train_steps": 0.005475759506225586, "step": 195}
{"info/global_step": 196, "train_info/time_within_train_step": 27.741543769836426, "step": 196}
{"train_info/time_between_train_steps": 0.005231618881225586, "step": 196}
{"info/global_step": 197, "train_info/time_within_train_step": 27.903958559036255, "step": 197}
{"train_info/time_between_train_steps": 0.00535273551940918, "step": 197}
{"info/global_step": 198, "train_info/time_within_train_step": 27.741702556610107, "step": 198}
{"train_info/time_between_train_steps": 0.005177974700927734, "step": 198}
{"info/global_step": 199, "train_info/time_within_train_step": 27.694640636444092, "step": 199}
{"train_info/time_between_train_steps": 0.0051801204681396484, "step": 199}
{"info/global_step": 200, "train_info/time_within_train_step": 27.87686538696289, "step": 200}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740829923, "_runtime": 5872}, "step": 200}
{"logs": {"train/loss": 4.9169, "train/learning_rate": 0.0005555555555555556, "train/epoch": 7.01, "_timestamp": 1740829923, "_runtime": 5872}, "step": 200}
{"train_info/time_between_train_steps": 71.40856099128723, "step": 200}
{"info/global_step": 201, "train_info/time_within_train_step": 27.688949823379517, "step": 201}
{"train_info/time_between_train_steps": 0.004904747009277344, "step": 201}
{"info/global_step": 202, "train_info/time_within_train_step": 27.72277045249939, "step": 202}
{"train_info/time_between_train_steps": 0.005402803421020508, "step": 202}
{"info/global_step": 203, "train_info/time_within_train_step": 27.705255270004272, "step": 203}
{"train_info/time_between_train_steps": 0.005044460296630859, "step": 203}
{"info/global_step": 204, "train_info/time_within_train_step": 27.715781927108765, "step": 204}
{"train_info/time_between_train_steps": 0.005054950714111328, "step": 204}
{"info/global_step": 205, "train_info/time_within_train_step": 27.756427526474, "step": 205}
{"train_info/time_between_train_steps": 0.005423545837402344, "step": 205}
{"info/global_step": 206, "train_info/time_within_train_step": 27.73091173171997, "step": 206}
{"train_info/time_between_train_steps": 0.0050106048583984375, "step": 206}
{"info/global_step": 207, "train_info/time_within_train_step": 27.694384336471558, "step": 207}
{"train_info/time_between_train_steps": 0.0059413909912109375, "step": 207}
{"info/global_step": 208, "train_info/time_within_train_step": 27.72783851623535, "step": 208}
{"train_info/time_between_train_steps": 0.005311727523803711, "step": 208}
{"info/global_step": 209, "train_info/time_within_train_step": 27.719402074813843, "step": 209}
{"train_info/time_between_train_steps": 0.0050928592681884766, "step": 209}
{"info/global_step": 210, "train_info/time_within_train_step": 27.69693922996521, "step": 210}
{"train_info/time_between_train_steps": 0.005269289016723633, "step": 210}
{"info/global_step": 211, "train_info/time_within_train_step": 27.715784311294556, "step": 211}
{"train_info/time_between_train_steps": 0.005045652389526367, "step": 211}
{"info/global_step": 212, "train_info/time_within_train_step": 27.87380599975586, "step": 212}
{"train_info/time_between_train_steps": 0.005231618881225586, "step": 212}
{"info/global_step": 213, "train_info/time_within_train_step": 27.85225820541382, "step": 213}
{"train_info/time_between_train_steps": 0.005368709564208984, "step": 213}
{"info/global_step": 214, "train_info/time_within_train_step": 27.778074502944946, "step": 214}
{"train_info/time_between_train_steps": 0.006146907806396484, "step": 214}
{"info/global_step": 215, "train_info/time_within_train_step": 27.72144341468811, "step": 215}
{"train_info/time_between_train_steps": 0.005540609359741211, "step": 215}
{"info/global_step": 216, "train_info/time_within_train_step": 27.72233247756958, "step": 216}
{"train_info/time_between_train_steps": 0.005738258361816406, "step": 216}
{"train_info/time_between_train_steps": 30.0035719871521, "step": 216}
{"info/global_step": 217, "train_info/time_within_train_step": 27.727752923965454, "step": 217}
{"train_info/time_between_train_steps": 0.0132904052734375, "step": 217}
{"info/global_step": 218, "train_info/time_within_train_step": 27.848336696624756, "step": 218}
{"train_info/time_between_train_steps": 0.005022287368774414, "step": 218}
{"info/global_step": 219, "train_info/time_within_train_step": 27.730770349502563, "step": 219}
{"train_info/time_between_train_steps": 0.006495237350463867, "step": 219}
{"info/global_step": 220, "train_info/time_within_train_step": 27.861899375915527, "step": 220}
{"train_info/time_between_train_steps": 0.005459308624267578, "step": 220}
{"info/global_step": 221, "train_info/time_within_train_step": 27.72015881538391, "step": 221}
{"train_info/time_between_train_steps": 0.0054569244384765625, "step": 221}
{"info/global_step": 222, "train_info/time_within_train_step": 27.880970239639282, "step": 222}
{"train_info/time_between_train_steps": 0.005377054214477539, "step": 222}
{"info/global_step": 223, "train_info/time_within_train_step": 27.719080209732056, "step": 223}
{"train_info/time_between_train_steps": 0.005482912063598633, "step": 223}
{"info/global_step": 224, "train_info/time_within_train_step": 27.80422353744507, "step": 224}
{"train_info/time_between_train_steps": 0.00543212890625, "step": 224}
{"info/global_step": 225, "train_info/time_within_train_step": 27.718651056289673, "step": 225}
{"train_info/time_between_train_steps": 0.0050525665283203125, "step": 225}
{"info/global_step": 226, "train_info/time_within_train_step": 27.696388006210327, "step": 226}
{"train_info/time_between_train_steps": 0.005218029022216797, "step": 226}
{"info/global_step": 227, "train_info/time_within_train_step": 27.81152844429016, "step": 227}
{"train_info/time_between_train_steps": 0.006003141403198242, "step": 227}
{"info/global_step": 228, "train_info/time_within_train_step": 27.76421308517456, "step": 228}
{"train_info/time_between_train_steps": 0.005090236663818359, "step": 228}
{"info/global_step": 229, "train_info/time_within_train_step": 27.70001459121704, "step": 229}
{"train_info/time_between_train_steps": 0.0051860809326171875, "step": 229}
{"info/global_step": 230, "train_info/time_within_train_step": 27.72329330444336, "step": 230}
{"train_info/time_between_train_steps": 0.005209684371948242, "step": 230}
{"info/global_step": 231, "train_info/time_within_train_step": 27.709064960479736, "step": 231}
{"train_info/time_between_train_steps": 0.005251169204711914, "step": 231}
{"info/global_step": 232, "train_info/time_within_train_step": 27.712372303009033, "step": 232}
{"train_info/time_between_train_steps": 0.005196332931518555, "step": 232}
{"info/global_step": 233, "train_info/time_within_train_step": 27.72724413871765, "step": 233}
{"train_info/time_between_train_steps": 0.005225419998168945, "step": 233}
{"info/global_step": 234, "train_info/time_within_train_step": 27.73222851753235, "step": 234}
{"train_info/time_between_train_steps": 0.0051670074462890625, "step": 234}
{"info/global_step": 235, "train_info/time_within_train_step": 27.723369598388672, "step": 235}
{"train_info/time_between_train_steps": 0.005420684814453125, "step": 235}
{"info/global_step": 236, "train_info/time_within_train_step": 27.707173109054565, "step": 236}
{"train_info/time_between_train_steps": 0.004990339279174805, "step": 236}
{"info/global_step": 237, "train_info/time_within_train_step": 27.71030616760254, "step": 237}
{"train_info/time_between_train_steps": 0.006212949752807617, "step": 237}
{"info/global_step": 238, "train_info/time_within_train_step": 27.70557737350464, "step": 238}
{"train_info/time_between_train_steps": 0.005048513412475586, "step": 238}
{"info/global_step": 239, "train_info/time_within_train_step": 27.750725507736206, "step": 239}
{"train_info/time_between_train_steps": 0.0054779052734375, "step": 239}
{"info/global_step": 240, "train_info/time_within_train_step": 27.69505286216736, "step": 240}
{"train_info/time_between_train_steps": 0.005310535430908203, "step": 240}
{"info/global_step": 241, "train_info/time_within_train_step": 27.70771098136902, "step": 241}
{"train_info/time_between_train_steps": 0.005216360092163086, "step": 241}
{"info/global_step": 242, "train_info/time_within_train_step": 27.73019790649414, "step": 242}
{"train_info/time_between_train_steps": 0.006548166275024414, "step": 242}
{"info/global_step": 243, "train_info/time_within_train_step": 27.85103678703308, "step": 243}
{"train_info/time_between_train_steps": 0.0058879852294921875, "step": 243}
{"train_info/time_between_train_steps": 30.14335298538208, "step": 243}
{"info/global_step": 244, "train_info/time_within_train_step": 27.721389770507812, "step": 244}
{"train_info/time_between_train_steps": 0.00519561767578125, "step": 244}
{"info/global_step": 245, "train_info/time_within_train_step": 27.84705901145935, "step": 245}
{"train_info/time_between_train_steps": 0.005219459533691406, "step": 245}
{"info/global_step": 246, "train_info/time_within_train_step": 27.716986894607544, "step": 246}
{"train_info/time_between_train_steps": 0.005453824996948242, "step": 246}
{"info/global_step": 247, "train_info/time_within_train_step": 27.855106115341187, "step": 247}
{"train_info/time_between_train_steps": 0.005281925201416016, "step": 247}
{"info/global_step": 248, "train_info/time_within_train_step": 27.70311999320984, "step": 248}
{"train_info/time_between_train_steps": 0.005381584167480469, "step": 248}
{"info/global_step": 249, "train_info/time_within_train_step": 27.891501903533936, "step": 249}
{"train_info/time_between_train_steps": 0.005697965621948242, "step": 249}
{"info/global_step": 250, "train_info/time_within_train_step": 27.70957350730896, "step": 250}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740831443, "_runtime": 7392}, "step": 250}
{"logs": {"train/loss": 4.7748, "train/learning_rate": 0.0005277777777777777, "train/epoch": 9.01, "_timestamp": 1740831443, "_runtime": 7392}, "step": 250}
{"train_info/time_between_train_steps": 0.02661919593811035, "step": 250}
{"info/global_step": 251, "train_info/time_within_train_step": 27.847467184066772, "step": 251}
{"train_info/time_between_train_steps": 0.005439043045043945, "step": 251}
{"info/global_step": 252, "train_info/time_within_train_step": 27.71045708656311, "step": 252}
{"train_info/time_between_train_steps": 0.005213260650634766, "step": 252}
{"info/global_step": 253, "train_info/time_within_train_step": 29.836015939712524, "step": 253}
{"train_info/time_between_train_steps": 0.005486726760864258, "step": 253}
{"info/global_step": 254, "train_info/time_within_train_step": 27.832483768463135, "step": 254}
{"train_info/time_between_train_steps": 0.005151987075805664, "step": 254}
{"info/global_step": 255, "train_info/time_within_train_step": 27.71641707420349, "step": 255}
{"train_info/time_between_train_steps": 0.005892038345336914, "step": 255}
{"info/global_step": 256, "train_info/time_within_train_step": 27.705476999282837, "step": 256}
{"train_info/time_between_train_steps": 0.005370616912841797, "step": 256}
{"info/global_step": 257, "train_info/time_within_train_step": 27.828298330307007, "step": 257}
{"train_info/time_between_train_steps": 0.004931211471557617, "step": 257}
{"info/global_step": 258, "train_info/time_within_train_step": 27.723498344421387, "step": 258}
{"train_info/time_between_train_steps": 0.005083560943603516, "step": 258}
{"info/global_step": 259, "train_info/time_within_train_step": 27.687702894210815, "step": 259}
{"train_info/time_between_train_steps": 0.005162715911865234, "step": 259}
{"info/global_step": 260, "train_info/time_within_train_step": 27.704142808914185, "step": 260}
{"train_info/time_between_train_steps": 0.00501704216003418, "step": 260}
{"info/global_step": 261, "train_info/time_within_train_step": 27.717151641845703, "step": 261}
{"train_info/time_between_train_steps": 0.0050334930419921875, "step": 261}
{"info/global_step": 262, "train_info/time_within_train_step": 27.7015438079834, "step": 262}
{"train_info/time_between_train_steps": 0.005017995834350586, "step": 262}
{"info/global_step": 263, "train_info/time_within_train_step": 27.689342975616455, "step": 263}
{"train_info/time_between_train_steps": 0.005089282989501953, "step": 263}
{"info/global_step": 264, "train_info/time_within_train_step": 27.713035345077515, "step": 264}
{"train_info/time_between_train_steps": 0.006147861480712891, "step": 264}
{"info/global_step": 265, "train_info/time_within_train_step": 27.69876527786255, "step": 265}
{"train_info/time_between_train_steps": 0.004920244216918945, "step": 265}
{"info/global_step": 266, "train_info/time_within_train_step": 27.707741498947144, "step": 266}
{"train_info/time_between_train_steps": 0.008828878402709961, "step": 266}
{"info/global_step": 267, "train_info/time_within_train_step": 27.687307596206665, "step": 267}
{"train_info/time_between_train_steps": 0.005110979080200195, "step": 267}
{"info/global_step": 268, "train_info/time_within_train_step": 27.731905698776245, "step": 268}
{"train_info/time_between_train_steps": 0.00521087646484375, "step": 268}
{"info/global_step": 269, "train_info/time_within_train_step": 27.703439235687256, "step": 269}
{"train_info/time_between_train_steps": 0.005433082580566406, "step": 269}
{"info/global_step": 270, "train_info/time_within_train_step": 27.765674591064453, "step": 270}
{"train_info/time_between_train_steps": 0.00574946403503418, "step": 270}
{"train_info/time_between_train_steps": 29.745858192443848, "step": 270}
{"info/global_step": 271, "train_info/time_within_train_step": 27.683923721313477, "step": 271}
{"train_info/time_between_train_steps": 0.004957437515258789, "step": 271}
{"info/global_step": 272, "train_info/time_within_train_step": 27.88573384284973, "step": 272}
{"train_info/time_between_train_steps": 0.004858732223510742, "step": 272}
{"info/global_step": 273, "train_info/time_within_train_step": 27.728705406188965, "step": 273}
{"train_info/time_between_train_steps": 0.0056209564208984375, "step": 273}
{"info/global_step": 274, "train_info/time_within_train_step": 27.870072603225708, "step": 274}
{"train_info/time_between_train_steps": 0.005419015884399414, "step": 274}
{"info/global_step": 275, "train_info/time_within_train_step": 27.69218134880066, "step": 275}
{"train_info/time_between_train_steps": 0.00735783576965332, "step": 275}
{"info/global_step": 276, "train_info/time_within_train_step": 27.89175772666931, "step": 276}
{"train_info/time_between_train_steps": 0.005269289016723633, "step": 276}
{"info/global_step": 277, "train_info/time_within_train_step": 27.698303699493408, "step": 277}
{"train_info/time_between_train_steps": 0.0051763057708740234, "step": 277}
{"info/global_step": 278, "train_info/time_within_train_step": 27.824692487716675, "step": 278}
{"train_info/time_between_train_steps": 0.0052318572998046875, "step": 278}
{"info/global_step": 279, "train_info/time_within_train_step": 27.711709022521973, "step": 279}
{"train_info/time_between_train_steps": 0.004962921142578125, "step": 279}
{"info/global_step": 280, "train_info/time_within_train_step": 27.71587610244751, "step": 280}
{"train_info/time_between_train_steps": 0.004960060119628906, "step": 280}
{"info/global_step": 281, "train_info/time_within_train_step": 27.697986602783203, "step": 281}
{"train_info/time_between_train_steps": 0.005327701568603516, "step": 281}
{"info/global_step": 282, "train_info/time_within_train_step": 27.679179668426514, "step": 282}
{"train_info/time_between_train_steps": 0.0048828125, "step": 282}
{"info/global_step": 283, "train_info/time_within_train_step": 27.698227405548096, "step": 283}
{"train_info/time_between_train_steps": 0.005114078521728516, "step": 283}
{"info/global_step": 284, "train_info/time_within_train_step": 27.70395064353943, "step": 284}
{"train_info/time_between_train_steps": 0.0051729679107666016, "step": 284}
{"info/global_step": 285, "train_info/time_within_train_step": 27.726306438446045, "step": 285}
{"train_info/time_between_train_steps": 0.005076169967651367, "step": 285}
{"info/global_step": 286, "train_info/time_within_train_step": 27.708518266677856, "step": 286}
{"train_info/time_between_train_steps": 0.005265235900878906, "step": 286}
{"info/global_step": 287, "train_info/time_within_train_step": 27.73025870323181, "step": 287}
{"train_info/time_between_train_steps": 0.005002737045288086, "step": 287}
{"info/global_step": 288, "train_info/time_within_train_step": 27.767294883728027, "step": 288}
{"train_info/time_between_train_steps": 0.004942893981933594, "step": 288}
{"info/global_step": 289, "train_info/time_within_train_step": 27.74757146835327, "step": 289}
{"train_info/time_between_train_steps": 0.00530552864074707, "step": 289}
{"info/global_step": 290, "train_info/time_within_train_step": 27.677445650100708, "step": 290}
{"train_info/time_between_train_steps": 0.005026578903198242, "step": 290}
{"info/global_step": 291, "train_info/time_within_train_step": 27.738504886627197, "step": 291}
{"train_info/time_between_train_steps": 0.005297422409057617, "step": 291}
{"info/global_step": 292, "train_info/time_within_train_step": 27.70669913291931, "step": 292}
{"train_info/time_between_train_steps": 0.005061149597167969, "step": 292}
{"info/global_step": 293, "train_info/time_within_train_step": 27.69928479194641, "step": 293}
{"train_info/time_between_train_steps": 0.005146980285644531, "step": 293}
{"info/global_step": 294, "train_info/time_within_train_step": 27.694706439971924, "step": 294}
{"train_info/time_between_train_steps": 0.005213022232055664, "step": 294}
{"info/global_step": 295, "train_info/time_within_train_step": 27.691195726394653, "step": 295}
{"train_info/time_between_train_steps": 0.004995822906494141, "step": 295}
{"info/global_step": 296, "train_info/time_within_train_step": 27.715235948562622, "step": 296}
{"train_info/time_between_train_steps": 0.0054247379302978516, "step": 296}
{"info/global_step": 297, "train_info/time_within_train_step": 27.718720197677612, "step": 297}
{"train_info/time_between_train_steps": 0.005729198455810547, "step": 297}
{"train_info/time_between_train_steps": 29.892987728118896, "step": 297}
{"info/global_step": 298, "train_info/time_within_train_step": 27.709092378616333, "step": 298}
{"train_info/time_between_train_steps": 0.005079030990600586, "step": 298}
{"info/global_step": 299, "train_info/time_within_train_step": 27.81121563911438, "step": 299}
{"train_info/time_between_train_steps": 0.005123138427734375, "step": 299}
{"info/global_step": 300, "train_info/time_within_train_step": 27.723816394805908, "step": 300}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740832893, "_runtime": 8842}, "step": 300}
{"logs": {"train/loss": 4.6113, "train/learning_rate": 0.0005, "train/epoch": 11.0, "_timestamp": 1740832893, "_runtime": 8842}, "step": 300}
{"train_info/time_between_train_steps": 68.72886753082275, "step": 300}
{"info/global_step": 301, "train_info/time_within_train_step": 27.944496393203735, "step": 301}
{"train_info/time_between_train_steps": 0.005503416061401367, "step": 301}
{"info/global_step": 302, "train_info/time_within_train_step": 27.813271284103394, "step": 302}
{"train_info/time_between_train_steps": 0.010621070861816406, "step": 302}
{"info/global_step": 303, "train_info/time_within_train_step": 27.879083156585693, "step": 303}
{"train_info/time_between_train_steps": 0.005305767059326172, "step": 303}
{"info/global_step": 304, "train_info/time_within_train_step": 27.70069146156311, "step": 304}
{"train_info/time_between_train_steps": 0.01583242416381836, "step": 304}
{"info/global_step": 305, "train_info/time_within_train_step": 27.783106327056885, "step": 305}
{"train_info/time_between_train_steps": 0.005769252777099609, "step": 305}
{"info/global_step": 306, "train_info/time_within_train_step": 27.71502161026001, "step": 306}
{"train_info/time_between_train_steps": 0.004978656768798828, "step": 306}
{"info/global_step": 307, "train_info/time_within_train_step": 27.74606704711914, "step": 307}
{"train_info/time_between_train_steps": 0.005297422409057617, "step": 307}
{"info/global_step": 308, "train_info/time_within_train_step": 27.677711725234985, "step": 308}
{"train_info/time_between_train_steps": 0.004990577697753906, "step": 308}
{"info/global_step": 309, "train_info/time_within_train_step": 27.717071294784546, "step": 309}
{"train_info/time_between_train_steps": 0.004876375198364258, "step": 309}
{"info/global_step": 310, "train_info/time_within_train_step": 27.719885110855103, "step": 310}
{"train_info/time_between_train_steps": 0.0050923824310302734, "step": 310}
{"info/global_step": 311, "train_info/time_within_train_step": 27.713855504989624, "step": 311}
{"train_info/time_between_train_steps": 0.004925966262817383, "step": 311}
{"info/global_step": 312, "train_info/time_within_train_step": 27.71424150466919, "step": 312}
{"train_info/time_between_train_steps": 0.005113124847412109, "step": 312}
{"info/global_step": 313, "train_info/time_within_train_step": 27.703622817993164, "step": 313}
{"train_info/time_between_train_steps": 0.005049467086791992, "step": 313}
{"info/global_step": 314, "train_info/time_within_train_step": 27.70532727241516, "step": 314}
{"train_info/time_between_train_steps": 0.00533604621887207, "step": 314}
{"info/global_step": 315, "train_info/time_within_train_step": 27.696733474731445, "step": 315}
{"train_info/time_between_train_steps": 0.005115032196044922, "step": 315}
{"info/global_step": 316, "train_info/time_within_train_step": 27.699946641921997, "step": 316}
{"train_info/time_between_train_steps": 0.005320072174072266, "step": 316}
{"info/global_step": 317, "train_info/time_within_train_step": 27.69359016418457, "step": 317}
{"train_info/time_between_train_steps": 0.004960536956787109, "step": 317}
{"info/global_step": 318, "train_info/time_within_train_step": 27.81396985054016, "step": 318}
{"train_info/time_between_train_steps": 0.0049517154693603516, "step": 318}
{"info/global_step": 319, "train_info/time_within_train_step": 27.697635889053345, "step": 319}
{"train_info/time_between_train_steps": 0.005113363265991211, "step": 319}
{"info/global_step": 320, "train_info/time_within_train_step": 27.70133948326111, "step": 320}
{"train_info/time_between_train_steps": 0.005296468734741211, "step": 320}
{"info/global_step": 321, "train_info/time_within_train_step": 27.710905075073242, "step": 321}
{"train_info/time_between_train_steps": 0.005137920379638672, "step": 321}
{"info/global_step": 322, "train_info/time_within_train_step": 27.705875873565674, "step": 322}
{"train_info/time_between_train_steps": 0.00514531135559082, "step": 322}
{"info/global_step": 323, "train_info/time_within_train_step": 27.716498613357544, "step": 323}
{"train_info/time_between_train_steps": 0.005134105682373047, "step": 323}
{"info/global_step": 324, "train_info/time_within_train_step": 27.70203924179077, "step": 324}
{"train_info/time_between_train_steps": 0.005556344985961914, "step": 324}
{"train_info/time_between_train_steps": 29.971785306930542, "step": 324}
{"info/global_step": 325, "train_info/time_within_train_step": 27.70545268058777, "step": 325}
{"train_info/time_between_train_steps": 0.004975795745849609, "step": 325}
{"info/global_step": 326, "train_info/time_within_train_step": 27.814971685409546, "step": 326}
{"train_info/time_between_train_steps": 0.004874467849731445, "step": 326}
{"info/global_step": 327, "train_info/time_within_train_step": 27.703237295150757, "step": 327}
{"train_info/time_between_train_steps": 0.004938602447509766, "step": 327}
{"info/global_step": 328, "train_info/time_within_train_step": 27.84750533103943, "step": 328}
{"train_info/time_between_train_steps": 0.00495457649230957, "step": 328}
{"info/global_step": 329, "train_info/time_within_train_step": 27.683165311813354, "step": 329}
{"train_info/time_between_train_steps": 0.005002021789550781, "step": 329}
{"info/global_step": 330, "train_info/time_within_train_step": 27.81504535675049, "step": 330}
{"train_info/time_between_train_steps": 0.004901885986328125, "step": 330}
{"info/global_step": 331, "train_info/time_within_train_step": 27.69839119911194, "step": 331}
{"train_info/time_between_train_steps": 0.005086183547973633, "step": 331}
{"info/global_step": 332, "train_info/time_within_train_step": 27.80078625679016, "step": 332}
{"train_info/time_between_train_steps": 0.005413532257080078, "step": 332}
{"info/global_step": 333, "train_info/time_within_train_step": 27.796300411224365, "step": 333}
{"train_info/time_between_train_steps": 0.004987955093383789, "step": 333}
{"info/global_step": 334, "train_info/time_within_train_step": 27.694554567337036, "step": 334}
{"train_info/time_between_train_steps": 0.0052297115325927734, "step": 334}
{"info/global_step": 335, "train_info/time_within_train_step": 27.686922788619995, "step": 335}
{"train_info/time_between_train_steps": 0.005709171295166016, "step": 335}
{"info/global_step": 336, "train_info/time_within_train_step": 27.73978614807129, "step": 336}
{"train_info/time_between_train_steps": 0.0048787593841552734, "step": 336}
{"info/global_step": 337, "train_info/time_within_train_step": 27.69904375076294, "step": 337}
{"train_info/time_between_train_steps": 0.0048007965087890625, "step": 337}
{"info/global_step": 338, "train_info/time_within_train_step": 27.742437839508057, "step": 338}
{"train_info/time_between_train_steps": 0.005023002624511719, "step": 338}
{"info/global_step": 339, "train_info/time_within_train_step": 27.69900155067444, "step": 339}
{"train_info/time_between_train_steps": 0.005210399627685547, "step": 339}
{"info/global_step": 340, "train_info/time_within_train_step": 27.696231842041016, "step": 340}
{"train_info/time_between_train_steps": 0.005199909210205078, "step": 340}
{"info/global_step": 341, "train_info/time_within_train_step": 27.692163467407227, "step": 341}
{"train_info/time_between_train_steps": 0.005689859390258789, "step": 341}
{"info/global_step": 342, "train_info/time_within_train_step": 27.700796842575073, "step": 342}
{"train_info/time_between_train_steps": 0.005124092102050781, "step": 342}
{"info/global_step": 343, "train_info/time_within_train_step": 27.699374437332153, "step": 343}
{"train_info/time_between_train_steps": 0.0051670074462890625, "step": 343}
{"info/global_step": 344, "train_info/time_within_train_step": 27.68837547302246, "step": 344}
{"train_info/time_between_train_steps": 0.00490260124206543, "step": 344}
{"info/global_step": 345, "train_info/time_within_train_step": 27.686238050460815, "step": 345}
{"train_info/time_between_train_steps": 0.00590205192565918, "step": 345}
{"info/global_step": 346, "train_info/time_within_train_step": 27.71175789833069, "step": 346}
{"train_info/time_between_train_steps": 0.005026340484619141, "step": 346}
{"info/global_step": 347, "train_info/time_within_train_step": 27.73295569419861, "step": 347}
{"train_info/time_between_train_steps": 0.004974365234375, "step": 347}
{"info/global_step": 348, "train_info/time_within_train_step": 27.833566188812256, "step": 348}
{"train_info/time_between_train_steps": 0.005349636077880859, "step": 348}
{"info/global_step": 349, "train_info/time_within_train_step": 29.259286642074585, "step": 349}
{"train_info/time_between_train_steps": 0.005425691604614258, "step": 349}
{"info/global_step": 350, "train_info/time_within_train_step": 27.82205080986023, "step": 350}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740834382, "_runtime": 10331}, "step": 350}
{"logs": {"train/loss": 4.3301, "train/learning_rate": 0.00047222222222222224, "train/epoch": 12.02, "_timestamp": 1740834382, "_runtime": 10331}, "step": 350}
{"train_info/time_between_train_steps": 0.026610851287841797, "step": 350}
{"info/global_step": 351, "train_info/time_within_train_step": 27.718280792236328, "step": 351}
{"train_info/time_between_train_steps": 0.0063915252685546875, "step": 351}
{"train_info/time_between_train_steps": 30.16409707069397, "step": 351}
{"info/global_step": 352, "train_info/time_within_train_step": 27.75032377243042, "step": 352}
{"train_info/time_between_train_steps": 0.004950761795043945, "step": 352}
{"info/global_step": 353, "train_info/time_within_train_step": 27.801109313964844, "step": 353}
{"train_info/time_between_train_steps": 0.0049304962158203125, "step": 353}
{"info/global_step": 354, "train_info/time_within_train_step": 27.696782112121582, "step": 354}
{"train_info/time_between_train_steps": 0.005049228668212891, "step": 354}
{"info/global_step": 355, "train_info/time_within_train_step": 27.79987621307373, "step": 355}
{"train_info/time_between_train_steps": 0.00496220588684082, "step": 355}
{"info/global_step": 356, "train_info/time_within_train_step": 27.69485068321228, "step": 356}
{"train_info/time_between_train_steps": 0.00516200065612793, "step": 356}
{"info/global_step": 357, "train_info/time_within_train_step": 27.89965844154358, "step": 357}
{"train_info/time_between_train_steps": 0.005285978317260742, "step": 357}
{"info/global_step": 358, "train_info/time_within_train_step": 27.718451023101807, "step": 358}
{"train_info/time_between_train_steps": 0.005517482757568359, "step": 358}
{"info/global_step": 359, "train_info/time_within_train_step": 27.808380842208862, "step": 359}
{"train_info/time_between_train_steps": 0.0053827762603759766, "step": 359}
{"info/global_step": 360, "train_info/time_within_train_step": 27.703009366989136, "step": 360}
{"train_info/time_between_train_steps": 0.004916667938232422, "step": 360}
{"info/global_step": 361, "train_info/time_within_train_step": 27.688544988632202, "step": 361}
{"train_info/time_between_train_steps": 0.005113840103149414, "step": 361}
{"info/global_step": 362, "train_info/time_within_train_step": 27.682151317596436, "step": 362}
{"train_info/time_between_train_steps": 0.005080461502075195, "step": 362}
{"info/global_step": 363, "train_info/time_within_train_step": 27.800988912582397, "step": 363}
{"train_info/time_between_train_steps": 0.005213499069213867, "step": 363}
{"info/global_step": 364, "train_info/time_within_train_step": 27.691623210906982, "step": 364}
{"train_info/time_between_train_steps": 0.005220890045166016, "step": 364}
{"info/global_step": 365, "train_info/time_within_train_step": 27.70055913925171, "step": 365}
{"train_info/time_between_train_steps": 0.00501704216003418, "step": 365}
{"info/global_step": 366, "train_info/time_within_train_step": 27.707960605621338, "step": 366}
{"train_info/time_between_train_steps": 0.005042314529418945, "step": 366}
{"info/global_step": 367, "train_info/time_within_train_step": 27.704532146453857, "step": 367}
{"train_info/time_between_train_steps": 0.005196809768676758, "step": 367}
{"info/global_step": 368, "train_info/time_within_train_step": 27.72313117980957, "step": 368}
{"train_info/time_between_train_steps": 0.00502324104309082, "step": 368}
{"info/global_step": 369, "train_info/time_within_train_step": 27.70803952217102, "step": 369}
{"train_info/time_between_train_steps": 0.004953622817993164, "step": 369}
{"info/global_step": 370, "train_info/time_within_train_step": 27.73861837387085, "step": 370}
{"train_info/time_between_train_steps": 0.006087064743041992, "step": 370}
{"info/global_step": 371, "train_info/time_within_train_step": 27.729703664779663, "step": 371}
{"train_info/time_between_train_steps": 0.005898714065551758, "step": 371}
{"info/global_step": 372, "train_info/time_within_train_step": 27.71752953529358, "step": 372}
{"train_info/time_between_train_steps": 0.005046367645263672, "step": 372}
{"info/global_step": 373, "train_info/time_within_train_step": 27.712212562561035, "step": 373}
{"train_info/time_between_train_steps": 0.005193471908569336, "step": 373}
{"info/global_step": 374, "train_info/time_within_train_step": 27.712870359420776, "step": 374}
{"train_info/time_between_train_steps": 0.005297422409057617, "step": 374}
{"info/global_step": 375, "train_info/time_within_train_step": 27.71082353591919, "step": 375}
{"train_info/time_between_train_steps": 0.0052602291107177734, "step": 375}
{"info/global_step": 376, "train_info/time_within_train_step": 27.699671030044556, "step": 376}
{"train_info/time_between_train_steps": 0.0050601959228515625, "step": 376}
{"info/global_step": 377, "train_info/time_within_train_step": 27.699132919311523, "step": 377}
{"train_info/time_between_train_steps": 0.006150484085083008, "step": 377}
{"info/global_step": 378, "train_info/time_within_train_step": 27.721951484680176, "step": 378}
{"train_info/time_between_train_steps": 0.005815267562866211, "step": 378}
{"train_info/time_between_train_steps": 29.89716386795044, "step": 378}
{"info/global_step": 379, "train_info/time_within_train_step": 27.68725824356079, "step": 379}
{"train_info/time_between_train_steps": 0.0048291683197021484, "step": 379}
{"info/global_step": 380, "train_info/time_within_train_step": 27.79752826690674, "step": 380}
{"train_info/time_between_train_steps": 0.005009889602661133, "step": 380}
{"info/global_step": 381, "train_info/time_within_train_step": 27.708723306655884, "step": 381}
{"train_info/time_between_train_steps": 0.00506281852722168, "step": 381}
{"info/global_step": 382, "train_info/time_within_train_step": 27.801533699035645, "step": 382}
{"train_info/time_between_train_steps": 0.00487828254699707, "step": 382}
{"info/global_step": 383, "train_info/time_within_train_step": 27.722710609436035, "step": 383}
{"train_info/time_between_train_steps": 0.0052335262298583984, "step": 383}
{"info/global_step": 384, "train_info/time_within_train_step": 27.891085147857666, "step": 384}
{"train_info/time_between_train_steps": 0.0052242279052734375, "step": 384}
{"info/global_step": 385, "train_info/time_within_train_step": 27.713855266571045, "step": 385}
{"train_info/time_between_train_steps": 0.005141019821166992, "step": 385}
{"info/global_step": 386, "train_info/time_within_train_step": 27.738038301467896, "step": 386}
{"train_info/time_between_train_steps": 0.00527644157409668, "step": 386}
{"info/global_step": 387, "train_info/time_within_train_step": 27.723580837249756, "step": 387}
{"train_info/time_between_train_steps": 0.004835367202758789, "step": 387}
{"info/global_step": 388, "train_info/time_within_train_step": 27.735204219818115, "step": 388}
{"train_info/time_between_train_steps": 0.004822731018066406, "step": 388}
{"info/global_step": 389, "train_info/time_within_train_step": 27.68376588821411, "step": 389}
{"train_info/time_between_train_steps": 0.004823446273803711, "step": 389}
{"info/global_step": 390, "train_info/time_within_train_step": 27.739256143569946, "step": 390}
{"train_info/time_between_train_steps": 0.004739522933959961, "step": 390}
{"info/global_step": 391, "train_info/time_within_train_step": 27.68847346305847, "step": 391}
{"train_info/time_between_train_steps": 0.004811525344848633, "step": 391}
{"info/global_step": 392, "train_info/time_within_train_step": 27.68512463569641, "step": 392}
{"train_info/time_between_train_steps": 0.005121469497680664, "step": 392}
{"info/global_step": 393, "train_info/time_within_train_step": 27.787583827972412, "step": 393}
{"train_info/time_between_train_steps": 0.005105018615722656, "step": 393}
{"info/global_step": 394, "train_info/time_within_train_step": 27.69494938850403, "step": 394}
{"train_info/time_between_train_steps": 0.005059242248535156, "step": 394}
{"info/global_step": 395, "train_info/time_within_train_step": 27.697033643722534, "step": 395}
{"train_info/time_between_train_steps": 0.005006074905395508, "step": 395}
{"info/global_step": 396, "train_info/time_within_train_step": 27.71225643157959, "step": 396}
{"train_info/time_between_train_steps": 0.004931926727294922, "step": 396}
{"info/global_step": 397, "train_info/time_within_train_step": 27.698719263076782, "step": 397}
{"train_info/time_between_train_steps": 0.004930257797241211, "step": 397}
{"info/global_step": 398, "train_info/time_within_train_step": 27.686323642730713, "step": 398}
{"train_info/time_between_train_steps": 0.005032539367675781, "step": 398}
{"info/global_step": 399, "train_info/time_within_train_step": 27.68223547935486, "step": 399}
{"train_info/time_between_train_steps": 0.0049402713775634766, "step": 399}
{"info/global_step": 400, "train_info/time_within_train_step": 27.704569101333618, "step": 400}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740835830, "_runtime": 11779}, "step": 400}
{"logs": {"train/loss": 4.2208, "train/learning_rate": 0.00044444444444444436, "train/epoch": 14.02, "_timestamp": 1740835830, "_runtime": 11779}, "step": 400}
{"train_info/time_between_train_steps": 65.49763083457947, "step": 400}
{"info/global_step": 401, "train_info/time_within_train_step": 27.777589797973633, "step": 401}
{"train_info/time_between_train_steps": 0.0053861141204833984, "step": 401}
{"info/global_step": 402, "train_info/time_within_train_step": 27.715510845184326, "step": 402}
{"train_info/time_between_train_steps": 0.0052144527435302734, "step": 402}
{"info/global_step": 403, "train_info/time_within_train_step": 27.715824604034424, "step": 403}
{"train_info/time_between_train_steps": 0.005365848541259766, "step": 403}
{"info/global_step": 404, "train_info/time_within_train_step": 27.718252897262573, "step": 404}
{"train_info/time_between_train_steps": 0.0054471492767333984, "step": 404}
{"info/global_step": 405, "train_info/time_within_train_step": 27.75610899925232, "step": 405}
{"train_info/time_between_train_steps": 0.006641864776611328, "step": 405}
{"train_info/time_between_train_steps": 30.19359016418457, "step": 405}
{"info/global_step": 406, "train_info/time_within_train_step": 27.724653482437134, "step": 406}
{"train_info/time_between_train_steps": 0.0060842037200927734, "step": 406}
{"info/global_step": 407, "train_info/time_within_train_step": 27.84691572189331, "step": 407}
{"train_info/time_between_train_steps": 0.0049779415130615234, "step": 407}
{"info/global_step": 408, "train_info/time_within_train_step": 27.826810598373413, "step": 408}
{"train_info/time_between_train_steps": 0.005158662796020508, "step": 408}
{"info/global_step": 409, "train_info/time_within_train_step": 27.82830834388733, "step": 409}
{"train_info/time_between_train_steps": 0.006407976150512695, "step": 409}
{"info/global_step": 410, "train_info/time_within_train_step": 27.71260714530945, "step": 410}
{"train_info/time_between_train_steps": 0.005293846130371094, "step": 410}
{"info/global_step": 411, "train_info/time_within_train_step": 27.847822904586792, "step": 411}
{"train_info/time_between_train_steps": 0.0050716400146484375, "step": 411}
{"info/global_step": 412, "train_info/time_within_train_step": 27.70905613899231, "step": 412}
{"train_info/time_between_train_steps": 0.0051572322845458984, "step": 412}
{"info/global_step": 413, "train_info/time_within_train_step": 27.758363723754883, "step": 413}
{"train_info/time_between_train_steps": 0.005182504653930664, "step": 413}
{"info/global_step": 414, "train_info/time_within_train_step": 27.706284999847412, "step": 414}
{"train_info/time_between_train_steps": 0.005072832107543945, "step": 414}
{"info/global_step": 415, "train_info/time_within_train_step": 27.75137162208557, "step": 415}
{"train_info/time_between_train_steps": 0.0049936771392822266, "step": 415}
{"info/global_step": 416, "train_info/time_within_train_step": 27.705172777175903, "step": 416}
{"train_info/time_between_train_steps": 0.0048673152923583984, "step": 416}
{"info/global_step": 417, "train_info/time_within_train_step": 27.67977213859558, "step": 417}
{"train_info/time_between_train_steps": 0.006400346755981445, "step": 417}
{"info/global_step": 418, "train_info/time_within_train_step": 27.70727276802063, "step": 418}
{"train_info/time_between_train_steps": 0.005223512649536133, "step": 418}
{"info/global_step": 419, "train_info/time_within_train_step": 27.700334548950195, "step": 419}
{"train_info/time_between_train_steps": 0.0051424503326416016, "step": 419}
{"info/global_step": 420, "train_info/time_within_train_step": 27.692026138305664, "step": 420}
{"train_info/time_between_train_steps": 0.004917621612548828, "step": 420}
{"info/global_step": 421, "train_info/time_within_train_step": 27.69590401649475, "step": 421}
{"train_info/time_between_train_steps": 0.0050792694091796875, "step": 421}
{"info/global_step": 422, "train_info/time_within_train_step": 27.700926065444946, "step": 422}
{"train_info/time_between_train_steps": 0.00507354736328125, "step": 422}
{"info/global_step": 423, "train_info/time_within_train_step": 27.79981303215027, "step": 423}
{"train_info/time_between_train_steps": 0.005093574523925781, "step": 423}
{"info/global_step": 424, "train_info/time_within_train_step": 27.758687257766724, "step": 424}
{"train_info/time_between_train_steps": 0.0050466060638427734, "step": 424}
{"info/global_step": 425, "train_info/time_within_train_step": 27.749645948410034, "step": 425}
{"train_info/time_between_train_steps": 0.005060911178588867, "step": 425}
{"info/global_step": 426, "train_info/time_within_train_step": 27.69817852973938, "step": 426}
{"train_info/time_between_train_steps": 0.005190134048461914, "step": 426}
{"info/global_step": 427, "train_info/time_within_train_step": 27.70855951309204, "step": 427}
{"train_info/time_between_train_steps": 0.005096912384033203, "step": 427}
{"info/global_step": 428, "train_info/time_within_train_step": 27.706968545913696, "step": 428}
{"train_info/time_between_train_steps": 0.005213737487792969, "step": 428}
{"info/global_step": 429, "train_info/time_within_train_step": 27.702224731445312, "step": 429}
{"train_info/time_between_train_steps": 0.0052144527435302734, "step": 429}
{"info/global_step": 430, "train_info/time_within_train_step": 27.693960666656494, "step": 430}
{"train_info/time_between_train_steps": 0.0050580501556396484, "step": 430}
{"info/global_step": 431, "train_info/time_within_train_step": 27.7053120136261, "step": 431}
{"train_info/time_between_train_steps": 0.005528926849365234, "step": 431}
{"info/global_step": 432, "train_info/time_within_train_step": 27.731310606002808, "step": 432}
{"train_info/time_between_train_steps": 0.005760908126831055, "step": 432}
{"train_info/time_between_train_steps": 30.011183500289917, "step": 432}
{"info/global_step": 433, "train_info/time_within_train_step": 27.687133073806763, "step": 433}
{"train_info/time_between_train_steps": 0.005784034729003906, "step": 433}
{"info/global_step": 434, "train_info/time_within_train_step": 27.78863286972046, "step": 434}
{"train_info/time_between_train_steps": 0.0049784183502197266, "step": 434}
{"info/global_step": 435, "train_info/time_within_train_step": 27.70439052581787, "step": 435}
{"train_info/time_between_train_steps": 0.0050051212310791016, "step": 435}
{"info/global_step": 436, "train_info/time_within_train_step": 27.87604570388794, "step": 436}
{"train_info/time_between_train_steps": 0.005239248275756836, "step": 436}
{"info/global_step": 437, "train_info/time_within_train_step": 27.721327304840088, "step": 437}
{"train_info/time_between_train_steps": 0.00516200065612793, "step": 437}
{"info/global_step": 438, "train_info/time_within_train_step": 27.966629028320312, "step": 438}
{"train_info/time_between_train_steps": 0.005241870880126953, "step": 438}
{"info/global_step": 439, "train_info/time_within_train_step": 27.712815284729004, "step": 439}
{"train_info/time_between_train_steps": 0.005032539367675781, "step": 439}
{"info/global_step": 440, "train_info/time_within_train_step": 27.811208486557007, "step": 440}
{"train_info/time_between_train_steps": 0.005095958709716797, "step": 440}
{"info/global_step": 441, "train_info/time_within_train_step": 27.708343982696533, "step": 441}
{"train_info/time_between_train_steps": 0.004823923110961914, "step": 441}
{"info/global_step": 442, "train_info/time_within_train_step": 27.750231981277466, "step": 442}
{"train_info/time_between_train_steps": 0.018458127975463867, "step": 442}
{"info/global_step": 443, "train_info/time_within_train_step": 27.683879375457764, "step": 443}
{"train_info/time_between_train_steps": 0.0050656795501708984, "step": 443}
{"info/global_step": 444, "train_info/time_within_train_step": 29.24922800064087, "step": 444}
{"train_info/time_between_train_steps": 0.004964113235473633, "step": 444}
{"info/global_step": 445, "train_info/time_within_train_step": 27.76553773880005, "step": 445}
{"train_info/time_between_train_steps": 0.005015373229980469, "step": 445}
{"info/global_step": 446, "train_info/time_within_train_step": 27.73563504219055, "step": 446}
{"train_info/time_between_train_steps": 0.004942655563354492, "step": 446}
{"info/global_step": 447, "train_info/time_within_train_step": 27.6950044631958, "step": 447}
{"train_info/time_between_train_steps": 0.004893302917480469, "step": 447}
{"info/global_step": 448, "train_info/time_within_train_step": 27.699372053146362, "step": 448}
{"train_info/time_between_train_steps": 0.004933357238769531, "step": 448}
{"info/global_step": 449, "train_info/time_within_train_step": 27.707264184951782, "step": 449}
{"train_info/time_between_train_steps": 0.0060825347900390625, "step": 449}
{"info/global_step": 450, "train_info/time_within_train_step": 27.698795557022095, "step": 450}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740837347, "_runtime": 13296}, "step": 450}
{"logs": {"train/loss": 4.0675, "train/learning_rate": 0.00041666666666666664, "train/epoch": 16.02, "_timestamp": 1740837347, "_runtime": 13296}, "step": 450}
{"train_info/time_between_train_steps": 0.02537989616394043, "step": 450}
{"info/global_step": 451, "train_info/time_within_train_step": 27.69651222229004, "step": 451}
{"train_info/time_between_train_steps": 0.004915714263916016, "step": 451}
{"info/global_step": 452, "train_info/time_within_train_step": 27.699123859405518, "step": 452}
{"train_info/time_between_train_steps": 0.0050487518310546875, "step": 452}
{"info/global_step": 453, "train_info/time_within_train_step": 27.716983318328857, "step": 453}
{"train_info/time_between_train_steps": 0.004937648773193359, "step": 453}
{"info/global_step": 454, "train_info/time_within_train_step": 27.78393054008484, "step": 454}
{"train_info/time_between_train_steps": 0.004942893981933594, "step": 454}
{"info/global_step": 455, "train_info/time_within_train_step": 27.7157461643219, "step": 455}
{"train_info/time_between_train_steps": 0.009691953659057617, "step": 455}
{"info/global_step": 456, "train_info/time_within_train_step": 27.7082998752594, "step": 456}
{"train_info/time_between_train_steps": 0.009653568267822266, "step": 456}
{"info/global_step": 457, "train_info/time_within_train_step": 27.686444997787476, "step": 457}
{"train_info/time_between_train_steps": 0.008860588073730469, "step": 457}
{"info/global_step": 458, "train_info/time_within_train_step": 27.70262885093689, "step": 458}
{"train_info/time_between_train_steps": 0.0054280757904052734, "step": 458}
{"info/global_step": 459, "train_info/time_within_train_step": 27.73326849937439, "step": 459}
{"train_info/time_between_train_steps": 0.0060231685638427734, "step": 459}
{"train_info/time_between_train_steps": 29.680886268615723, "step": 459}
{"info/global_step": 460, "train_info/time_within_train_step": 27.70081377029419, "step": 460}
{"train_info/time_between_train_steps": 0.004883289337158203, "step": 460}
{"info/global_step": 461, "train_info/time_within_train_step": 27.82279086112976, "step": 461}
{"train_info/time_between_train_steps": 0.004965305328369141, "step": 461}
{"info/global_step": 462, "train_info/time_within_train_step": 27.67608880996704, "step": 462}
{"train_info/time_between_train_steps": 0.0050067901611328125, "step": 462}
{"info/global_step": 463, "train_info/time_within_train_step": 27.8287250995636, "step": 463}
{"train_info/time_between_train_steps": 0.004859447479248047, "step": 463}
{"info/global_step": 464, "train_info/time_within_train_step": 27.717490196228027, "step": 464}
{"train_info/time_between_train_steps": 0.005129814147949219, "step": 464}
{"info/global_step": 465, "train_info/time_within_train_step": 27.812546968460083, "step": 465}
{"train_info/time_between_train_steps": 0.0052373409271240234, "step": 465}
{"info/global_step": 466, "train_info/time_within_train_step": 27.700138807296753, "step": 466}
{"train_info/time_between_train_steps": 0.00538325309753418, "step": 466}
{"info/global_step": 467, "train_info/time_within_train_step": 27.776431798934937, "step": 467}
{"train_info/time_between_train_steps": 0.0051174163818359375, "step": 467}
{"info/global_step": 468, "train_info/time_within_train_step": 27.813345432281494, "step": 468}
{"train_info/time_between_train_steps": 0.005002021789550781, "step": 468}
{"info/global_step": 469, "train_info/time_within_train_step": 27.678297758102417, "step": 469}
{"train_info/time_between_train_steps": 0.004813194274902344, "step": 469}
{"info/global_step": 470, "train_info/time_within_train_step": 27.696513891220093, "step": 470}
{"train_info/time_between_train_steps": 0.005072355270385742, "step": 470}
{"info/global_step": 471, "train_info/time_within_train_step": 27.67917037010193, "step": 471}
{"train_info/time_between_train_steps": 0.004827022552490234, "step": 471}
{"info/global_step": 472, "train_info/time_within_train_step": 27.681620597839355, "step": 472}
{"train_info/time_between_train_steps": 0.004870891571044922, "step": 472}
{"info/global_step": 473, "train_info/time_within_train_step": 27.683671236038208, "step": 473}
{"train_info/time_between_train_steps": 0.00515437126159668, "step": 473}
{"info/global_step": 474, "train_info/time_within_train_step": 27.71831178665161, "step": 474}
{"train_info/time_between_train_steps": 0.013263702392578125, "step": 474}
{"info/global_step": 475, "train_info/time_within_train_step": 27.70002269744873, "step": 475}
{"train_info/time_between_train_steps": 0.005238771438598633, "step": 475}
{"info/global_step": 476, "train_info/time_within_train_step": 27.71768283843994, "step": 476}
{"train_info/time_between_train_steps": 0.0050048828125, "step": 476}
{"info/global_step": 477, "train_info/time_within_train_step": 27.703116178512573, "step": 477}
{"train_info/time_between_train_steps": 0.005093574523925781, "step": 477}
{"info/global_step": 478, "train_info/time_within_train_step": 27.704834461212158, "step": 478}
{"train_info/time_between_train_steps": 0.004998922348022461, "step": 478}
{"info/global_step": 479, "train_info/time_within_train_step": 27.68981170654297, "step": 479}
{"train_info/time_between_train_steps": 0.004964351654052734, "step": 479}
{"info/global_step": 480, "train_info/time_within_train_step": 27.743243932724, "step": 480}
{"train_info/time_between_train_steps": 0.005007266998291016, "step": 480}
{"info/global_step": 481, "train_info/time_within_train_step": 27.691340684890747, "step": 481}
{"train_info/time_between_train_steps": 0.005079746246337891, "step": 481}
{"info/global_step": 482, "train_info/time_within_train_step": 27.739471673965454, "step": 482}
{"train_info/time_between_train_steps": 0.00523066520690918, "step": 482}
{"info/global_step": 483, "train_info/time_within_train_step": 27.704129219055176, "step": 483}
{"train_info/time_between_train_steps": 0.0051233768463134766, "step": 483}
{"info/global_step": 484, "train_info/time_within_train_step": 27.82376503944397, "step": 484}
{"train_info/time_between_train_steps": 0.005006313323974609, "step": 484}
{"info/global_step": 485, "train_info/time_within_train_step": 27.71829867362976, "step": 485}
{"train_info/time_between_train_steps": 0.0052585601806640625, "step": 485}
{"info/global_step": 486, "train_info/time_within_train_step": 27.73840022087097, "step": 486}
{"train_info/time_between_train_steps": 0.0056896209716796875, "step": 486}
{"train_info/time_between_train_steps": 29.915683031082153, "step": 486}
{"info/global_step": 487, "train_info/time_within_train_step": 27.691699743270874, "step": 487}
{"train_info/time_between_train_steps": 0.005095958709716797, "step": 487}
{"info/global_step": 488, "train_info/time_within_train_step": 27.855538368225098, "step": 488}
{"train_info/time_between_train_steps": 0.0050945281982421875, "step": 488}
{"info/global_step": 489, "train_info/time_within_train_step": 27.69971466064453, "step": 489}
{"train_info/time_between_train_steps": 0.005095243453979492, "step": 489}
{"info/global_step": 490, "train_info/time_within_train_step": 27.817004680633545, "step": 490}
{"train_info/time_between_train_steps": 0.005288839340209961, "step": 490}
{"info/global_step": 491, "train_info/time_within_train_step": 27.711607933044434, "step": 491}
{"train_info/time_between_train_steps": 0.005115985870361328, "step": 491}
{"info/global_step": 492, "train_info/time_within_train_step": 27.830391883850098, "step": 492}
{"train_info/time_between_train_steps": 0.005289316177368164, "step": 492}
{"info/global_step": 493, "train_info/time_within_train_step": 27.7207989692688, "step": 493}
{"train_info/time_between_train_steps": 0.005590915679931641, "step": 493}
{"info/global_step": 494, "train_info/time_within_train_step": 27.78736186027527, "step": 494}
{"train_info/time_between_train_steps": 0.005058765411376953, "step": 494}
{"info/global_step": 495, "train_info/time_within_train_step": 27.695293188095093, "step": 495}
{"train_info/time_between_train_steps": 0.004912137985229492, "step": 495}
{"info/global_step": 496, "train_info/time_within_train_step": 27.72775363922119, "step": 496}
{"train_info/time_between_train_steps": 0.004870891571044922, "step": 496}
{"info/global_step": 497, "train_info/time_within_train_step": 27.71324372291565, "step": 497}
{"train_info/time_between_train_steps": 0.004956960678100586, "step": 497}
{"info/global_step": 498, "train_info/time_within_train_step": 27.718392848968506, "step": 498}
{"train_info/time_between_train_steps": 0.0049381256103515625, "step": 498}
{"info/global_step": 499, "train_info/time_within_train_step": 27.786532163619995, "step": 499}
{"train_info/time_between_train_steps": 0.004997730255126953, "step": 499}
{"info/global_step": 500, "train_info/time_within_train_step": 28.196540355682373, "step": 500}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740838795, "_runtime": 14744}, "step": 500}
{"logs": {"train/loss": 3.936, "train/learning_rate": 0.00038888888888888887, "train/epoch": 18.01, "_timestamp": 1740838795, "_runtime": 14744}, "step": 500}
{"train_info/time_between_train_steps": 64.55442786216736, "step": 500}
{"info/global_step": 501, "train_info/time_within_train_step": 27.69785189628601, "step": 501}
{"train_info/time_between_train_steps": 0.004908323287963867, "step": 501}
{"info/global_step": 502, "train_info/time_within_train_step": 27.69355058670044, "step": 502}
{"train_info/time_between_train_steps": 0.0048902034759521484, "step": 502}
{"info/global_step": 503, "train_info/time_within_train_step": 27.72808003425598, "step": 503}
{"train_info/time_between_train_steps": 0.005031108856201172, "step": 503}
{"info/global_step": 504, "train_info/time_within_train_step": 27.694600105285645, "step": 504}
{"train_info/time_between_train_steps": 0.0051152706146240234, "step": 504}
{"info/global_step": 505, "train_info/time_within_train_step": 27.69920802116394, "step": 505}
{"train_info/time_between_train_steps": 0.005002737045288086, "step": 505}
{"info/global_step": 506, "train_info/time_within_train_step": 27.73385739326477, "step": 506}
{"train_info/time_between_train_steps": 0.0049896240234375, "step": 506}
{"info/global_step": 507, "train_info/time_within_train_step": 27.726142406463623, "step": 507}
{"train_info/time_between_train_steps": 0.004999637603759766, "step": 507}
{"info/global_step": 508, "train_info/time_within_train_step": 27.698557376861572, "step": 508}
{"train_info/time_between_train_steps": 0.009522676467895508, "step": 508}
{"info/global_step": 509, "train_info/time_within_train_step": 27.697508335113525, "step": 509}
{"train_info/time_between_train_steps": 0.005251646041870117, "step": 509}
{"info/global_step": 510, "train_info/time_within_train_step": 27.724956035614014, "step": 510}
{"train_info/time_between_train_steps": 0.00501561164855957, "step": 510}
{"info/global_step": 511, "train_info/time_within_train_step": 27.766982793807983, "step": 511}
{"train_info/time_between_train_steps": 0.005387306213378906, "step": 511}
{"info/global_step": 512, "train_info/time_within_train_step": 27.71553373336792, "step": 512}
{"train_info/time_between_train_steps": 0.005225181579589844, "step": 512}
{"info/global_step": 513, "train_info/time_within_train_step": 27.71915340423584, "step": 513}
{"train_info/time_between_train_steps": 0.005575418472290039, "step": 513}
{"train_info/time_between_train_steps": 30.185796976089478, "step": 513}
{"info/global_step": 514, "train_info/time_within_train_step": 27.700867652893066, "step": 514}
{"train_info/time_between_train_steps": 0.005086421966552734, "step": 514}
{"info/global_step": 515, "train_info/time_within_train_step": 27.80924940109253, "step": 515}
{"train_info/time_between_train_steps": 0.004841327667236328, "step": 515}
{"info/global_step": 516, "train_info/time_within_train_step": 27.684515237808228, "step": 516}
{"train_info/time_between_train_steps": 0.004948139190673828, "step": 516}
{"info/global_step": 517, "train_info/time_within_train_step": 27.853545427322388, "step": 517}
{"train_info/time_between_train_steps": 0.005072593688964844, "step": 517}
{"info/global_step": 518, "train_info/time_within_train_step": 27.71235942840576, "step": 518}
{"train_info/time_between_train_steps": 0.00508570671081543, "step": 518}
{"info/global_step": 519, "train_info/time_within_train_step": 27.85283660888672, "step": 519}
{"train_info/time_between_train_steps": 0.005338430404663086, "step": 519}
{"info/global_step": 520, "train_info/time_within_train_step": 27.710861921310425, "step": 520}
{"train_info/time_between_train_steps": 0.005052328109741211, "step": 520}
{"info/global_step": 521, "train_info/time_within_train_step": 27.763000011444092, "step": 521}
{"train_info/time_between_train_steps": 0.006014347076416016, "step": 521}
{"info/global_step": 522, "train_info/time_within_train_step": 27.696249961853027, "step": 522}
{"train_info/time_between_train_steps": 0.005732297897338867, "step": 522}
{"info/global_step": 523, "train_info/time_within_train_step": 27.700204849243164, "step": 523}
{"train_info/time_between_train_steps": 0.009996414184570312, "step": 523}
{"info/global_step": 524, "train_info/time_within_train_step": 27.69421911239624, "step": 524}
{"train_info/time_between_train_steps": 0.004848957061767578, "step": 524}
{"info/global_step": 525, "train_info/time_within_train_step": 27.737581968307495, "step": 525}
{"train_info/time_between_train_steps": 0.005200862884521484, "step": 525}
{"info/global_step": 526, "train_info/time_within_train_step": 27.71271014213562, "step": 526}
{"train_info/time_between_train_steps": 0.005055427551269531, "step": 526}
{"info/global_step": 527, "train_info/time_within_train_step": 27.711381912231445, "step": 527}
{"train_info/time_between_train_steps": 0.005002021789550781, "step": 527}
{"info/global_step": 528, "train_info/time_within_train_step": 27.71398138999939, "step": 528}
{"train_info/time_between_train_steps": 0.006079673767089844, "step": 528}
{"info/global_step": 529, "train_info/time_within_train_step": 27.789142370224, "step": 529}
{"train_info/time_between_train_steps": 0.0049517154693603516, "step": 529}
{"info/global_step": 530, "train_info/time_within_train_step": 27.68666648864746, "step": 530}
{"train_info/time_between_train_steps": 0.004893064498901367, "step": 530}
{"info/global_step": 531, "train_info/time_within_train_step": 27.688210010528564, "step": 531}
{"train_info/time_between_train_steps": 0.00621795654296875, "step": 531}
{"info/global_step": 532, "train_info/time_within_train_step": 27.689505338668823, "step": 532}
{"train_info/time_between_train_steps": 0.0049800872802734375, "step": 532}
{"info/global_step": 533, "train_info/time_within_train_step": 27.689338207244873, "step": 533}
{"train_info/time_between_train_steps": 0.006212472915649414, "step": 533}
{"info/global_step": 534, "train_info/time_within_train_step": 27.70200538635254, "step": 534}
{"train_info/time_between_train_steps": 0.005033731460571289, "step": 534}
{"info/global_step": 535, "train_info/time_within_train_step": 27.70678949356079, "step": 535}
{"train_info/time_between_train_steps": 0.0049381256103515625, "step": 535}
{"info/global_step": 536, "train_info/time_within_train_step": 27.74942111968994, "step": 536}
{"train_info/time_between_train_steps": 0.0050258636474609375, "step": 536}
{"info/global_step": 537, "train_info/time_within_train_step": 27.696080207824707, "step": 537}
{"train_info/time_between_train_steps": 0.00498199462890625, "step": 537}
{"info/global_step": 538, "train_info/time_within_train_step": 27.69432020187378, "step": 538}
{"train_info/time_between_train_steps": 0.0051441192626953125, "step": 538}
{"info/global_step": 539, "train_info/time_within_train_step": 27.725271463394165, "step": 539}
{"train_info/time_between_train_steps": 0.005257368087768555, "step": 539}
{"info/global_step": 540, "train_info/time_within_train_step": 27.71247100830078, "step": 540}
{"train_info/time_between_train_steps": 0.005945682525634766, "step": 540}
{"train_info/time_between_train_steps": 36.31485557556152, "step": 540}
{"info/global_step": 541, "train_info/time_within_train_step": 31.44718313217163, "step": 541}
{"train_info/time_between_train_steps": 0.00576329231262207, "step": 541}
{"info/global_step": 542, "train_info/time_within_train_step": 28.567880153656006, "step": 542}
{"train_info/time_between_train_steps": 0.006264448165893555, "step": 542}
{"info/global_step": 543, "train_info/time_within_train_step": 27.70960235595703, "step": 543}
{"train_info/time_between_train_steps": 0.005270481109619141, "step": 543}
{"info/global_step": 544, "train_info/time_within_train_step": 27.930503845214844, "step": 544}
{"train_info/time_between_train_steps": 0.005115985870361328, "step": 544}
{"info/global_step": 545, "train_info/time_within_train_step": 27.697705268859863, "step": 545}
{"train_info/time_between_train_steps": 0.005143404006958008, "step": 545}
{"info/global_step": 546, "train_info/time_within_train_step": 27.81600570678711, "step": 546}
{"train_info/time_between_train_steps": 0.005052804946899414, "step": 546}
{"info/global_step": 547, "train_info/time_within_train_step": 27.70984649658203, "step": 547}
{"train_info/time_between_train_steps": 0.005257844924926758, "step": 547}
{"info/global_step": 548, "train_info/time_within_train_step": 27.833492517471313, "step": 548}
{"train_info/time_between_train_steps": 0.005406379699707031, "step": 548}
{"info/global_step": 549, "train_info/time_within_train_step": 27.709967851638794, "step": 549}
{"train_info/time_between_train_steps": 0.005059957504272461, "step": 549}
{"info/global_step": 550, "train_info/time_within_train_step": 27.716723918914795, "step": 550}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740840322, "_runtime": 16271}, "step": 550}
{"logs": {"train/loss": 3.8214, "train/learning_rate": 0.0003611111111111111, "train/epoch": 20.01, "_timestamp": 1740840322, "_runtime": 16271}, "step": 550}
{"train_info/time_between_train_steps": 0.029241561889648438, "step": 550}
{"info/global_step": 551, "train_info/time_within_train_step": 27.68070387840271, "step": 551}
{"train_info/time_between_train_steps": 0.00505518913269043, "step": 551}
{"info/global_step": 552, "train_info/time_within_train_step": 27.69338059425354, "step": 552}
{"train_info/time_between_train_steps": 0.005041837692260742, "step": 552}
{"info/global_step": 553, "train_info/time_within_train_step": 27.707963943481445, "step": 553}
{"train_info/time_between_train_steps": 0.005029439926147461, "step": 553}
{"info/global_step": 554, "train_info/time_within_train_step": 27.71103072166443, "step": 554}
{"train_info/time_between_train_steps": 0.0049855709075927734, "step": 554}
{"info/global_step": 555, "train_info/time_within_train_step": 27.692758083343506, "step": 555}
{"train_info/time_between_train_steps": 0.0049703121185302734, "step": 555}
{"info/global_step": 556, "train_info/time_within_train_step": 27.69515872001648, "step": 556}
{"train_info/time_between_train_steps": 0.005334377288818359, "step": 556}
{"info/global_step": 557, "train_info/time_within_train_step": 27.68488907814026, "step": 557}
{"train_info/time_between_train_steps": 0.005007266998291016, "step": 557}
{"info/global_step": 558, "train_info/time_within_train_step": 27.690217971801758, "step": 558}
{"train_info/time_between_train_steps": 0.00502324104309082, "step": 558}
{"info/global_step": 559, "train_info/time_within_train_step": 27.813263416290283, "step": 559}
{"train_info/time_between_train_steps": 0.004905223846435547, "step": 559}
{"info/global_step": 560, "train_info/time_within_train_step": 27.685781002044678, "step": 560}
{"train_info/time_between_train_steps": 0.004985332489013672, "step": 560}
{"info/global_step": 561, "train_info/time_within_train_step": 27.75338840484619, "step": 561}
{"train_info/time_between_train_steps": 0.00590205192565918, "step": 561}
{"info/global_step": 562, "train_info/time_within_train_step": 27.699915170669556, "step": 562}
{"train_info/time_between_train_steps": 0.0050733089447021484, "step": 562}
{"info/global_step": 563, "train_info/time_within_train_step": 27.69005846977234, "step": 563}
{"train_info/time_between_train_steps": 0.00516200065612793, "step": 563}
{"info/global_step": 564, "train_info/time_within_train_step": 27.69141435623169, "step": 564}
{"train_info/time_between_train_steps": 0.005044460296630859, "step": 564}
{"info/global_step": 565, "train_info/time_within_train_step": 27.70297145843506, "step": 565}
{"train_info/time_between_train_steps": 0.005186319351196289, "step": 565}
{"info/global_step": 566, "train_info/time_within_train_step": 27.690438508987427, "step": 566}
{"train_info/time_between_train_steps": 0.005147457122802734, "step": 566}
{"info/global_step": 567, "train_info/time_within_train_step": 27.759084463119507, "step": 567}
{"train_info/time_between_train_steps": 0.005579233169555664, "step": 567}
{"train_info/time_between_train_steps": 30.04567527770996, "step": 567}
{"info/global_step": 568, "train_info/time_within_train_step": 27.692572832107544, "step": 568}
{"train_info/time_between_train_steps": 0.004819631576538086, "step": 568}
{"info/global_step": 569, "train_info/time_within_train_step": 27.807674884796143, "step": 569}
{"train_info/time_between_train_steps": 0.0050504207611083984, "step": 569}
{"info/global_step": 570, "train_info/time_within_train_step": 27.760478019714355, "step": 570}
{"train_info/time_between_train_steps": 0.005127668380737305, "step": 570}
{"info/global_step": 571, "train_info/time_within_train_step": 27.869112253189087, "step": 571}
{"train_info/time_between_train_steps": 0.005037546157836914, "step": 571}
{"info/global_step": 572, "train_info/time_within_train_step": 27.690861463546753, "step": 572}
{"train_info/time_between_train_steps": 0.004973173141479492, "step": 572}
{"info/global_step": 573, "train_info/time_within_train_step": 27.83838653564453, "step": 573}
{"train_info/time_between_train_steps": 0.005025148391723633, "step": 573}
{"info/global_step": 574, "train_info/time_within_train_step": 27.77498745918274, "step": 574}
{"train_info/time_between_train_steps": 0.004961967468261719, "step": 574}
{"info/global_step": 575, "train_info/time_within_train_step": 27.73822259902954, "step": 575}
{"train_info/time_between_train_steps": 0.0049092769622802734, "step": 575}
{"info/global_step": 576, "train_info/time_within_train_step": 27.70577049255371, "step": 576}
{"train_info/time_between_train_steps": 0.0057790279388427734, "step": 576}
{"info/global_step": 577, "train_info/time_within_train_step": 27.693512201309204, "step": 577}
{"train_info/time_between_train_steps": 0.005444765090942383, "step": 577}
{"info/global_step": 578, "train_info/time_within_train_step": 27.717949628829956, "step": 578}
{"train_info/time_between_train_steps": 0.00528717041015625, "step": 578}
{"info/global_step": 579, "train_info/time_within_train_step": 27.69823670387268, "step": 579}
{"train_info/time_between_train_steps": 0.00484919548034668, "step": 579}
{"info/global_step": 580, "train_info/time_within_train_step": 27.6811785697937, "step": 580}
{"train_info/time_between_train_steps": 0.004903316497802734, "step": 580}
{"info/global_step": 581, "train_info/time_within_train_step": 27.683958292007446, "step": 581}
{"train_info/time_between_train_steps": 0.004791736602783203, "step": 581}
{"info/global_step": 582, "train_info/time_within_train_step": 27.70455765724182, "step": 582}
{"train_info/time_between_train_steps": 0.0051152706146240234, "step": 582}
{"info/global_step": 583, "train_info/time_within_train_step": 27.727899074554443, "step": 583}
{"train_info/time_between_train_steps": 0.0048978328704833984, "step": 583}
{"info/global_step": 584, "train_info/time_within_train_step": 27.691884517669678, "step": 584}
{"train_info/time_between_train_steps": 0.0048902034759521484, "step": 584}
{"info/global_step": 585, "train_info/time_within_train_step": 27.700793266296387, "step": 585}
{"train_info/time_between_train_steps": 0.006008625030517578, "step": 585}
{"info/global_step": 586, "train_info/time_within_train_step": 27.711878776550293, "step": 586}
{"train_info/time_between_train_steps": 0.005179405212402344, "step": 586}
{"info/global_step": 587, "train_info/time_within_train_step": 27.685803651809692, "step": 587}
{"train_info/time_between_train_steps": 0.0050411224365234375, "step": 587}
{"info/global_step": 588, "train_info/time_within_train_step": 27.742922067642212, "step": 588}
{"train_info/time_between_train_steps": 0.005070209503173828, "step": 588}
{"info/global_step": 589, "train_info/time_within_train_step": 27.69490623474121, "step": 589}
{"train_info/time_between_train_steps": 0.004949092864990234, "step": 589}
{"info/global_step": 590, "train_info/time_within_train_step": 27.79101538658142, "step": 590}
{"train_info/time_between_train_steps": 0.005232095718383789, "step": 590}
{"info/global_step": 591, "train_info/time_within_train_step": 27.696873426437378, "step": 591}
{"train_info/time_between_train_steps": 0.005121946334838867, "step": 591}
{"info/global_step": 592, "train_info/time_within_train_step": 27.7044837474823, "step": 592}
{"train_info/time_between_train_steps": 0.005169868469238281, "step": 592}
{"info/global_step": 593, "train_info/time_within_train_step": 27.726821660995483, "step": 593}
{"train_info/time_between_train_steps": 0.005170345306396484, "step": 593}
{"info/global_step": 594, "train_info/time_within_train_step": 27.709304571151733, "step": 594}
{"train_info/time_between_train_steps": 0.005827903747558594, "step": 594}
{"train_info/time_between_train_steps": 30.006944179534912, "step": 594}
{"info/global_step": 595, "train_info/time_within_train_step": 27.745293617248535, "step": 595}
{"train_info/time_between_train_steps": 0.005143404006958008, "step": 595}
{"info/global_step": 596, "train_info/time_within_train_step": 27.830859661102295, "step": 596}
{"train_info/time_between_train_steps": 0.004900693893432617, "step": 596}
{"info/global_step": 597, "train_info/time_within_train_step": 27.726498126983643, "step": 597}
{"train_info/time_between_train_steps": 0.005430459976196289, "step": 597}
{"info/global_step": 598, "train_info/time_within_train_step": 27.84933829307556, "step": 598}
{"train_info/time_between_train_steps": 0.005286693572998047, "step": 598}
{"info/global_step": 599, "train_info/time_within_train_step": 27.740664958953857, "step": 599}
{"train_info/time_between_train_steps": 0.005303859710693359, "step": 599}
{"info/global_step": 600, "train_info/time_within_train_step": 28.07859230041504, "step": 600}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740841771, "_runtime": 17720}, "step": 600}
{"logs": {"train/loss": 3.723, "train/learning_rate": 0.0003333333333333333, "train/epoch": 22.0, "_timestamp": 1740841771, "_runtime": 17720}, "step": 600}
{"train_info/time_between_train_steps": 59.91651129722595, "step": 600}
{"info/global_step": 601, "train_info/time_within_train_step": 27.71948218345642, "step": 601}
{"train_info/time_between_train_steps": 0.005325794219970703, "step": 601}
{"info/global_step": 602, "train_info/time_within_train_step": 27.825542211532593, "step": 602}
{"train_info/time_between_train_steps": 0.01570272445678711, "step": 602}
{"info/global_step": 603, "train_info/time_within_train_step": 27.71902060508728, "step": 603}
{"train_info/time_between_train_steps": 0.004909992218017578, "step": 603}
{"info/global_step": 604, "train_info/time_within_train_step": 27.78294014930725, "step": 604}
{"train_info/time_between_train_steps": 0.009931802749633789, "step": 604}
{"info/global_step": 605, "train_info/time_within_train_step": 27.680620431900024, "step": 605}
{"train_info/time_between_train_steps": 0.004824399948120117, "step": 605}
{"info/global_step": 606, "train_info/time_within_train_step": 27.729180574417114, "step": 606}
{"train_info/time_between_train_steps": 0.004915952682495117, "step": 606}
{"info/global_step": 607, "train_info/time_within_train_step": 27.707778692245483, "step": 607}
{"train_info/time_between_train_steps": 0.004945039749145508, "step": 607}
{"info/global_step": 608, "train_info/time_within_train_step": 27.703047037124634, "step": 608}
{"train_info/time_between_train_steps": 0.004849433898925781, "step": 608}
{"info/global_step": 609, "train_info/time_within_train_step": 27.712072372436523, "step": 609}
{"train_info/time_between_train_steps": 0.005087614059448242, "step": 609}
{"info/global_step": 610, "train_info/time_within_train_step": 27.723695516586304, "step": 610}
{"train_info/time_between_train_steps": 0.005009174346923828, "step": 610}
{"info/global_step": 611, "train_info/time_within_train_step": 27.698099851608276, "step": 611}
{"train_info/time_between_train_steps": 0.009967803955078125, "step": 611}
{"info/global_step": 612, "train_info/time_within_train_step": 27.715684413909912, "step": 612}
{"train_info/time_between_train_steps": 0.0049762725830078125, "step": 612}
{"info/global_step": 613, "train_info/time_within_train_step": 27.716911792755127, "step": 613}
{"train_info/time_between_train_steps": 0.0049707889556884766, "step": 613}
{"info/global_step": 614, "train_info/time_within_train_step": 27.717849731445312, "step": 614}
{"train_info/time_between_train_steps": 0.0050199031829833984, "step": 614}
{"info/global_step": 615, "train_info/time_within_train_step": 27.69408941268921, "step": 615}
{"train_info/time_between_train_steps": 0.0050411224365234375, "step": 615}
{"info/global_step": 616, "train_info/time_within_train_step": 27.692881107330322, "step": 616}
{"train_info/time_between_train_steps": 0.004937648773193359, "step": 616}
{"info/global_step": 617, "train_info/time_within_train_step": 27.756505727767944, "step": 617}
{"train_info/time_between_train_steps": 0.005895137786865234, "step": 617}
{"info/global_step": 618, "train_info/time_within_train_step": 27.710872650146484, "step": 618}
{"train_info/time_between_train_steps": 0.0050487518310546875, "step": 618}
{"info/global_step": 619, "train_info/time_within_train_step": 27.691160202026367, "step": 619}
{"train_info/time_between_train_steps": 0.004869222640991211, "step": 619}
{"info/global_step": 620, "train_info/time_within_train_step": 27.7916362285614, "step": 620}
{"train_info/time_between_train_steps": 0.00526118278503418, "step": 620}
{"info/global_step": 621, "train_info/time_within_train_step": 27.762264251708984, "step": 621}
{"train_info/time_between_train_steps": 0.005701780319213867, "step": 621}
{"train_info/time_between_train_steps": 29.927477598190308, "step": 621}
{"info/global_step": 622, "train_info/time_within_train_step": 27.695526599884033, "step": 622}
{"train_info/time_between_train_steps": 0.005052328109741211, "step": 622}
{"info/global_step": 623, "train_info/time_within_train_step": 27.814733266830444, "step": 623}
{"train_info/time_between_train_steps": 0.01009511947631836, "step": 623}
{"info/global_step": 624, "train_info/time_within_train_step": 27.718855142593384, "step": 624}
{"train_info/time_between_train_steps": 0.0048787593841552734, "step": 624}
{"info/global_step": 625, "train_info/time_within_train_step": 27.79455018043518, "step": 625}
{"train_info/time_between_train_steps": 0.00490260124206543, "step": 625}
{"info/global_step": 626, "train_info/time_within_train_step": 27.679096937179565, "step": 626}
{"train_info/time_between_train_steps": 0.004887104034423828, "step": 626}
{"info/global_step": 627, "train_info/time_within_train_step": 27.786513090133667, "step": 627}
{"train_info/time_between_train_steps": 0.004891633987426758, "step": 627}
{"info/global_step": 628, "train_info/time_within_train_step": 27.689024448394775, "step": 628}
{"train_info/time_between_train_steps": 0.005063295364379883, "step": 628}
{"info/global_step": 629, "train_info/time_within_train_step": 27.804577589035034, "step": 629}
{"train_info/time_between_train_steps": 0.0050029754638671875, "step": 629}
{"info/global_step": 630, "train_info/time_within_train_step": 27.69887900352478, "step": 630}
{"train_info/time_between_train_steps": 0.005058765411376953, "step": 630}
{"info/global_step": 631, "train_info/time_within_train_step": 27.703584909439087, "step": 631}
{"train_info/time_between_train_steps": 0.0050506591796875, "step": 631}
{"info/global_step": 632, "train_info/time_within_train_step": 27.69171977043152, "step": 632}
{"train_info/time_between_train_steps": 0.0048711299896240234, "step": 632}
{"info/global_step": 633, "train_info/time_within_train_step": 27.68562960624695, "step": 633}
{"train_info/time_between_train_steps": 0.0049097537994384766, "step": 633}
{"info/global_step": 634, "train_info/time_within_train_step": 27.800650358200073, "step": 634}
{"train_info/time_between_train_steps": 0.005928993225097656, "step": 634}
{"info/global_step": 635, "train_info/time_within_train_step": 27.688570022583008, "step": 635}
{"train_info/time_between_train_steps": 0.004832267761230469, "step": 635}
{"info/global_step": 636, "train_info/time_within_train_step": 27.68016266822815, "step": 636}
{"train_info/time_between_train_steps": 0.0048296451568603516, "step": 636}
{"info/global_step": 637, "train_info/time_within_train_step": 27.682127714157104, "step": 637}
{"train_info/time_between_train_steps": 0.005084514617919922, "step": 637}
{"info/global_step": 638, "train_info/time_within_train_step": 28.049829721450806, "step": 638}
{"train_info/time_between_train_steps": 0.005068540573120117, "step": 638}
{"info/global_step": 639, "train_info/time_within_train_step": 27.907888174057007, "step": 639}
{"train_info/time_between_train_steps": 0.005096435546875, "step": 639}
{"info/global_step": 640, "train_info/time_within_train_step": 27.747770071029663, "step": 640}
{"train_info/time_between_train_steps": 0.005161285400390625, "step": 640}
{"info/global_step": 641, "train_info/time_within_train_step": 27.862735271453857, "step": 641}
{"train_info/time_between_train_steps": 0.014527320861816406, "step": 641}
{"info/global_step": 642, "train_info/time_within_train_step": 27.90514826774597, "step": 642}
{"train_info/time_between_train_steps": 0.00490117073059082, "step": 642}
{"info/global_step": 643, "train_info/time_within_train_step": 27.67620015144348, "step": 643}
{"train_info/time_between_train_steps": 0.004919767379760742, "step": 643}
{"info/global_step": 644, "train_info/time_within_train_step": 27.7186119556427, "step": 644}
{"train_info/time_between_train_steps": 0.0049016475677490234, "step": 644}
{"info/global_step": 645, "train_info/time_within_train_step": 27.67970871925354, "step": 645}
{"train_info/time_between_train_steps": 0.005181312561035156, "step": 645}
{"info/global_step": 646, "train_info/time_within_train_step": 27.702643632888794, "step": 646}
{"train_info/time_between_train_steps": 0.005243539810180664, "step": 646}
{"info/global_step": 647, "train_info/time_within_train_step": 27.716694116592407, "step": 647}
{"train_info/time_between_train_steps": 0.005157947540283203, "step": 647}
{"info/global_step": 648, "train_info/time_within_train_step": 27.70688271522522, "step": 648}
{"train_info/time_between_train_steps": 0.005456209182739258, "step": 648}
{"train_info/time_between_train_steps": 29.816805839538574, "step": 648}
{"info/global_step": 649, "train_info/time_within_train_step": 27.816304445266724, "step": 649}
{"train_info/time_between_train_steps": 0.00494837760925293, "step": 649}
{"info/global_step": 650, "train_info/time_within_train_step": 27.78134250640869, "step": 650}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740843279, "_runtime": 19228}, "step": 650}
{"logs": {"train/loss": 3.6354, "train/learning_rate": 0.00030555555555555555, "train/epoch": 24.0, "_timestamp": 1740843279, "_runtime": 19228}, "step": 650}
{"train_info/time_between_train_steps": 0.0254976749420166, "step": 650}
{"info/global_step": 651, "train_info/time_within_train_step": 27.669740915298462, "step": 651}
{"train_info/time_between_train_steps": 0.004873752593994141, "step": 651}
{"info/global_step": 652, "train_info/time_within_train_step": 27.82678723335266, "step": 652}
{"train_info/time_between_train_steps": 0.005076408386230469, "step": 652}
{"info/global_step": 653, "train_info/time_within_train_step": 27.688273429870605, "step": 653}
{"train_info/time_between_train_steps": 0.005063056945800781, "step": 653}
{"info/global_step": 654, "train_info/time_within_train_step": 27.816269874572754, "step": 654}
{"train_info/time_between_train_steps": 0.00509190559387207, "step": 654}
{"info/global_step": 655, "train_info/time_within_train_step": 27.71123957633972, "step": 655}
{"train_info/time_between_train_steps": 0.005261659622192383, "step": 655}
{"info/global_step": 656, "train_info/time_within_train_step": 27.837177991867065, "step": 656}
{"train_info/time_between_train_steps": 0.005412578582763672, "step": 656}
{"info/global_step": 657, "train_info/time_within_train_step": 27.749289512634277, "step": 657}
{"train_info/time_between_train_steps": 0.005151510238647461, "step": 657}
{"info/global_step": 658, "train_info/time_within_train_step": 27.739206790924072, "step": 658}
{"train_info/time_between_train_steps": 0.005658388137817383, "step": 658}
{"info/global_step": 659, "train_info/time_within_train_step": 27.781262159347534, "step": 659}
{"train_info/time_between_train_steps": 0.005989789962768555, "step": 659}
{"info/global_step": 660, "train_info/time_within_train_step": 27.78048014640808, "step": 660}
{"train_info/time_between_train_steps": 0.011110067367553711, "step": 660}
{"info/global_step": 661, "train_info/time_within_train_step": 27.6915602684021, "step": 661}
{"train_info/time_between_train_steps": 0.0050084590911865234, "step": 661}
{"info/global_step": 662, "train_info/time_within_train_step": 27.73012065887451, "step": 662}
{"train_info/time_between_train_steps": 0.005239963531494141, "step": 662}
{"info/global_step": 663, "train_info/time_within_train_step": 27.711363792419434, "step": 663}
{"train_info/time_between_train_steps": 0.005080223083496094, "step": 663}
{"info/global_step": 664, "train_info/time_within_train_step": 27.70581340789795, "step": 664}
{"train_info/time_between_train_steps": 0.005072116851806641, "step": 664}
{"info/global_step": 665, "train_info/time_within_train_step": 27.810693502426147, "step": 665}
{"train_info/time_between_train_steps": 0.005069255828857422, "step": 665}
{"info/global_step": 666, "train_info/time_within_train_step": 27.854423999786377, "step": 666}
{"train_info/time_between_train_steps": 0.005458354949951172, "step": 666}
{"info/global_step": 667, "train_info/time_within_train_step": 27.761021375656128, "step": 667}
{"train_info/time_between_train_steps": 0.005433559417724609, "step": 667}
{"info/global_step": 668, "train_info/time_within_train_step": 27.719167947769165, "step": 668}
{"train_info/time_between_train_steps": 0.010063409805297852, "step": 668}
{"info/global_step": 669, "train_info/time_within_train_step": 27.74881339073181, "step": 669}
{"train_info/time_between_train_steps": 0.010021209716796875, "step": 669}
{"info/global_step": 670, "train_info/time_within_train_step": 27.755228996276855, "step": 670}
{"train_info/time_between_train_steps": 0.0055239200592041016, "step": 670}
{"info/global_step": 671, "train_info/time_within_train_step": 27.716668844223022, "step": 671}
{"train_info/time_between_train_steps": 0.005781412124633789, "step": 671}
{"info/global_step": 672, "train_info/time_within_train_step": 27.730043172836304, "step": 672}
{"train_info/time_between_train_steps": 0.00614619255065918, "step": 672}
{"info/global_step": 673, "train_info/time_within_train_step": 27.73808741569519, "step": 673}
{"train_info/time_between_train_steps": 0.006433010101318359, "step": 673}
{"info/global_step": 674, "train_info/time_within_train_step": 27.717840433120728, "step": 674}
{"train_info/time_between_train_steps": 0.005638599395751953, "step": 674}
{"info/global_step": 675, "train_info/time_within_train_step": 27.72583317756653, "step": 675}
{"train_info/time_between_train_steps": 0.007586479187011719, "step": 675}
{"train_info/time_between_train_steps": 30.315802574157715, "step": 675}
{"info/global_step": 676, "train_info/time_within_train_step": 27.711756944656372, "step": 676}
{"train_info/time_between_train_steps": 0.00566554069519043, "step": 676}
{"info/global_step": 677, "train_info/time_within_train_step": 27.88424015045166, "step": 677}
{"train_info/time_between_train_steps": 0.005429983139038086, "step": 677}
{"info/global_step": 678, "train_info/time_within_train_step": 27.725080966949463, "step": 678}
{"train_info/time_between_train_steps": 0.005316257476806641, "step": 678}
{"info/global_step": 679, "train_info/time_within_train_step": 27.953651666641235, "step": 679}
{"train_info/time_between_train_steps": 0.00548553466796875, "step": 679}
{"info/global_step": 680, "train_info/time_within_train_step": 27.70855474472046, "step": 680}
{"train_info/time_between_train_steps": 0.005279541015625, "step": 680}
{"info/global_step": 681, "train_info/time_within_train_step": 27.881622791290283, "step": 681}
{"train_info/time_between_train_steps": 0.0055027008056640625, "step": 681}
{"info/global_step": 682, "train_info/time_within_train_step": 27.704180479049683, "step": 682}
{"train_info/time_between_train_steps": 0.005196809768676758, "step": 682}
{"info/global_step": 683, "train_info/time_within_train_step": 27.837424516677856, "step": 683}
{"train_info/time_between_train_steps": 0.009970664978027344, "step": 683}
{"info/global_step": 684, "train_info/time_within_train_step": 27.703913688659668, "step": 684}
{"train_info/time_between_train_steps": 0.004930973052978516, "step": 684}
{"info/global_step": 685, "train_info/time_within_train_step": 27.676082372665405, "step": 685}
{"train_info/time_between_train_steps": 0.0050923824310302734, "step": 685}
{"info/global_step": 686, "train_info/time_within_train_step": 27.676323890686035, "step": 686}
{"train_info/time_between_train_steps": 0.004973411560058594, "step": 686}
{"info/global_step": 687, "train_info/time_within_train_step": 27.67393946647644, "step": 687}
{"train_info/time_between_train_steps": 0.005110263824462891, "step": 687}
{"info/global_step": 688, "train_info/time_within_train_step": 27.684831380844116, "step": 688}
{"train_info/time_between_train_steps": 0.005018949508666992, "step": 688}
{"info/global_step": 689, "train_info/time_within_train_step": 27.675782203674316, "step": 689}
{"train_info/time_between_train_steps": 0.0049669742584228516, "step": 689}
{"info/global_step": 690, "train_info/time_within_train_step": 27.680647373199463, "step": 690}
{"train_info/time_between_train_steps": 0.0051119327545166016, "step": 690}
{"info/global_step": 691, "train_info/time_within_train_step": 27.67592215538025, "step": 691}
{"train_info/time_between_train_steps": 0.0050356388092041016, "step": 691}
{"info/global_step": 692, "train_info/time_within_train_step": 27.69999861717224, "step": 692}
{"train_info/time_between_train_steps": 0.00520777702331543, "step": 692}
{"info/global_step": 693, "train_info/time_within_train_step": 27.71281623840332, "step": 693}
{"train_info/time_between_train_steps": 0.005997419357299805, "step": 693}
{"info/global_step": 694, "train_info/time_within_train_step": 27.84760284423828, "step": 694}
{"train_info/time_between_train_steps": 0.00611567497253418, "step": 694}
{"info/global_step": 695, "train_info/time_within_train_step": 27.909284353256226, "step": 695}
{"train_info/time_between_train_steps": 0.006217479705810547, "step": 695}
{"info/global_step": 696, "train_info/time_within_train_step": 27.845138549804688, "step": 696}
{"train_info/time_between_train_steps": 0.0060842037200927734, "step": 696}
{"info/global_step": 697, "train_info/time_within_train_step": 27.81016445159912, "step": 697}
{"train_info/time_between_train_steps": 0.005791902542114258, "step": 697}
{"info/global_step": 698, "train_info/time_within_train_step": 27.774031162261963, "step": 698}
{"train_info/time_between_train_steps": 0.00583958625793457, "step": 698}
{"info/global_step": 699, "train_info/time_within_train_step": 27.792640686035156, "step": 699}
{"train_info/time_between_train_steps": 0.006005764007568359, "step": 699}
{"info/global_step": 700, "train_info/time_within_train_step": 33.67160105705261, "step": 700}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740844706, "_runtime": 20655}, "step": 700}
{"logs": {"train/loss": 3.4857, "train/learning_rate": 0.0002777777777777778, "train/epoch": 25.02, "_timestamp": 1740844706, "_runtime": 20655}, "step": 700}
{"train_info/time_between_train_steps": 206.83106207847595, "step": 700}
{"info/global_step": 701, "train_info/time_within_train_step": 27.74384117126465, "step": 701}
{"train_info/time_between_train_steps": 0.0055615901947021484, "step": 701}
{"info/global_step": 702, "train_info/time_within_train_step": 27.77969193458557, "step": 702}
{"train_info/time_between_train_steps": 0.0064182281494140625, "step": 702}
{"train_info/time_between_train_steps": 30.54557156562805, "step": 702}
{"info/global_step": 703, "train_info/time_within_train_step": 27.71657419204712, "step": 703}
{"train_info/time_between_train_steps": 0.00524449348449707, "step": 703}
{"info/global_step": 704, "train_info/time_within_train_step": 27.796988010406494, "step": 704}
{"train_info/time_between_train_steps": 0.0049016475677490234, "step": 704}
{"info/global_step": 705, "train_info/time_within_train_step": 27.69405460357666, "step": 705}
{"train_info/time_between_train_steps": 0.00541996955871582, "step": 705}
{"info/global_step": 706, "train_info/time_within_train_step": 27.812695503234863, "step": 706}
{"train_info/time_between_train_steps": 0.005300283432006836, "step": 706}
{"info/global_step": 707, "train_info/time_within_train_step": 27.70946168899536, "step": 707}
{"train_info/time_between_train_steps": 0.005086183547973633, "step": 707}
{"info/global_step": 708, "train_info/time_within_train_step": 27.83755898475647, "step": 708}
{"train_info/time_between_train_steps": 0.014818906784057617, "step": 708}
{"info/global_step": 709, "train_info/time_within_train_step": 27.9216947555542, "step": 709}
{"train_info/time_between_train_steps": 0.005433797836303711, "step": 709}
{"info/global_step": 710, "train_info/time_within_train_step": 27.90178418159485, "step": 710}
{"train_info/time_between_train_steps": 0.005206108093261719, "step": 710}
{"info/global_step": 711, "train_info/time_within_train_step": 27.72823476791382, "step": 711}
{"train_info/time_between_train_steps": 0.005189180374145508, "step": 711}
{"info/global_step": 712, "train_info/time_within_train_step": 27.75936007499695, "step": 712}
{"train_info/time_between_train_steps": 0.014758825302124023, "step": 712}
{"info/global_step": 713, "train_info/time_within_train_step": 28.13560152053833, "step": 713}
{"train_info/time_between_train_steps": 0.0075531005859375, "step": 713}
{"info/global_step": 714, "train_info/time_within_train_step": 27.677961111068726, "step": 714}
{"train_info/time_between_train_steps": 0.014613628387451172, "step": 714}
{"info/global_step": 715, "train_info/time_within_train_step": 28.046892404556274, "step": 715}
{"train_info/time_between_train_steps": 0.005028963088989258, "step": 715}
{"info/global_step": 716, "train_info/time_within_train_step": 27.680304765701294, "step": 716}
{"train_info/time_between_train_steps": 0.005101680755615234, "step": 716}
{"info/global_step": 717, "train_info/time_within_train_step": 27.683669805526733, "step": 717}
{"train_info/time_between_train_steps": 0.005057811737060547, "step": 717}
{"info/global_step": 718, "train_info/time_within_train_step": 27.674943208694458, "step": 718}
{"train_info/time_between_train_steps": 0.005045652389526367, "step": 718}
{"info/global_step": 719, "train_info/time_within_train_step": 27.678584337234497, "step": 719}
{"train_info/time_between_train_steps": 0.004988193511962891, "step": 719}
{"info/global_step": 720, "train_info/time_within_train_step": 27.69148278236389, "step": 720}
{"train_info/time_between_train_steps": 0.005110979080200195, "step": 720}
{"info/global_step": 721, "train_info/time_within_train_step": 27.683693647384644, "step": 721}
{"train_info/time_between_train_steps": 0.005024433135986328, "step": 721}
{"info/global_step": 722, "train_info/time_within_train_step": 27.688849210739136, "step": 722}
{"train_info/time_between_train_steps": 0.005109071731567383, "step": 722}
{"info/global_step": 723, "train_info/time_within_train_step": 27.69204878807068, "step": 723}
{"train_info/time_between_train_steps": 0.005203723907470703, "step": 723}
{"info/global_step": 724, "train_info/time_within_train_step": 27.69172954559326, "step": 724}
{"train_info/time_between_train_steps": 0.005031585693359375, "step": 724}
{"info/global_step": 725, "train_info/time_within_train_step": 27.775407075881958, "step": 725}
{"train_info/time_between_train_steps": 0.005133867263793945, "step": 725}
{"info/global_step": 726, "train_info/time_within_train_step": 27.702449321746826, "step": 726}
{"train_info/time_between_train_steps": 0.005081892013549805, "step": 726}
{"info/global_step": 727, "train_info/time_within_train_step": 27.717079401016235, "step": 727}
{"train_info/time_between_train_steps": 0.005192279815673828, "step": 727}
{"info/global_step": 728, "train_info/time_within_train_step": 27.740185737609863, "step": 728}
{"train_info/time_between_train_steps": 0.0052754878997802734, "step": 728}
{"info/global_step": 729, "train_info/time_within_train_step": 27.71349334716797, "step": 729}
{"train_info/time_between_train_steps": 0.005593776702880859, "step": 729}
{"train_info/time_between_train_steps": 37.03710627555847, "step": 729}
{"info/global_step": 730, "train_info/time_within_train_step": 28.456470727920532, "step": 730}
{"train_info/time_between_train_steps": 0.005145549774169922, "step": 730}
{"info/global_step": 731, "train_info/time_within_train_step": 31.001458883285522, "step": 731}
{"train_info/time_between_train_steps": 0.00502324104309082, "step": 731}
{"info/global_step": 732, "train_info/time_within_train_step": 28.084529161453247, "step": 732}
{"train_info/time_between_train_steps": 0.005625486373901367, "step": 732}
{"info/global_step": 733, "train_info/time_within_train_step": 27.79112982749939, "step": 733}
{"train_info/time_between_train_steps": 0.004885435104370117, "step": 733}
{"info/global_step": 734, "train_info/time_within_train_step": 27.682578563690186, "step": 734}
{"train_info/time_between_train_steps": 0.004922151565551758, "step": 734}
{"info/global_step": 735, "train_info/time_within_train_step": 27.789616584777832, "step": 735}
{"train_info/time_between_train_steps": 0.0053522586822509766, "step": 735}
{"info/global_step": 736, "train_info/time_within_train_step": 27.67343544960022, "step": 736}
{"train_info/time_between_train_steps": 0.005559444427490234, "step": 736}
{"info/global_step": 737, "train_info/time_within_train_step": 27.784698963165283, "step": 737}
{"train_info/time_between_train_steps": 0.005016803741455078, "step": 737}
{"info/global_step": 738, "train_info/time_within_train_step": 27.70726728439331, "step": 738}
{"train_info/time_between_train_steps": 0.004850864410400391, "step": 738}
{"info/global_step": 739, "train_info/time_within_train_step": 27.677554845809937, "step": 739}
{"train_info/time_between_train_steps": 0.00502467155456543, "step": 739}
{"info/global_step": 740, "train_info/time_within_train_step": 27.785966873168945, "step": 740}
{"train_info/time_between_train_steps": 0.004889249801635742, "step": 740}
{"info/global_step": 741, "train_info/time_within_train_step": 27.673385620117188, "step": 741}
{"train_info/time_between_train_steps": 0.004769563674926758, "step": 741}
{"info/global_step": 742, "train_info/time_within_train_step": 27.661123991012573, "step": 742}
{"train_info/time_between_train_steps": 0.004848957061767578, "step": 742}
{"info/global_step": 743, "train_info/time_within_train_step": 27.662720918655396, "step": 743}
{"train_info/time_between_train_steps": 0.004853725433349609, "step": 743}
{"info/global_step": 744, "train_info/time_within_train_step": 27.66813635826111, "step": 744}
{"train_info/time_between_train_steps": 0.004850864410400391, "step": 744}
{"info/global_step": 745, "train_info/time_within_train_step": 27.67000436782837, "step": 745}
{"train_info/time_between_train_steps": 0.0048449039459228516, "step": 745}
{"info/global_step": 746, "train_info/time_within_train_step": 27.67826819419861, "step": 746}
{"train_info/time_between_train_steps": 0.004978656768798828, "step": 746}
{"info/global_step": 747, "train_info/time_within_train_step": 27.689675331115723, "step": 747}
{"train_info/time_between_train_steps": 0.005036354064941406, "step": 747}
{"info/global_step": 748, "train_info/time_within_train_step": 27.730032682418823, "step": 748}
{"train_info/time_between_train_steps": 0.005134105682373047, "step": 748}
{"info/global_step": 749, "train_info/time_within_train_step": 27.69027042388916, "step": 749}
{"train_info/time_between_train_steps": 0.004926919937133789, "step": 749}
{"info/global_step": 750, "train_info/time_within_train_step": 27.67449688911438, "step": 750}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740846376, "_runtime": 22325}, "step": 750}
{"logs": {"train/loss": 3.4873, "train/learning_rate": 0.00025, "train/epoch": 27.02, "_timestamp": 1740846376, "_runtime": 22325}, "step": 750}
{"train_info/time_between_train_steps": 0.026235580444335938, "step": 750}
{"info/global_step": 751, "train_info/time_within_train_step": 27.66990613937378, "step": 751}
{"train_info/time_between_train_steps": 0.004987239837646484, "step": 751}
{"info/global_step": 752, "train_info/time_within_train_step": 27.678941249847412, "step": 752}
{"train_info/time_between_train_steps": 0.0050542354583740234, "step": 752}
{"info/global_step": 753, "train_info/time_within_train_step": 27.687677145004272, "step": 753}
{"train_info/time_between_train_steps": 0.005120515823364258, "step": 753}
{"info/global_step": 754, "train_info/time_within_train_step": 27.688232898712158, "step": 754}
{"train_info/time_between_train_steps": 0.0049724578857421875, "step": 754}
{"info/global_step": 755, "train_info/time_within_train_step": 27.72896909713745, "step": 755}
{"train_info/time_between_train_steps": 0.005682945251464844, "step": 755}
{"info/global_step": 756, "train_info/time_within_train_step": 27.786107301712036, "step": 756}
{"train_info/time_between_train_steps": 0.005536079406738281, "step": 756}
{"train_info/time_between_train_steps": 30.098906755447388, "step": 756}
{"info/global_step": 757, "train_info/time_within_train_step": 27.687285661697388, "step": 757}
{"train_info/time_between_train_steps": 0.004949331283569336, "step": 757}
{"info/global_step": 758, "train_info/time_within_train_step": 27.771246910095215, "step": 758}
{"train_info/time_between_train_steps": 0.00491786003112793, "step": 758}
{"info/global_step": 759, "train_info/time_within_train_step": 27.673028469085693, "step": 759}
{"train_info/time_between_train_steps": 0.0048809051513671875, "step": 759}
{"info/global_step": 760, "train_info/time_within_train_step": 27.792242765426636, "step": 760}
{"train_info/time_between_train_steps": 0.00485682487487793, "step": 760}
{"info/global_step": 761, "train_info/time_within_train_step": 27.688682556152344, "step": 761}
{"train_info/time_between_train_steps": 0.004906415939331055, "step": 761}
{"info/global_step": 762, "train_info/time_within_train_step": 27.789018154144287, "step": 762}
{"train_info/time_between_train_steps": 0.004868268966674805, "step": 762}
{"info/global_step": 763, "train_info/time_within_train_step": 27.666141510009766, "step": 763}
{"train_info/time_between_train_steps": 0.0049626827239990234, "step": 763}
{"info/global_step": 764, "train_info/time_within_train_step": 27.7238347530365, "step": 764}
{"train_info/time_between_train_steps": 0.004948854446411133, "step": 764}
{"info/global_step": 765, "train_info/time_within_train_step": 27.692870616912842, "step": 765}
{"train_info/time_between_train_steps": 0.004865884780883789, "step": 765}
{"info/global_step": 766, "train_info/time_within_train_step": 27.687604665756226, "step": 766}
{"train_info/time_between_train_steps": 0.0048367977142333984, "step": 766}
{"info/global_step": 767, "train_info/time_within_train_step": 27.668979167938232, "step": 767}
{"train_info/time_between_train_steps": 0.0049648284912109375, "step": 767}
{"info/global_step": 768, "train_info/time_within_train_step": 27.667807579040527, "step": 768}
{"train_info/time_between_train_steps": 0.0049953460693359375, "step": 768}
{"info/global_step": 769, "train_info/time_within_train_step": 27.67560839653015, "step": 769}
{"train_info/time_between_train_steps": 0.005052328109741211, "step": 769}
{"info/global_step": 770, "train_info/time_within_train_step": 27.77580690383911, "step": 770}
{"train_info/time_between_train_steps": 0.0048673152923583984, "step": 770}
{"info/global_step": 771, "train_info/time_within_train_step": 27.685364246368408, "step": 771}
{"train_info/time_between_train_steps": 0.004854679107666016, "step": 771}
{"info/global_step": 772, "train_info/time_within_train_step": 27.665890216827393, "step": 772}
{"train_info/time_between_train_steps": 0.009523153305053711, "step": 772}
{"info/global_step": 773, "train_info/time_within_train_step": 27.708261489868164, "step": 773}
{"train_info/time_between_train_steps": 0.004906415939331055, "step": 773}
{"info/global_step": 774, "train_info/time_within_train_step": 27.684916019439697, "step": 774}
{"train_info/time_between_train_steps": 0.004843235015869141, "step": 774}
{"info/global_step": 775, "train_info/time_within_train_step": 27.678362607955933, "step": 775}
{"train_info/time_between_train_steps": 0.0049130916595458984, "step": 775}
{"info/global_step": 776, "train_info/time_within_train_step": 27.67090630531311, "step": 776}
{"train_info/time_between_train_steps": 0.004918575286865234, "step": 776}
{"info/global_step": 777, "train_info/time_within_train_step": 27.686808824539185, "step": 777}
{"train_info/time_between_train_steps": 0.0051653385162353516, "step": 777}
{"info/global_step": 778, "train_info/time_within_train_step": 27.674484729766846, "step": 778}
{"train_info/time_between_train_steps": 0.004946231842041016, "step": 778}
{"info/global_step": 779, "train_info/time_within_train_step": 27.684953212738037, "step": 779}
{"train_info/time_between_train_steps": 0.0051991939544677734, "step": 779}
{"info/global_step": 780, "train_info/time_within_train_step": 27.708922863006592, "step": 780}
{"train_info/time_between_train_steps": 0.005036592483520508, "step": 780}
{"info/global_step": 781, "train_info/time_within_train_step": 27.6800274848938, "step": 781}
{"train_info/time_between_train_steps": 0.0049266815185546875, "step": 781}
{"info/global_step": 782, "train_info/time_within_train_step": 27.724701166152954, "step": 782}
{"train_info/time_between_train_steps": 0.0052928924560546875, "step": 782}
{"info/global_step": 783, "train_info/time_within_train_step": 27.72376275062561, "step": 783}
{"train_info/time_between_train_steps": 0.005519866943359375, "step": 783}
{"train_info/time_between_train_steps": 29.77666711807251, "step": 783}
{"info/global_step": 784, "train_info/time_within_train_step": 27.693456411361694, "step": 784}
{"train_info/time_between_train_steps": 0.009436368942260742, "step": 784}
{"info/global_step": 785, "train_info/time_within_train_step": 27.87903618812561, "step": 785}
{"train_info/time_between_train_steps": 0.0048983097076416016, "step": 785}
{"info/global_step": 786, "train_info/time_within_train_step": 27.66324734687805, "step": 786}
{"train_info/time_between_train_steps": 0.005010128021240234, "step": 786}
{"info/global_step": 787, "train_info/time_within_train_step": 27.835694313049316, "step": 787}
{"train_info/time_between_train_steps": 0.005179882049560547, "step": 787}
{"info/global_step": 788, "train_info/time_within_train_step": 27.700854778289795, "step": 788}
{"train_info/time_between_train_steps": 0.0050983428955078125, "step": 788}
{"info/global_step": 789, "train_info/time_within_train_step": 27.829336166381836, "step": 789}
{"train_info/time_between_train_steps": 0.00987696647644043, "step": 789}
{"info/global_step": 790, "train_info/time_within_train_step": 27.680597066879272, "step": 790}
{"train_info/time_between_train_steps": 0.0051267147064208984, "step": 790}
{"info/global_step": 791, "train_info/time_within_train_step": 27.734810829162598, "step": 791}
{"train_info/time_between_train_steps": 0.005182027816772461, "step": 791}
{"info/global_step": 792, "train_info/time_within_train_step": 27.68208599090576, "step": 792}
{"train_info/time_between_train_steps": 0.004829883575439453, "step": 792}
{"info/global_step": 793, "train_info/time_within_train_step": 27.66411781311035, "step": 793}
{"train_info/time_between_train_steps": 0.00481414794921875, "step": 793}
{"info/global_step": 794, "train_info/time_within_train_step": 27.66429829597473, "step": 794}
{"train_info/time_between_train_steps": 0.004828929901123047, "step": 794}
{"info/global_step": 795, "train_info/time_within_train_step": 27.6657292842865, "step": 795}
{"train_info/time_between_train_steps": 0.004831075668334961, "step": 795}
{"info/global_step": 796, "train_info/time_within_train_step": 27.714486598968506, "step": 796}
{"train_info/time_between_train_steps": 0.0048100948333740234, "step": 796}
{"info/global_step": 797, "train_info/time_within_train_step": 27.68399667739868, "step": 797}
{"train_info/time_between_train_steps": 0.004889249801635742, "step": 797}
{"info/global_step": 798, "train_info/time_within_train_step": 27.71822500228882, "step": 798}
{"train_info/time_between_train_steps": 0.004775047302246094, "step": 798}
{"info/global_step": 799, "train_info/time_within_train_step": 27.691266536712646, "step": 799}
{"train_info/time_between_train_steps": 0.0050466060638427734, "step": 799}
{"info/global_step": 800, "train_info/time_within_train_step": 28.760324239730835, "step": 800}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740847825, "_runtime": 23774}, "step": 800}
{"logs": {"train/loss": 3.4192, "train/learning_rate": 0.00022222222222222218, "train/epoch": 29.01, "_timestamp": 1740847825, "_runtime": 23774}, "step": 800}
{"train_info/time_between_train_steps": 47.205350399017334, "step": 800}
{"info/global_step": 801, "train_info/time_within_train_step": 27.783620357513428, "step": 801}
{"train_info/time_between_train_steps": 0.004789829254150391, "step": 801}
{"info/global_step": 802, "train_info/time_within_train_step": 27.66414165496826, "step": 802}
{"train_info/time_between_train_steps": 0.009442567825317383, "step": 802}
{"info/global_step": 803, "train_info/time_within_train_step": 27.68747043609619, "step": 803}
{"train_info/time_between_train_steps": 0.004793405532836914, "step": 803}
{"info/global_step": 804, "train_info/time_within_train_step": 27.673717260360718, "step": 804}
{"train_info/time_between_train_steps": 0.0047931671142578125, "step": 804}
{"info/global_step": 805, "train_info/time_within_train_step": 27.70438051223755, "step": 805}
{"train_info/time_between_train_steps": 0.0047931671142578125, "step": 805}
{"info/global_step": 806, "train_info/time_within_train_step": 27.678099870681763, "step": 806}
{"train_info/time_between_train_steps": 0.004972219467163086, "step": 806}
{"info/global_step": 807, "train_info/time_within_train_step": 27.679516077041626, "step": 807}
{"train_info/time_between_train_steps": 0.004879951477050781, "step": 807}
{"info/global_step": 808, "train_info/time_within_train_step": 27.683780670166016, "step": 808}
{"train_info/time_between_train_steps": 0.004923582077026367, "step": 808}
{"info/global_step": 809, "train_info/time_within_train_step": 27.666471242904663, "step": 809}
{"train_info/time_between_train_steps": 0.005055665969848633, "step": 809}
{"info/global_step": 810, "train_info/time_within_train_step": 27.703022003173828, "step": 810}
{"train_info/time_between_train_steps": 0.005709648132324219, "step": 810}
{"train_info/time_between_train_steps": 29.764092206954956, "step": 810}
{"info/global_step": 811, "train_info/time_within_train_step": 27.69265651702881, "step": 811}
{"train_info/time_between_train_steps": 0.005024909973144531, "step": 811}
{"info/global_step": 812, "train_info/time_within_train_step": 27.770199060440063, "step": 812}
{"train_info/time_between_train_steps": 0.005019426345825195, "step": 812}
{"info/global_step": 813, "train_info/time_within_train_step": 27.66638493537903, "step": 813}
{"train_info/time_between_train_steps": 0.004874229431152344, "step": 813}
{"info/global_step": 814, "train_info/time_within_train_step": 27.779430866241455, "step": 814}
{"train_info/time_between_train_steps": 0.004888057708740234, "step": 814}
{"info/global_step": 815, "train_info/time_within_train_step": 27.81258201599121, "step": 815}
{"train_info/time_between_train_steps": 0.004875659942626953, "step": 815}
{"info/global_step": 816, "train_info/time_within_train_step": 27.773365020751953, "step": 816}
{"train_info/time_between_train_steps": 0.004875659942626953, "step": 816}
{"info/global_step": 817, "train_info/time_within_train_step": 27.67487120628357, "step": 817}
{"train_info/time_between_train_steps": 0.00487971305847168, "step": 817}
{"info/global_step": 818, "train_info/time_within_train_step": 27.715709686279297, "step": 818}
{"train_info/time_between_train_steps": 0.0048487186431884766, "step": 818}
{"info/global_step": 819, "train_info/time_within_train_step": 27.700871467590332, "step": 819}
{"train_info/time_between_train_steps": 0.0047681331634521484, "step": 819}
{"info/global_step": 820, "train_info/time_within_train_step": 27.6862211227417, "step": 820}
{"train_info/time_between_train_steps": 0.004822969436645508, "step": 820}
{"info/global_step": 821, "train_info/time_within_train_step": 27.718676567077637, "step": 821}
{"train_info/time_between_train_steps": 0.0049860477447509766, "step": 821}
{"info/global_step": 822, "train_info/time_within_train_step": 27.69129776954651, "step": 822}
{"train_info/time_between_train_steps": 0.004958152770996094, "step": 822}
{"info/global_step": 823, "train_info/time_within_train_step": 27.703024864196777, "step": 823}
{"train_info/time_between_train_steps": 0.005072116851806641, "step": 823}
{"info/global_step": 824, "train_info/time_within_train_step": 27.727746725082397, "step": 824}
{"train_info/time_between_train_steps": 0.004908084869384766, "step": 824}
{"info/global_step": 825, "train_info/time_within_train_step": 27.706406831741333, "step": 825}
{"train_info/time_between_train_steps": 0.009533166885375977, "step": 825}
{"info/global_step": 826, "train_info/time_within_train_step": 27.724584817886353, "step": 826}
{"train_info/time_between_train_steps": 0.0049741268157958984, "step": 826}
{"info/global_step": 827, "train_info/time_within_train_step": 27.68110418319702, "step": 827}
{"train_info/time_between_train_steps": 0.004975557327270508, "step": 827}
{"info/global_step": 828, "train_info/time_within_train_step": 29.191751956939697, "step": 828}
{"train_info/time_between_train_steps": 0.005174398422241211, "step": 828}
{"info/global_step": 829, "train_info/time_within_train_step": 27.686218738555908, "step": 829}
{"train_info/time_between_train_steps": 0.005042314529418945, "step": 829}
{"info/global_step": 830, "train_info/time_within_train_step": 27.712808847427368, "step": 830}
{"train_info/time_between_train_steps": 0.005039215087890625, "step": 830}
{"info/global_step": 831, "train_info/time_within_train_step": 27.775639057159424, "step": 831}
{"train_info/time_between_train_steps": 0.005159616470336914, "step": 831}
{"info/global_step": 832, "train_info/time_within_train_step": 27.682536125183105, "step": 832}
{"train_info/time_between_train_steps": 0.004995584487915039, "step": 832}
{"info/global_step": 833, "train_info/time_within_train_step": 27.676775217056274, "step": 833}
{"train_info/time_between_train_steps": 0.005083799362182617, "step": 833}
{"info/global_step": 834, "train_info/time_within_train_step": 27.684953689575195, "step": 834}
{"train_info/time_between_train_steps": 0.005028724670410156, "step": 834}
{"info/global_step": 835, "train_info/time_within_train_step": 27.68022322654724, "step": 835}
{"train_info/time_between_train_steps": 0.005133390426635742, "step": 835}
{"info/global_step": 836, "train_info/time_within_train_step": 27.70702838897705, "step": 836}
{"train_info/time_between_train_steps": 0.005124092102050781, "step": 836}
{"info/global_step": 837, "train_info/time_within_train_step": 27.722740650177002, "step": 837}
{"train_info/time_between_train_steps": 0.005530357360839844, "step": 837}
{"train_info/time_between_train_steps": 29.98409914970398, "step": 837}
{"info/global_step": 838, "train_info/time_within_train_step": 27.699995040893555, "step": 838}
{"train_info/time_between_train_steps": 0.004848957061767578, "step": 838}
{"info/global_step": 839, "train_info/time_within_train_step": 27.80113697052002, "step": 839}
{"train_info/time_between_train_steps": 0.009358882904052734, "step": 839}
{"info/global_step": 840, "train_info/time_within_train_step": 27.73231601715088, "step": 840}
{"train_info/time_between_train_steps": 0.009874105453491211, "step": 840}
{"info/global_step": 841, "train_info/time_within_train_step": 27.799561977386475, "step": 841}
{"train_info/time_between_train_steps": 0.00975179672241211, "step": 841}
{"info/global_step": 842, "train_info/time_within_train_step": 27.686108350753784, "step": 842}
{"train_info/time_between_train_steps": 0.009713172912597656, "step": 842}
{"info/global_step": 843, "train_info/time_within_train_step": 27.812929153442383, "step": 843}
{"train_info/time_between_train_steps": 0.005160331726074219, "step": 843}
{"info/global_step": 844, "train_info/time_within_train_step": 27.70095992088318, "step": 844}
{"train_info/time_between_train_steps": 0.005116939544677734, "step": 844}
{"info/global_step": 845, "train_info/time_within_train_step": 27.82533884048462, "step": 845}
{"train_info/time_between_train_steps": 0.005056619644165039, "step": 845}
{"info/global_step": 846, "train_info/time_within_train_step": 27.692238330841064, "step": 846}
{"train_info/time_between_train_steps": 0.0048410892486572266, "step": 846}
{"info/global_step": 847, "train_info/time_within_train_step": 27.661797046661377, "step": 847}
{"train_info/time_between_train_steps": 0.004889726638793945, "step": 847}
{"info/global_step": 848, "train_info/time_within_train_step": 27.723478078842163, "step": 848}
{"train_info/time_between_train_steps": 0.004887580871582031, "step": 848}
{"info/global_step": 849, "train_info/time_within_train_step": 27.803511381149292, "step": 849}
{"train_info/time_between_train_steps": 0.014331817626953125, "step": 849}
{"info/global_step": 850, "train_info/time_within_train_step": 27.972411155700684, "step": 850}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740849321, "_runtime": 25270}, "step": 850}
{"logs": {"train/loss": 3.3588, "train/learning_rate": 0.00019444444444444443, "train/epoch": 31.01, "_timestamp": 1740849321, "_runtime": 25270}, "step": 850}
{"train_info/time_between_train_steps": 0.02624368667602539, "step": 850}
{"info/global_step": 851, "train_info/time_within_train_step": 27.729284286499023, "step": 851}
{"train_info/time_between_train_steps": 0.009176254272460938, "step": 851}
{"info/global_step": 852, "train_info/time_within_train_step": 27.684555768966675, "step": 852}
{"train_info/time_between_train_steps": 0.009459495544433594, "step": 852}
{"info/global_step": 853, "train_info/time_within_train_step": 27.675358772277832, "step": 853}
{"train_info/time_between_train_steps": 0.005049943923950195, "step": 853}
{"info/global_step": 854, "train_info/time_within_train_step": 27.678413152694702, "step": 854}
{"train_info/time_between_train_steps": 0.00616455078125, "step": 854}
{"info/global_step": 855, "train_info/time_within_train_step": 27.942291736602783, "step": 855}
{"train_info/time_between_train_steps": 0.009419679641723633, "step": 855}
{"info/global_step": 856, "train_info/time_within_train_step": 27.693035125732422, "step": 856}
{"train_info/time_between_train_steps": 0.009519577026367188, "step": 856}
{"info/global_step": 857, "train_info/time_within_train_step": 27.729402780532837, "step": 857}
{"train_info/time_between_train_steps": 0.009224891662597656, "step": 857}
{"info/global_step": 858, "train_info/time_within_train_step": 27.682048797607422, "step": 858}
{"train_info/time_between_train_steps": 0.005026102066040039, "step": 858}
{"info/global_step": 859, "train_info/time_within_train_step": 27.67737603187561, "step": 859}
{"train_info/time_between_train_steps": 0.0048828125, "step": 859}
{"info/global_step": 860, "train_info/time_within_train_step": 27.69451403617859, "step": 860}
{"train_info/time_between_train_steps": 0.0050106048583984375, "step": 860}
{"info/global_step": 861, "train_info/time_within_train_step": 27.759641647338867, "step": 861}
{"train_info/time_between_train_steps": 0.005048990249633789, "step": 861}
{"info/global_step": 862, "train_info/time_within_train_step": 27.680718660354614, "step": 862}
{"train_info/time_between_train_steps": 0.005243062973022461, "step": 862}
{"info/global_step": 863, "train_info/time_within_train_step": 27.689197301864624, "step": 863}
{"train_info/time_between_train_steps": 0.00516819953918457, "step": 863}
{"info/global_step": 864, "train_info/time_within_train_step": 27.714664697647095, "step": 864}
{"train_info/time_between_train_steps": 0.010147809982299805, "step": 864}
{"train_info/time_between_train_steps": 30.143633604049683, "step": 864}
{"info/global_step": 865, "train_info/time_within_train_step": 27.724799156188965, "step": 865}
{"train_info/time_between_train_steps": 0.0048220157623291016, "step": 865}
{"info/global_step": 866, "train_info/time_within_train_step": 27.79680371284485, "step": 866}
{"train_info/time_between_train_steps": 0.004859447479248047, "step": 866}
{"info/global_step": 867, "train_info/time_within_train_step": 27.67693281173706, "step": 867}
{"train_info/time_between_train_steps": 0.0048677921295166016, "step": 867}
{"info/global_step": 868, "train_info/time_within_train_step": 27.784663438796997, "step": 868}
{"train_info/time_between_train_steps": 0.004867076873779297, "step": 868}
{"info/global_step": 869, "train_info/time_within_train_step": 27.710551977157593, "step": 869}
{"train_info/time_between_train_steps": 0.0048253536224365234, "step": 869}
{"info/global_step": 870, "train_info/time_within_train_step": 27.8006010055542, "step": 870}
{"train_info/time_between_train_steps": 0.005091428756713867, "step": 870}
{"info/global_step": 871, "train_info/time_within_train_step": 27.69104528427124, "step": 871}
{"train_info/time_between_train_steps": 0.005070924758911133, "step": 871}
{"info/global_step": 872, "train_info/time_within_train_step": 27.734634160995483, "step": 872}
{"train_info/time_between_train_steps": 0.005060434341430664, "step": 872}
{"info/global_step": 873, "train_info/time_within_train_step": 27.687848329544067, "step": 873}
{"train_info/time_between_train_steps": 0.005029439926147461, "step": 873}
{"info/global_step": 874, "train_info/time_within_train_step": 27.678471326828003, "step": 874}
{"train_info/time_between_train_steps": 0.004931211471557617, "step": 874}
{"info/global_step": 875, "train_info/time_within_train_step": 27.69746470451355, "step": 875}
{"train_info/time_between_train_steps": 0.004852294921875, "step": 875}
{"info/global_step": 876, "train_info/time_within_train_step": 27.811804056167603, "step": 876}
{"train_info/time_between_train_steps": 0.004873514175415039, "step": 876}
{"info/global_step": 877, "train_info/time_within_train_step": 27.673725366592407, "step": 877}
{"train_info/time_between_train_steps": 0.0048313140869140625, "step": 877}
{"info/global_step": 878, "train_info/time_within_train_step": 27.686044454574585, "step": 878}
{"train_info/time_between_train_steps": 0.004877567291259766, "step": 878}
{"info/global_step": 879, "train_info/time_within_train_step": 27.677005767822266, "step": 879}
{"train_info/time_between_train_steps": 0.004914283752441406, "step": 879}
{"info/global_step": 880, "train_info/time_within_train_step": 27.67187213897705, "step": 880}
{"train_info/time_between_train_steps": 0.004900693893432617, "step": 880}
{"info/global_step": 881, "train_info/time_within_train_step": 27.678098917007446, "step": 881}
{"train_info/time_between_train_steps": 0.0049326419830322266, "step": 881}
{"info/global_step": 882, "train_info/time_within_train_step": 27.709429025650024, "step": 882}
{"train_info/time_between_train_steps": 0.005080699920654297, "step": 882}
{"info/global_step": 883, "train_info/time_within_train_step": 27.685009241104126, "step": 883}
{"train_info/time_between_train_steps": 0.005266666412353516, "step": 883}
{"info/global_step": 884, "train_info/time_within_train_step": 27.67283296585083, "step": 884}
{"train_info/time_between_train_steps": 0.004992246627807617, "step": 884}
{"info/global_step": 885, "train_info/time_within_train_step": 27.676812887191772, "step": 885}
{"train_info/time_between_train_steps": 0.005077838897705078, "step": 885}
{"info/global_step": 886, "train_info/time_within_train_step": 27.67237091064453, "step": 886}
{"train_info/time_between_train_steps": 0.005023002624511719, "step": 886}
{"info/global_step": 887, "train_info/time_within_train_step": 27.685868978500366, "step": 887}
{"train_info/time_between_train_steps": 0.005026817321777344, "step": 887}
{"info/global_step": 888, "train_info/time_within_train_step": 27.7054226398468, "step": 888}
{"train_info/time_between_train_steps": 0.005001544952392578, "step": 888}
{"info/global_step": 889, "train_info/time_within_train_step": 27.702757596969604, "step": 889}
{"train_info/time_between_train_steps": 0.004946231842041016, "step": 889}
{"info/global_step": 890, "train_info/time_within_train_step": 27.683587789535522, "step": 890}
{"train_info/time_between_train_steps": 0.009494304656982422, "step": 890}
{"info/global_step": 891, "train_info/time_within_train_step": 27.783833265304565, "step": 891}
{"train_info/time_between_train_steps": 0.0054552555084228516, "step": 891}
{"train_info/time_between_train_steps": 29.804793119430542, "step": 891}
{"info/global_step": 892, "train_info/time_within_train_step": 27.674879789352417, "step": 892}
{"train_info/time_between_train_steps": 0.0049591064453125, "step": 892}
{"info/global_step": 893, "train_info/time_within_train_step": 27.795053958892822, "step": 893}
{"train_info/time_between_train_steps": 0.004885435104370117, "step": 893}
{"info/global_step": 894, "train_info/time_within_train_step": 27.730618238449097, "step": 894}
{"train_info/time_between_train_steps": 0.005022525787353516, "step": 894}
{"info/global_step": 895, "train_info/time_within_train_step": 27.795719146728516, "step": 895}
{"train_info/time_between_train_steps": 0.005055665969848633, "step": 895}
{"info/global_step": 896, "train_info/time_within_train_step": 27.678985595703125, "step": 896}
{"train_info/time_between_train_steps": 0.004889726638793945, "step": 896}
{"info/global_step": 897, "train_info/time_within_train_step": 27.79135251045227, "step": 897}
{"train_info/time_between_train_steps": 0.007337331771850586, "step": 897}
{"info/global_step": 898, "train_info/time_within_train_step": 27.724390745162964, "step": 898}
{"train_info/time_between_train_steps": 0.00716400146484375, "step": 898}
{"info/global_step": 899, "train_info/time_within_train_step": 27.74332880973816, "step": 899}
{"train_info/time_between_train_steps": 0.005120992660522461, "step": 899}
{"info/global_step": 900, "train_info/time_within_train_step": 28.89875078201294, "step": 900}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740850770, "_runtime": 26719}, "step": 900}
{"logs": {"train/loss": 3.3039, "train/learning_rate": 0.00016666666666666666, "train/epoch": 33.01, "_timestamp": 1740850770, "_runtime": 26719}, "step": 900}
{"train_info/time_between_train_steps": 45.26551580429077, "step": 900}
{"info/global_step": 901, "train_info/time_within_train_step": 27.70385217666626, "step": 901}
{"train_info/time_between_train_steps": 0.004641056060791016, "step": 901}
{"info/global_step": 902, "train_info/time_within_train_step": 27.68757462501526, "step": 902}
{"train_info/time_between_train_steps": 0.004954814910888672, "step": 902}
{"info/global_step": 903, "train_info/time_within_train_step": 27.716274738311768, "step": 903}
{"train_info/time_between_train_steps": 0.004925966262817383, "step": 903}
{"info/global_step": 904, "train_info/time_within_train_step": 27.697364568710327, "step": 904}
{"train_info/time_between_train_steps": 0.005096912384033203, "step": 904}
{"info/global_step": 905, "train_info/time_within_train_step": 27.67770767211914, "step": 905}
{"train_info/time_between_train_steps": 0.005036354064941406, "step": 905}
{"info/global_step": 906, "train_info/time_within_train_step": 27.761990308761597, "step": 906}
{"train_info/time_between_train_steps": 0.00489044189453125, "step": 906}
{"info/global_step": 907, "train_info/time_within_train_step": 27.66882038116455, "step": 907}
{"train_info/time_between_train_steps": 0.00492405891418457, "step": 907}
{"info/global_step": 908, "train_info/time_within_train_step": 27.666944980621338, "step": 908}
{"train_info/time_between_train_steps": 0.005099058151245117, "step": 908}
{"info/global_step": 909, "train_info/time_within_train_step": 27.67121148109436, "step": 909}
{"train_info/time_between_train_steps": 0.004846334457397461, "step": 909}
{"info/global_step": 910, "train_info/time_within_train_step": 27.6857008934021, "step": 910}
{"train_info/time_between_train_steps": 0.0049326419830322266, "step": 910}
{"info/global_step": 911, "train_info/time_within_train_step": 27.678569078445435, "step": 911}
{"train_info/time_between_train_steps": 0.0049097537994384766, "step": 911}
{"info/global_step": 912, "train_info/time_within_train_step": 27.719058990478516, "step": 912}
{"train_info/time_between_train_steps": 0.004888296127319336, "step": 912}
{"info/global_step": 913, "train_info/time_within_train_step": 27.687885761260986, "step": 913}
{"train_info/time_between_train_steps": 0.005017280578613281, "step": 913}
{"info/global_step": 914, "train_info/time_within_train_step": 27.719244718551636, "step": 914}
{"train_info/time_between_train_steps": 0.0050296783447265625, "step": 914}
{"info/global_step": 915, "train_info/time_within_train_step": 27.70354700088501, "step": 915}
{"train_info/time_between_train_steps": 0.0051937103271484375, "step": 915}
{"info/global_step": 916, "train_info/time_within_train_step": 27.72683310508728, "step": 916}
{"train_info/time_between_train_steps": 0.005121469497680664, "step": 916}
{"info/global_step": 917, "train_info/time_within_train_step": 27.704691886901855, "step": 917}
{"train_info/time_between_train_steps": 0.005083560943603516, "step": 917}
{"info/global_step": 918, "train_info/time_within_train_step": 27.730708122253418, "step": 918}
{"train_info/time_between_train_steps": 0.00565791130065918, "step": 918}
{"train_info/time_between_train_steps": 30.122909545898438, "step": 918}
{"info/global_step": 919, "train_info/time_within_train_step": 27.72745943069458, "step": 919}
{"train_info/time_between_train_steps": 0.012470722198486328, "step": 919}
{"info/global_step": 920, "train_info/time_within_train_step": 28.007152318954468, "step": 920}
{"train_info/time_between_train_steps": 0.005845069885253906, "step": 920}
{"info/global_step": 921, "train_info/time_within_train_step": 27.767570972442627, "step": 921}
{"train_info/time_between_train_steps": 0.0048906803131103516, "step": 921}
{"info/global_step": 922, "train_info/time_within_train_step": 27.785916328430176, "step": 922}
{"train_info/time_between_train_steps": 0.0049114227294921875, "step": 922}
{"info/global_step": 923, "train_info/time_within_train_step": 27.696243286132812, "step": 923}
{"train_info/time_between_train_steps": 0.00534510612487793, "step": 923}
{"info/global_step": 924, "train_info/time_within_train_step": 29.475159168243408, "step": 924}
{"train_info/time_between_train_steps": 0.005399227142333984, "step": 924}
{"info/global_step": 925, "train_info/time_within_train_step": 27.709466218948364, "step": 925}
{"train_info/time_between_train_steps": 0.005091428756713867, "step": 925}
{"info/global_step": 926, "train_info/time_within_train_step": 27.75891661643982, "step": 926}
{"train_info/time_between_train_steps": 0.0051190853118896484, "step": 926}
{"info/global_step": 927, "train_info/time_within_train_step": 27.696956634521484, "step": 927}
{"train_info/time_between_train_steps": 0.004891395568847656, "step": 927}
{"info/global_step": 928, "train_info/time_within_train_step": 27.718759536743164, "step": 928}
{"train_info/time_between_train_steps": 0.004932880401611328, "step": 928}
{"info/global_step": 929, "train_info/time_within_train_step": 27.68552827835083, "step": 929}
{"train_info/time_between_train_steps": 0.004800558090209961, "step": 929}
{"info/global_step": 930, "train_info/time_within_train_step": 27.713728666305542, "step": 930}
{"train_info/time_between_train_steps": 0.00484156608581543, "step": 930}
{"info/global_step": 931, "train_info/time_within_train_step": 27.684489727020264, "step": 931}
{"train_info/time_between_train_steps": 0.00475311279296875, "step": 931}
{"info/global_step": 932, "train_info/time_within_train_step": 27.72183656692505, "step": 932}
{"train_info/time_between_train_steps": 0.0048503875732421875, "step": 932}
{"info/global_step": 933, "train_info/time_within_train_step": 27.677327871322632, "step": 933}
{"train_info/time_between_train_steps": 0.010462522506713867, "step": 933}
{"info/global_step": 934, "train_info/time_within_train_step": 27.690778493881226, "step": 934}
{"train_info/time_between_train_steps": 0.004829883575439453, "step": 934}
{"info/global_step": 935, "train_info/time_within_train_step": 27.691473245620728, "step": 935}
{"train_info/time_between_train_steps": 0.004842042922973633, "step": 935}
{"info/global_step": 936, "train_info/time_within_train_step": 27.77688980102539, "step": 936}
{"train_info/time_between_train_steps": 0.004910945892333984, "step": 936}
{"info/global_step": 937, "train_info/time_within_train_step": 27.684531450271606, "step": 937}
{"train_info/time_between_train_steps": 0.005032539367675781, "step": 937}
{"info/global_step": 938, "train_info/time_within_train_step": 27.68385887145996, "step": 938}
{"train_info/time_between_train_steps": 0.00955820083618164, "step": 938}
{"info/global_step": 939, "train_info/time_within_train_step": 27.770795583724976, "step": 939}
{"train_info/time_between_train_steps": 0.009311914443969727, "step": 939}
{"info/global_step": 940, "train_info/time_within_train_step": 27.677662134170532, "step": 940}
{"train_info/time_between_train_steps": 0.0048961639404296875, "step": 940}
{"info/global_step": 941, "train_info/time_within_train_step": 27.684374570846558, "step": 941}
{"train_info/time_between_train_steps": 0.00504612922668457, "step": 941}
{"info/global_step": 942, "train_info/time_within_train_step": 27.698890924453735, "step": 942}
{"train_info/time_between_train_steps": 0.004955291748046875, "step": 942}
{"info/global_step": 943, "train_info/time_within_train_step": 27.732757091522217, "step": 943}
{"train_info/time_between_train_steps": 0.009642601013183594, "step": 943}
{"info/global_step": 944, "train_info/time_within_train_step": 27.70550560951233, "step": 944}
{"train_info/time_between_train_steps": 0.005131244659423828, "step": 944}
{"info/global_step": 945, "train_info/time_within_train_step": 27.746062517166138, "step": 945}
{"train_info/time_between_train_steps": 0.005440473556518555, "step": 945}
{"train_info/time_between_train_steps": 30.173041582107544, "step": 945}
{"info/global_step": 946, "train_info/time_within_train_step": 27.72544836997986, "step": 946}
{"train_info/time_between_train_steps": 0.005124092102050781, "step": 946}
{"info/global_step": 947, "train_info/time_within_train_step": 27.832210063934326, "step": 947}
{"train_info/time_between_train_steps": 0.005255222320556641, "step": 947}
{"info/global_step": 948, "train_info/time_within_train_step": 27.694816827774048, "step": 948}
{"train_info/time_between_train_steps": 0.005127906799316406, "step": 948}
{"info/global_step": 949, "train_info/time_within_train_step": 27.808695077896118, "step": 949}
{"train_info/time_between_train_steps": 0.005349874496459961, "step": 949}
{"info/global_step": 950, "train_info/time_within_train_step": 27.70198702812195, "step": 950}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740852266, "_runtime": 28215}, "step": 950}
{"logs": {"train/loss": 3.2517, "train/learning_rate": 0.0001388888888888889, "train/epoch": 35.0, "_timestamp": 1740852266, "_runtime": 28215}, "step": 950}
{"train_info/time_between_train_steps": 0.02563619613647461, "step": 950}
{"info/global_step": 951, "train_info/time_within_train_step": 27.938244581222534, "step": 951}
{"train_info/time_between_train_steps": 0.005014181137084961, "step": 951}
{"info/global_step": 952, "train_info/time_within_train_step": 27.682576417922974, "step": 952}
{"train_info/time_between_train_steps": 0.0050809383392333984, "step": 952}
{"info/global_step": 953, "train_info/time_within_train_step": 27.774165630340576, "step": 953}
{"train_info/time_between_train_steps": 0.0050776004791259766, "step": 953}
{"info/global_step": 954, "train_info/time_within_train_step": 27.706505060195923, "step": 954}
{"train_info/time_between_train_steps": 0.0047762393951416016, "step": 954}
{"info/global_step": 955, "train_info/time_within_train_step": 27.668495416641235, "step": 955}
{"train_info/time_between_train_steps": 0.004809379577636719, "step": 955}
{"info/global_step": 956, "train_info/time_within_train_step": 27.67198133468628, "step": 956}
{"train_info/time_between_train_steps": 0.004809856414794922, "step": 956}
{"info/global_step": 957, "train_info/time_within_train_step": 27.71132516860962, "step": 957}
{"train_info/time_between_train_steps": 0.004769563674926758, "step": 957}
{"info/global_step": 958, "train_info/time_within_train_step": 27.68324041366577, "step": 958}
{"train_info/time_between_train_steps": 0.0048258304595947266, "step": 958}
{"info/global_step": 959, "train_info/time_within_train_step": 27.741595029830933, "step": 959}
{"train_info/time_between_train_steps": 0.00492548942565918, "step": 959}
{"info/global_step": 960, "train_info/time_within_train_step": 27.69749116897583, "step": 960}
{"train_info/time_between_train_steps": 0.0050241947174072266, "step": 960}
{"info/global_step": 961, "train_info/time_within_train_step": 27.73287081718445, "step": 961}
{"train_info/time_between_train_steps": 0.005017757415771484, "step": 961}
{"info/global_step": 962, "train_info/time_within_train_step": 27.684839248657227, "step": 962}
{"train_info/time_between_train_steps": 0.005012035369873047, "step": 962}
{"info/global_step": 963, "train_info/time_within_train_step": 27.6839337348938, "step": 963}
{"train_info/time_between_train_steps": 0.004934787750244141, "step": 963}
{"info/global_step": 964, "train_info/time_within_train_step": 27.73786187171936, "step": 964}
{"train_info/time_between_train_steps": 0.004908323287963867, "step": 964}
{"info/global_step": 965, "train_info/time_within_train_step": 27.695863962173462, "step": 965}
{"train_info/time_between_train_steps": 0.004930734634399414, "step": 965}
{"info/global_step": 966, "train_info/time_within_train_step": 27.72150731086731, "step": 966}
{"train_info/time_between_train_steps": 0.00490570068359375, "step": 966}
{"info/global_step": 967, "train_info/time_within_train_step": 27.77740454673767, "step": 967}
{"train_info/time_between_train_steps": 0.0048770904541015625, "step": 967}
{"info/global_step": 968, "train_info/time_within_train_step": 27.677809238433838, "step": 968}
{"train_info/time_between_train_steps": 0.004970550537109375, "step": 968}
{"info/global_step": 969, "train_info/time_within_train_step": 27.689607620239258, "step": 969}
{"train_info/time_between_train_steps": 0.0050160884857177734, "step": 969}
{"info/global_step": 970, "train_info/time_within_train_step": 27.721258640289307, "step": 970}
{"train_info/time_between_train_steps": 0.005247831344604492, "step": 970}
{"info/global_step": 971, "train_info/time_within_train_step": 27.69359016418457, "step": 971}
{"train_info/time_between_train_steps": 0.005462646484375, "step": 971}
{"info/global_step": 972, "train_info/time_within_train_step": 27.70785093307495, "step": 972}
{"train_info/time_between_train_steps": 0.005631923675537109, "step": 972}
{"train_info/time_between_train_steps": 29.86201548576355, "step": 972}
{"info/global_step": 973, "train_info/time_within_train_step": 27.67912745475769, "step": 973}
{"train_info/time_between_train_steps": 0.004904985427856445, "step": 973}
{"info/global_step": 974, "train_info/time_within_train_step": 27.78260898590088, "step": 974}
{"train_info/time_between_train_steps": 0.0048999786376953125, "step": 974}
{"info/global_step": 975, "train_info/time_within_train_step": 27.674346685409546, "step": 975}
{"train_info/time_between_train_steps": 0.004889249801635742, "step": 975}
{"info/global_step": 976, "train_info/time_within_train_step": 27.808800220489502, "step": 976}
{"train_info/time_between_train_steps": 0.004987001419067383, "step": 976}
{"info/global_step": 977, "train_info/time_within_train_step": 27.68191123008728, "step": 977}
{"train_info/time_between_train_steps": 0.0049169063568115234, "step": 977}
{"info/global_step": 978, "train_info/time_within_train_step": 27.79277276992798, "step": 978}
{"train_info/time_between_train_steps": 0.004929542541503906, "step": 978}
{"info/global_step": 979, "train_info/time_within_train_step": 27.681364059448242, "step": 979}
{"train_info/time_between_train_steps": 0.004934549331665039, "step": 979}
{"info/global_step": 980, "train_info/time_within_train_step": 27.77244257926941, "step": 980}
{"train_info/time_between_train_steps": 0.005151271820068359, "step": 980}
{"info/global_step": 981, "train_info/time_within_train_step": 27.827749252319336, "step": 981}
{"train_info/time_between_train_steps": 0.005184650421142578, "step": 981}
{"info/global_step": 982, "train_info/time_within_train_step": 27.70582342147827, "step": 982}
{"train_info/time_between_train_steps": 0.005141735076904297, "step": 982}
{"info/global_step": 983, "train_info/time_within_train_step": 27.68125629425049, "step": 983}
{"train_info/time_between_train_steps": 0.005137443542480469, "step": 983}
{"info/global_step": 984, "train_info/time_within_train_step": 27.709975719451904, "step": 984}
{"train_info/time_between_train_steps": 0.004925966262817383, "step": 984}
{"info/global_step": 985, "train_info/time_within_train_step": 27.693689823150635, "step": 985}
{"train_info/time_between_train_steps": 0.0056285858154296875, "step": 985}
{"info/global_step": 986, "train_info/time_within_train_step": 27.679486751556396, "step": 986}
{"train_info/time_between_train_steps": 0.005175352096557617, "step": 986}
{"info/global_step": 987, "train_info/time_within_train_step": 27.684715747833252, "step": 987}
{"train_info/time_between_train_steps": 0.005450248718261719, "step": 987}
{"info/global_step": 988, "train_info/time_within_train_step": 27.675952434539795, "step": 988}
{"train_info/time_between_train_steps": 0.005146503448486328, "step": 988}
{"info/global_step": 989, "train_info/time_within_train_step": 27.669283866882324, "step": 989}
{"train_info/time_between_train_steps": 0.0048334598541259766, "step": 989}
{"info/global_step": 990, "train_info/time_within_train_step": 27.66947603225708, "step": 990}
{"train_info/time_between_train_steps": 0.004849910736083984, "step": 990}
{"info/global_step": 991, "train_info/time_within_train_step": 27.669990301132202, "step": 991}
{"train_info/time_between_train_steps": 0.0051174163818359375, "step": 991}
{"info/global_step": 992, "train_info/time_within_train_step": 27.70541548728943, "step": 992}
{"train_info/time_between_train_steps": 0.004925727844238281, "step": 992}
{"info/global_step": 993, "train_info/time_within_train_step": 27.684295654296875, "step": 993}
{"train_info/time_between_train_steps": 0.006127119064331055, "step": 993}
{"info/global_step": 994, "train_info/time_within_train_step": 27.68722915649414, "step": 994}
{"train_info/time_between_train_steps": 0.005240201950073242, "step": 994}
{"info/global_step": 995, "train_info/time_within_train_step": 27.70956826210022, "step": 995}
{"train_info/time_between_train_steps": 0.004973888397216797, "step": 995}
{"info/global_step": 996, "train_info/time_within_train_step": 27.70260238647461, "step": 996}
{"train_info/time_between_train_steps": 0.005582094192504883, "step": 996}
{"info/global_step": 997, "train_info/time_within_train_step": 27.799703359603882, "step": 997}
{"train_info/time_between_train_steps": 0.005698680877685547, "step": 997}
{"info/global_step": 998, "train_info/time_within_train_step": 27.686805963516235, "step": 998}
{"train_info/time_between_train_steps": 0.0054209232330322266, "step": 998}
{"info/global_step": 999, "train_info/time_within_train_step": 27.731101751327515, "step": 999}
{"train_info/time_between_train_steps": 0.005412578582763672, "step": 999}
{"train_info/time_between_train_steps": 31.865500688552856, "step": 999}
{"info/global_step": 1000, "train_info/time_within_train_step": 28.28204655647278, "step": 1000}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 22626.0, "train_info/memory_max_reserved": 22626.0, "_timestamp": 1740853716, "_runtime": 29665}, "step": 1000}
{"logs": {"train/loss": 3.2036, "train/learning_rate": 0.00011111111111111109, "train/epoch": 37.0, "_timestamp": 1740853716, "_runtime": 29665}, "step": 1000}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1740853721, "_runtime": 29670}, "step": 1000}
{"logs": {"eval/loss": 4.179767608642578, "eval/runtime": 5.1227, "eval/samples_per_second": 39.628, "eval/steps_per_second": 2.538, "train/epoch": 37.0, "_timestamp": 1740853721, "_runtime": 29670}, "step": 1000}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1740853721, "_runtime": 29670}, "step": 1000}
{"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.179767608642578, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 65.35066451958149, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 5.1227, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 39.628, "train/epoch": 37.0, "_timestamp": 1740853721, "_runtime": 29670}, "step": 1000}
{"train_info/time_between_train_steps": 45.9484076499939, "step": 1000}
{"info/global_step": 1001, "train_info/time_within_train_step": 27.837408781051636, "step": 1001}
{"train_info/time_between_train_steps": 0.00507664680480957, "step": 1001}
{"info/global_step": 1002, "train_info/time_within_train_step": 27.69816517829895, "step": 1002}
{"train_info/time_between_train_steps": 0.005040645599365234, "step": 1002}
{"info/global_step": 1003, "train_info/time_within_train_step": 27.81215238571167, "step": 1003}
{"train_info/time_between_train_steps": 0.005277156829833984, "step": 1003}
{"info/global_step": 1004, "train_info/time_within_train_step": 27.694470643997192, "step": 1004}
{"train_info/time_between_train_steps": 0.0050203800201416016, "step": 1004}
{"info/global_step": 1005, "train_info/time_within_train_step": 27.80090045928955, "step": 1005}
{"train_info/time_between_train_steps": 0.005087137222290039, "step": 1005}
{"info/global_step": 1006, "train_info/time_within_train_step": 27.69578719139099, "step": 1006}
{"train_info/time_between_train_steps": 0.005076169967651367, "step": 1006}
{"info/global_step": 1007, "train_info/time_within_train_step": 27.76434874534607, "step": 1007}
{"train_info/time_between_train_steps": 0.00501561164855957, "step": 1007}
{"info/global_step": 1008, "train_info/time_within_train_step": 27.687906980514526, "step": 1008}
{"train_info/time_between_train_steps": 0.00561976432800293, "step": 1008}
{"info/global_step": 1009, "train_info/time_within_train_step": 27.67438244819641, "step": 1009}
{"train_info/time_between_train_steps": 0.004801750183105469, "step": 1009}
{"info/global_step": 1010, "train_info/time_within_train_step": 27.683626651763916, "step": 1010}
{"train_info/time_between_train_steps": 0.0047855377197265625, "step": 1010}
{"info/global_step": 1011, "train_info/time_within_train_step": 27.670052766799927, "step": 1011}
{"train_info/time_between_train_steps": 0.004802227020263672, "step": 1011}
{"info/global_step": 1012, "train_info/time_within_train_step": 27.803303003311157, "step": 1012}
{"train_info/time_between_train_steps": 0.004975795745849609, "step": 1012}
{"info/global_step": 1013, "train_info/time_within_train_step": 27.694621801376343, "step": 1013}
{"train_info/time_between_train_steps": 0.004976987838745117, "step": 1013}
{"info/global_step": 1014, "train_info/time_within_train_step": 27.69673466682434, "step": 1014}
{"train_info/time_between_train_steps": 0.004991769790649414, "step": 1014}
{"info/global_step": 1015, "train_info/time_within_train_step": 27.673216581344604, "step": 1015}
{"train_info/time_between_train_steps": 0.004970073699951172, "step": 1015}
{"info/global_step": 1016, "train_info/time_within_train_step": 27.689252853393555, "step": 1016}
{"train_info/time_between_train_steps": 0.00968480110168457, "step": 1016}
{"info/global_step": 1017, "train_info/time_within_train_step": 27.76191020011902, "step": 1017}
{"train_info/time_between_train_steps": 0.0048961639404296875, "step": 1017}
{"info/global_step": 1018, "train_info/time_within_train_step": 27.715384244918823, "step": 1018}
{"train_info/time_between_train_steps": 0.009560823440551758, "step": 1018}
{"info/global_step": 1019, "train_info/time_within_train_step": 27.67725896835327, "step": 1019}
{"train_info/time_between_train_steps": 0.009600400924682617, "step": 1019}
{"info/global_step": 1020, "train_info/time_within_train_step": 27.671130180358887, "step": 1020}
{"train_info/time_between_train_steps": 0.009505987167358398, "step": 1020}
{"info/global_step": 1021, "train_info/time_within_train_step": 28.24190354347229, "step": 1021}
{"train_info/time_between_train_steps": 0.0053958892822265625, "step": 1021}
{"info/global_step": 1022, "train_info/time_within_train_step": 28.01408362388611, "step": 1022}
{"train_info/time_between_train_steps": 0.009936809539794922, "step": 1022}
{"info/global_step": 1023, "train_info/time_within_train_step": 27.698705196380615, "step": 1023}
{"train_info/time_between_train_steps": 0.005206108093261719, "step": 1023}
{"info/global_step": 1024, "train_info/time_within_train_step": 27.699064254760742, "step": 1024}
{"train_info/time_between_train_steps": 0.005106687545776367, "step": 1024}
{"info/global_step": 1025, "train_info/time_within_train_step": 27.740069150924683, "step": 1025}
{"train_info/time_between_train_steps": 0.005167961120605469, "step": 1025}
{"info/global_step": 1026, "train_info/time_within_train_step": 27.718387842178345, "step": 1026}
{"train_info/time_between_train_steps": 0.005465030670166016, "step": 1026}
{"train_info/time_between_train_steps": 30.292476892471313, "step": 1026}
{"info/global_step": 1027, "train_info/time_within_train_step": 27.689913988113403, "step": 1027}
{"train_info/time_between_train_steps": 0.0049135684967041016, "step": 1027}
{"info/global_step": 1028, "train_info/time_within_train_step": 27.828578233718872, "step": 1028}
{"train_info/time_between_train_steps": 0.004880666732788086, "step": 1028}
{"info/global_step": 1029, "train_info/time_within_train_step": 27.674129962921143, "step": 1029}
{"train_info/time_between_train_steps": 0.0049588680267333984, "step": 1029}
{"info/global_step": 1030, "train_info/time_within_train_step": 27.794133186340332, "step": 1030}
{"train_info/time_between_train_steps": 0.00517725944519043, "step": 1030}
{"info/global_step": 1031, "train_info/time_within_train_step": 27.681121349334717, "step": 1031}
{"train_info/time_between_train_steps": 0.005063533782958984, "step": 1031}
{"info/global_step": 1032, "train_info/time_within_train_step": 27.843863010406494, "step": 1032}
{"train_info/time_between_train_steps": 0.0051422119140625, "step": 1032}
{"info/global_step": 1033, "train_info/time_within_train_step": 27.70227289199829, "step": 1033}
{"train_info/time_between_train_steps": 0.005079746246337891, "step": 1033}
{"info/global_step": 1034, "train_info/time_within_train_step": 27.745685338974, "step": 1034}
{"train_info/time_between_train_steps": 0.005156517028808594, "step": 1034}
{"info/global_step": 1035, "train_info/time_within_train_step": 27.68821144104004, "step": 1035}
{"train_info/time_between_train_steps": 0.004775047302246094, "step": 1035}
{"info/global_step": 1036, "train_info/time_within_train_step": 27.667786598205566, "step": 1036}
{"train_info/time_between_train_steps": 0.004781007766723633, "step": 1036}
{"info/global_step": 1037, "train_info/time_within_train_step": 27.709097862243652, "step": 1037}
{"train_info/time_between_train_steps": 0.004791259765625, "step": 1037}
{"info/global_step": 1038, "train_info/time_within_train_step": 27.667290210723877, "step": 1038}
{"train_info/time_between_train_steps": 0.0047605037689208984, "step": 1038}
{"info/global_step": 1039, "train_info/time_within_train_step": 27.66750192642212, "step": 1039}
{"train_info/time_between_train_steps": 0.00472712516784668, "step": 1039}
{"info/global_step": 1040, "train_info/time_within_train_step": 27.665059566497803, "step": 1040}
{"train_info/time_between_train_steps": 0.0048427581787109375, "step": 1040}
{"info/global_step": 1041, "train_info/time_within_train_step": 27.679503679275513, "step": 1041}
{"train_info/time_between_train_steps": 0.0047838687896728516, "step": 1041}
{"info/global_step": 1042, "train_info/time_within_train_step": 27.776715755462646, "step": 1042}
{"train_info/time_between_train_steps": 0.004834413528442383, "step": 1042}
{"info/global_step": 1043, "train_info/time_within_train_step": 27.673070669174194, "step": 1043}
{"train_info/time_between_train_steps": 0.004947185516357422, "step": 1043}
{"info/global_step": 1044, "train_info/time_within_train_step": 27.684876203536987, "step": 1044}
{"train_info/time_between_train_steps": 0.004996061325073242, "step": 1044}
{"info/global_step": 1045, "train_info/time_within_train_step": 27.7279531955719, "step": 1045}
{"train_info/time_between_train_steps": 0.009791374206542969, "step": 1045}
{"info/global_step": 1046, "train_info/time_within_train_step": 27.686697721481323, "step": 1046}
{"train_info/time_between_train_steps": 0.004957437515258789, "step": 1046}
{"info/global_step": 1047, "train_info/time_within_train_step": 27.675090551376343, "step": 1047}
{"train_info/time_between_train_steps": 0.004918813705444336, "step": 1047}
{"info/global_step": 1048, "train_info/time_within_train_step": 27.673603773117065, "step": 1048}
{"train_info/time_between_train_steps": 0.004923820495605469, "step": 1048}
{"info/global_step": 1049, "train_info/time_within_train_step": 27.684213876724243, "step": 1049}
{"train_info/time_between_train_steps": 0.005010128021240234, "step": 1049}
{"info/global_step": 1050, "train_info/time_within_train_step": 27.67605233192444, "step": 1050}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1740855181, "_runtime": 31130}, "step": 1050}
{"logs": {"train/loss": 3.1032, "train/learning_rate": 8.333333333333333e-05, "train/epoch": 38.02, "_timestamp": 1740855181, "_runtime": 31130}, "step": 1050}
{"train_info/time_between_train_steps": 0.02540874481201172, "step": 1050}
{"info/global_step": 1051, "train_info/time_within_train_step": 27.676450490951538, "step": 1051}
{"train_info/time_between_train_steps": 0.004914760589599609, "step": 1051}
{"info/global_step": 1052, "train_info/time_within_train_step": 27.68729066848755, "step": 1052}
{"train_info/time_between_train_steps": 0.005120754241943359, "step": 1052}
{"info/global_step": 1053, "train_info/time_within_train_step": 27.69151282310486, "step": 1053}
{"train_info/time_between_train_steps": 0.005424976348876953, "step": 1053}
{"train_info/time_between_train_steps": 29.80830216407776, "step": 1053}
{"info/global_step": 1054, "train_info/time_within_train_step": 27.695092916488647, "step": 1054}
{"train_info/time_between_train_steps": 0.005778789520263672, "step": 1054}
{"info/global_step": 1055, "train_info/time_within_train_step": 27.806375980377197, "step": 1055}
{"train_info/time_between_train_steps": 0.004920482635498047, "step": 1055}
{"info/global_step": 1056, "train_info/time_within_train_step": 27.775171041488647, "step": 1056}
{"train_info/time_between_train_steps": 0.004980802536010742, "step": 1056}
{"info/global_step": 1057, "train_info/time_within_train_step": 27.784335374832153, "step": 1057}
{"train_info/time_between_train_steps": 0.009524345397949219, "step": 1057}
{"info/global_step": 1058, "train_info/time_within_train_step": 27.676077604293823, "step": 1058}
{"train_info/time_between_train_steps": 0.009401082992553711, "step": 1058}
{"info/global_step": 1059, "train_info/time_within_train_step": 27.803493976593018, "step": 1059}
{"train_info/time_between_train_steps": 0.008848905563354492, "step": 1059}
{"info/global_step": 1060, "train_info/time_within_train_step": 27.689388036727905, "step": 1060}
{"train_info/time_between_train_steps": 0.004886627197265625, "step": 1060}
{"info/global_step": 1061, "train_info/time_within_train_step": 27.730841875076294, "step": 1061}
{"train_info/time_between_train_steps": 0.004877328872680664, "step": 1061}
{"info/global_step": 1062, "train_info/time_within_train_step": 27.693867206573486, "step": 1062}
{"train_info/time_between_train_steps": 0.004689455032348633, "step": 1062}
{"info/global_step": 1063, "train_info/time_within_train_step": 27.65892004966736, "step": 1063}
{"train_info/time_between_train_steps": 0.004697322845458984, "step": 1063}
{"info/global_step": 1064, "train_info/time_within_train_step": 27.66943907737732, "step": 1064}
{"train_info/time_between_train_steps": 0.0047149658203125, "step": 1064}
{"info/global_step": 1065, "train_info/time_within_train_step": 27.66978693008423, "step": 1065}
{"train_info/time_between_train_steps": 0.004691362380981445, "step": 1065}
{"info/global_step": 1066, "train_info/time_within_train_step": 27.708312511444092, "step": 1066}
{"train_info/time_between_train_steps": 0.0048067569732666016, "step": 1066}
{"info/global_step": 1067, "train_info/time_within_train_step": 27.68553876876831, "step": 1067}
{"train_info/time_between_train_steps": 0.004884958267211914, "step": 1067}
{"info/global_step": 1068, "train_info/time_within_train_step": 27.689347982406616, "step": 1068}
{"train_info/time_between_train_steps": 0.005012035369873047, "step": 1068}
{"info/global_step": 1069, "train_info/time_within_train_step": 27.683759689331055, "step": 1069}
{"train_info/time_between_train_steps": 0.004987478256225586, "step": 1069}
{"info/global_step": 1070, "train_info/time_within_train_step": 27.705440998077393, "step": 1070}
{"train_info/time_between_train_steps": 0.0049974918365478516, "step": 1070}
{"info/global_step": 1071, "train_info/time_within_train_step": 27.675816297531128, "step": 1071}
{"train_info/time_between_train_steps": 0.0049114227294921875, "step": 1071}
{"info/global_step": 1072, "train_info/time_within_train_step": 27.804784059524536, "step": 1072}
{"train_info/time_between_train_steps": 0.004919290542602539, "step": 1072}
{"info/global_step": 1073, "train_info/time_within_train_step": 27.701993703842163, "step": 1073}
{"train_info/time_between_train_steps": 0.005866050720214844, "step": 1073}
{"info/global_step": 1074, "train_info/time_within_train_step": 27.694175004959106, "step": 1074}
{"train_info/time_between_train_steps": 0.004905223846435547, "step": 1074}
{"info/global_step": 1075, "train_info/time_within_train_step": 27.679261445999146, "step": 1075}
{"train_info/time_between_train_steps": 0.005095005035400391, "step": 1075}
{"info/global_step": 1076, "train_info/time_within_train_step": 27.68309712409973, "step": 1076}
{"train_info/time_between_train_steps": 0.005004167556762695, "step": 1076}
{"info/global_step": 1077, "train_info/time_within_train_step": 27.688883304595947, "step": 1077}
{"train_info/time_between_train_steps": 0.005163431167602539, "step": 1077}
{"info/global_step": 1078, "train_info/time_within_train_step": 27.702832221984863, "step": 1078}
{"train_info/time_between_train_steps": 0.005207061767578125, "step": 1078}
{"info/global_step": 1079, "train_info/time_within_train_step": 27.728931665420532, "step": 1079}
{"train_info/time_between_train_steps": 0.005362510681152344, "step": 1079}
{"info/global_step": 1080, "train_info/time_within_train_step": 27.72173500061035, "step": 1080}
{"train_info/time_between_train_steps": 0.005534648895263672, "step": 1080}
{"train_info/time_between_train_steps": 30.02582597732544, "step": 1080}
{"info/global_step": 1081, "train_info/time_within_train_step": 27.67504334449768, "step": 1081}
{"train_info/time_between_train_steps": 0.00487828254699707, "step": 1081}
{"info/global_step": 1082, "train_info/time_within_train_step": 27.796360969543457, "step": 1082}
{"train_info/time_between_train_steps": 0.004873991012573242, "step": 1082}
{"info/global_step": 1083, "train_info/time_within_train_step": 27.721129417419434, "step": 1083}
{"train_info/time_between_train_steps": 0.004914283752441406, "step": 1083}
{"info/global_step": 1084, "train_info/time_within_train_step": 27.773406505584717, "step": 1084}
{"train_info/time_between_train_steps": 0.00483250617980957, "step": 1084}
{"info/global_step": 1085, "train_info/time_within_train_step": 27.67207169532776, "step": 1085}
{"train_info/time_between_train_steps": 0.004860877990722656, "step": 1085}
{"info/global_step": 1086, "train_info/time_within_train_step": 27.80374813079834, "step": 1086}
{"train_info/time_between_train_steps": 0.0048944950103759766, "step": 1086}
{"info/global_step": 1087, "train_info/time_within_train_step": 27.786004304885864, "step": 1087}
{"train_info/time_between_train_steps": 0.004897117614746094, "step": 1087}
{"info/global_step": 1088, "train_info/time_within_train_step": 27.746264219284058, "step": 1088}
{"train_info/time_between_train_steps": 0.005034685134887695, "step": 1088}
{"info/global_step": 1089, "train_info/time_within_train_step": 27.691611766815186, "step": 1089}
{"train_info/time_between_train_steps": 0.004956722259521484, "step": 1089}
{"info/global_step": 1090, "train_info/time_within_train_step": 27.67954707145691, "step": 1090}
{"train_info/time_between_train_steps": 0.005037784576416016, "step": 1090}
{"info/global_step": 1091, "train_info/time_within_train_step": 27.676440715789795, "step": 1091}
{"train_info/time_between_train_steps": 0.004950046539306641, "step": 1091}
{"info/global_step": 1092, "train_info/time_within_train_step": 27.678266286849976, "step": 1092}
{"train_info/time_between_train_steps": 0.004917621612548828, "step": 1092}
{"info/global_step": 1093, "train_info/time_within_train_step": 27.672656297683716, "step": 1093}
{"train_info/time_between_train_steps": 0.004774808883666992, "step": 1093}
{"info/global_step": 1094, "train_info/time_within_train_step": 27.684431552886963, "step": 1094}
{"train_info/time_between_train_steps": 0.004815578460693359, "step": 1094}
{"info/global_step": 1095, "train_info/time_within_train_step": 27.699134588241577, "step": 1095}
{"train_info/time_between_train_steps": 0.004881143569946289, "step": 1095}
{"info/global_step": 1096, "train_info/time_within_train_step": 27.677995443344116, "step": 1096}
{"train_info/time_between_train_steps": 0.004858970642089844, "step": 1096}
{"info/global_step": 1097, "train_info/time_within_train_step": 27.690423011779785, "step": 1097}
{"train_info/time_between_train_steps": 0.004859447479248047, "step": 1097}
{"info/global_step": 1098, "train_info/time_within_train_step": 27.66803812980652, "step": 1098}
{"train_info/time_between_train_steps": 0.004816770553588867, "step": 1098}
{"info/global_step": 1099, "train_info/time_within_train_step": 28.182527542114258, "step": 1099}
{"train_info/time_between_train_steps": 0.004991769790649414, "step": 1099}
{"info/global_step": 1100, "train_info/time_within_train_step": 28.494115829467773, "step": 1100}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1740856629, "_runtime": 32578}, "step": 1100}
{"logs": {"train/loss": 3.1282, "train/learning_rate": 5.5555555555555545e-05, "train/epoch": 40.02, "_timestamp": 1740856629, "_runtime": 32578}, "step": 1100}
{"train_info/time_between_train_steps": 42.37265753746033, "step": 1100}
{"info/global_step": 1101, "train_info/time_within_train_step": 27.692761659622192, "step": 1101}
{"train_info/time_between_train_steps": 0.004929542541503906, "step": 1101}
{"info/global_step": 1102, "train_info/time_within_train_step": 27.789745092391968, "step": 1102}
{"train_info/time_between_train_steps": 0.00485992431640625, "step": 1102}
{"info/global_step": 1103, "train_info/time_within_train_step": 27.676003456115723, "step": 1103}
{"train_info/time_between_train_steps": 0.005030632019042969, "step": 1103}
{"info/global_step": 1104, "train_info/time_within_train_step": 27.680352449417114, "step": 1104}
{"train_info/time_between_train_steps": 0.004987239837646484, "step": 1104}
{"info/global_step": 1105, "train_info/time_within_train_step": 27.678697109222412, "step": 1105}
{"train_info/time_between_train_steps": 0.005013704299926758, "step": 1105}
{"info/global_step": 1106, "train_info/time_within_train_step": 27.67962884902954, "step": 1106}
{"train_info/time_between_train_steps": 0.005142927169799805, "step": 1106}
{"info/global_step": 1107, "train_info/time_within_train_step": 27.691576957702637, "step": 1107}
{"train_info/time_between_train_steps": 0.005461692810058594, "step": 1107}
{"train_info/time_between_train_steps": 30.07877230644226, "step": 1107}
{"info/global_step": 1108, "train_info/time_within_train_step": 27.692732572555542, "step": 1108}
{"train_info/time_between_train_steps": 0.005208492279052734, "step": 1108}
{"info/global_step": 1109, "train_info/time_within_train_step": 27.829736709594727, "step": 1109}
{"train_info/time_between_train_steps": 0.0050890445709228516, "step": 1109}
{"info/global_step": 1110, "train_info/time_within_train_step": 27.730689764022827, "step": 1110}
{"train_info/time_between_train_steps": 0.00506591796875, "step": 1110}
{"info/global_step": 1111, "train_info/time_within_train_step": 27.80470323562622, "step": 1111}
{"train_info/time_between_train_steps": 0.005137443542480469, "step": 1111}
{"info/global_step": 1112, "train_info/time_within_train_step": 27.687325954437256, "step": 1112}
{"train_info/time_between_train_steps": 0.0051364898681640625, "step": 1112}
{"info/global_step": 1113, "train_info/time_within_train_step": 27.799099683761597, "step": 1113}
{"train_info/time_between_train_steps": 0.005001544952392578, "step": 1113}
{"info/global_step": 1114, "train_info/time_within_train_step": 27.725959300994873, "step": 1114}
{"train_info/time_between_train_steps": 0.0050542354583740234, "step": 1114}
{"info/global_step": 1115, "train_info/time_within_train_step": 27.731789588928223, "step": 1115}
{"train_info/time_between_train_steps": 0.005156040191650391, "step": 1115}
{"info/global_step": 1116, "train_info/time_within_train_step": 27.686558961868286, "step": 1116}
{"train_info/time_between_train_steps": 0.0047550201416015625, "step": 1116}
{"info/global_step": 1117, "train_info/time_within_train_step": 27.992826223373413, "step": 1117}
{"train_info/time_between_train_steps": 0.005074262619018555, "step": 1117}
{"info/global_step": 1118, "train_info/time_within_train_step": 28.333396673202515, "step": 1118}
{"train_info/time_between_train_steps": 0.00502324104309082, "step": 1118}
{"info/global_step": 1119, "train_info/time_within_train_step": 28.143287420272827, "step": 1119}
{"train_info/time_between_train_steps": 0.004838466644287109, "step": 1119}
{"info/global_step": 1120, "train_info/time_within_train_step": 27.69369864463806, "step": 1120}
{"train_info/time_between_train_steps": 0.004889011383056641, "step": 1120}
{"info/global_step": 1121, "train_info/time_within_train_step": 27.71147608757019, "step": 1121}
{"train_info/time_between_train_steps": 0.005092144012451172, "step": 1121}
{"info/global_step": 1122, "train_info/time_within_train_step": 27.687582969665527, "step": 1122}
{"train_info/time_between_train_steps": 0.004998922348022461, "step": 1122}
{"info/global_step": 1123, "train_info/time_within_train_step": 27.70512318611145, "step": 1123}
{"train_info/time_between_train_steps": 0.0051801204681396484, "step": 1123}
{"info/global_step": 1124, "train_info/time_within_train_step": 27.681578397750854, "step": 1124}
{"train_info/time_between_train_steps": 0.0049626827239990234, "step": 1124}
{"info/global_step": 1125, "train_info/time_within_train_step": 27.851972341537476, "step": 1125}
{"train_info/time_between_train_steps": 0.010074615478515625, "step": 1125}
{"info/global_step": 1126, "train_info/time_within_train_step": 28.030656576156616, "step": 1126}
{"train_info/time_between_train_steps": 0.0094146728515625, "step": 1126}
{"info/global_step": 1127, "train_info/time_within_train_step": 27.735562801361084, "step": 1127}
{"train_info/time_between_train_steps": 0.004916667938232422, "step": 1127}
{"info/global_step": 1128, "train_info/time_within_train_step": 27.68979787826538, "step": 1128}
{"train_info/time_between_train_steps": 0.004988431930541992, "step": 1128}
{"info/global_step": 1129, "train_info/time_within_train_step": 27.72968077659607, "step": 1129}
{"train_info/time_between_train_steps": 0.0048639774322509766, "step": 1129}
{"info/global_step": 1130, "train_info/time_within_train_step": 27.71677303314209, "step": 1130}
{"train_info/time_between_train_steps": 0.0050466060638427734, "step": 1130}
{"info/global_step": 1131, "train_info/time_within_train_step": 27.70972776412964, "step": 1131}
{"train_info/time_between_train_steps": 0.005130290985107422, "step": 1131}
{"info/global_step": 1132, "train_info/time_within_train_step": 27.70779514312744, "step": 1132}
{"train_info/time_between_train_steps": 0.005143880844116211, "step": 1132}
{"info/global_step": 1133, "train_info/time_within_train_step": 27.778823852539062, "step": 1133}
{"train_info/time_between_train_steps": 0.005446434020996094, "step": 1133}
{"info/global_step": 1134, "train_info/time_within_train_step": 27.72339105606079, "step": 1134}
{"train_info/time_between_train_steps": 0.005533456802368164, "step": 1134}
{"train_info/time_between_train_steps": 29.957901000976562, "step": 1134}
{"info/global_step": 1135, "train_info/time_within_train_step": 27.73313570022583, "step": 1135}
{"train_info/time_between_train_steps": 0.005877494812011719, "step": 1135}
{"info/global_step": 1136, "train_info/time_within_train_step": 27.80004596710205, "step": 1136}
{"train_info/time_between_train_steps": 0.00487208366394043, "step": 1136}
{"info/global_step": 1137, "train_info/time_within_train_step": 27.699987649917603, "step": 1137}
{"train_info/time_between_train_steps": 0.004783153533935547, "step": 1137}
{"info/global_step": 1138, "train_info/time_within_train_step": 27.8054461479187, "step": 1138}
{"train_info/time_between_train_steps": 0.004898548126220703, "step": 1138}
{"info/global_step": 1139, "train_info/time_within_train_step": 27.7035653591156, "step": 1139}
{"train_info/time_between_train_steps": 0.006071329116821289, "step": 1139}
{"info/global_step": 1140, "train_info/time_within_train_step": 28.05338764190674, "step": 1140}
{"train_info/time_between_train_steps": 0.005099058151245117, "step": 1140}
{"info/global_step": 1141, "train_info/time_within_train_step": 27.75528383255005, "step": 1141}
{"train_info/time_between_train_steps": 0.005220174789428711, "step": 1141}
{"info/global_step": 1142, "train_info/time_within_train_step": 27.77657389640808, "step": 1142}
{"train_info/time_between_train_steps": 0.0050160884857177734, "step": 1142}
{"info/global_step": 1143, "train_info/time_within_train_step": 27.726791858673096, "step": 1143}
{"train_info/time_between_train_steps": 0.004811763763427734, "step": 1143}
{"info/global_step": 1144, "train_info/time_within_train_step": 27.695000410079956, "step": 1144}
{"train_info/time_between_train_steps": 0.005006074905395508, "step": 1144}
{"info/global_step": 1145, "train_info/time_within_train_step": 27.68716835975647, "step": 1145}
{"train_info/time_between_train_steps": 0.0047719478607177734, "step": 1145}
{"info/global_step": 1146, "train_info/time_within_train_step": 27.691530466079712, "step": 1146}
{"train_info/time_between_train_steps": 0.004807472229003906, "step": 1146}
{"info/global_step": 1147, "train_info/time_within_train_step": 27.77796220779419, "step": 1147}
{"train_info/time_between_train_steps": 0.009932518005371094, "step": 1147}
{"info/global_step": 1148, "train_info/time_within_train_step": 27.69778060913086, "step": 1148}
{"train_info/time_between_train_steps": 0.004953622817993164, "step": 1148}
{"info/global_step": 1149, "train_info/time_within_train_step": 27.677943229675293, "step": 1149}
{"train_info/time_between_train_steps": 0.004799604415893555, "step": 1149}
{"info/global_step": 1150, "train_info/time_within_train_step": 27.726304054260254, "step": 1150}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1740858121, "_runtime": 34070}, "step": 1150}
{"logs": {"train/loss": 3.0965, "train/learning_rate": 2.7777777777777772e-05, "train/epoch": 42.01, "_timestamp": 1740858121, "_runtime": 34070}, "step": 1150}
{"train_info/time_between_train_steps": 0.02528548240661621, "step": 1150}
{"info/global_step": 1151, "train_info/time_within_train_step": 27.67268466949463, "step": 1151}
{"train_info/time_between_train_steps": 0.00493311882019043, "step": 1151}
{"info/global_step": 1152, "train_info/time_within_train_step": 27.71139168739319, "step": 1152}
{"train_info/time_between_train_steps": 0.005100727081298828, "step": 1152}
{"info/global_step": 1153, "train_info/time_within_train_step": 27.692034244537354, "step": 1153}
{"train_info/time_between_train_steps": 0.009293317794799805, "step": 1153}
{"info/global_step": 1154, "train_info/time_within_train_step": 27.723060369491577, "step": 1154}
{"train_info/time_between_train_steps": 0.0049190521240234375, "step": 1154}
{"info/global_step": 1155, "train_info/time_within_train_step": 27.688494443893433, "step": 1155}
{"train_info/time_between_train_steps": 0.0050122737884521484, "step": 1155}
{"info/global_step": 1156, "train_info/time_within_train_step": 27.73175311088562, "step": 1156}
{"train_info/time_between_train_steps": 0.0048830509185791016, "step": 1156}
{"info/global_step": 1157, "train_info/time_within_train_step": 27.6952166557312, "step": 1157}
{"train_info/time_between_train_steps": 0.0050506591796875, "step": 1157}
{"info/global_step": 1158, "train_info/time_within_train_step": 27.704674005508423, "step": 1158}
{"train_info/time_between_train_steps": 0.004937171936035156, "step": 1158}
{"info/global_step": 1159, "train_info/time_within_train_step": 27.697640419006348, "step": 1159}
{"train_info/time_between_train_steps": 0.004979610443115234, "step": 1159}
{"info/global_step": 1160, "train_info/time_within_train_step": 27.6982901096344, "step": 1160}
{"train_info/time_between_train_steps": 0.005146026611328125, "step": 1160}
{"info/global_step": 1161, "train_info/time_within_train_step": 27.744900703430176, "step": 1161}
{"train_info/time_between_train_steps": 0.005276679992675781, "step": 1161}
{"train_info/time_between_train_steps": 29.92055368423462, "step": 1161}
{"info/global_step": 1162, "train_info/time_within_train_step": 27.783670663833618, "step": 1162}
{"train_info/time_between_train_steps": 0.004852294921875, "step": 1162}
{"info/global_step": 1163, "train_info/time_within_train_step": 27.823227643966675, "step": 1163}
{"train_info/time_between_train_steps": 0.005086660385131836, "step": 1163}
{"info/global_step": 1164, "train_info/time_within_train_step": 27.737992525100708, "step": 1164}
{"train_info/time_between_train_steps": 0.010019779205322266, "step": 1164}
{"info/global_step": 1165, "train_info/time_within_train_step": 27.833585500717163, "step": 1165}
{"train_info/time_between_train_steps": 0.005137920379638672, "step": 1165}
{"info/global_step": 1166, "train_info/time_within_train_step": 27.77501368522644, "step": 1166}
{"train_info/time_between_train_steps": 0.009694337844848633, "step": 1166}
{"info/global_step": 1167, "train_info/time_within_train_step": 27.826500177383423, "step": 1167}
{"train_info/time_between_train_steps": 0.0051343441009521484, "step": 1167}
{"info/global_step": 1168, "train_info/time_within_train_step": 27.7075674533844, "step": 1168}
{"train_info/time_between_train_steps": 0.0049855709075927734, "step": 1168}
{"info/global_step": 1169, "train_info/time_within_train_step": 27.73738741874695, "step": 1169}
{"train_info/time_between_train_steps": 0.005007743835449219, "step": 1169}
{"info/global_step": 1170, "train_info/time_within_train_step": 27.692854404449463, "step": 1170}
{"train_info/time_between_train_steps": 0.004728794097900391, "step": 1170}
{"info/global_step": 1171, "train_info/time_within_train_step": 27.695501804351807, "step": 1171}
{"train_info/time_between_train_steps": 0.0048062801361083984, "step": 1171}
{"info/global_step": 1172, "train_info/time_within_train_step": 27.69487714767456, "step": 1172}
{"train_info/time_between_train_steps": 0.0048007965087890625, "step": 1172}
{"info/global_step": 1173, "train_info/time_within_train_step": 27.675931453704834, "step": 1173}
{"train_info/time_between_train_steps": 0.004728794097900391, "step": 1173}
{"info/global_step": 1174, "train_info/time_within_train_step": 27.685073137283325, "step": 1174}
{"train_info/time_between_train_steps": 0.004676103591918945, "step": 1174}
{"info/global_step": 1175, "train_info/time_within_train_step": 27.716898441314697, "step": 1175}
{"train_info/time_between_train_steps": 0.004889011383056641, "step": 1175}
{"info/global_step": 1176, "train_info/time_within_train_step": 27.69726014137268, "step": 1176}
{"train_info/time_between_train_steps": 0.005027055740356445, "step": 1176}
{"info/global_step": 1177, "train_info/time_within_train_step": 27.729109048843384, "step": 1177}
{"train_info/time_between_train_steps": 0.004983425140380859, "step": 1177}
{"info/global_step": 1178, "train_info/time_within_train_step": 27.78203320503235, "step": 1178}
{"train_info/time_between_train_steps": 0.00502324104309082, "step": 1178}
{"info/global_step": 1179, "train_info/time_within_train_step": 27.731884002685547, "step": 1179}
{"train_info/time_between_train_steps": 0.004941701889038086, "step": 1179}
{"info/global_step": 1180, "train_info/time_within_train_step": 27.73948884010315, "step": 1180}
{"train_info/time_between_train_steps": 0.005121707916259766, "step": 1180}
{"info/global_step": 1181, "train_info/time_within_train_step": 27.68657946586609, "step": 1181}
{"train_info/time_between_train_steps": 0.004862546920776367, "step": 1181}
{"info/global_step": 1182, "train_info/time_within_train_step": 27.697163343429565, "step": 1182}
{"train_info/time_between_train_steps": 0.004860877990722656, "step": 1182}
{"info/global_step": 1183, "train_info/time_within_train_step": 27.708019495010376, "step": 1183}
{"train_info/time_between_train_steps": 0.005054473876953125, "step": 1183}
{"info/global_step": 1184, "train_info/time_within_train_step": 27.69333004951477, "step": 1184}
{"train_info/time_between_train_steps": 0.00952911376953125, "step": 1184}
{"info/global_step": 1185, "train_info/time_within_train_step": 27.684035301208496, "step": 1185}
{"train_info/time_between_train_steps": 0.0050318241119384766, "step": 1185}
{"info/global_step": 1186, "train_info/time_within_train_step": 27.728570461273193, "step": 1186}
{"train_info/time_between_train_steps": 0.004942655563354492, "step": 1186}
{"info/global_step": 1187, "train_info/time_within_train_step": 27.69552493095398, "step": 1187}
{"train_info/time_between_train_steps": 0.00515437126159668, "step": 1187}
{"info/global_step": 1188, "train_info/time_within_train_step": 27.767336130142212, "step": 1188}
{"train_info/time_between_train_steps": 0.005585670471191406, "step": 1188}
{"train_info/time_between_train_steps": 30.154910802841187, "step": 1188}
{"info/global_step": 1189, "train_info/time_within_train_step": 27.717191457748413, "step": 1189}
{"train_info/time_between_train_steps": 0.004914999008178711, "step": 1189}
{"info/global_step": 1190, "train_info/time_within_train_step": 27.80989098548889, "step": 1190}
{"train_info/time_between_train_steps": 0.004873037338256836, "step": 1190}
{"info/global_step": 1191, "train_info/time_within_train_step": 27.67591691017151, "step": 1191}
{"train_info/time_between_train_steps": 0.0050237178802490234, "step": 1191}
{"info/global_step": 1192, "train_info/time_within_train_step": 27.894358158111572, "step": 1192}
{"train_info/time_between_train_steps": 0.004902362823486328, "step": 1192}
{"info/global_step": 1193, "train_info/time_within_train_step": 27.673638582229614, "step": 1193}
{"train_info/time_between_train_steps": 0.004803180694580078, "step": 1193}
{"info/global_step": 1194, "train_info/time_within_train_step": 27.79937481880188, "step": 1194}
{"train_info/time_between_train_steps": 0.0048983097076416016, "step": 1194}
{"info/global_step": 1195, "train_info/time_within_train_step": 27.70522928237915, "step": 1195}
{"train_info/time_between_train_steps": 0.004971504211425781, "step": 1195}
{"info/global_step": 1196, "train_info/time_within_train_step": 27.77164316177368, "step": 1196}
{"train_info/time_between_train_steps": 0.005106687545776367, "step": 1196}
{"info/global_step": 1197, "train_info/time_within_train_step": 27.682453870773315, "step": 1197}
{"train_info/time_between_train_steps": 0.004803895950317383, "step": 1197}
{"info/global_step": 1198, "train_info/time_within_train_step": 27.68337607383728, "step": 1198}
{"train_info/time_between_train_steps": 0.004686832427978516, "step": 1198}
{"info/global_step": 1199, "train_info/time_within_train_step": 27.7890305519104, "step": 1199}
{"train_info/time_between_train_steps": 0.0051767826080322266, "step": 1199}
{"info/global_step": 1200, "train_info/time_within_train_step": 29.19957208633423, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1740859572, "_runtime": 35521}, "step": 1200}
{"logs": {"train/loss": 3.072, "train/learning_rate": 0.0, "train/epoch": 44.01, "_timestamp": 1740859572, "_runtime": 35521}, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1922.4462890625, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1740859642, "_runtime": 35591}, "step": 1200}
{"logs": {"train/train_runtime": 35592.1699, "train/train_samples_per_second": 17.262, "train/train_steps_per_second": 0.034, "train/total_flos": 3.32388548739072e+17, "train/train_loss": 4.037196648915609, "train/epoch": 44.01, "_timestamp": 1740859642, "_runtime": 35591}, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1922.4453125, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1740859661, "_runtime": 35610}, "step": 1200}
{"logs": {"eval/loss": 4.2008867263793945, "eval/runtime": 4.0215, "eval/samples_per_second": 50.479, "eval/steps_per_second": 3.233, "train/epoch": 44.01, "_timestamp": 1740859661, "_runtime": 35610}, "step": 1200}
{"train_info": {"train_info/memory_allocated": 1922.4453125, "train_info/memory_max_allocated": 20713.490234375, "train_info/memory_reserved": 27336.0, "train_info/memory_max_reserved": 27336.0, "_timestamp": 1740859661, "_runtime": 35610}, "step": 1200}
{"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.2008867263793945, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 66.74548979474166, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 4.0215, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 50.479, "train/epoch": 44.01, "_timestamp": 1740859661, "_runtime": 35610}, "step": 1200}