{"num_parameters": 108882432, "trainable_parameters": 108882432, "step": 0} {"train_info/time_between_train_steps": 2.3392982482910156, "step": 0} {"info/global_step": 1, "train_info/time_within_train_step": 4.471024990081787, "step": 1} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 4412.87744140625, "train_info/memory_reserved": 4642.0, "train_info/memory_max_reserved": 4642.0, "_timestamp": 1746566009, "_runtime": 18}, "step": 1} {"logs": {"train/loss": 10.3518, "train/learning_rate": 6e-07, "train/epoch": 0.0, "_timestamp": 1746566009, "_runtime": 18}, "step": 1} {"train_info/time_between_train_steps": 0.01431417465209961, "step": 1} {"info/global_step": 2, "train_info/time_within_train_step": 2.5028202533721924, "step": 2} {"train_info/time_between_train_steps": 0.003167867660522461, "step": 2} {"info/global_step": 3, "train_info/time_within_train_step": 2.6146469116210938, "step": 3} {"train_info/time_between_train_steps": 0.0033111572265625, "step": 3} {"info/global_step": 4, "train_info/time_within_train_step": 2.6430411338806152, "step": 4} {"train_info/time_between_train_steps": 0.0032224655151367188, "step": 4} {"info/global_step": 5, "train_info/time_within_train_step": 2.6450512409210205, "step": 5} {"train_info/time_between_train_steps": 0.003207683563232422, "step": 5} {"info/global_step": 6, "train_info/time_within_train_step": 2.650383710861206, "step": 6} {"train_info/time_between_train_steps": 0.003178119659423828, "step": 6} {"info/global_step": 7, "train_info/time_within_train_step": 2.6612892150878906, "step": 7} {"train_info/time_between_train_steps": 0.0033240318298339844, "step": 7} {"info/global_step": 8, "train_info/time_within_train_step": 2.677560567855835, "step": 8} {"train_info/time_between_train_steps": 0.0032422542572021484, "step": 8} {"info/global_step": 9, "train_info/time_within_train_step": 2.7523460388183594, "step": 9} {"train_info/time_between_train_steps": 0.0034415721893310547, "step": 9} {"info/global_step": 10, "train_info/time_within_train_step": 2.7513928413391113, "step": 10} {"train_info/time_between_train_steps": 0.003448486328125, "step": 10} {"info/global_step": 11, "train_info/time_within_train_step": 2.7526707649230957, "step": 11} {"train_info/time_between_train_steps": 0.003178834915161133, "step": 11} {"info/global_step": 12, "train_info/time_within_train_step": 2.7525265216827393, "step": 12} {"train_info/time_between_train_steps": 0.003309488296508789, "step": 12} {"info/global_step": 13, "train_info/time_within_train_step": 2.7522308826446533, "step": 13} {"train_info/time_between_train_steps": 0.003164052963256836, "step": 13} {"info/global_step": 14, "train_info/time_within_train_step": 2.75183367729187, "step": 14} {"train_info/time_between_train_steps": 0.003148794174194336, "step": 14} {"info/global_step": 15, "train_info/time_within_train_step": 2.751687526702881, "step": 15} {"train_info/time_between_train_steps": 0.0033698081970214844, "step": 15} {"info/global_step": 16, "train_info/time_within_train_step": 2.753061294555664, "step": 16} {"train_info/time_between_train_steps": 0.0031609535217285156, "step": 16} {"info/global_step": 17, "train_info/time_within_train_step": 2.7528767585754395, "step": 17} {"train_info/time_between_train_steps": 0.0033125877380371094, "step": 17} {"info/global_step": 18, "train_info/time_within_train_step": 2.755141258239746, "step": 18} {"train_info/time_between_train_steps": 0.0031304359436035156, "step": 18} {"info/global_step": 19, "train_info/time_within_train_step": 2.755034923553467, "step": 19} {"train_info/time_between_train_steps": 0.0033643245697021484, "step": 19} {"info/global_step": 20, "train_info/time_within_train_step": 2.7555792331695557, "step": 20} {"train_info/time_between_train_steps": 0.0032629966735839844, "step": 20} {"info/global_step": 21, "train_info/time_within_train_step": 2.7553980350494385, "step": 21} {"train_info/time_between_train_steps": 0.003255605697631836, "step": 21} {"info/global_step": 22, "train_info/time_within_train_step": 2.9891512393951416, "step": 22} {"train_info/time_between_train_steps": 0.0031561851501464844, "step": 22} {"info/global_step": 23, "train_info/time_within_train_step": 2.7533938884735107, "step": 23} {"train_info/time_between_train_steps": 0.003280162811279297, "step": 23} {"info/global_step": 24, "train_info/time_within_train_step": 2.755012035369873, "step": 24} {"train_info/time_between_train_steps": 0.003206014633178711, "step": 24} {"info/global_step": 25, "train_info/time_within_train_step": 2.755319356918335, "step": 25} {"train_info/time_between_train_steps": 0.003336191177368164, "step": 25} {"info/global_step": 26, "train_info/time_within_train_step": 2.754765272140503, "step": 26} {"train_info/time_between_train_steps": 0.00315093994140625, "step": 26} {"info/global_step": 27, "train_info/time_within_train_step": 2.7550148963928223, "step": 27} {"train_info/time_between_train_steps": 0.0031881332397460938, "step": 27} {"info/global_step": 28, "train_info/time_within_train_step": 2.754521369934082, "step": 28} {"train_info/time_between_train_steps": 0.0033354759216308594, "step": 28} {"info/global_step": 29, "train_info/time_within_train_step": 2.754826545715332, "step": 29} {"train_info/time_between_train_steps": 0.003383159637451172, "step": 29} {"info/global_step": 30, "train_info/time_within_train_step": 2.7547667026519775, "step": 30} {"train_info/time_between_train_steps": 0.003274679183959961, "step": 30} {"info/global_step": 31, "train_info/time_within_train_step": 2.754694700241089, "step": 31} {"train_info/time_between_train_steps": 0.0030748844146728516, "step": 31} {"info/global_step": 32, "train_info/time_within_train_step": 2.7548623085021973, "step": 32} {"train_info/time_between_train_steps": 0.0030956268310546875, "step": 32} {"info/global_step": 33, "train_info/time_within_train_step": 2.7546567916870117, "step": 33} {"train_info/time_between_train_steps": 0.0032753944396972656, "step": 33} {"info/global_step": 34, "train_info/time_within_train_step": 2.7539350986480713, "step": 34} {"train_info/time_between_train_steps": 0.0033652782440185547, "step": 34} {"info/global_step": 35, "train_info/time_within_train_step": 2.7539801597595215, "step": 35} {"train_info/time_between_train_steps": 0.0032072067260742188, "step": 35} {"info/global_step": 36, "train_info/time_within_train_step": 2.7549948692321777, "step": 36} {"train_info/time_between_train_steps": 0.0031142234802246094, "step": 36} {"info/global_step": 37, "train_info/time_within_train_step": 2.7564241886138916, "step": 37} {"train_info/time_between_train_steps": 0.0031418800354003906, "step": 37} {"info/global_step": 38, "train_info/time_within_train_step": 2.754756450653076, "step": 38} {"train_info/time_between_train_steps": 0.003289937973022461, "step": 38} {"info/global_step": 39, "train_info/time_within_train_step": 2.756704092025757, "step": 39} {"train_info/time_between_train_steps": 0.003261566162109375, "step": 39} {"info/global_step": 40, "train_info/time_within_train_step": 2.7541587352752686, "step": 40} {"train_info/time_between_train_steps": 0.0030853748321533203, "step": 40} {"info/global_step": 41, "train_info/time_within_train_step": 2.754969358444214, "step": 41} {"train_info/time_between_train_steps": 0.003117084503173828, "step": 41} {"info/global_step": 42, "train_info/time_within_train_step": 2.755427360534668, "step": 42} {"train_info/time_between_train_steps": 0.003093719482421875, "step": 42} {"info/global_step": 43, "train_info/time_within_train_step": 2.7549641132354736, "step": 43} {"train_info/time_between_train_steps": 0.0030879974365234375, "step": 43} {"info/global_step": 44, "train_info/time_within_train_step": 2.7553746700286865, "step": 44} {"train_info/time_between_train_steps": 0.003251314163208008, "step": 44} {"info/global_step": 45, "train_info/time_within_train_step": 2.754159927368164, "step": 45} {"train_info/time_between_train_steps": 0.0031499862670898438, "step": 45} {"info/global_step": 46, "train_info/time_within_train_step": 2.753244400024414, "step": 46} {"train_info/time_between_train_steps": 0.0031070709228515625, "step": 46} {"info/global_step": 47, "train_info/time_within_train_step": 2.7543482780456543, "step": 47} {"train_info/time_between_train_steps": 0.0030968189239501953, "step": 47} {"info/global_step": 48, "train_info/time_within_train_step": 2.754479169845581, "step": 48} {"train_info/time_between_train_steps": 0.003123760223388672, "step": 48} {"info/global_step": 49, "train_info/time_within_train_step": 2.754836320877075, "step": 49} {"train_info/time_between_train_steps": 0.003257274627685547, "step": 49} {"info/global_step": 50, "train_info/time_within_train_step": 2.7548701763153076, "step": 50} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746566144, "_runtime": 153}, "step": 50} {"logs": {"train/loss": 8.788, "train/learning_rate": 2.9999999999999997e-05, "train/epoch": 0.01, "_timestamp": 1746566144, "_runtime": 153}, "step": 50} {"train_info/time_between_train_steps": 0.0071337223052978516, "step": 50} {"info/global_step": 51, "train_info/time_within_train_step": 2.7555201053619385, "step": 51} {"train_info/time_between_train_steps": 0.003220796585083008, "step": 51} {"info/global_step": 52, "train_info/time_within_train_step": 2.755286693572998, "step": 52} {"train_info/time_between_train_steps": 0.003139495849609375, "step": 52} {"info/global_step": 53, "train_info/time_within_train_step": 2.7549564838409424, "step": 53} {"train_info/time_between_train_steps": 0.0031325817108154297, "step": 53} {"info/global_step": 54, "train_info/time_within_train_step": 2.7546043395996094, "step": 54} {"train_info/time_between_train_steps": 0.0032415390014648438, "step": 54} {"info/global_step": 55, "train_info/time_within_train_step": 2.7545204162597656, "step": 55} {"train_info/time_between_train_steps": 0.003205537796020508, "step": 55} {"info/global_step": 56, "train_info/time_within_train_step": 2.754415988922119, "step": 56} {"train_info/time_between_train_steps": 0.0032868385314941406, "step": 56} {"info/global_step": 57, "train_info/time_within_train_step": 2.7546684741973877, "step": 57} {"train_info/time_between_train_steps": 0.003177642822265625, "step": 57} {"info/global_step": 58, "train_info/time_within_train_step": 2.7540996074676514, "step": 58} {"train_info/time_between_train_steps": 0.003308534622192383, "step": 58} {"info/global_step": 59, "train_info/time_within_train_step": 2.7552623748779297, "step": 59} {"train_info/time_between_train_steps": 0.0033495426177978516, "step": 59} {"info/global_step": 60, "train_info/time_within_train_step": 2.754812479019165, "step": 60} {"train_info/time_between_train_steps": 0.003279447555541992, "step": 60} {"info/global_step": 61, "train_info/time_within_train_step": 2.7535786628723145, "step": 61} {"train_info/time_between_train_steps": 0.0034415721893310547, "step": 61} {"info/global_step": 62, "train_info/time_within_train_step": 2.7558770179748535, "step": 62} {"train_info/time_between_train_steps": 0.0032393932342529297, "step": 62} {"info/global_step": 63, "train_info/time_within_train_step": 2.891343593597412, "step": 63} {"train_info/time_between_train_steps": 0.0033278465270996094, "step": 63} {"info/global_step": 64, "train_info/time_within_train_step": 2.7568089962005615, "step": 64} {"train_info/time_between_train_steps": 0.003404855728149414, "step": 64} {"info/global_step": 65, "train_info/time_within_train_step": 2.755826950073242, "step": 65} {"train_info/time_between_train_steps": 0.0031790733337402344, "step": 65} {"info/global_step": 66, "train_info/time_within_train_step": 2.7554702758789062, "step": 66} {"train_info/time_between_train_steps": 0.0032546520233154297, "step": 66} {"info/global_step": 67, "train_info/time_within_train_step": 2.7551069259643555, "step": 67} {"train_info/time_between_train_steps": 0.0033817291259765625, "step": 67} {"info/global_step": 68, "train_info/time_within_train_step": 2.754805326461792, "step": 68} {"train_info/time_between_train_steps": 0.0035331249237060547, "step": 68} {"info/global_step": 69, "train_info/time_within_train_step": 2.755836248397827, "step": 69} {"train_info/time_between_train_steps": 0.003404378890991211, "step": 69} {"info/global_step": 70, "train_info/time_within_train_step": 2.7552285194396973, "step": 70} {"train_info/time_between_train_steps": 0.0032126903533935547, "step": 70} {"info/global_step": 71, "train_info/time_within_train_step": 2.7541463375091553, "step": 71} {"train_info/time_between_train_steps": 0.0032460689544677734, "step": 71} {"info/global_step": 72, "train_info/time_within_train_step": 2.755110740661621, "step": 72} {"train_info/time_between_train_steps": 0.0034520626068115234, "step": 72} {"info/global_step": 73, "train_info/time_within_train_step": 2.754164695739746, "step": 73} {"train_info/time_between_train_steps": 0.0031938552856445312, "step": 73} {"info/global_step": 74, "train_info/time_within_train_step": 2.754664897918701, "step": 74} {"train_info/time_between_train_steps": 0.003414154052734375, "step": 74} {"info/global_step": 75, "train_info/time_within_train_step": 2.7533257007598877, "step": 75} {"train_info/time_between_train_steps": 0.0033245086669921875, "step": 75} {"info/global_step": 76, "train_info/time_within_train_step": 2.7544755935668945, "step": 76} {"train_info/time_between_train_steps": 0.0033257007598876953, "step": 76} {"info/global_step": 77, "train_info/time_within_train_step": 2.7544169425964355, "step": 77} {"train_info/time_between_train_steps": 0.0032105445861816406, "step": 77} {"info/global_step": 78, "train_info/time_within_train_step": 2.7541773319244385, "step": 78} {"train_info/time_between_train_steps": 0.003306150436401367, "step": 78} {"info/global_step": 79, "train_info/time_within_train_step": 2.754261016845703, "step": 79} {"train_info/time_between_train_steps": 0.003242969512939453, "step": 79} {"info/global_step": 80, "train_info/time_within_train_step": 2.75534987449646, "step": 80} {"train_info/time_between_train_steps": 0.0034122467041015625, "step": 80} {"info/global_step": 81, "train_info/time_within_train_step": 2.754329204559326, "step": 81} {"train_info/time_between_train_steps": 0.0033495426177978516, "step": 81} {"info/global_step": 82, "train_info/time_within_train_step": 2.7560648918151855, "step": 82} {"train_info/time_between_train_steps": 0.0034608840942382812, "step": 82} {"info/global_step": 83, "train_info/time_within_train_step": 2.756174087524414, "step": 83} {"train_info/time_between_train_steps": 0.0033180713653564453, "step": 83} {"info/global_step": 84, "train_info/time_within_train_step": 2.755115032196045, "step": 84} {"train_info/time_between_train_steps": 0.0032939910888671875, "step": 84} {"info/global_step": 85, "train_info/time_within_train_step": 2.7548775672912598, "step": 85} {"train_info/time_between_train_steps": 0.003656625747680664, "step": 85} {"info/global_step": 86, "train_info/time_within_train_step": 2.7555153369903564, "step": 86} {"train_info/time_between_train_steps": 0.0034842491149902344, "step": 86} {"info/global_step": 87, "train_info/time_within_train_step": 2.754899501800537, "step": 87} {"train_info/time_between_train_steps": 0.0036368370056152344, "step": 87} {"info/global_step": 88, "train_info/time_within_train_step": 2.754084348678589, "step": 88} {"train_info/time_between_train_steps": 0.003539562225341797, "step": 88} {"info/global_step": 89, "train_info/time_within_train_step": 2.757103204727173, "step": 89} {"train_info/time_between_train_steps": 0.003653287887573242, "step": 89} {"info/global_step": 90, "train_info/time_within_train_step": 2.755711793899536, "step": 90} {"train_info/time_between_train_steps": 0.003615140914916992, "step": 90} {"info/global_step": 91, "train_info/time_within_train_step": 2.7534375190734863, "step": 91} {"train_info/time_between_train_steps": 0.0036242008209228516, "step": 91} {"info/global_step": 92, "train_info/time_within_train_step": 2.7536091804504395, "step": 92} {"train_info/time_between_train_steps": 0.0036003589630126953, "step": 92} {"info/global_step": 93, "train_info/time_within_train_step": 2.755341053009033, "step": 93} {"train_info/time_between_train_steps": 0.003651142120361328, "step": 93} {"info/global_step": 94, "train_info/time_within_train_step": 2.753891944885254, "step": 94} {"train_info/time_between_train_steps": 0.0035064220428466797, "step": 94} {"info/global_step": 95, "train_info/time_within_train_step": 2.755432367324829, "step": 95} {"train_info/time_between_train_steps": 0.003696918487548828, "step": 95} {"info/global_step": 96, "train_info/time_within_train_step": 2.754350423812866, "step": 96} {"train_info/time_between_train_steps": 0.003550291061401367, "step": 96} {"info/global_step": 97, "train_info/time_within_train_step": 2.7537026405334473, "step": 97} {"train_info/time_between_train_steps": 0.004030466079711914, "step": 97} {"info/global_step": 98, "train_info/time_within_train_step": 2.753965377807617, "step": 98} {"train_info/time_between_train_steps": 0.0035696029663085938, "step": 98} {"info/global_step": 99, "train_info/time_within_train_step": 2.754188299179077, "step": 99} {"train_info/time_between_train_steps": 0.0035674571990966797, "step": 99} {"info/global_step": 100, "train_info/time_within_train_step": 2.7547247409820557, "step": 100} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746566282, "_runtime": 291}, "step": 100} {"logs": {"train/loss": 7.577, "train/learning_rate": 5.9999999999999995e-05, "train/epoch": 0.01, "_timestamp": 1746566282, "_runtime": 291}, "step": 100} {"train_info/time_between_train_steps": 0.013339042663574219, "step": 100} {"info/global_step": 101, "train_info/time_within_train_step": 2.754871129989624, "step": 101} {"train_info/time_between_train_steps": 0.003730297088623047, "step": 101} {"info/global_step": 102, "train_info/time_within_train_step": 2.753568649291992, "step": 102} {"train_info/time_between_train_steps": 0.0035240650177001953, "step": 102} {"info/global_step": 103, "train_info/time_within_train_step": 2.755476951599121, "step": 103} {"train_info/time_between_train_steps": 0.003522634506225586, "step": 103} {"info/global_step": 104, "train_info/time_within_train_step": 2.7549657821655273, "step": 104} {"train_info/time_between_train_steps": 0.0037240982055664062, "step": 104} {"info/global_step": 105, "train_info/time_within_train_step": 2.754276752471924, "step": 105} {"train_info/time_between_train_steps": 0.003747224807739258, "step": 105} {"info/global_step": 106, "train_info/time_within_train_step": 2.7538838386535645, "step": 106} {"train_info/time_between_train_steps": 0.003463268280029297, "step": 106} {"info/global_step": 107, "train_info/time_within_train_step": 2.753957748413086, "step": 107} {"train_info/time_between_train_steps": 0.003494739532470703, "step": 107} {"info/global_step": 108, "train_info/time_within_train_step": 3.1201415061950684, "step": 108} {"train_info/time_between_train_steps": 0.003427743911743164, "step": 108} {"info/global_step": 109, "train_info/time_within_train_step": 2.754420757293701, "step": 109} {"train_info/time_between_train_steps": 0.003336191177368164, "step": 109} {"info/global_step": 110, "train_info/time_within_train_step": 2.7528886795043945, "step": 110} {"train_info/time_between_train_steps": 0.0032460689544677734, "step": 110} {"info/global_step": 111, "train_info/time_within_train_step": 2.753432512283325, "step": 111} {"train_info/time_between_train_steps": 0.003427743911743164, "step": 111} {"info/global_step": 112, "train_info/time_within_train_step": 2.7538745403289795, "step": 112} {"train_info/time_between_train_steps": 0.0032105445861816406, "step": 112} {"info/global_step": 113, "train_info/time_within_train_step": 2.753770112991333, "step": 113} {"train_info/time_between_train_steps": 0.0032265186309814453, "step": 113} {"info/global_step": 114, "train_info/time_within_train_step": 2.750358819961548, "step": 114} {"train_info/time_between_train_steps": 0.0031745433807373047, "step": 114} {"info/global_step": 115, "train_info/time_within_train_step": 2.7532567977905273, "step": 115} {"train_info/time_between_train_steps": 0.0033843517303466797, "step": 115} {"info/global_step": 116, "train_info/time_within_train_step": 2.754854917526245, "step": 116} {"train_info/time_between_train_steps": 0.0033576488494873047, "step": 116} {"info/global_step": 117, "train_info/time_within_train_step": 2.7525992393493652, "step": 117} {"train_info/time_between_train_steps": 0.003396272659301758, "step": 117} {"info/global_step": 118, "train_info/time_within_train_step": 2.753410816192627, "step": 118} {"train_info/time_between_train_steps": 0.003297090530395508, "step": 118} {"info/global_step": 119, "train_info/time_within_train_step": 2.7527964115142822, "step": 119} {"train_info/time_between_train_steps": 0.003152132034301758, "step": 119} {"info/global_step": 120, "train_info/time_within_train_step": 2.752531051635742, "step": 120} {"train_info/time_between_train_steps": 0.003265380859375, "step": 120} {"info/global_step": 121, "train_info/time_within_train_step": 2.752432107925415, "step": 121} {"train_info/time_between_train_steps": 0.0031707286834716797, "step": 121} {"info/global_step": 122, "train_info/time_within_train_step": 2.754225015640259, "step": 122} {"train_info/time_between_train_steps": 0.0031385421752929688, "step": 122} {"info/global_step": 123, "train_info/time_within_train_step": 2.7527167797088623, "step": 123} {"train_info/time_between_train_steps": 0.0031316280364990234, "step": 123} {"info/global_step": 124, "train_info/time_within_train_step": 2.7530431747436523, "step": 124} {"train_info/time_between_train_steps": 0.0032804012298583984, "step": 124} {"info/global_step": 125, "train_info/time_within_train_step": 2.754290819168091, "step": 125} {"train_info/time_between_train_steps": 0.13553285598754883, "step": 125} {"info/global_step": 126, "train_info/time_within_train_step": 2.7560641765594482, "step": 126} {"train_info/time_between_train_steps": 0.0032012462615966797, "step": 126} {"info/global_step": 127, "train_info/time_within_train_step": 2.7545218467712402, "step": 127} {"train_info/time_between_train_steps": 0.0032591819763183594, "step": 127} {"info/global_step": 128, "train_info/time_within_train_step": 2.7530553340911865, "step": 128} {"train_info/time_between_train_steps": 0.003478527069091797, "step": 128} {"info/global_step": 129, "train_info/time_within_train_step": 2.753472089767456, "step": 129} {"train_info/time_between_train_steps": 0.0032236576080322266, "step": 129} {"info/global_step": 130, "train_info/time_within_train_step": 2.754774808883667, "step": 130} {"train_info/time_between_train_steps": 0.0033631324768066406, "step": 130} {"info/global_step": 131, "train_info/time_within_train_step": 2.755448341369629, "step": 131} {"train_info/time_between_train_steps": 0.003284454345703125, "step": 131} {"info/global_step": 132, "train_info/time_within_train_step": 2.7529942989349365, "step": 132} {"train_info/time_between_train_steps": 0.0031833648681640625, "step": 132} {"info/global_step": 133, "train_info/time_within_train_step": 2.754163980484009, "step": 133} {"train_info/time_between_train_steps": 0.003214120864868164, "step": 133} {"info/global_step": 134, "train_info/time_within_train_step": 2.753666639328003, "step": 134} {"train_info/time_between_train_steps": 0.0031507015228271484, "step": 134} {"info/global_step": 135, "train_info/time_within_train_step": 2.753340721130371, "step": 135} {"train_info/time_between_train_steps": 0.0031893253326416016, "step": 135} {"info/global_step": 136, "train_info/time_within_train_step": 2.7532827854156494, "step": 136} {"train_info/time_between_train_steps": 0.0031507015228271484, "step": 136} {"info/global_step": 137, "train_info/time_within_train_step": 2.753754138946533, "step": 137} {"train_info/time_between_train_steps": 0.003154277801513672, "step": 137} {"info/global_step": 138, "train_info/time_within_train_step": 2.755516529083252, "step": 138} {"train_info/time_between_train_steps": 0.003541231155395508, "step": 138} {"info/global_step": 139, "train_info/time_within_train_step": 2.756082534790039, "step": 139} {"train_info/time_between_train_steps": 0.003461122512817383, "step": 139} {"info/global_step": 140, "train_info/time_within_train_step": 2.754770040512085, "step": 140} {"train_info/time_between_train_steps": 0.003403186798095703, "step": 140} {"info/global_step": 141, "train_info/time_within_train_step": 2.7540292739868164, "step": 141} {"train_info/time_between_train_steps": 0.0036296844482421875, "step": 141} {"info/global_step": 142, "train_info/time_within_train_step": 2.755143880844116, "step": 142} {"train_info/time_between_train_steps": 0.003390789031982422, "step": 142} {"info/global_step": 143, "train_info/time_within_train_step": 2.754504680633545, "step": 143} {"train_info/time_between_train_steps": 0.0034110546112060547, "step": 143} {"info/global_step": 144, "train_info/time_within_train_step": 2.7557337284088135, "step": 144} {"train_info/time_between_train_steps": 0.0034215450286865234, "step": 144} {"info/global_step": 145, "train_info/time_within_train_step": 2.7553727626800537, "step": 145} {"train_info/time_between_train_steps": 0.003495454788208008, "step": 145} {"info/global_step": 146, "train_info/time_within_train_step": 2.756120204925537, "step": 146} {"train_info/time_between_train_steps": 0.0034685134887695312, "step": 146} {"info/global_step": 147, "train_info/time_within_train_step": 2.756063938140869, "step": 147} {"train_info/time_between_train_steps": 0.0035905838012695312, "step": 147} {"info/global_step": 148, "train_info/time_within_train_step": 2.7557220458984375, "step": 148} {"train_info/time_between_train_steps": 0.003607511520385742, "step": 148} {"info/global_step": 149, "train_info/time_within_train_step": 2.7545113563537598, "step": 149} {"train_info/time_between_train_steps": 0.0037240982055664062, "step": 149} {"info/global_step": 150, "train_info/time_within_train_step": 2.7539241313934326, "step": 150} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746566421, "_runtime": 430}, "step": 150} {"logs": {"train/loss": 6.914, "train/learning_rate": 8.999999999999999e-05, "train/epoch": 0.01, "_timestamp": 1746566421, "_runtime": 430}, "step": 150} {"train_info/time_between_train_steps": 0.007609367370605469, "step": 150} {"info/global_step": 151, "train_info/time_within_train_step": 2.7567765712738037, "step": 151} {"train_info/time_between_train_steps": 0.0038683414459228516, "step": 151} {"info/global_step": 152, "train_info/time_within_train_step": 2.7564175128936768, "step": 152} {"train_info/time_between_train_steps": 0.003716707229614258, "step": 152} {"info/global_step": 153, "train_info/time_within_train_step": 2.756751775741577, "step": 153} {"train_info/time_between_train_steps": 0.0037789344787597656, "step": 153} {"info/global_step": 154, "train_info/time_within_train_step": 2.7570669651031494, "step": 154} {"train_info/time_between_train_steps": 0.003719806671142578, "step": 154} {"info/global_step": 155, "train_info/time_within_train_step": 2.75583815574646, "step": 155} {"train_info/time_between_train_steps": 0.0037043094635009766, "step": 155} {"info/global_step": 156, "train_info/time_within_train_step": 2.7543067932128906, "step": 156} {"train_info/time_between_train_steps": 0.0035886764526367188, "step": 156} {"info/global_step": 157, "train_info/time_within_train_step": 2.7535455226898193, "step": 157} {"train_info/time_between_train_steps": 0.0035469532012939453, "step": 157} {"info/global_step": 158, "train_info/time_within_train_step": 2.7548458576202393, "step": 158} {"train_info/time_between_train_steps": 0.0035381317138671875, "step": 158} {"info/global_step": 159, "train_info/time_within_train_step": 2.7542965412139893, "step": 159} {"train_info/time_between_train_steps": 0.003754854202270508, "step": 159} {"info/global_step": 160, "train_info/time_within_train_step": 2.7541351318359375, "step": 160} {"train_info/time_between_train_steps": 0.0036301612854003906, "step": 160} {"info/global_step": 161, "train_info/time_within_train_step": 3.1170687675476074, "step": 161} {"train_info/time_between_train_steps": 0.0036156177520751953, "step": 161} {"info/global_step": 162, "train_info/time_within_train_step": 2.7547547817230225, "step": 162} {"train_info/time_between_train_steps": 0.003356456756591797, "step": 162} {"info/global_step": 163, "train_info/time_within_train_step": 2.7552146911621094, "step": 163} {"train_info/time_between_train_steps": 0.0034859180450439453, "step": 163} {"info/global_step": 164, "train_info/time_within_train_step": 2.7554216384887695, "step": 164} {"train_info/time_between_train_steps": 0.0034210681915283203, "step": 164} {"info/global_step": 165, "train_info/time_within_train_step": 2.754901170730591, "step": 165} {"train_info/time_between_train_steps": 0.0033445358276367188, "step": 165} {"info/global_step": 166, "train_info/time_within_train_step": 2.755131959915161, "step": 166} {"train_info/time_between_train_steps": 0.0033462047576904297, "step": 166} {"info/global_step": 167, "train_info/time_within_train_step": 2.755638599395752, "step": 167} {"train_info/time_between_train_steps": 0.0033304691314697266, "step": 167} {"info/global_step": 168, "train_info/time_within_train_step": 2.753835439682007, "step": 168} {"train_info/time_between_train_steps": 0.0031616687774658203, "step": 168} {"info/global_step": 169, "train_info/time_within_train_step": 2.7552342414855957, "step": 169} {"train_info/time_between_train_steps": 0.0035707950592041016, "step": 169} {"info/global_step": 170, "train_info/time_within_train_step": 2.755732536315918, "step": 170} {"train_info/time_between_train_steps": 0.0033969879150390625, "step": 170} {"info/global_step": 171, "train_info/time_within_train_step": 2.7523818016052246, "step": 171} {"train_info/time_between_train_steps": 0.0032672882080078125, "step": 171} {"info/global_step": 172, "train_info/time_within_train_step": 2.7567412853240967, "step": 172} {"train_info/time_between_train_steps": 0.0061757564544677734, "step": 172} {"info/global_step": 173, "train_info/time_within_train_step": 2.757720470428467, "step": 173} {"train_info/time_between_train_steps": 0.0034084320068359375, "step": 173} {"info/global_step": 174, "train_info/time_within_train_step": 2.7614340782165527, "step": 174} {"train_info/time_between_train_steps": 0.003337860107421875, "step": 174} {"info/global_step": 175, "train_info/time_within_train_step": 2.7558960914611816, "step": 175} {"train_info/time_between_train_steps": 0.0035529136657714844, "step": 175} {"info/global_step": 176, "train_info/time_within_train_step": 2.7536587715148926, "step": 176} {"train_info/time_between_train_steps": 0.003381967544555664, "step": 176} {"info/global_step": 177, "train_info/time_within_train_step": 2.7536540031433105, "step": 177} {"train_info/time_between_train_steps": 0.003162860870361328, "step": 177} {"info/global_step": 178, "train_info/time_within_train_step": 2.754702568054199, "step": 178} {"train_info/time_between_train_steps": 0.0033659934997558594, "step": 178} {"info/global_step": 179, "train_info/time_within_train_step": 2.7535102367401123, "step": 179} {"train_info/time_between_train_steps": 0.0031528472900390625, "step": 179} {"info/global_step": 180, "train_info/time_within_train_step": 2.753718137741089, "step": 180} {"train_info/time_between_train_steps": 0.0033876895904541016, "step": 180} {"info/global_step": 181, "train_info/time_within_train_step": 2.7547523975372314, "step": 181} {"train_info/time_between_train_steps": 0.0034754276275634766, "step": 181} {"info/global_step": 182, "train_info/time_within_train_step": 2.7548668384552, "step": 182} {"train_info/time_between_train_steps": 0.003376483917236328, "step": 182} {"info/global_step": 183, "train_info/time_within_train_step": 2.7561681270599365, "step": 183} {"train_info/time_between_train_steps": 0.003512144088745117, "step": 183} {"info/global_step": 184, "train_info/time_within_train_step": 2.755354642868042, "step": 184} {"train_info/time_between_train_steps": 0.003462076187133789, "step": 184} {"info/global_step": 185, "train_info/time_within_train_step": 2.7562716007232666, "step": 185} {"train_info/time_between_train_steps": 0.0033447742462158203, "step": 185} {"info/global_step": 186, "train_info/time_within_train_step": 2.7564964294433594, "step": 186} {"train_info/time_between_train_steps": 0.0033843517303466797, "step": 186} {"info/global_step": 187, "train_info/time_within_train_step": 2.7559361457824707, "step": 187} {"train_info/time_between_train_steps": 0.003376483917236328, "step": 187} {"info/global_step": 188, "train_info/time_within_train_step": 2.8857617378234863, "step": 188} {"train_info/time_between_train_steps": 0.0036444664001464844, "step": 188} {"info/global_step": 189, "train_info/time_within_train_step": 2.7556746006011963, "step": 189} {"train_info/time_between_train_steps": 0.003549337387084961, "step": 189} {"info/global_step": 190, "train_info/time_within_train_step": 2.7556698322296143, "step": 190} {"train_info/time_between_train_steps": 0.0035028457641601562, "step": 190} {"info/global_step": 191, "train_info/time_within_train_step": 2.754194974899292, "step": 191} {"train_info/time_between_train_steps": 0.0034284591674804688, "step": 191} {"info/global_step": 192, "train_info/time_within_train_step": 2.7548625469207764, "step": 192} {"train_info/time_between_train_steps": 0.003557920455932617, "step": 192} {"info/global_step": 193, "train_info/time_within_train_step": 2.7535347938537598, "step": 193} {"train_info/time_between_train_steps": 0.003385782241821289, "step": 193} {"info/global_step": 194, "train_info/time_within_train_step": 2.7547483444213867, "step": 194} {"train_info/time_between_train_steps": 0.0034847259521484375, "step": 194} {"info/global_step": 195, "train_info/time_within_train_step": 2.7560477256774902, "step": 195} {"train_info/time_between_train_steps": 0.0034837722778320312, "step": 195} {"info/global_step": 196, "train_info/time_within_train_step": 2.7557473182678223, "step": 196} {"train_info/time_between_train_steps": 0.0035974979400634766, "step": 196} {"info/global_step": 197, "train_info/time_within_train_step": 2.7572734355926514, "step": 197} {"train_info/time_between_train_steps": 0.0037772655487060547, "step": 197} {"info/global_step": 198, "train_info/time_within_train_step": 2.7571089267730713, "step": 198} {"train_info/time_between_train_steps": 0.0034461021423339844, "step": 198} {"info/global_step": 199, "train_info/time_within_train_step": 2.75567364692688, "step": 199} {"train_info/time_between_train_steps": 0.0037119388580322266, "step": 199} {"info/global_step": 200, "train_info/time_within_train_step": 3.0286948680877686, "step": 200} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746566560, "_runtime": 569}, "step": 200} {"logs": {"train/loss": 6.6399, "train/learning_rate": 0.00011999999999999999, "train/epoch": 0.02, "_timestamp": 1746566560, "_runtime": 569}, "step": 200} {"train_info/time_between_train_steps": 52.54655408859253, "step": 200} {"info/global_step": 201, "train_info/time_within_train_step": 2.525697708129883, "step": 201} {"train_info/time_between_train_steps": 0.0037965774536132812, "step": 201} {"info/global_step": 202, "train_info/time_within_train_step": 2.563741445541382, "step": 202} {"train_info/time_between_train_steps": 0.0036470890045166016, "step": 202} {"info/global_step": 203, "train_info/time_within_train_step": 2.6810526847839355, "step": 203} {"train_info/time_between_train_steps": 0.004266977310180664, "step": 203} {"info/global_step": 204, "train_info/time_within_train_step": 2.707659959793091, "step": 204} {"train_info/time_between_train_steps": 0.003777027130126953, "step": 204} {"info/global_step": 205, "train_info/time_within_train_step": 2.693135976791382, "step": 205} {"train_info/time_between_train_steps": 0.003780841827392578, "step": 205} {"info/global_step": 206, "train_info/time_within_train_step": 2.677165985107422, "step": 206} {"train_info/time_between_train_steps": 0.0038864612579345703, "step": 206} {"info/global_step": 207, "train_info/time_within_train_step": 2.7023911476135254, "step": 207} {"train_info/time_between_train_steps": 0.003674745559692383, "step": 207} {"info/global_step": 208, "train_info/time_within_train_step": 2.7489194869995117, "step": 208} {"train_info/time_between_train_steps": 0.0038237571716308594, "step": 208} {"info/global_step": 209, "train_info/time_within_train_step": 2.753080368041992, "step": 209} {"train_info/time_between_train_steps": 0.003681659698486328, "step": 209} {"info/global_step": 210, "train_info/time_within_train_step": 2.7561025619506836, "step": 210} {"train_info/time_between_train_steps": 0.0036957263946533203, "step": 210} {"info/global_step": 211, "train_info/time_within_train_step": 2.7573184967041016, "step": 211} {"train_info/time_between_train_steps": 0.003807544708251953, "step": 211} {"info/global_step": 212, "train_info/time_within_train_step": 2.758401870727539, "step": 212} {"train_info/time_between_train_steps": 0.0037064552307128906, "step": 212} {"info/global_step": 213, "train_info/time_within_train_step": 2.7578301429748535, "step": 213} {"train_info/time_between_train_steps": 0.003537893295288086, "step": 213} {"info/global_step": 214, "train_info/time_within_train_step": 2.7569377422332764, "step": 214} {"train_info/time_between_train_steps": 0.003690481185913086, "step": 214} {"info/global_step": 215, "train_info/time_within_train_step": 2.7581074237823486, "step": 215} {"train_info/time_between_train_steps": 0.003827333450317383, "step": 215} {"info/global_step": 216, "train_info/time_within_train_step": 2.7568705081939697, "step": 216} {"train_info/time_between_train_steps": 0.003618478775024414, "step": 216} {"info/global_step": 217, "train_info/time_within_train_step": 2.756873607635498, "step": 217} {"train_info/time_between_train_steps": 0.0035347938537597656, "step": 217} {"info/global_step": 218, "train_info/time_within_train_step": 2.756398916244507, "step": 218} {"train_info/time_between_train_steps": 0.003637552261352539, "step": 218} {"info/global_step": 219, "train_info/time_within_train_step": 2.756458282470703, "step": 219} {"train_info/time_between_train_steps": 0.0034651756286621094, "step": 219} {"info/global_step": 220, "train_info/time_within_train_step": 2.756244421005249, "step": 220} {"train_info/time_between_train_steps": 0.0035614967346191406, "step": 220} {"info/global_step": 221, "train_info/time_within_train_step": 2.754997968673706, "step": 221} {"train_info/time_between_train_steps": 0.0035104751586914062, "step": 221} {"info/global_step": 222, "train_info/time_within_train_step": 2.7879750728607178, "step": 222} {"train_info/time_between_train_steps": 0.003621816635131836, "step": 222} {"info/global_step": 223, "train_info/time_within_train_step": 2.756970167160034, "step": 223} {"train_info/time_between_train_steps": 0.0035161972045898438, "step": 223} {"info/global_step": 224, "train_info/time_within_train_step": 2.7572154998779297, "step": 224} {"train_info/time_between_train_steps": 0.00341796875, "step": 224} {"info/global_step": 225, "train_info/time_within_train_step": 2.7557389736175537, "step": 225} {"train_info/time_between_train_steps": 0.0035140514373779297, "step": 225} {"info/global_step": 226, "train_info/time_within_train_step": 2.758244752883911, "step": 226} {"train_info/time_between_train_steps": 0.003704547882080078, "step": 226} {"info/global_step": 227, "train_info/time_within_train_step": 2.756768226623535, "step": 227} {"train_info/time_between_train_steps": 0.003453969955444336, "step": 227} {"info/global_step": 228, "train_info/time_within_train_step": 2.757150411605835, "step": 228} {"train_info/time_between_train_steps": 0.003493070602416992, "step": 228} {"info/global_step": 229, "train_info/time_within_train_step": 2.7566933631896973, "step": 229} {"train_info/time_between_train_steps": 0.0036554336547851562, "step": 229} {"info/global_step": 230, "train_info/time_within_train_step": 2.756890296936035, "step": 230} {"train_info/time_between_train_steps": 0.0033998489379882812, "step": 230} {"info/global_step": 231, "train_info/time_within_train_step": 2.757312297821045, "step": 231} {"train_info/time_between_train_steps": 0.003504037857055664, "step": 231} {"info/global_step": 232, "train_info/time_within_train_step": 2.7568342685699463, "step": 232} {"train_info/time_between_train_steps": 0.0036928653717041016, "step": 232} {"info/global_step": 233, "train_info/time_within_train_step": 2.757422924041748, "step": 233} {"train_info/time_between_train_steps": 0.0037162303924560547, "step": 233} {"info/global_step": 234, "train_info/time_within_train_step": 2.7582013607025146, "step": 234} {"train_info/time_between_train_steps": 0.0038022994995117188, "step": 234} {"info/global_step": 235, "train_info/time_within_train_step": 2.756315231323242, "step": 235} {"train_info/time_between_train_steps": 0.0037717819213867188, "step": 235} {"info/global_step": 236, "train_info/time_within_train_step": 2.755995035171509, "step": 236} {"train_info/time_between_train_steps": 0.0036957263946533203, "step": 236} {"info/global_step": 237, "train_info/time_within_train_step": 3.1472063064575195, "step": 237} {"train_info/time_between_train_steps": 0.0034198760986328125, "step": 237} {"info/global_step": 238, "train_info/time_within_train_step": 2.754739999771118, "step": 238} {"train_info/time_between_train_steps": 0.003347158432006836, "step": 238} {"info/global_step": 239, "train_info/time_within_train_step": 2.7562031745910645, "step": 239} {"train_info/time_between_train_steps": 0.0033931732177734375, "step": 239} {"info/global_step": 240, "train_info/time_within_train_step": 2.757312536239624, "step": 240} {"train_info/time_between_train_steps": 0.0034394264221191406, "step": 240} {"info/global_step": 241, "train_info/time_within_train_step": 2.7568461894989014, "step": 241} {"train_info/time_between_train_steps": 0.003498554229736328, "step": 241} {"info/global_step": 242, "train_info/time_within_train_step": 2.7576873302459717, "step": 242} {"train_info/time_between_train_steps": 0.0038080215454101562, "step": 242} {"info/global_step": 243, "train_info/time_within_train_step": 2.7570509910583496, "step": 243} {"train_info/time_between_train_steps": 0.004008293151855469, "step": 243} {"info/global_step": 244, "train_info/time_within_train_step": 2.7573139667510986, "step": 244} {"train_info/time_between_train_steps": 0.0035614967346191406, "step": 244} {"info/global_step": 245, "train_info/time_within_train_step": 2.756495237350464, "step": 245} {"train_info/time_between_train_steps": 0.004083871841430664, "step": 245} {"info/global_step": 246, "train_info/time_within_train_step": 2.7567005157470703, "step": 246} {"train_info/time_between_train_steps": 0.0036725997924804688, "step": 246} {"info/global_step": 247, "train_info/time_within_train_step": 2.7581427097320557, "step": 247} {"train_info/time_between_train_steps": 0.003703594207763672, "step": 247} {"info/global_step": 248, "train_info/time_within_train_step": 2.7568230628967285, "step": 248} {"train_info/time_between_train_steps": 0.003787994384765625, "step": 248} {"info/global_step": 249, "train_info/time_within_train_step": 2.7577385902404785, "step": 249} {"train_info/time_between_train_steps": 0.003740072250366211, "step": 249} {"info/global_step": 250, "train_info/time_within_train_step": 3.5089755058288574, "step": 250} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746566751, "_runtime": 760}, "step": 250} {"logs": {"train/loss": 6.3893, "train/learning_rate": 0.00015, "train/epoch": 0.03, "_timestamp": 1746566751, "_runtime": 760}, "step": 250} {"train_info/time_between_train_steps": 0.20528030395507812, "step": 250} {"info/global_step": 251, "train_info/time_within_train_step": 2.7545762062072754, "step": 251} {"train_info/time_between_train_steps": 0.006742238998413086, "step": 251} {"info/global_step": 252, "train_info/time_within_train_step": 2.7562575340270996, "step": 252} {"train_info/time_between_train_steps": 0.006528139114379883, "step": 252} {"info/global_step": 253, "train_info/time_within_train_step": 2.7562787532806396, "step": 253} {"train_info/time_between_train_steps": 0.007029533386230469, "step": 253} {"info/global_step": 254, "train_info/time_within_train_step": 2.7572176456451416, "step": 254} {"train_info/time_between_train_steps": 0.006956577301025391, "step": 254} {"info/global_step": 255, "train_info/time_within_train_step": 2.756415605545044, "step": 255} {"train_info/time_between_train_steps": 0.007088184356689453, "step": 255} {"info/global_step": 256, "train_info/time_within_train_step": 2.7589213848114014, "step": 256} {"train_info/time_between_train_steps": 0.005082130432128906, "step": 256} {"info/global_step": 257, "train_info/time_within_train_step": 2.7572720050811768, "step": 257} {"train_info/time_between_train_steps": 0.00710606575012207, "step": 257} {"info/global_step": 258, "train_info/time_within_train_step": 2.7570314407348633, "step": 258} {"train_info/time_between_train_steps": 0.006852388381958008, "step": 258} {"info/global_step": 259, "train_info/time_within_train_step": 2.7567572593688965, "step": 259} {"train_info/time_between_train_steps": 0.006905555725097656, "step": 259} {"info/global_step": 260, "train_info/time_within_train_step": 2.7575485706329346, "step": 260} {"train_info/time_between_train_steps": 0.006960153579711914, "step": 260} {"info/global_step": 261, "train_info/time_within_train_step": 2.757061004638672, "step": 261} {"train_info/time_between_train_steps": 0.0067901611328125, "step": 261} {"info/global_step": 262, "train_info/time_within_train_step": 2.756603240966797, "step": 262} {"train_info/time_between_train_steps": 0.007009029388427734, "step": 262} {"info/global_step": 263, "train_info/time_within_train_step": 2.7566213607788086, "step": 263} {"train_info/time_between_train_steps": 0.006974935531616211, "step": 263} {"info/global_step": 264, "train_info/time_within_train_step": 2.757439374923706, "step": 264} {"train_info/time_between_train_steps": 0.007044076919555664, "step": 264} {"info/global_step": 265, "train_info/time_within_train_step": 2.7857303619384766, "step": 265} {"train_info/time_between_train_steps": 0.006911277770996094, "step": 265} {"info/global_step": 266, "train_info/time_within_train_step": 2.7561607360839844, "step": 266} {"train_info/time_between_train_steps": 0.006843090057373047, "step": 266} {"info/global_step": 267, "train_info/time_within_train_step": 2.7555010318756104, "step": 267} {"train_info/time_between_train_steps": 0.006895542144775391, "step": 267} {"info/global_step": 268, "train_info/time_within_train_step": 2.7583770751953125, "step": 268} {"train_info/time_between_train_steps": 0.006910562515258789, "step": 268} {"info/global_step": 269, "train_info/time_within_train_step": 2.7569832801818848, "step": 269} {"train_info/time_between_train_steps": 0.006875514984130859, "step": 269} {"info/global_step": 270, "train_info/time_within_train_step": 2.756553888320923, "step": 270} {"train_info/time_between_train_steps": 0.003724813461303711, "step": 270} {"info/global_step": 271, "train_info/time_within_train_step": 2.757255792617798, "step": 271} {"train_info/time_between_train_steps": 0.007012367248535156, "step": 271} {"info/global_step": 272, "train_info/time_within_train_step": 2.7559192180633545, "step": 272} {"train_info/time_between_train_steps": 0.0069942474365234375, "step": 272} {"info/global_step": 273, "train_info/time_within_train_step": 2.7565855979919434, "step": 273} {"train_info/time_between_train_steps": 0.006920576095581055, "step": 273} {"info/global_step": 274, "train_info/time_within_train_step": 2.7579102516174316, "step": 274} {"train_info/time_between_train_steps": 0.00693821907043457, "step": 274} {"info/global_step": 275, "train_info/time_within_train_step": 2.7564992904663086, "step": 275} {"train_info/time_between_train_steps": 0.0035910606384277344, "step": 275} {"info/global_step": 276, "train_info/time_within_train_step": 2.7561497688293457, "step": 276} {"train_info/time_between_train_steps": 0.003679990768432617, "step": 276} {"info/global_step": 277, "train_info/time_within_train_step": 2.757500648498535, "step": 277} {"train_info/time_between_train_steps": 0.0036516189575195312, "step": 277} {"info/global_step": 278, "train_info/time_within_train_step": 2.7577099800109863, "step": 278} {"train_info/time_between_train_steps": 0.0036525726318359375, "step": 278} {"info/global_step": 279, "train_info/time_within_train_step": 2.7558062076568604, "step": 279} {"train_info/time_between_train_steps": 0.003608226776123047, "step": 279} {"info/global_step": 280, "train_info/time_within_train_step": 2.7560911178588867, "step": 280} {"train_info/time_between_train_steps": 0.003638744354248047, "step": 280} {"info/global_step": 281, "train_info/time_within_train_step": 2.7566206455230713, "step": 281} {"train_info/time_between_train_steps": 0.0036773681640625, "step": 281} {"info/global_step": 282, "train_info/time_within_train_step": 2.7571120262145996, "step": 282} {"train_info/time_between_train_steps": 0.0037016868591308594, "step": 282} {"info/global_step": 283, "train_info/time_within_train_step": 2.7567389011383057, "step": 283} {"train_info/time_between_train_steps": 0.0036656856536865234, "step": 283} {"info/global_step": 284, "train_info/time_within_train_step": 2.7573812007904053, "step": 284} {"train_info/time_between_train_steps": 0.003554105758666992, "step": 284} {"info/global_step": 285, "train_info/time_within_train_step": 2.755549430847168, "step": 285} {"train_info/time_between_train_steps": 0.0036232471466064453, "step": 285} {"info/global_step": 286, "train_info/time_within_train_step": 2.756152391433716, "step": 286} {"train_info/time_between_train_steps": 0.0069506168365478516, "step": 286} {"info/global_step": 287, "train_info/time_within_train_step": 2.752166748046875, "step": 287} {"train_info/time_between_train_steps": 0.006928920745849609, "step": 287} {"info/global_step": 288, "train_info/time_within_train_step": 2.757556438446045, "step": 288} {"train_info/time_between_train_steps": 0.006874799728393555, "step": 288} {"info/global_step": 289, "train_info/time_within_train_step": 2.7577316761016846, "step": 289} {"train_info/time_between_train_steps": 0.006996870040893555, "step": 289} {"info/global_step": 290, "train_info/time_within_train_step": 2.756605625152588, "step": 290} {"train_info/time_between_train_steps": 0.005954265594482422, "step": 290} {"info/global_step": 291, "train_info/time_within_train_step": 2.757295846939087, "step": 291} {"train_info/time_between_train_steps": 0.00680851936340332, "step": 291} {"info/global_step": 292, "train_info/time_within_train_step": 2.758507490158081, "step": 292} {"train_info/time_between_train_steps": 0.006921291351318359, "step": 292} {"info/global_step": 293, "train_info/time_within_train_step": 2.757215738296509, "step": 293} {"train_info/time_between_train_steps": 0.006845951080322266, "step": 293} {"info/global_step": 294, "train_info/time_within_train_step": 2.7577733993530273, "step": 294} {"train_info/time_between_train_steps": 0.006810665130615234, "step": 294} {"info/global_step": 295, "train_info/time_within_train_step": 2.75667667388916, "step": 295} {"train_info/time_between_train_steps": 0.006854057312011719, "step": 295} {"info/global_step": 296, "train_info/time_within_train_step": 2.7570371627807617, "step": 296} {"train_info/time_between_train_steps": 0.00501561164855957, "step": 296} {"info/global_step": 297, "train_info/time_within_train_step": 2.754927635192871, "step": 297} {"train_info/time_between_train_steps": 0.00356292724609375, "step": 297} {"info/global_step": 298, "train_info/time_within_train_step": 2.7558374404907227, "step": 298} {"train_info/time_between_train_steps": 0.005421161651611328, "step": 298} {"info/global_step": 299, "train_info/time_within_train_step": 2.7554104328155518, "step": 299} {"train_info/time_between_train_steps": 0.0036132335662841797, "step": 299} {"info/global_step": 300, "train_info/time_within_train_step": 2.756120204925537, "step": 300} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746566890, "_runtime": 899}, "step": 300} {"logs": {"train/loss": 6.2035, "train/learning_rate": 0.00017999999999999998, "train/epoch": 0.03, "_timestamp": 1746566890, "_runtime": 899}, "step": 300} {"train_info/time_between_train_steps": 0.022199630737304688, "step": 300} {"info/global_step": 301, "train_info/time_within_train_step": 2.7565927505493164, "step": 301} {"train_info/time_between_train_steps": 0.0036034584045410156, "step": 301} {"info/global_step": 302, "train_info/time_within_train_step": 2.756585121154785, "step": 302} {"train_info/time_between_train_steps": 0.0036079883575439453, "step": 302} {"info/global_step": 303, "train_info/time_within_train_step": 2.7563681602478027, "step": 303} {"train_info/time_between_train_steps": 0.006419181823730469, "step": 303} {"info/global_step": 304, "train_info/time_within_train_step": 2.7552881240844727, "step": 304} {"train_info/time_between_train_steps": 0.00351715087890625, "step": 304} {"info/global_step": 305, "train_info/time_within_train_step": 2.755901336669922, "step": 305} {"train_info/time_between_train_steps": 0.006842136383056641, "step": 305} {"info/global_step": 306, "train_info/time_within_train_step": 2.7571237087249756, "step": 306} {"train_info/time_between_train_steps": 0.0068128108978271484, "step": 306} {"info/global_step": 307, "train_info/time_within_train_step": 2.7581112384796143, "step": 307} {"train_info/time_between_train_steps": 0.0068683624267578125, "step": 307} {"info/global_step": 308, "train_info/time_within_train_step": 2.756648540496826, "step": 308} {"train_info/time_between_train_steps": 0.006805896759033203, "step": 308} {"info/global_step": 309, "train_info/time_within_train_step": 2.757107973098755, "step": 309} {"train_info/time_between_train_steps": 0.0067331790924072266, "step": 309} {"info/global_step": 310, "train_info/time_within_train_step": 2.756072759628296, "step": 310} {"train_info/time_between_train_steps": 0.006984710693359375, "step": 310} {"info/global_step": 311, "train_info/time_within_train_step": 2.7553718090057373, "step": 311} {"train_info/time_between_train_steps": 0.006834506988525391, "step": 311} {"info/global_step": 312, "train_info/time_within_train_step": 2.7557239532470703, "step": 312} {"train_info/time_between_train_steps": 0.006796836853027344, "step": 312} {"info/global_step": 313, "train_info/time_within_train_step": 2.9033803939819336, "step": 313} {"train_info/time_between_train_steps": 0.006640911102294922, "step": 313} {"info/global_step": 314, "train_info/time_within_train_step": 2.7584726810455322, "step": 314} {"train_info/time_between_train_steps": 0.006567478179931641, "step": 314} {"info/global_step": 315, "train_info/time_within_train_step": 2.755215644836426, "step": 315} {"train_info/time_between_train_steps": 0.0065457820892333984, "step": 315} {"info/global_step": 316, "train_info/time_within_train_step": 2.756795883178711, "step": 316} {"train_info/time_between_train_steps": 0.006627798080444336, "step": 316} {"info/global_step": 317, "train_info/time_within_train_step": 2.7573657035827637, "step": 317} {"train_info/time_between_train_steps": 0.006616830825805664, "step": 317} {"info/global_step": 318, "train_info/time_within_train_step": 2.756479024887085, "step": 318} {"train_info/time_between_train_steps": 0.00334930419921875, "step": 318} {"info/global_step": 319, "train_info/time_within_train_step": 2.75677227973938, "step": 319} {"train_info/time_between_train_steps": 0.0033655166625976562, "step": 319} {"info/global_step": 320, "train_info/time_within_train_step": 2.7552754878997803, "step": 320} {"train_info/time_between_train_steps": 0.003484964370727539, "step": 320} {"info/global_step": 321, "train_info/time_within_train_step": 2.7558867931365967, "step": 321} {"train_info/time_between_train_steps": 0.0034759044647216797, "step": 321} {"info/global_step": 322, "train_info/time_within_train_step": 2.7565391063690186, "step": 322} {"train_info/time_between_train_steps": 0.0036020278930664062, "step": 322} {"info/global_step": 323, "train_info/time_within_train_step": 2.757241725921631, "step": 323} {"train_info/time_between_train_steps": 0.0036339759826660156, "step": 323} {"info/global_step": 324, "train_info/time_within_train_step": 3.150437831878662, "step": 324} {"train_info/time_between_train_steps": 0.0064067840576171875, "step": 324} {"info/global_step": 325, "train_info/time_within_train_step": 2.7554028034210205, "step": 325} {"train_info/time_between_train_steps": 0.006504535675048828, "step": 325} {"info/global_step": 326, "train_info/time_within_train_step": 2.7547686100006104, "step": 326} {"train_info/time_between_train_steps": 0.004708766937255859, "step": 326} {"info/global_step": 327, "train_info/time_within_train_step": 2.7555603981018066, "step": 327} {"train_info/time_between_train_steps": 0.0066754817962646484, "step": 327} {"info/global_step": 328, "train_info/time_within_train_step": 2.755711793899536, "step": 328} {"train_info/time_between_train_steps": 0.006551980972290039, "step": 328} {"info/global_step": 329, "train_info/time_within_train_step": 2.7548060417175293, "step": 329} {"train_info/time_between_train_steps": 0.00648188591003418, "step": 329} {"info/global_step": 330, "train_info/time_within_train_step": 2.756047248840332, "step": 330} {"train_info/time_between_train_steps": 0.0065228939056396484, "step": 330} {"info/global_step": 331, "train_info/time_within_train_step": 2.7560184001922607, "step": 331} {"train_info/time_between_train_steps": 0.006574392318725586, "step": 331} {"info/global_step": 332, "train_info/time_within_train_step": 2.756572723388672, "step": 332} {"train_info/time_between_train_steps": 0.006508350372314453, "step": 332} {"info/global_step": 333, "train_info/time_within_train_step": 2.755293130874634, "step": 333} {"train_info/time_between_train_steps": 0.006468772888183594, "step": 333} {"info/global_step": 334, "train_info/time_within_train_step": 2.753873348236084, "step": 334} {"train_info/time_between_train_steps": 0.006471872329711914, "step": 334} {"info/global_step": 335, "train_info/time_within_train_step": 2.7574968338012695, "step": 335} {"train_info/time_between_train_steps": 0.0065765380859375, "step": 335} {"info/global_step": 336, "train_info/time_within_train_step": 2.7546122074127197, "step": 336} {"train_info/time_between_train_steps": 0.006492137908935547, "step": 336} {"info/global_step": 337, "train_info/time_within_train_step": 2.755208730697632, "step": 337} {"train_info/time_between_train_steps": 0.00652623176574707, "step": 337} {"info/global_step": 338, "train_info/time_within_train_step": 2.7546041011810303, "step": 338} {"train_info/time_between_train_steps": 0.006505727767944336, "step": 338} {"info/global_step": 339, "train_info/time_within_train_step": 2.7563467025756836, "step": 339} {"train_info/time_between_train_steps": 0.006718635559082031, "step": 339} {"info/global_step": 340, "train_info/time_within_train_step": 2.7538702487945557, "step": 340} {"train_info/time_between_train_steps": 0.006559848785400391, "step": 340} {"info/global_step": 341, "train_info/time_within_train_step": 2.7555902004241943, "step": 341} {"train_info/time_between_train_steps": 0.006541252136230469, "step": 341} {"info/global_step": 342, "train_info/time_within_train_step": 2.7552270889282227, "step": 342} {"train_info/time_between_train_steps": 0.00672149658203125, "step": 342} {"info/global_step": 343, "train_info/time_within_train_step": 2.7565548419952393, "step": 343} {"train_info/time_between_train_steps": 0.006523609161376953, "step": 343} {"info/global_step": 344, "train_info/time_within_train_step": 2.757408380508423, "step": 344} {"train_info/time_between_train_steps": 0.006543397903442383, "step": 344} {"info/global_step": 345, "train_info/time_within_train_step": 2.755452871322632, "step": 345} {"train_info/time_between_train_steps": 0.006528139114379883, "step": 345} {"info/global_step": 346, "train_info/time_within_train_step": 2.758849859237671, "step": 346} {"train_info/time_between_train_steps": 0.0064809322357177734, "step": 346} {"info/global_step": 347, "train_info/time_within_train_step": 2.7533059120178223, "step": 347} {"train_info/time_between_train_steps": 0.006501197814941406, "step": 347} {"info/global_step": 348, "train_info/time_within_train_step": 2.755563735961914, "step": 348} {"train_info/time_between_train_steps": 0.006432294845581055, "step": 348} {"info/global_step": 349, "train_info/time_within_train_step": 2.7548372745513916, "step": 349} {"train_info/time_between_train_steps": 0.006880760192871094, "step": 349} {"info/global_step": 350, "train_info/time_within_train_step": 2.755117654800415, "step": 350} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746567029, "_runtime": 1038}, "step": 350} {"logs": {"train/loss": 6.0459, "train/learning_rate": 0.00020999999999999998, "train/epoch": 0.04, "_timestamp": 1746567029, "_runtime": 1038}, "step": 350} {"train_info/time_between_train_steps": 0.013231515884399414, "step": 350} {"info/global_step": 351, "train_info/time_within_train_step": 2.756117105484009, "step": 351} {"train_info/time_between_train_steps": 0.006530046463012695, "step": 351} {"info/global_step": 352, "train_info/time_within_train_step": 2.7568039894104004, "step": 352} {"train_info/time_between_train_steps": 0.003318309783935547, "step": 352} {"info/global_step": 353, "train_info/time_within_train_step": 2.755018711090088, "step": 353} {"train_info/time_between_train_steps": 0.006537437438964844, "step": 353} {"info/global_step": 354, "train_info/time_within_train_step": 2.7550134658813477, "step": 354} {"train_info/time_between_train_steps": 0.0064067840576171875, "step": 354} {"info/global_step": 355, "train_info/time_within_train_step": 2.754664659500122, "step": 355} {"train_info/time_between_train_steps": 0.006532907485961914, "step": 355} {"info/global_step": 356, "train_info/time_within_train_step": 2.756146192550659, "step": 356} {"train_info/time_between_train_steps": 0.006510257720947266, "step": 356} {"info/global_step": 357, "train_info/time_within_train_step": 2.7558321952819824, "step": 357} {"train_info/time_between_train_steps": 0.006690263748168945, "step": 357} {"info/global_step": 358, "train_info/time_within_train_step": 2.756488800048828, "step": 358} {"train_info/time_between_train_steps": 0.006663322448730469, "step": 358} {"info/global_step": 359, "train_info/time_within_train_step": 2.756439685821533, "step": 359} {"train_info/time_between_train_steps": 0.0065724849700927734, "step": 359} {"info/global_step": 360, "train_info/time_within_train_step": 2.7559564113616943, "step": 360} {"train_info/time_between_train_steps": 0.006653785705566406, "step": 360} {"info/global_step": 361, "train_info/time_within_train_step": 2.7576451301574707, "step": 361} {"train_info/time_between_train_steps": 0.006600141525268555, "step": 361} {"info/global_step": 362, "train_info/time_within_train_step": 2.7550501823425293, "step": 362} {"train_info/time_between_train_steps": 0.0066165924072265625, "step": 362} {"info/global_step": 363, "train_info/time_within_train_step": 2.7566709518432617, "step": 363} {"train_info/time_between_train_steps": 0.006775617599487305, "step": 363} {"info/global_step": 364, "train_info/time_within_train_step": 2.7583274841308594, "step": 364} {"train_info/time_between_train_steps": 0.007024526596069336, "step": 364} {"info/global_step": 365, "train_info/time_within_train_step": 2.7562384605407715, "step": 365} {"train_info/time_between_train_steps": 0.0069730281829833984, "step": 365} {"info/global_step": 366, "train_info/time_within_train_step": 2.7576582431793213, "step": 366} {"train_info/time_between_train_steps": 0.006888866424560547, "step": 366} {"info/global_step": 367, "train_info/time_within_train_step": 2.7553622722625732, "step": 367} {"train_info/time_between_train_steps": 0.006903648376464844, "step": 367} {"info/global_step": 368, "train_info/time_within_train_step": 2.757862091064453, "step": 368} {"train_info/time_between_train_steps": 0.006982564926147461, "step": 368} {"info/global_step": 369, "train_info/time_within_train_step": 2.755796194076538, "step": 369} {"train_info/time_between_train_steps": 0.00690150260925293, "step": 369} {"info/global_step": 370, "train_info/time_within_train_step": 2.7550556659698486, "step": 370} {"train_info/time_between_train_steps": 0.006877422332763672, "step": 370} {"info/global_step": 371, "train_info/time_within_train_step": 2.75822114944458, "step": 371} {"train_info/time_between_train_steps": 0.006829261779785156, "step": 371} {"info/global_step": 372, "train_info/time_within_train_step": 2.756720542907715, "step": 372} {"train_info/time_between_train_steps": 0.006816864013671875, "step": 372} {"info/global_step": 373, "train_info/time_within_train_step": 2.7561278343200684, "step": 373} {"train_info/time_between_train_steps": 0.006894588470458984, "step": 373} {"info/global_step": 374, "train_info/time_within_train_step": 2.7558653354644775, "step": 374} {"train_info/time_between_train_steps": 0.006817817687988281, "step": 374} {"info/global_step": 375, "train_info/time_within_train_step": 2.757398843765259, "step": 375} {"train_info/time_between_train_steps": 0.18230772018432617, "step": 375} {"info/global_step": 376, "train_info/time_within_train_step": 2.7556633949279785, "step": 376} {"train_info/time_between_train_steps": 0.006633281707763672, "step": 376} {"info/global_step": 377, "train_info/time_within_train_step": 3.070917844772339, "step": 377} {"train_info/time_between_train_steps": 0.006314992904663086, "step": 377} {"info/global_step": 378, "train_info/time_within_train_step": 2.7551026344299316, "step": 378} {"train_info/time_between_train_steps": 0.0064029693603515625, "step": 378} {"info/global_step": 379, "train_info/time_within_train_step": 2.754091739654541, "step": 379} {"train_info/time_between_train_steps": 0.0063953399658203125, "step": 379} {"info/global_step": 380, "train_info/time_within_train_step": 2.755791425704956, "step": 380} {"train_info/time_between_train_steps": 0.0066106319427490234, "step": 380} {"info/global_step": 381, "train_info/time_within_train_step": 2.7545502185821533, "step": 381} {"train_info/time_between_train_steps": 0.006417274475097656, "step": 381} {"info/global_step": 382, "train_info/time_within_train_step": 2.754547357559204, "step": 382} {"train_info/time_between_train_steps": 0.0065212249755859375, "step": 382} {"info/global_step": 383, "train_info/time_within_train_step": 2.7535717487335205, "step": 383} {"train_info/time_between_train_steps": 0.0033159255981445312, "step": 383} {"info/global_step": 384, "train_info/time_within_train_step": 2.7543206214904785, "step": 384} {"train_info/time_between_train_steps": 0.0032875537872314453, "step": 384} {"info/global_step": 385, "train_info/time_within_train_step": 2.7534892559051514, "step": 385} {"train_info/time_between_train_steps": 0.006468057632446289, "step": 385} {"info/global_step": 386, "train_info/time_within_train_step": 2.7573788166046143, "step": 386} {"train_info/time_between_train_steps": 0.006477832794189453, "step": 386} {"info/global_step": 387, "train_info/time_within_train_step": 2.754770040512085, "step": 387} {"train_info/time_between_train_steps": 0.00647735595703125, "step": 387} {"info/global_step": 388, "train_info/time_within_train_step": 2.7557179927825928, "step": 388} {"train_info/time_between_train_steps": 0.006799459457397461, "step": 388} {"info/global_step": 389, "train_info/time_within_train_step": 2.7556991577148438, "step": 389} {"train_info/time_between_train_steps": 0.006827592849731445, "step": 389} {"info/global_step": 390, "train_info/time_within_train_step": 2.758110761642456, "step": 390} {"train_info/time_between_train_steps": 0.007002353668212891, "step": 390} {"info/global_step": 391, "train_info/time_within_train_step": 2.7558705806732178, "step": 391} {"train_info/time_between_train_steps": 0.006810188293457031, "step": 391} {"info/global_step": 392, "train_info/time_within_train_step": 2.756199359893799, "step": 392} {"train_info/time_between_train_steps": 0.006949186325073242, "step": 392} {"info/global_step": 393, "train_info/time_within_train_step": 2.756930351257324, "step": 393} {"train_info/time_between_train_steps": 0.006971836090087891, "step": 393} {"info/global_step": 394, "train_info/time_within_train_step": 2.7570905685424805, "step": 394} {"train_info/time_between_train_steps": 0.00706934928894043, "step": 394} {"info/global_step": 395, "train_info/time_within_train_step": 2.7556653022766113, "step": 395} {"train_info/time_between_train_steps": 0.006441593170166016, "step": 395} {"info/global_step": 396, "train_info/time_within_train_step": 2.755197048187256, "step": 396} {"train_info/time_between_train_steps": 0.0069468021392822266, "step": 396} {"info/global_step": 397, "train_info/time_within_train_step": 2.7558765411376953, "step": 397} {"train_info/time_between_train_steps": 0.006895780563354492, "step": 397} {"info/global_step": 398, "train_info/time_within_train_step": 2.7555105686187744, "step": 398} {"train_info/time_between_train_steps": 0.00689697265625, "step": 398} {"info/global_step": 399, "train_info/time_within_train_step": 2.755678415298462, "step": 399} {"train_info/time_between_train_steps": 0.00683140754699707, "step": 399} {"info/global_step": 400, "train_info/time_within_train_step": 2.7551722526550293, "step": 400} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746567168, "_runtime": 1177}, "step": 400} {"logs": {"train/loss": 5.9165, "train/learning_rate": 0.00023999999999999998, "train/epoch": 0.04, "_timestamp": 1746567168, "_runtime": 1177}, "step": 400} {"train_info/time_between_train_steps": 26.89666485786438, "step": 400} {"info/global_step": 401, "train_info/time_within_train_step": 2.5381059646606445, "step": 401} {"train_info/time_between_train_steps": 0.006943702697753906, "step": 401} {"info/global_step": 402, "train_info/time_within_train_step": 2.580063819885254, "step": 402} {"train_info/time_between_train_steps": 0.003640890121459961, "step": 402} {"info/global_step": 403, "train_info/time_within_train_step": 2.717163562774658, "step": 403} {"train_info/time_between_train_steps": 0.003733396530151367, "step": 403} {"info/global_step": 404, "train_info/time_within_train_step": 2.7447245121002197, "step": 404} {"train_info/time_between_train_steps": 0.004073381423950195, "step": 404} {"info/global_step": 405, "train_info/time_within_train_step": 2.7544376850128174, "step": 405} {"train_info/time_between_train_steps": 0.003623485565185547, "step": 405} {"info/global_step": 406, "train_info/time_within_train_step": 2.7559919357299805, "step": 406} {"train_info/time_between_train_steps": 0.003489255905151367, "step": 406} {"info/global_step": 407, "train_info/time_within_train_step": 2.7555902004241943, "step": 407} {"train_info/time_between_train_steps": 0.003620147705078125, "step": 407} {"info/global_step": 408, "train_info/time_within_train_step": 2.7572712898254395, "step": 408} {"train_info/time_between_train_steps": 0.0035638809204101562, "step": 408} {"info/global_step": 409, "train_info/time_within_train_step": 2.7568440437316895, "step": 409} {"train_info/time_between_train_steps": 0.003648519515991211, "step": 409} {"info/global_step": 410, "train_info/time_within_train_step": 2.756610631942749, "step": 410} {"train_info/time_between_train_steps": 0.003597259521484375, "step": 410} {"info/global_step": 411, "train_info/time_within_train_step": 2.7562923431396484, "step": 411} {"train_info/time_between_train_steps": 0.0036056041717529297, "step": 411} {"info/global_step": 412, "train_info/time_within_train_step": 2.756925106048584, "step": 412} {"train_info/time_between_train_steps": 0.003589153289794922, "step": 412} {"info/global_step": 413, "train_info/time_within_train_step": 2.7543833255767822, "step": 413} {"train_info/time_between_train_steps": 0.0035915374755859375, "step": 413} {"info/global_step": 414, "train_info/time_within_train_step": 2.756105422973633, "step": 414} {"train_info/time_between_train_steps": 0.0035293102264404297, "step": 414} {"info/global_step": 415, "train_info/time_within_train_step": 2.755723476409912, "step": 415} {"train_info/time_between_train_steps": 0.0035376548767089844, "step": 415} {"info/global_step": 416, "train_info/time_within_train_step": 2.7558062076568604, "step": 416} {"train_info/time_between_train_steps": 0.003507852554321289, "step": 416} {"info/global_step": 417, "train_info/time_within_train_step": 2.7563915252685547, "step": 417} {"train_info/time_between_train_steps": 0.0035278797149658203, "step": 417} {"info/global_step": 418, "train_info/time_within_train_step": 2.7565460205078125, "step": 418} {"train_info/time_between_train_steps": 0.0035195350646972656, "step": 418} {"info/global_step": 419, "train_info/time_within_train_step": 2.756296157836914, "step": 419} {"train_info/time_between_train_steps": 0.0034601688385009766, "step": 419} {"info/global_step": 420, "train_info/time_within_train_step": 2.7549991607666016, "step": 420} {"train_info/time_between_train_steps": 0.0035271644592285156, "step": 420} {"info/global_step": 421, "train_info/time_within_train_step": 2.7554569244384766, "step": 421} {"train_info/time_between_train_steps": 0.0035042762756347656, "step": 421} {"info/global_step": 422, "train_info/time_within_train_step": 2.756035327911377, "step": 422} {"train_info/time_between_train_steps": 0.0035250186920166016, "step": 422} {"info/global_step": 423, "train_info/time_within_train_step": 2.7559969425201416, "step": 423} {"train_info/time_between_train_steps": 0.0034639835357666016, "step": 423} {"info/global_step": 424, "train_info/time_within_train_step": 2.7567074298858643, "step": 424} {"train_info/time_between_train_steps": 0.006833076477050781, "step": 424} {"info/global_step": 425, "train_info/time_within_train_step": 2.755713939666748, "step": 425} {"train_info/time_between_train_steps": 0.006861209869384766, "step": 425} {"info/global_step": 426, "train_info/time_within_train_step": 2.7552742958068848, "step": 426} {"train_info/time_between_train_steps": 0.0034723281860351562, "step": 426} {"info/global_step": 427, "train_info/time_within_train_step": 2.756054401397705, "step": 427} {"train_info/time_between_train_steps": 0.003451108932495117, "step": 427} {"info/global_step": 428, "train_info/time_within_train_step": 2.75630784034729, "step": 428} {"train_info/time_between_train_steps": 0.003527402877807617, "step": 428} {"info/global_step": 429, "train_info/time_within_train_step": 2.755251169204712, "step": 429} {"train_info/time_between_train_steps": 0.003481626510620117, "step": 429} {"info/global_step": 430, "train_info/time_within_train_step": 2.754946708679199, "step": 430} {"train_info/time_between_train_steps": 0.003531217575073242, "step": 430} {"info/global_step": 431, "train_info/time_within_train_step": 2.756577968597412, "step": 431} {"train_info/time_between_train_steps": 0.0035953521728515625, "step": 431} {"info/global_step": 432, "train_info/time_within_train_step": 2.756622791290283, "step": 432} {"train_info/time_between_train_steps": 0.0035505294799804688, "step": 432} {"info/global_step": 433, "train_info/time_within_train_step": 2.7550485134124756, "step": 433} {"train_info/time_between_train_steps": 0.003500223159790039, "step": 433} {"info/global_step": 434, "train_info/time_within_train_step": 3.0964107513427734, "step": 434} {"train_info/time_between_train_steps": 0.0032041072845458984, "step": 434} {"info/global_step": 435, "train_info/time_within_train_step": 2.754720687866211, "step": 435} {"train_info/time_between_train_steps": 0.0032896995544433594, "step": 435} {"info/global_step": 436, "train_info/time_within_train_step": 2.755697250366211, "step": 436} {"train_info/time_between_train_steps": 0.0032973289489746094, "step": 436} {"info/global_step": 437, "train_info/time_within_train_step": 2.7548723220825195, "step": 437} {"train_info/time_between_train_steps": 0.003295421600341797, "step": 437} {"info/global_step": 438, "train_info/time_within_train_step": 2.8980624675750732, "step": 438} {"train_info/time_between_train_steps": 0.0032453536987304688, "step": 438} {"info/global_step": 439, "train_info/time_within_train_step": 2.754754066467285, "step": 439} {"train_info/time_between_train_steps": 0.003706216812133789, "step": 439} {"info/global_step": 440, "train_info/time_within_train_step": 2.7558271884918213, "step": 440} {"train_info/time_between_train_steps": 0.0032918453216552734, "step": 440} {"info/global_step": 441, "train_info/time_within_train_step": 2.755056142807007, "step": 441} {"train_info/time_between_train_steps": 0.0032758712768554688, "step": 441} {"info/global_step": 442, "train_info/time_within_train_step": 2.7544634342193604, "step": 442} {"train_info/time_between_train_steps": 0.0032796859741210938, "step": 442} {"info/global_step": 443, "train_info/time_within_train_step": 2.754471778869629, "step": 443} {"train_info/time_between_train_steps": 0.003306150436401367, "step": 443} {"info/global_step": 444, "train_info/time_within_train_step": 2.7551815509796143, "step": 444} {"train_info/time_between_train_steps": 0.003304719924926758, "step": 444} {"info/global_step": 445, "train_info/time_within_train_step": 2.755068778991699, "step": 445} {"train_info/time_between_train_steps": 0.0032694339752197266, "step": 445} {"info/global_step": 446, "train_info/time_within_train_step": 2.755089282989502, "step": 446} {"train_info/time_between_train_steps": 0.003264904022216797, "step": 446} {"info/global_step": 447, "train_info/time_within_train_step": 2.75523042678833, "step": 447} {"train_info/time_between_train_steps": 0.0032024383544921875, "step": 447} {"info/global_step": 448, "train_info/time_within_train_step": 2.7552871704101562, "step": 448} {"train_info/time_between_train_steps": 0.0031735897064208984, "step": 448} {"info/global_step": 449, "train_info/time_within_train_step": 2.755725622177124, "step": 449} {"train_info/time_between_train_steps": 0.0032062530517578125, "step": 449} {"info/global_step": 450, "train_info/time_within_train_step": 2.7559735774993896, "step": 450} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746567333, "_runtime": 1342}, "step": 450} {"logs": {"train/loss": 5.8008, "train/learning_rate": 0.00027, "train/epoch": 0.04, "_timestamp": 1746567333, "_runtime": 1342}, "step": 450} {"train_info/time_between_train_steps": 0.013142824172973633, "step": 450} {"info/global_step": 451, "train_info/time_within_train_step": 2.754199504852295, "step": 451} {"train_info/time_between_train_steps": 0.0031728744506835938, "step": 451} {"info/global_step": 452, "train_info/time_within_train_step": 2.753736972808838, "step": 452} {"train_info/time_between_train_steps": 0.0031893253326416016, "step": 452} {"info/global_step": 453, "train_info/time_within_train_step": 2.7558133602142334, "step": 453} {"train_info/time_between_train_steps": 0.0032405853271484375, "step": 453} {"info/global_step": 454, "train_info/time_within_train_step": 2.753986120223999, "step": 454} {"train_info/time_between_train_steps": 0.0032694339752197266, "step": 454} {"info/global_step": 455, "train_info/time_within_train_step": 2.7551400661468506, "step": 455} {"train_info/time_between_train_steps": 0.003477334976196289, "step": 455} {"info/global_step": 456, "train_info/time_within_train_step": 2.7545166015625, "step": 456} {"train_info/time_between_train_steps": 0.003538846969604492, "step": 456} {"info/global_step": 457, "train_info/time_within_train_step": 2.754082441329956, "step": 457} {"train_info/time_between_train_steps": 0.0034685134887695312, "step": 457} {"info/global_step": 458, "train_info/time_within_train_step": 2.756470203399658, "step": 458} {"train_info/time_between_train_steps": 0.0036118030548095703, "step": 458} {"info/global_step": 459, "train_info/time_within_train_step": 2.755276679992676, "step": 459} {"train_info/time_between_train_steps": 0.0035991668701171875, "step": 459} {"info/global_step": 460, "train_info/time_within_train_step": 2.7552852630615234, "step": 460} {"train_info/time_between_train_steps": 0.00354766845703125, "step": 460} {"info/global_step": 461, "train_info/time_within_train_step": 2.7561495304107666, "step": 461} {"train_info/time_between_train_steps": 0.0035657882690429688, "step": 461} {"info/global_step": 462, "train_info/time_within_train_step": 2.7578072547912598, "step": 462} {"train_info/time_between_train_steps": 0.0037038326263427734, "step": 462} {"info/global_step": 463, "train_info/time_within_train_step": 2.756706476211548, "step": 463} {"train_info/time_between_train_steps": 0.0034952163696289062, "step": 463} {"info/global_step": 464, "train_info/time_within_train_step": 2.7562665939331055, "step": 464} {"train_info/time_between_train_steps": 0.0035576820373535156, "step": 464} {"info/global_step": 465, "train_info/time_within_train_step": 2.754955530166626, "step": 465} {"train_info/time_between_train_steps": 0.003480672836303711, "step": 465} {"info/global_step": 466, "train_info/time_within_train_step": 2.7545883655548096, "step": 466} {"train_info/time_between_train_steps": 0.003631591796875, "step": 466} {"info/global_step": 467, "train_info/time_within_train_step": 2.7538373470306396, "step": 467} {"train_info/time_between_train_steps": 0.0035696029663085938, "step": 467} {"info/global_step": 468, "train_info/time_within_train_step": 2.7559683322906494, "step": 468} {"train_info/time_between_train_steps": 0.0035207271575927734, "step": 468} {"info/global_step": 469, "train_info/time_within_train_step": 2.755034923553467, "step": 469} {"train_info/time_between_train_steps": 0.0035524368286132812, "step": 469} {"info/global_step": 470, "train_info/time_within_train_step": 2.7548131942749023, "step": 470} {"train_info/time_between_train_steps": 0.0035276412963867188, "step": 470} {"info/global_step": 471, "train_info/time_within_train_step": 2.755490779876709, "step": 471} {"train_info/time_between_train_steps": 0.0034961700439453125, "step": 471} {"info/global_step": 472, "train_info/time_within_train_step": 2.756089925765991, "step": 472} {"train_info/time_between_train_steps": 0.003537416458129883, "step": 472} {"info/global_step": 473, "train_info/time_within_train_step": 2.7561967372894287, "step": 473} {"train_info/time_between_train_steps": 0.0035245418548583984, "step": 473} {"info/global_step": 474, "train_info/time_within_train_step": 2.755155324935913, "step": 474} {"train_info/time_between_train_steps": 0.003576993942260742, "step": 474} {"info/global_step": 475, "train_info/time_within_train_step": 2.755096912384033, "step": 475} {"train_info/time_between_train_steps": 0.003576517105102539, "step": 475} {"info/global_step": 476, "train_info/time_within_train_step": 2.755613327026367, "step": 476} {"train_info/time_between_train_steps": 0.0035212039947509766, "step": 476} {"info/global_step": 477, "train_info/time_within_train_step": 2.75691819190979, "step": 477} {"train_info/time_between_train_steps": 0.003530263900756836, "step": 477} {"info/global_step": 478, "train_info/time_within_train_step": 2.756580352783203, "step": 478} {"train_info/time_between_train_steps": 0.003600597381591797, "step": 478} {"info/global_step": 479, "train_info/time_within_train_step": 2.755474328994751, "step": 479} {"train_info/time_between_train_steps": 0.003481626510620117, "step": 479} {"info/global_step": 480, "train_info/time_within_train_step": 2.7549240589141846, "step": 480} {"train_info/time_between_train_steps": 0.0035393238067626953, "step": 480} {"info/global_step": 481, "train_info/time_within_train_step": 2.755810022354126, "step": 481} {"train_info/time_between_train_steps": 0.0036478042602539062, "step": 481} {"info/global_step": 482, "train_info/time_within_train_step": 2.75469708442688, "step": 482} {"train_info/time_between_train_steps": 0.003537416458129883, "step": 482} {"info/global_step": 483, "train_info/time_within_train_step": 2.754783868789673, "step": 483} {"train_info/time_between_train_steps": 0.0035169124603271484, "step": 483} {"info/global_step": 484, "train_info/time_within_train_step": 2.7553510665893555, "step": 484} {"train_info/time_between_train_steps": 0.003674745559692383, "step": 484} {"info/global_step": 485, "train_info/time_within_train_step": 2.7542197704315186, "step": 485} {"train_info/time_between_train_steps": 0.003614187240600586, "step": 485} {"info/global_step": 486, "train_info/time_within_train_step": 2.755560874938965, "step": 486} {"train_info/time_between_train_steps": 0.003493070602416992, "step": 486} {"info/global_step": 487, "train_info/time_within_train_step": 3.0851757526397705, "step": 487} {"train_info/time_between_train_steps": 0.003321409225463867, "step": 487} {"info/global_step": 488, "train_info/time_within_train_step": 2.7558014392852783, "step": 488} {"train_info/time_between_train_steps": 0.0032129287719726562, "step": 488} {"info/global_step": 489, "train_info/time_within_train_step": 2.754556655883789, "step": 489} {"train_info/time_between_train_steps": 0.003264188766479492, "step": 489} {"info/global_step": 490, "train_info/time_within_train_step": 2.754652500152588, "step": 490} {"train_info/time_between_train_steps": 0.003209829330444336, "step": 490} {"info/global_step": 491, "train_info/time_within_train_step": 2.754805088043213, "step": 491} {"train_info/time_between_train_steps": 0.0032041072845458984, "step": 491} {"info/global_step": 492, "train_info/time_within_train_step": 2.753934383392334, "step": 492} {"train_info/time_between_train_steps": 0.003250598907470703, "step": 492} {"info/global_step": 493, "train_info/time_within_train_step": 2.754725933074951, "step": 493} {"train_info/time_between_train_steps": 0.0031909942626953125, "step": 493} {"info/global_step": 494, "train_info/time_within_train_step": 2.7547807693481445, "step": 494} {"train_info/time_between_train_steps": 0.0032126903533935547, "step": 494} {"info/global_step": 495, "train_info/time_within_train_step": 2.7546355724334717, "step": 495} {"train_info/time_between_train_steps": 0.0035245418548583984, "step": 495} {"info/global_step": 496, "train_info/time_within_train_step": 2.7548575401306152, "step": 496} {"train_info/time_between_train_steps": 0.0032317638397216797, "step": 496} {"info/global_step": 497, "train_info/time_within_train_step": 2.753934144973755, "step": 497} {"train_info/time_between_train_steps": 0.0032470226287841797, "step": 497} {"info/global_step": 498, "train_info/time_within_train_step": 2.754208564758301, "step": 498} {"train_info/time_between_train_steps": 0.0032176971435546875, "step": 498} {"info/global_step": 499, "train_info/time_within_train_step": 2.754908323287964, "step": 499} {"train_info/time_between_train_steps": 0.0031757354736328125, "step": 499} {"info/global_step": 500, "train_info/time_within_train_step": 3.2689990997314453, "step": 500} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746567473, "_runtime": 1482}, "step": 500} {"logs": {"train/loss": 5.722, "train/learning_rate": 0.0003, "train/epoch": 0.05, "_timestamp": 1746567473, "_runtime": 1482}, "step": 500} {"train_info/time_between_train_steps": 0.10655021667480469, "step": 500} {"info/global_step": 501, "train_info/time_within_train_step": 2.751579523086548, "step": 501} {"train_info/time_between_train_steps": 0.003196239471435547, "step": 501} {"info/global_step": 502, "train_info/time_within_train_step": 2.753319263458252, "step": 502} {"train_info/time_between_train_steps": 0.0032262802124023438, "step": 502} {"info/global_step": 503, "train_info/time_within_train_step": 2.755645513534546, "step": 503} {"train_info/time_between_train_steps": 0.0031659603118896484, "step": 503} {"info/global_step": 504, "train_info/time_within_train_step": 2.75388240814209, "step": 504} {"train_info/time_between_train_steps": 0.003206968307495117, "step": 504} {"info/global_step": 505, "train_info/time_within_train_step": 2.7538902759552, "step": 505} {"train_info/time_between_train_steps": 0.0031890869140625, "step": 505} {"info/global_step": 506, "train_info/time_within_train_step": 2.754459857940674, "step": 506} {"train_info/time_between_train_steps": 0.0032236576080322266, "step": 506} {"info/global_step": 507, "train_info/time_within_train_step": 2.753838300704956, "step": 507} {"train_info/time_between_train_steps": 0.0032105445861816406, "step": 507} {"info/global_step": 508, "train_info/time_within_train_step": 2.7535548210144043, "step": 508} {"train_info/time_between_train_steps": 0.003195524215698242, "step": 508} {"info/global_step": 509, "train_info/time_within_train_step": 2.754814863204956, "step": 509} {"train_info/time_between_train_steps": 0.003178834915161133, "step": 509} {"info/global_step": 510, "train_info/time_within_train_step": 2.7536351680755615, "step": 510} {"train_info/time_between_train_steps": 0.0031702518463134766, "step": 510} {"info/global_step": 511, "train_info/time_within_train_step": 2.753450393676758, "step": 511} {"train_info/time_between_train_steps": 0.00322723388671875, "step": 511} {"info/global_step": 512, "train_info/time_within_train_step": 2.754305601119995, "step": 512} {"train_info/time_between_train_steps": 0.003176450729370117, "step": 512} {"info/global_step": 513, "train_info/time_within_train_step": 2.7548584938049316, "step": 513} {"train_info/time_between_train_steps": 0.0031745433807373047, "step": 513} {"info/global_step": 514, "train_info/time_within_train_step": 2.7546331882476807, "step": 514} {"train_info/time_between_train_steps": 0.003195524215698242, "step": 514} {"info/global_step": 515, "train_info/time_within_train_step": 2.755434274673462, "step": 515} {"train_info/time_between_train_steps": 0.003242969512939453, "step": 515} {"info/global_step": 516, "train_info/time_within_train_step": 2.7549455165863037, "step": 516} {"train_info/time_between_train_steps": 0.003180980682373047, "step": 516} {"info/global_step": 517, "train_info/time_within_train_step": 2.7554867267608643, "step": 517} {"train_info/time_between_train_steps": 0.003328561782836914, "step": 517} {"info/global_step": 518, "train_info/time_within_train_step": 2.752960205078125, "step": 518} {"train_info/time_between_train_steps": 0.003185749053955078, "step": 518} {"info/global_step": 519, "train_info/time_within_train_step": 2.7537834644317627, "step": 519} {"train_info/time_between_train_steps": 0.003176450729370117, "step": 519} {"info/global_step": 520, "train_info/time_within_train_step": 2.755308151245117, "step": 520} {"train_info/time_between_train_steps": 0.003226757049560547, "step": 520} {"info/global_step": 521, "train_info/time_within_train_step": 2.7557930946350098, "step": 521} {"train_info/time_between_train_steps": 0.0031747817993164062, "step": 521} {"info/global_step": 522, "train_info/time_within_train_step": 2.753434658050537, "step": 522} {"train_info/time_between_train_steps": 0.003190279006958008, "step": 522} {"info/global_step": 523, "train_info/time_within_train_step": 2.7542672157287598, "step": 523} {"train_info/time_between_train_steps": 0.0031876564025878906, "step": 523} {"info/global_step": 524, "train_info/time_within_train_step": 2.7551071643829346, "step": 524} {"train_info/time_between_train_steps": 0.0031630992889404297, "step": 524} {"info/global_step": 525, "train_info/time_within_train_step": 2.984112024307251, "step": 525} {"train_info/time_between_train_steps": 0.003184795379638672, "step": 525} {"info/global_step": 526, "train_info/time_within_train_step": 2.7540454864501953, "step": 526} {"train_info/time_between_train_steps": 0.0032012462615966797, "step": 526} {"info/global_step": 527, "train_info/time_within_train_step": 2.754345655441284, "step": 527} {"train_info/time_between_train_steps": 0.0031807422637939453, "step": 527} {"info/global_step": 528, "train_info/time_within_train_step": 2.7540111541748047, "step": 528} {"train_info/time_between_train_steps": 0.003274679183959961, "step": 528} {"info/global_step": 529, "train_info/time_within_train_step": 2.754143476486206, "step": 529} {"train_info/time_between_train_steps": 0.0032088756561279297, "step": 529} {"info/global_step": 530, "train_info/time_within_train_step": 2.7539267539978027, "step": 530} {"train_info/time_between_train_steps": 0.0031676292419433594, "step": 530} {"info/global_step": 531, "train_info/time_within_train_step": 2.754754066467285, "step": 531} {"train_info/time_between_train_steps": 0.0032567977905273438, "step": 531} {"info/global_step": 532, "train_info/time_within_train_step": 2.7528669834136963, "step": 532} {"train_info/time_between_train_steps": 0.003190755844116211, "step": 532} {"info/global_step": 533, "train_info/time_within_train_step": 2.7528021335601807, "step": 533} {"train_info/time_between_train_steps": 0.0031697750091552734, "step": 533} {"info/global_step": 534, "train_info/time_within_train_step": 2.7540745735168457, "step": 534} {"train_info/time_between_train_steps": 0.0032324790954589844, "step": 534} {"info/global_step": 535, "train_info/time_within_train_step": 2.753507614135742, "step": 535} {"train_info/time_between_train_steps": 0.003181934356689453, "step": 535} {"info/global_step": 536, "train_info/time_within_train_step": 2.753842830657959, "step": 536} {"train_info/time_between_train_steps": 0.003170013427734375, "step": 536} {"info/global_step": 537, "train_info/time_within_train_step": 2.753586530685425, "step": 537} {"train_info/time_between_train_steps": 0.0032052993774414062, "step": 537} {"info/global_step": 538, "train_info/time_within_train_step": 2.754318952560425, "step": 538} {"train_info/time_between_train_steps": 0.0031719207763671875, "step": 538} {"info/global_step": 539, "train_info/time_within_train_step": 2.753549575805664, "step": 539} {"train_info/time_between_train_steps": 0.003245115280151367, "step": 539} {"info/global_step": 540, "train_info/time_within_train_step": 2.754173994064331, "step": 540} {"train_info/time_between_train_steps": 0.003200054168701172, "step": 540} {"info/global_step": 541, "train_info/time_within_train_step": 2.75464129447937, "step": 541} {"train_info/time_between_train_steps": 0.018674612045288086, "step": 541} {"info/global_step": 542, "train_info/time_within_train_step": 2.7551157474517822, "step": 542} {"train_info/time_between_train_steps": 0.002907276153564453, "step": 542} {"info/global_step": 543, "train_info/time_within_train_step": 2.7537200450897217, "step": 543} {"train_info/time_between_train_steps": 0.0029036998748779297, "step": 543} {"info/global_step": 544, "train_info/time_within_train_step": 2.7535107135772705, "step": 544} {"train_info/time_between_train_steps": 0.002874612808227539, "step": 544} {"info/global_step": 545, "train_info/time_within_train_step": 2.753779649734497, "step": 545} {"train_info/time_between_train_steps": 0.0028858184814453125, "step": 545} {"info/global_step": 546, "train_info/time_within_train_step": 2.753331184387207, "step": 546} {"train_info/time_between_train_steps": 0.00287628173828125, "step": 546} {"info/global_step": 547, "train_info/time_within_train_step": 2.7535784244537354, "step": 547} {"train_info/time_between_train_steps": 0.0028743743896484375, "step": 547} {"info/global_step": 548, "train_info/time_within_train_step": 2.7531180381774902, "step": 548} {"train_info/time_between_train_steps": 0.002879619598388672, "step": 548} {"info/global_step": 549, "train_info/time_within_train_step": 2.7535276412963867, "step": 549} {"train_info/time_between_train_steps": 0.0028734207153320312, "step": 549} {"info/global_step": 550, "train_info/time_within_train_step": 2.7533035278320312, "step": 550} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746567611, "_runtime": 1620}, "step": 550} {"logs": {"train/loss": 5.6412, "train/learning_rate": 0.00033, "train/epoch": 0.06, "_timestamp": 1746567611, "_runtime": 1620}, "step": 550} {"train_info/time_between_train_steps": 0.0071163177490234375, "step": 550} {"info/global_step": 551, "train_info/time_within_train_step": 2.7533187866210938, "step": 551} {"train_info/time_between_train_steps": 0.0028831958770751953, "step": 551} {"info/global_step": 552, "train_info/time_within_train_step": 2.753539562225342, "step": 552} {"train_info/time_between_train_steps": 0.0028760433197021484, "step": 552} {"info/global_step": 553, "train_info/time_within_train_step": 2.7517507076263428, "step": 553} {"train_info/time_between_train_steps": 0.0028731822967529297, "step": 553} {"info/global_step": 554, "train_info/time_within_train_step": 2.7526705265045166, "step": 554} {"train_info/time_between_train_steps": 0.002961397171020508, "step": 554} {"info/global_step": 555, "train_info/time_within_train_step": 2.7527763843536377, "step": 555} {"train_info/time_between_train_steps": 0.002871990203857422, "step": 555} {"info/global_step": 556, "train_info/time_within_train_step": 2.752562999725342, "step": 556} {"train_info/time_between_train_steps": 0.0028657913208007812, "step": 556} {"info/global_step": 557, "train_info/time_within_train_step": 2.752898931503296, "step": 557} {"train_info/time_between_train_steps": 0.0028884410858154297, "step": 557} {"info/global_step": 558, "train_info/time_within_train_step": 2.7529287338256836, "step": 558} {"train_info/time_between_train_steps": 0.0028955936431884766, "step": 558} {"info/global_step": 559, "train_info/time_within_train_step": 2.753394603729248, "step": 559} {"train_info/time_between_train_steps": 0.0029337406158447266, "step": 559} {"info/global_step": 560, "train_info/time_within_train_step": 2.7537574768066406, "step": 560} {"train_info/time_between_train_steps": 0.002909421920776367, "step": 560} {"info/global_step": 561, "train_info/time_within_train_step": 2.751965045928955, "step": 561} {"train_info/time_between_train_steps": 0.0029211044311523438, "step": 561} {"info/global_step": 562, "train_info/time_within_train_step": 2.7534451484680176, "step": 562} {"train_info/time_between_train_steps": 0.0028772354125976562, "step": 562} {"info/global_step": 563, "train_info/time_within_train_step": 2.7528321743011475, "step": 563} {"train_info/time_between_train_steps": 0.002877473831176758, "step": 563} {"info/global_step": 564, "train_info/time_within_train_step": 2.7528023719787598, "step": 564} {"train_info/time_between_train_steps": 0.002903461456298828, "step": 564} {"info/global_step": 565, "train_info/time_within_train_step": 2.752861261367798, "step": 565} {"train_info/time_between_train_steps": 0.002934694290161133, "step": 565} {"info/global_step": 566, "train_info/time_within_train_step": 2.7528610229492188, "step": 566} {"train_info/time_between_train_steps": 0.002911090850830078, "step": 566} {"info/global_step": 567, "train_info/time_within_train_step": 2.75248384475708, "step": 567} {"train_info/time_between_train_steps": 0.0029392242431640625, "step": 567} {"info/global_step": 568, "train_info/time_within_train_step": 2.7526285648345947, "step": 568} {"train_info/time_between_train_steps": 0.0029973983764648438, "step": 568} {"info/global_step": 569, "train_info/time_within_train_step": 2.7527835369110107, "step": 569} {"train_info/time_between_train_steps": 0.003055095672607422, "step": 569} {"info/global_step": 570, "train_info/time_within_train_step": 2.75150465965271, "step": 570} {"train_info/time_between_train_steps": 0.0029265880584716797, "step": 570} {"info/global_step": 571, "train_info/time_within_train_step": 2.7531981468200684, "step": 571} {"train_info/time_between_train_steps": 0.002981901168823242, "step": 571} {"info/global_step": 572, "train_info/time_within_train_step": 2.7519471645355225, "step": 572} {"train_info/time_between_train_steps": 0.0030105113983154297, "step": 572} {"info/global_step": 573, "train_info/time_within_train_step": 2.7538633346557617, "step": 573} {"train_info/time_between_train_steps": 0.002988576889038086, "step": 573} {"info/global_step": 574, "train_info/time_within_train_step": 2.754026412963867, "step": 574} {"train_info/time_between_train_steps": 0.002912759780883789, "step": 574} {"info/global_step": 575, "train_info/time_within_train_step": 2.7519407272338867, "step": 575} {"train_info/time_between_train_steps": 0.002899169921875, "step": 575} {"info/global_step": 576, "train_info/time_within_train_step": 2.754154920578003, "step": 576} {"train_info/time_between_train_steps": 0.0029087066650390625, "step": 576} {"info/global_step": 577, "train_info/time_within_train_step": 2.755023717880249, "step": 577} {"train_info/time_between_train_steps": 0.002888917922973633, "step": 577} {"info/global_step": 578, "train_info/time_within_train_step": 2.753976821899414, "step": 578} {"train_info/time_between_train_steps": 0.002875804901123047, "step": 578} {"info/global_step": 579, "train_info/time_within_train_step": 2.7536697387695312, "step": 579} {"train_info/time_between_train_steps": 0.0029058456420898438, "step": 579} {"info/global_step": 580, "train_info/time_within_train_step": 2.7538270950317383, "step": 580} {"train_info/time_between_train_steps": 0.002935647964477539, "step": 580} {"info/global_step": 581, "train_info/time_within_train_step": 2.7523484230041504, "step": 581} {"train_info/time_between_train_steps": 0.0028667449951171875, "step": 581} {"info/global_step": 582, "train_info/time_within_train_step": 2.7528579235076904, "step": 582} {"train_info/time_between_train_steps": 0.0028858184814453125, "step": 582} {"info/global_step": 583, "train_info/time_within_train_step": 2.751774549484253, "step": 583} {"train_info/time_between_train_steps": 0.0029211044311523438, "step": 583} {"info/global_step": 584, "train_info/time_within_train_step": 2.7521347999572754, "step": 584} {"train_info/time_between_train_steps": 0.002870798110961914, "step": 584} {"info/global_step": 585, "train_info/time_within_train_step": 2.752129316329956, "step": 585} {"train_info/time_between_train_steps": 0.0028657913208007812, "step": 585} {"info/global_step": 586, "train_info/time_within_train_step": 2.752241849899292, "step": 586} {"train_info/time_between_train_steps": 0.0029010772705078125, "step": 586} {"info/global_step": 587, "train_info/time_within_train_step": 2.7533648014068604, "step": 587} {"train_info/time_between_train_steps": 0.0028798580169677734, "step": 587} {"info/global_step": 588, "train_info/time_within_train_step": 2.7543907165527344, "step": 588} {"train_info/time_between_train_steps": 0.0029511451721191406, "step": 588} {"info/global_step": 589, "train_info/time_within_train_step": 2.7535152435302734, "step": 589} {"train_info/time_between_train_steps": 0.002949953079223633, "step": 589} {"info/global_step": 590, "train_info/time_within_train_step": 2.7541708946228027, "step": 590} {"train_info/time_between_train_steps": 0.0029404163360595703, "step": 590} {"info/global_step": 591, "train_info/time_within_train_step": 2.7527894973754883, "step": 591} {"train_info/time_between_train_steps": 0.0030434131622314453, "step": 591} {"info/global_step": 592, "train_info/time_within_train_step": 2.7552437782287598, "step": 592} {"train_info/time_between_train_steps": 0.0029850006103515625, "step": 592} {"info/global_step": 593, "train_info/time_within_train_step": 2.7545535564422607, "step": 593} {"train_info/time_between_train_steps": 0.002891063690185547, "step": 593} {"info/global_step": 594, "train_info/time_within_train_step": 2.754875659942627, "step": 594} {"train_info/time_between_train_steps": 0.0029408931732177734, "step": 594} {"info/global_step": 595, "train_info/time_within_train_step": 2.7544288635253906, "step": 595} {"train_info/time_between_train_steps": 0.0029897689819335938, "step": 595} {"info/global_step": 596, "train_info/time_within_train_step": 2.75349760055542, "step": 596} {"train_info/time_between_train_steps": 0.0029075145721435547, "step": 596} {"info/global_step": 597, "train_info/time_within_train_step": 2.7535312175750732, "step": 597} {"train_info/time_between_train_steps": 0.003022909164428711, "step": 597} {"info/global_step": 598, "train_info/time_within_train_step": 2.753056526184082, "step": 598} {"train_info/time_between_train_steps": 0.0029621124267578125, "step": 598} {"info/global_step": 599, "train_info/time_within_train_step": 2.7539920806884766, "step": 599} {"train_info/time_between_train_steps": 0.002892732620239258, "step": 599} {"info/global_step": 600, "train_info/time_within_train_step": 2.7529144287109375, "step": 600} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746567750, "_runtime": 1759}, "step": 600} {"logs": {"train/loss": 5.5771, "train/learning_rate": 0.00035999999999999997, "train/epoch": 0.06, "_timestamp": 1746567750, "_runtime": 1759}, "step": 600} {"train_info/time_between_train_steps": 26.589051246643066, "step": 600} {"info/global_step": 601, "train_info/time_within_train_step": 2.5370187759399414, "step": 601} {"train_info/time_between_train_steps": 0.0029757022857666016, "step": 601} {"info/global_step": 602, "train_info/time_within_train_step": 2.587589740753174, "step": 602} {"train_info/time_between_train_steps": 0.002960681915283203, "step": 602} {"info/global_step": 603, "train_info/time_within_train_step": 2.7150344848632812, "step": 603} {"train_info/time_between_train_steps": 0.0029747486114501953, "step": 603} {"info/global_step": 604, "train_info/time_within_train_step": 2.7224550247192383, "step": 604} {"train_info/time_between_train_steps": 0.0030999183654785156, "step": 604} {"info/global_step": 605, "train_info/time_within_train_step": 2.7407422065734863, "step": 605} {"train_info/time_between_train_steps": 0.0029752254486083984, "step": 605} {"info/global_step": 606, "train_info/time_within_train_step": 2.7531442642211914, "step": 606} {"train_info/time_between_train_steps": 0.0029075145721435547, "step": 606} {"info/global_step": 607, "train_info/time_within_train_step": 2.7536330223083496, "step": 607} {"train_info/time_between_train_steps": 0.0028777122497558594, "step": 607} {"info/global_step": 608, "train_info/time_within_train_step": 2.755295753479004, "step": 608} {"train_info/time_between_train_steps": 0.0029973983764648438, "step": 608} {"info/global_step": 609, "train_info/time_within_train_step": 2.7583460807800293, "step": 609} {"train_info/time_between_train_steps": 0.003025531768798828, "step": 609} {"info/global_step": 610, "train_info/time_within_train_step": 2.7540571689605713, "step": 610} {"train_info/time_between_train_steps": 0.00299835205078125, "step": 610} {"info/global_step": 611, "train_info/time_within_train_step": 2.933279275894165, "step": 611} {"train_info/time_between_train_steps": 0.0031037330627441406, "step": 611} {"info/global_step": 612, "train_info/time_within_train_step": 2.756662130355835, "step": 612} {"train_info/time_between_train_steps": 0.003001689910888672, "step": 612} {"info/global_step": 613, "train_info/time_within_train_step": 2.7566771507263184, "step": 613} {"train_info/time_between_train_steps": 0.003384828567504883, "step": 613} {"info/global_step": 614, "train_info/time_within_train_step": 2.7568652629852295, "step": 614} {"train_info/time_between_train_steps": 0.0031099319458007812, "step": 614} {"info/global_step": 615, "train_info/time_within_train_step": 2.7555110454559326, "step": 615} {"train_info/time_between_train_steps": 0.003207683563232422, "step": 615} {"info/global_step": 616, "train_info/time_within_train_step": 2.7561004161834717, "step": 616} {"train_info/time_between_train_steps": 0.003161191940307617, "step": 616} {"info/global_step": 617, "train_info/time_within_train_step": 2.7559146881103516, "step": 617} {"train_info/time_between_train_steps": 0.003077268600463867, "step": 617} {"info/global_step": 618, "train_info/time_within_train_step": 2.755601644515991, "step": 618} {"train_info/time_between_train_steps": 0.003123760223388672, "step": 618} {"info/global_step": 619, "train_info/time_within_train_step": 2.7559192180633545, "step": 619} {"train_info/time_between_train_steps": 0.003145933151245117, "step": 619} {"info/global_step": 620, "train_info/time_within_train_step": 2.7563891410827637, "step": 620} {"train_info/time_between_train_steps": 0.003037691116333008, "step": 620} {"info/global_step": 621, "train_info/time_within_train_step": 2.7567708492279053, "step": 621} {"train_info/time_between_train_steps": 0.003209829330444336, "step": 621} {"info/global_step": 622, "train_info/time_within_train_step": 2.7562081813812256, "step": 622} {"train_info/time_between_train_steps": 0.003130674362182617, "step": 622} {"info/global_step": 623, "train_info/time_within_train_step": 2.7568936347961426, "step": 623} {"train_info/time_between_train_steps": 0.0030803680419921875, "step": 623} {"info/global_step": 624, "train_info/time_within_train_step": 2.755784511566162, "step": 624} {"train_info/time_between_train_steps": 0.0031135082244873047, "step": 624} {"info/global_step": 625, "train_info/time_within_train_step": 2.757056713104248, "step": 625} {"train_info/time_between_train_steps": 0.003057241439819336, "step": 625} {"info/global_step": 626, "train_info/time_within_train_step": 2.7561471462249756, "step": 626} {"train_info/time_between_train_steps": 0.0030357837677001953, "step": 626} {"info/global_step": 627, "train_info/time_within_train_step": 2.7551047801971436, "step": 627} {"train_info/time_between_train_steps": 0.0030469894409179688, "step": 627} {"info/global_step": 628, "train_info/time_within_train_step": 2.754692316055298, "step": 628} {"train_info/time_between_train_steps": 0.0030782222747802734, "step": 628} {"info/global_step": 629, "train_info/time_within_train_step": 2.75614333152771, "step": 629} {"train_info/time_between_train_steps": 0.0030379295349121094, "step": 629} {"info/global_step": 630, "train_info/time_within_train_step": 2.755906581878662, "step": 630} {"train_info/time_between_train_steps": 0.0031309127807617188, "step": 630} {"info/global_step": 631, "train_info/time_within_train_step": 2.7542364597320557, "step": 631} {"train_info/time_between_train_steps": 0.003033876419067383, "step": 631} {"info/global_step": 632, "train_info/time_within_train_step": 2.7571957111358643, "step": 632} {"train_info/time_between_train_steps": 0.003086566925048828, "step": 632} {"info/global_step": 633, "train_info/time_within_train_step": 2.756740093231201, "step": 633} {"train_info/time_between_train_steps": 0.002970457077026367, "step": 633} {"info/global_step": 634, "train_info/time_within_train_step": 2.75704026222229, "step": 634} {"train_info/time_between_train_steps": 0.0030024051666259766, "step": 634} {"info/global_step": 635, "train_info/time_within_train_step": 2.7547075748443604, "step": 635} {"train_info/time_between_train_steps": 0.003051280975341797, "step": 635} {"info/global_step": 636, "train_info/time_within_train_step": 2.754096746444702, "step": 636} {"train_info/time_between_train_steps": 0.002953052520751953, "step": 636} {"info/global_step": 637, "train_info/time_within_train_step": 2.7540619373321533, "step": 637} {"train_info/time_between_train_steps": 0.0030426979064941406, "step": 637} {"info/global_step": 638, "train_info/time_within_train_step": 2.7559919357299805, "step": 638} {"train_info/time_between_train_steps": 0.002995014190673828, "step": 638} {"info/global_step": 639, "train_info/time_within_train_step": 2.754645824432373, "step": 639} {"train_info/time_between_train_steps": 0.0029790401458740234, "step": 639} {"info/global_step": 640, "train_info/time_within_train_step": 2.7550787925720215, "step": 640} {"train_info/time_between_train_steps": 0.0029518604278564453, "step": 640} {"info/global_step": 641, "train_info/time_within_train_step": 2.754903793334961, "step": 641} {"train_info/time_between_train_steps": 0.003016233444213867, "step": 641} {"info/global_step": 642, "train_info/time_within_train_step": 2.755782127380371, "step": 642} {"train_info/time_between_train_steps": 0.0029861927032470703, "step": 642} {"info/global_step": 643, "train_info/time_within_train_step": 2.7550549507141113, "step": 643} {"train_info/time_between_train_steps": 0.0030078887939453125, "step": 643} {"info/global_step": 644, "train_info/time_within_train_step": 2.755868911743164, "step": 644} {"train_info/time_between_train_steps": 0.003007173538208008, "step": 644} {"info/global_step": 645, "train_info/time_within_train_step": 2.7543318271636963, "step": 645} {"train_info/time_between_train_steps": 0.0030074119567871094, "step": 645} {"info/global_step": 646, "train_info/time_within_train_step": 2.7551681995391846, "step": 646} {"train_info/time_between_train_steps": 0.0029654502868652344, "step": 646} {"info/global_step": 647, "train_info/time_within_train_step": 2.754063367843628, "step": 647} {"train_info/time_between_train_steps": 0.0029921531677246094, "step": 647} {"info/global_step": 648, "train_info/time_within_train_step": 2.7535557746887207, "step": 648} {"train_info/time_between_train_steps": 0.0029926300048828125, "step": 648} {"info/global_step": 649, "train_info/time_within_train_step": 2.7555904388427734, "step": 649} {"train_info/time_between_train_steps": 0.002950906753540039, "step": 649} {"info/global_step": 650, "train_info/time_within_train_step": 2.7544798851013184, "step": 650} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746567914, "_runtime": 1923}, "step": 650} {"logs": {"train/loss": 5.4924, "train/learning_rate": 0.00039, "train/epoch": 0.07, "_timestamp": 1746567914, "_runtime": 1923}, "step": 650} {"train_info/time_between_train_steps": 0.014690637588500977, "step": 650} {"info/global_step": 651, "train_info/time_within_train_step": 2.7549076080322266, "step": 651} {"train_info/time_between_train_steps": 0.0030167102813720703, "step": 651} {"info/global_step": 652, "train_info/time_within_train_step": 2.7554638385772705, "step": 652} {"train_info/time_between_train_steps": 0.0030295848846435547, "step": 652} {"info/global_step": 653, "train_info/time_within_train_step": 2.7545664310455322, "step": 653} {"train_info/time_between_train_steps": 0.0030040740966796875, "step": 653} {"info/global_step": 654, "train_info/time_within_train_step": 2.7538974285125732, "step": 654} {"train_info/time_between_train_steps": 0.0029883384704589844, "step": 654} {"info/global_step": 655, "train_info/time_within_train_step": 2.7541232109069824, "step": 655} {"train_info/time_between_train_steps": 0.0030362606048583984, "step": 655} {"info/global_step": 656, "train_info/time_within_train_step": 2.7553787231445312, "step": 656} {"train_info/time_between_train_steps": 0.002985715866088867, "step": 656} {"info/global_step": 657, "train_info/time_within_train_step": 2.7539680004119873, "step": 657} {"train_info/time_between_train_steps": 0.002992391586303711, "step": 657} {"info/global_step": 658, "train_info/time_within_train_step": 2.754408121109009, "step": 658} {"train_info/time_between_train_steps": 0.0029990673065185547, "step": 658} {"info/global_step": 659, "train_info/time_within_train_step": 2.7539548873901367, "step": 659} {"train_info/time_between_train_steps": 0.0030324459075927734, "step": 659} {"info/global_step": 660, "train_info/time_within_train_step": 2.7530291080474854, "step": 660} {"train_info/time_between_train_steps": 0.003015756607055664, "step": 660} {"info/global_step": 661, "train_info/time_within_train_step": 2.7537519931793213, "step": 661} {"train_info/time_between_train_steps": 0.002966165542602539, "step": 661} {"info/global_step": 662, "train_info/time_within_train_step": 2.7545769214630127, "step": 662} {"train_info/time_between_train_steps": 0.0029954910278320312, "step": 662} {"info/global_step": 663, "train_info/time_within_train_step": 2.7543365955352783, "step": 663} {"train_info/time_between_train_steps": 0.0029344558715820312, "step": 663} {"info/global_step": 664, "train_info/time_within_train_step": 2.754371166229248, "step": 664} {"train_info/time_between_train_steps": 0.0029380321502685547, "step": 664} {"info/global_step": 665, "train_info/time_within_train_step": 2.7534029483795166, "step": 665} {"train_info/time_between_train_steps": 0.0029172897338867188, "step": 665} {"info/global_step": 666, "train_info/time_within_train_step": 2.7556705474853516, "step": 666} {"train_info/time_between_train_steps": 0.0030164718627929688, "step": 666} {"info/global_step": 667, "train_info/time_within_train_step": 2.754643440246582, "step": 667} {"train_info/time_between_train_steps": 0.0029888153076171875, "step": 667} {"info/global_step": 668, "train_info/time_within_train_step": 2.754767417907715, "step": 668} {"train_info/time_between_train_steps": 0.002997875213623047, "step": 668} {"info/global_step": 669, "train_info/time_within_train_step": 2.755812644958496, "step": 669} {"train_info/time_between_train_steps": 0.0029990673065185547, "step": 669} {"info/global_step": 670, "train_info/time_within_train_step": 2.7535064220428467, "step": 670} {"train_info/time_between_train_steps": 0.002985239028930664, "step": 670} {"info/global_step": 671, "train_info/time_within_train_step": 2.754150867462158, "step": 671} {"train_info/time_between_train_steps": 0.0029189586639404297, "step": 671} {"info/global_step": 672, "train_info/time_within_train_step": 2.754124402999878, "step": 672} {"train_info/time_between_train_steps": 0.0029153823852539062, "step": 672} {"info/global_step": 673, "train_info/time_within_train_step": 2.7549333572387695, "step": 673} {"train_info/time_between_train_steps": 0.0030410289764404297, "step": 673} {"info/global_step": 674, "train_info/time_within_train_step": 2.753399610519409, "step": 674} {"train_info/time_between_train_steps": 0.0029637813568115234, "step": 674} {"info/global_step": 675, "train_info/time_within_train_step": 2.7535109519958496, "step": 675} {"train_info/time_between_train_steps": 0.003027677536010742, "step": 675} {"info/global_step": 676, "train_info/time_within_train_step": 2.752979040145874, "step": 676} {"train_info/time_between_train_steps": 0.0030341148376464844, "step": 676} {"info/global_step": 677, "train_info/time_within_train_step": 2.7534172534942627, "step": 677} {"train_info/time_between_train_steps": 0.0029997825622558594, "step": 677} {"info/global_step": 678, "train_info/time_within_train_step": 2.75348162651062, "step": 678} {"train_info/time_between_train_steps": 0.0030145645141601562, "step": 678} {"info/global_step": 679, "train_info/time_within_train_step": 2.7545955181121826, "step": 679} {"train_info/time_between_train_steps": 0.003038167953491211, "step": 679} {"info/global_step": 680, "train_info/time_within_train_step": 2.7546563148498535, "step": 680} {"train_info/time_between_train_steps": 0.003014802932739258, "step": 680} {"info/global_step": 681, "train_info/time_within_train_step": 2.7542524337768555, "step": 681} {"train_info/time_between_train_steps": 0.002989053726196289, "step": 681} {"info/global_step": 682, "train_info/time_within_train_step": 2.7546417713165283, "step": 682} {"train_info/time_between_train_steps": 0.002971172332763672, "step": 682} {"info/global_step": 683, "train_info/time_within_train_step": 2.754328489303589, "step": 683} {"train_info/time_between_train_steps": 0.002936840057373047, "step": 683} {"info/global_step": 684, "train_info/time_within_train_step": 2.7540626525878906, "step": 684} {"train_info/time_between_train_steps": 0.0029876232147216797, "step": 684} {"info/global_step": 685, "train_info/time_within_train_step": 2.753798723220825, "step": 685} {"train_info/time_between_train_steps": 0.0029807090759277344, "step": 685} {"info/global_step": 686, "train_info/time_within_train_step": 2.753831386566162, "step": 686} {"train_info/time_between_train_steps": 0.0029480457305908203, "step": 686} {"info/global_step": 687, "train_info/time_within_train_step": 2.752527952194214, "step": 687} {"train_info/time_between_train_steps": 0.0030221939086914062, "step": 687} {"info/global_step": 688, "train_info/time_within_train_step": 2.753143787384033, "step": 688} {"train_info/time_between_train_steps": 0.0029687881469726562, "step": 688} {"info/global_step": 689, "train_info/time_within_train_step": 2.753406524658203, "step": 689} {"train_info/time_between_train_steps": 0.002978801727294922, "step": 689} {"info/global_step": 690, "train_info/time_within_train_step": 2.7542529106140137, "step": 690} {"train_info/time_between_train_steps": 0.0029294490814208984, "step": 690} {"info/global_step": 691, "train_info/time_within_train_step": 2.7533557415008545, "step": 691} {"train_info/time_between_train_steps": 0.0029213428497314453, "step": 691} {"info/global_step": 692, "train_info/time_within_train_step": 2.7535817623138428, "step": 692} {"train_info/time_between_train_steps": 0.0029828548431396484, "step": 692} {"info/global_step": 693, "train_info/time_within_train_step": 2.7532756328582764, "step": 693} {"train_info/time_between_train_steps": 0.0029723644256591797, "step": 693} {"info/global_step": 694, "train_info/time_within_train_step": 2.7535457611083984, "step": 694} {"train_info/time_between_train_steps": 0.0029723644256591797, "step": 694} {"info/global_step": 695, "train_info/time_within_train_step": 2.7537455558776855, "step": 695} {"train_info/time_between_train_steps": 0.002986431121826172, "step": 695} {"info/global_step": 696, "train_info/time_within_train_step": 2.755561113357544, "step": 696} {"train_info/time_between_train_steps": 0.0030074119567871094, "step": 696} {"info/global_step": 697, "train_info/time_within_train_step": 2.7545320987701416, "step": 697} {"train_info/time_between_train_steps": 0.0029349327087402344, "step": 697} {"info/global_step": 698, "train_info/time_within_train_step": 2.7535603046417236, "step": 698} {"train_info/time_between_train_steps": 0.002935171127319336, "step": 698} {"info/global_step": 699, "train_info/time_within_train_step": 2.753990411758423, "step": 699} {"train_info/time_between_train_steps": 0.002992868423461914, "step": 699} {"info/global_step": 700, "train_info/time_within_train_step": 2.7548837661743164, "step": 700} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746568053, "_runtime": 2062}, "step": 700} {"logs": {"train/loss": 5.4257, "train/learning_rate": 0.00041999999999999996, "train/epoch": 0.07, "_timestamp": 1746568053, "_runtime": 2062}, "step": 700} {"train_info/time_between_train_steps": 0.013451099395751953, "step": 700} {"info/global_step": 701, "train_info/time_within_train_step": 2.7545387744903564, "step": 701} {"train_info/time_between_train_steps": 0.0029816627502441406, "step": 701} {"info/global_step": 702, "train_info/time_within_train_step": 2.75430965423584, "step": 702} {"train_info/time_between_train_steps": 0.0029807090759277344, "step": 702} {"info/global_step": 703, "train_info/time_within_train_step": 2.7537217140197754, "step": 703} {"train_info/time_between_train_steps": 0.0030138492584228516, "step": 703} {"info/global_step": 704, "train_info/time_within_train_step": 2.752671480178833, "step": 704} {"train_info/time_between_train_steps": 0.0029582977294921875, "step": 704} {"info/global_step": 705, "train_info/time_within_train_step": 2.7534282207489014, "step": 705} {"train_info/time_between_train_steps": 0.002973794937133789, "step": 705} {"info/global_step": 706, "train_info/time_within_train_step": 2.7530462741851807, "step": 706} {"train_info/time_between_train_steps": 0.0029888153076171875, "step": 706} {"info/global_step": 707, "train_info/time_within_train_step": 2.7548515796661377, "step": 707} {"train_info/time_between_train_steps": 0.0029850006103515625, "step": 707} {"info/global_step": 708, "train_info/time_within_train_step": 2.753079414367676, "step": 708} {"train_info/time_between_train_steps": 0.0029900074005126953, "step": 708} {"info/global_step": 709, "train_info/time_within_train_step": 2.7547364234924316, "step": 709} {"train_info/time_between_train_steps": 0.0028786659240722656, "step": 709} {"info/global_step": 710, "train_info/time_within_train_step": 2.75447678565979, "step": 710} {"train_info/time_between_train_steps": 0.002965211868286133, "step": 710} {"info/global_step": 711, "train_info/time_within_train_step": 2.754319667816162, "step": 711} {"train_info/time_between_train_steps": 0.0029478073120117188, "step": 711} {"info/global_step": 712, "train_info/time_within_train_step": 2.754142999649048, "step": 712} {"train_info/time_between_train_steps": 0.0029480457305908203, "step": 712} {"info/global_step": 713, "train_info/time_within_train_step": 2.872467517852783, "step": 713} {"train_info/time_between_train_steps": 0.0029871463775634766, "step": 713} {"info/global_step": 714, "train_info/time_within_train_step": 2.7539751529693604, "step": 714} {"train_info/time_between_train_steps": 0.002890348434448242, "step": 714} {"info/global_step": 715, "train_info/time_within_train_step": 2.7554707527160645, "step": 715} {"train_info/time_between_train_steps": 0.002949237823486328, "step": 715} {"info/global_step": 716, "train_info/time_within_train_step": 2.755340576171875, "step": 716} {"train_info/time_between_train_steps": 0.0030035972595214844, "step": 716} {"info/global_step": 717, "train_info/time_within_train_step": 2.754603862762451, "step": 717} {"train_info/time_between_train_steps": 0.0029866695404052734, "step": 717} {"info/global_step": 718, "train_info/time_within_train_step": 2.753514289855957, "step": 718} {"train_info/time_between_train_steps": 0.002947092056274414, "step": 718} {"info/global_step": 719, "train_info/time_within_train_step": 2.7562289237976074, "step": 719} {"train_info/time_between_train_steps": 0.002953052520751953, "step": 719} {"info/global_step": 720, "train_info/time_within_train_step": 2.7546768188476562, "step": 720} {"train_info/time_between_train_steps": 0.0029785633087158203, "step": 720} {"info/global_step": 721, "train_info/time_within_train_step": 2.7590906620025635, "step": 721} {"train_info/time_between_train_steps": 0.003036022186279297, "step": 721} {"info/global_step": 722, "train_info/time_within_train_step": 2.754772663116455, "step": 722} {"train_info/time_between_train_steps": 0.002925872802734375, "step": 722} {"info/global_step": 723, "train_info/time_within_train_step": 2.7536816596984863, "step": 723} {"train_info/time_between_train_steps": 0.0029845237731933594, "step": 723} {"info/global_step": 724, "train_info/time_within_train_step": 2.7552742958068848, "step": 724} {"train_info/time_between_train_steps": 0.002989053726196289, "step": 724} {"info/global_step": 725, "train_info/time_within_train_step": 2.7551369667053223, "step": 725} {"train_info/time_between_train_steps": 0.0029592514038085938, "step": 725} {"info/global_step": 726, "train_info/time_within_train_step": 2.7547874450683594, "step": 726} {"train_info/time_between_train_steps": 0.002946615219116211, "step": 726} {"info/global_step": 727, "train_info/time_within_train_step": 2.755119562149048, "step": 727} {"train_info/time_between_train_steps": 0.0029516220092773438, "step": 727} {"info/global_step": 728, "train_info/time_within_train_step": 2.753774404525757, "step": 728} {"train_info/time_between_train_steps": 0.002943754196166992, "step": 728} {"info/global_step": 729, "train_info/time_within_train_step": 2.753852605819702, "step": 729} {"train_info/time_between_train_steps": 0.003001689910888672, "step": 729} {"info/global_step": 730, "train_info/time_within_train_step": 2.7534096240997314, "step": 730} {"train_info/time_between_train_steps": 0.002889394760131836, "step": 730} {"info/global_step": 731, "train_info/time_within_train_step": 2.7538723945617676, "step": 731} {"train_info/time_between_train_steps": 0.003010988235473633, "step": 731} {"info/global_step": 732, "train_info/time_within_train_step": 2.7546045780181885, "step": 732} {"train_info/time_between_train_steps": 0.00296783447265625, "step": 732} {"info/global_step": 733, "train_info/time_within_train_step": 2.7532577514648438, "step": 733} {"train_info/time_between_train_steps": 0.0029909610748291016, "step": 733} {"info/global_step": 734, "train_info/time_within_train_step": 2.75264048576355, "step": 734} {"train_info/time_between_train_steps": 0.0029234886169433594, "step": 734} {"info/global_step": 735, "train_info/time_within_train_step": 2.754861354827881, "step": 735} {"train_info/time_between_train_steps": 0.002937793731689453, "step": 735} {"info/global_step": 736, "train_info/time_within_train_step": 2.7550721168518066, "step": 736} {"train_info/time_between_train_steps": 0.0029468536376953125, "step": 736} {"info/global_step": 737, "train_info/time_within_train_step": 2.755603075027466, "step": 737} {"train_info/time_between_train_steps": 0.0030188560485839844, "step": 737} {"info/global_step": 738, "train_info/time_within_train_step": 2.755695343017578, "step": 738} {"train_info/time_between_train_steps": 0.0029778480529785156, "step": 738} {"info/global_step": 739, "train_info/time_within_train_step": 2.7551820278167725, "step": 739} {"train_info/time_between_train_steps": 0.002975940704345703, "step": 739} {"info/global_step": 740, "train_info/time_within_train_step": 2.754880428314209, "step": 740} {"train_info/time_between_train_steps": 0.00295257568359375, "step": 740} {"info/global_step": 741, "train_info/time_within_train_step": 2.75618839263916, "step": 741} {"train_info/time_between_train_steps": 0.0029747486114501953, "step": 741} {"info/global_step": 742, "train_info/time_within_train_step": 2.7562875747680664, "step": 742} {"train_info/time_between_train_steps": 0.003009319305419922, "step": 742} {"info/global_step": 743, "train_info/time_within_train_step": 2.7556521892547607, "step": 743} {"train_info/time_between_train_steps": 0.0029692649841308594, "step": 743} {"info/global_step": 744, "train_info/time_within_train_step": 2.754120349884033, "step": 744} {"train_info/time_between_train_steps": 0.0029447078704833984, "step": 744} {"info/global_step": 745, "train_info/time_within_train_step": 2.7535693645477295, "step": 745} {"train_info/time_between_train_steps": 0.0029757022857666016, "step": 745} {"info/global_step": 746, "train_info/time_within_train_step": 2.753542900085449, "step": 746} {"train_info/time_between_train_steps": 0.0029878616333007812, "step": 746} {"info/global_step": 747, "train_info/time_within_train_step": 2.753143310546875, "step": 747} {"train_info/time_between_train_steps": 0.0029773712158203125, "step": 747} {"info/global_step": 748, "train_info/time_within_train_step": 2.7541415691375732, "step": 748} {"train_info/time_between_train_steps": 0.002985239028930664, "step": 748} {"info/global_step": 749, "train_info/time_within_train_step": 2.7530338764190674, "step": 749} {"train_info/time_between_train_steps": 0.0029654502868652344, "step": 749} {"info/global_step": 750, "train_info/time_within_train_step": 3.252732515335083, "step": 750} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746568192, "_runtime": 2201}, "step": 750} {"logs": {"train/loss": 5.3565, "train/learning_rate": 0.00045, "train/epoch": 0.07, "_timestamp": 1746568192, "_runtime": 2201}, "step": 750} {"train_info/time_between_train_steps": 0.01610708236694336, "step": 750} {"info/global_step": 751, "train_info/time_within_train_step": 2.753025770187378, "step": 751} {"train_info/time_between_train_steps": 0.002988576889038086, "step": 751} {"info/global_step": 752, "train_info/time_within_train_step": 2.7534782886505127, "step": 752} {"train_info/time_between_train_steps": 0.002887725830078125, "step": 752} {"info/global_step": 753, "train_info/time_within_train_step": 2.7524235248565674, "step": 753} {"train_info/time_between_train_steps": 0.0030472278594970703, "step": 753} {"info/global_step": 754, "train_info/time_within_train_step": 2.7522099018096924, "step": 754} {"train_info/time_between_train_steps": 0.002975940704345703, "step": 754} {"info/global_step": 755, "train_info/time_within_train_step": 2.755549907684326, "step": 755} {"train_info/time_between_train_steps": 0.002981424331665039, "step": 755} {"info/global_step": 756, "train_info/time_within_train_step": 2.754664659500122, "step": 756} {"train_info/time_between_train_steps": 0.002909421920776367, "step": 756} {"info/global_step": 757, "train_info/time_within_train_step": 2.752653121948242, "step": 757} {"train_info/time_between_train_steps": 0.0029363632202148438, "step": 757} {"info/global_step": 758, "train_info/time_within_train_step": 2.753413438796997, "step": 758} {"train_info/time_between_train_steps": 0.0029532909393310547, "step": 758} {"info/global_step": 759, "train_info/time_within_train_step": 2.7531933784484863, "step": 759} {"train_info/time_between_train_steps": 0.002967357635498047, "step": 759} {"info/global_step": 760, "train_info/time_within_train_step": 2.7529985904693604, "step": 760} {"train_info/time_between_train_steps": 0.002938508987426758, "step": 760} {"info/global_step": 761, "train_info/time_within_train_step": 2.75315523147583, "step": 761} {"train_info/time_between_train_steps": 0.0029916763305664062, "step": 761} {"info/global_step": 762, "train_info/time_within_train_step": 2.75417423248291, "step": 762} {"train_info/time_between_train_steps": 0.00298309326171875, "step": 762} {"info/global_step": 763, "train_info/time_within_train_step": 2.7542788982391357, "step": 763} {"train_info/time_between_train_steps": 0.0029790401458740234, "step": 763} {"info/global_step": 764, "train_info/time_within_train_step": 2.754606246948242, "step": 764} {"train_info/time_between_train_steps": 0.0030362606048583984, "step": 764} {"info/global_step": 765, "train_info/time_within_train_step": 2.7556798458099365, "step": 765} {"train_info/time_between_train_steps": 0.0030531883239746094, "step": 765} {"info/global_step": 766, "train_info/time_within_train_step": 2.7552742958068848, "step": 766} {"train_info/time_between_train_steps": 0.002953052520751953, "step": 766} {"info/global_step": 767, "train_info/time_within_train_step": 2.8314812183380127, "step": 767} {"train_info/time_between_train_steps": 0.0029854774475097656, "step": 767} {"info/global_step": 768, "train_info/time_within_train_step": 2.7566027641296387, "step": 768} {"train_info/time_between_train_steps": 0.0029897689819335938, "step": 768} {"info/global_step": 769, "train_info/time_within_train_step": 2.7546024322509766, "step": 769} {"train_info/time_between_train_steps": 0.002879619598388672, "step": 769} {"info/global_step": 770, "train_info/time_within_train_step": 2.7543461322784424, "step": 770} {"train_info/time_between_train_steps": 0.0029141902923583984, "step": 770} {"info/global_step": 771, "train_info/time_within_train_step": 2.754258632659912, "step": 771} {"train_info/time_between_train_steps": 0.0028824806213378906, "step": 771} {"info/global_step": 772, "train_info/time_within_train_step": 2.7548885345458984, "step": 772} {"train_info/time_between_train_steps": 0.0028963088989257812, "step": 772} {"info/global_step": 773, "train_info/time_within_train_step": 2.753434896469116, "step": 773} {"train_info/time_between_train_steps": 0.0028924942016601562, "step": 773} {"info/global_step": 774, "train_info/time_within_train_step": 2.754359006881714, "step": 774} {"train_info/time_between_train_steps": 0.002933502197265625, "step": 774} {"info/global_step": 775, "train_info/time_within_train_step": 2.753891706466675, "step": 775} {"train_info/time_between_train_steps": 0.0029304027557373047, "step": 775} {"info/global_step": 776, "train_info/time_within_train_step": 2.753035068511963, "step": 776} {"train_info/time_between_train_steps": 0.0028836727142333984, "step": 776} {"info/global_step": 777, "train_info/time_within_train_step": 2.75384783744812, "step": 777} {"train_info/time_between_train_steps": 0.0028717517852783203, "step": 777} {"info/global_step": 778, "train_info/time_within_train_step": 2.7549657821655273, "step": 778} {"train_info/time_between_train_steps": 0.0030748844146728516, "step": 778} {"info/global_step": 779, "train_info/time_within_train_step": 2.753732204437256, "step": 779} {"train_info/time_between_train_steps": 0.0029692649841308594, "step": 779} {"info/global_step": 780, "train_info/time_within_train_step": 2.7542808055877686, "step": 780} {"train_info/time_between_train_steps": 0.002967357635498047, "step": 780} {"info/global_step": 781, "train_info/time_within_train_step": 2.7545108795166016, "step": 781} {"train_info/time_between_train_steps": 0.002993345260620117, "step": 781} {"info/global_step": 782, "train_info/time_within_train_step": 2.7529661655426025, "step": 782} {"train_info/time_between_train_steps": 0.0029439926147460938, "step": 782} {"info/global_step": 783, "train_info/time_within_train_step": 2.753309488296509, "step": 783} {"train_info/time_between_train_steps": 0.0029325485229492188, "step": 783} {"info/global_step": 784, "train_info/time_within_train_step": 2.7540464401245117, "step": 784} {"train_info/time_between_train_steps": 0.0029077529907226562, "step": 784} {"info/global_step": 785, "train_info/time_within_train_step": 2.7549593448638916, "step": 785} {"train_info/time_between_train_steps": 0.0029692649841308594, "step": 785} {"info/global_step": 786, "train_info/time_within_train_step": 2.754136323928833, "step": 786} {"train_info/time_between_train_steps": 0.0029494762420654297, "step": 786} {"info/global_step": 787, "train_info/time_within_train_step": 2.7546911239624023, "step": 787} {"train_info/time_between_train_steps": 0.0029349327087402344, "step": 787} {"info/global_step": 788, "train_info/time_within_train_step": 2.7549548149108887, "step": 788} {"train_info/time_between_train_steps": 0.0029506683349609375, "step": 788} {"info/global_step": 789, "train_info/time_within_train_step": 2.7552802562713623, "step": 789} {"train_info/time_between_train_steps": 0.0029718875885009766, "step": 789} {"info/global_step": 790, "train_info/time_within_train_step": 2.7555458545684814, "step": 790} {"train_info/time_between_train_steps": 0.0030095577239990234, "step": 790} {"info/global_step": 791, "train_info/time_within_train_step": 2.755587339401245, "step": 791} {"train_info/time_between_train_steps": 0.0029296875, "step": 791} {"info/global_step": 792, "train_info/time_within_train_step": 2.7554359436035156, "step": 792} {"train_info/time_between_train_steps": 0.0029420852661132812, "step": 792} {"info/global_step": 793, "train_info/time_within_train_step": 2.7560720443725586, "step": 793} {"train_info/time_between_train_steps": 0.002950906753540039, "step": 793} {"info/global_step": 794, "train_info/time_within_train_step": 2.7562034130096436, "step": 794} {"train_info/time_between_train_steps": 0.002951383590698242, "step": 794} {"info/global_step": 795, "train_info/time_within_train_step": 2.755453586578369, "step": 795} {"train_info/time_between_train_steps": 0.0029344558715820312, "step": 795} {"info/global_step": 796, "train_info/time_within_train_step": 2.756059408187866, "step": 796} {"train_info/time_between_train_steps": 0.0030007362365722656, "step": 796} {"info/global_step": 797, "train_info/time_within_train_step": 2.753873825073242, "step": 797} {"train_info/time_between_train_steps": 0.00298309326171875, "step": 797} {"info/global_step": 798, "train_info/time_within_train_step": 2.755882978439331, "step": 798} {"train_info/time_between_train_steps": 0.003050088882446289, "step": 798} {"info/global_step": 799, "train_info/time_within_train_step": 2.754915952682495, "step": 799} {"train_info/time_between_train_steps": 0.0029859542846679688, "step": 799} {"info/global_step": 800, "train_info/time_within_train_step": 2.755270004272461, "step": 800} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746568330, "_runtime": 2339}, "step": 800} {"logs": {"train/loss": 5.2938, "train/learning_rate": 0.00047999999999999996, "train/epoch": 0.08, "_timestamp": 1746568330, "_runtime": 2339}, "step": 800} {"train_info/time_between_train_steps": 19.613572359085083, "step": 800} {"info/global_step": 801, "train_info/time_within_train_step": 2.5338850021362305, "step": 801} {"train_info/time_between_train_steps": 0.0029909610748291016, "step": 801} {"info/global_step": 802, "train_info/time_within_train_step": 2.5714588165283203, "step": 802} {"train_info/time_between_train_steps": 0.0029494762420654297, "step": 802} {"info/global_step": 803, "train_info/time_within_train_step": 2.7031283378601074, "step": 803} {"train_info/time_between_train_steps": 0.0029637813568115234, "step": 803} {"info/global_step": 804, "train_info/time_within_train_step": 2.7468769550323486, "step": 804} {"train_info/time_between_train_steps": 0.002897024154663086, "step": 804} {"info/global_step": 805, "train_info/time_within_train_step": 2.8061258792877197, "step": 805} {"train_info/time_between_train_steps": 0.0029501914978027344, "step": 805} {"info/global_step": 806, "train_info/time_within_train_step": 2.7542927265167236, "step": 806} {"train_info/time_between_train_steps": 0.0029304027557373047, "step": 806} {"info/global_step": 807, "train_info/time_within_train_step": 2.7549617290496826, "step": 807} {"train_info/time_between_train_steps": 0.0029845237731933594, "step": 807} {"info/global_step": 808, "train_info/time_within_train_step": 2.7534778118133545, "step": 808} {"train_info/time_between_train_steps": 0.002955198287963867, "step": 808} {"info/global_step": 809, "train_info/time_within_train_step": 2.7547712326049805, "step": 809} {"train_info/time_between_train_steps": 0.0029518604278564453, "step": 809} {"info/global_step": 810, "train_info/time_within_train_step": 2.7545595169067383, "step": 810} {"train_info/time_between_train_steps": 0.002952098846435547, "step": 810} {"info/global_step": 811, "train_info/time_within_train_step": 2.755182981491089, "step": 811} {"train_info/time_between_train_steps": 0.0028951168060302734, "step": 811} {"info/global_step": 812, "train_info/time_within_train_step": 2.753795623779297, "step": 812} {"train_info/time_between_train_steps": 0.0029630661010742188, "step": 812} {"info/global_step": 813, "train_info/time_within_train_step": 2.754566192626953, "step": 813} {"train_info/time_between_train_steps": 0.0029778480529785156, "step": 813} {"info/global_step": 814, "train_info/time_within_train_step": 2.7550106048583984, "step": 814} {"train_info/time_between_train_steps": 0.0028705596923828125, "step": 814} {"info/global_step": 815, "train_info/time_within_train_step": 2.754871368408203, "step": 815} {"train_info/time_between_train_steps": 0.0029850006103515625, "step": 815} {"info/global_step": 816, "train_info/time_within_train_step": 2.7556612491607666, "step": 816} {"train_info/time_between_train_steps": 0.0030050277709960938, "step": 816} {"info/global_step": 817, "train_info/time_within_train_step": 2.7540855407714844, "step": 817} {"train_info/time_between_train_steps": 0.003036022186279297, "step": 817} {"info/global_step": 818, "train_info/time_within_train_step": 2.7556331157684326, "step": 818} {"train_info/time_between_train_steps": 0.003009796142578125, "step": 818} {"info/global_step": 819, "train_info/time_within_train_step": 2.755704164505005, "step": 819} {"train_info/time_between_train_steps": 0.0028603076934814453, "step": 819} {"info/global_step": 820, "train_info/time_within_train_step": 2.753683090209961, "step": 820} {"train_info/time_between_train_steps": 0.0029959678649902344, "step": 820} {"info/global_step": 821, "train_info/time_within_train_step": 2.7545857429504395, "step": 821} {"train_info/time_between_train_steps": 0.002973794937133789, "step": 821} {"info/global_step": 822, "train_info/time_within_train_step": 2.7540781497955322, "step": 822} {"train_info/time_between_train_steps": 0.002961397171020508, "step": 822} {"info/global_step": 823, "train_info/time_within_train_step": 2.7552056312561035, "step": 823} {"train_info/time_between_train_steps": 0.0029599666595458984, "step": 823} {"info/global_step": 824, "train_info/time_within_train_step": 2.755250930786133, "step": 824} {"train_info/time_between_train_steps": 0.003031492233276367, "step": 824} {"info/global_step": 825, "train_info/time_within_train_step": 2.755580425262451, "step": 825} {"train_info/time_between_train_steps": 0.0029566287994384766, "step": 825} {"info/global_step": 826, "train_info/time_within_train_step": 2.756941080093384, "step": 826} {"train_info/time_between_train_steps": 0.003049612045288086, "step": 826} {"info/global_step": 827, "train_info/time_within_train_step": 2.754791021347046, "step": 827} {"train_info/time_between_train_steps": 0.0030226707458496094, "step": 827} {"info/global_step": 828, "train_info/time_within_train_step": 2.7545011043548584, "step": 828} {"train_info/time_between_train_steps": 0.002853870391845703, "step": 828} {"info/global_step": 829, "train_info/time_within_train_step": 2.7555503845214844, "step": 829} {"train_info/time_between_train_steps": 0.0030241012573242188, "step": 829} {"info/global_step": 830, "train_info/time_within_train_step": 2.7545793056488037, "step": 830} {"train_info/time_between_train_steps": 0.0028867721557617188, "step": 830} {"info/global_step": 831, "train_info/time_within_train_step": 2.754863977432251, "step": 831} {"train_info/time_between_train_steps": 0.0031003952026367188, "step": 831} {"info/global_step": 832, "train_info/time_within_train_step": 2.755769729614258, "step": 832} {"train_info/time_between_train_steps": 0.002974987030029297, "step": 832} {"info/global_step": 833, "train_info/time_within_train_step": 2.7560977935791016, "step": 833} {"train_info/time_between_train_steps": 0.003284454345703125, "step": 833} {"info/global_step": 834, "train_info/time_within_train_step": 2.7556188106536865, "step": 834} {"train_info/time_between_train_steps": 0.003022909164428711, "step": 834} {"info/global_step": 835, "train_info/time_within_train_step": 2.7534422874450684, "step": 835} {"train_info/time_between_train_steps": 0.0031571388244628906, "step": 835} {"info/global_step": 836, "train_info/time_within_train_step": 2.7547452449798584, "step": 836} {"train_info/time_between_train_steps": 0.003202676773071289, "step": 836} {"info/global_step": 837, "train_info/time_within_train_step": 2.75358510017395, "step": 837} {"train_info/time_between_train_steps": 0.0032777786254882812, "step": 837} {"info/global_step": 838, "train_info/time_within_train_step": 2.7554657459259033, "step": 838} {"train_info/time_between_train_steps": 0.003381490707397461, "step": 838} {"info/global_step": 839, "train_info/time_within_train_step": 2.7555389404296875, "step": 839} {"train_info/time_between_train_steps": 0.003237009048461914, "step": 839} {"info/global_step": 840, "train_info/time_within_train_step": 2.7551872730255127, "step": 840} {"train_info/time_between_train_steps": 0.003063678741455078, "step": 840} {"info/global_step": 841, "train_info/time_within_train_step": 2.791233777999878, "step": 841} {"train_info/time_between_train_steps": 0.0031938552856445312, "step": 841} {"info/global_step": 842, "train_info/time_within_train_step": 2.7549829483032227, "step": 842} {"train_info/time_between_train_steps": 0.0030469894409179688, "step": 842} {"info/global_step": 843, "train_info/time_within_train_step": 2.7548818588256836, "step": 843} {"train_info/time_between_train_steps": 0.0032296180725097656, "step": 843} {"info/global_step": 844, "train_info/time_within_train_step": 2.7551002502441406, "step": 844} {"train_info/time_between_train_steps": 0.003564119338989258, "step": 844} {"info/global_step": 845, "train_info/time_within_train_step": 2.756063222885132, "step": 845} {"train_info/time_between_train_steps": 0.0032689571380615234, "step": 845} {"info/global_step": 846, "train_info/time_within_train_step": 2.755194902420044, "step": 846} {"train_info/time_between_train_steps": 0.003225088119506836, "step": 846} {"info/global_step": 847, "train_info/time_within_train_step": 2.7562177181243896, "step": 847} {"train_info/time_between_train_steps": 0.0035271644592285156, "step": 847} {"info/global_step": 848, "train_info/time_within_train_step": 2.755216121673584, "step": 848} {"train_info/time_between_train_steps": 0.003477334976196289, "step": 848} {"info/global_step": 849, "train_info/time_within_train_step": 2.75424861907959, "step": 849} {"train_info/time_between_train_steps": 0.003325223922729492, "step": 849} {"info/global_step": 850, "train_info/time_within_train_step": 2.7552082538604736, "step": 850} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746568488, "_runtime": 2497}, "step": 850} {"logs": {"train/loss": 5.2217, "train/learning_rate": 0.0005099999999999999, "train/epoch": 0.09, "_timestamp": 1746568488, "_runtime": 2497}, "step": 850} {"train_info/time_between_train_steps": 0.01819300651550293, "step": 850} {"info/global_step": 851, "train_info/time_within_train_step": 2.7552976608276367, "step": 851} {"train_info/time_between_train_steps": 0.0035500526428222656, "step": 851} {"info/global_step": 852, "train_info/time_within_train_step": 2.756152391433716, "step": 852} {"train_info/time_between_train_steps": 0.0035126209259033203, "step": 852} {"info/global_step": 853, "train_info/time_within_train_step": 2.7560524940490723, "step": 853} {"train_info/time_between_train_steps": 0.0036840438842773438, "step": 853} {"train_info/time_between_train_steps": 3.3663291931152344, "step": 853} {"info/global_step": 854, "train_info/time_within_train_step": 2.6804442405700684, "step": 854} {"train_info/time_between_train_steps": 0.0031785964965820312, "step": 854} {"info/global_step": 855, "train_info/time_within_train_step": 2.7544782161712646, "step": 855} {"train_info/time_between_train_steps": 0.0031943321228027344, "step": 855} {"info/global_step": 856, "train_info/time_within_train_step": 2.7545166015625, "step": 856} {"train_info/time_between_train_steps": 0.003158092498779297, "step": 856} {"info/global_step": 857, "train_info/time_within_train_step": 2.754519462585449, "step": 857} {"train_info/time_between_train_steps": 0.0032660961151123047, "step": 857} {"info/global_step": 858, "train_info/time_within_train_step": 2.959425210952759, "step": 858} {"train_info/time_between_train_steps": 0.003240823745727539, "step": 858} {"info/global_step": 859, "train_info/time_within_train_step": 2.7542357444763184, "step": 859} {"train_info/time_between_train_steps": 0.0031952857971191406, "step": 859} {"info/global_step": 860, "train_info/time_within_train_step": 2.7541675567626953, "step": 860} {"train_info/time_between_train_steps": 0.0032379627227783203, "step": 860} {"info/global_step": 861, "train_info/time_within_train_step": 2.7559821605682373, "step": 861} {"train_info/time_between_train_steps": 0.0033807754516601562, "step": 861} {"info/global_step": 862, "train_info/time_within_train_step": 2.7555088996887207, "step": 862} {"train_info/time_between_train_steps": 0.003347158432006836, "step": 862} {"info/global_step": 863, "train_info/time_within_train_step": 2.755951166152954, "step": 863} {"train_info/time_between_train_steps": 0.003287076950073242, "step": 863} {"info/global_step": 864, "train_info/time_within_train_step": 2.755908966064453, "step": 864} {"train_info/time_between_train_steps": 0.003511667251586914, "step": 864} {"info/global_step": 865, "train_info/time_within_train_step": 2.756209135055542, "step": 865} {"train_info/time_between_train_steps": 0.0034461021423339844, "step": 865} {"info/global_step": 866, "train_info/time_within_train_step": 2.756352424621582, "step": 866} {"train_info/time_between_train_steps": 0.0034546852111816406, "step": 866} {"info/global_step": 867, "train_info/time_within_train_step": 2.759423017501831, "step": 867} {"train_info/time_between_train_steps": 0.003931283950805664, "step": 867} {"info/global_step": 868, "train_info/time_within_train_step": 2.758331537246704, "step": 868} {"train_info/time_between_train_steps": 0.003870248794555664, "step": 868} {"info/global_step": 869, "train_info/time_within_train_step": 2.75689697265625, "step": 869} {"train_info/time_between_train_steps": 0.0036666393280029297, "step": 869} {"info/global_step": 870, "train_info/time_within_train_step": 2.756488561630249, "step": 870} {"train_info/time_between_train_steps": 0.003593921661376953, "step": 870} {"info/global_step": 871, "train_info/time_within_train_step": 2.757444381713867, "step": 871} {"train_info/time_between_train_steps": 0.00370025634765625, "step": 871} {"info/global_step": 872, "train_info/time_within_train_step": 2.757725715637207, "step": 872} {"train_info/time_between_train_steps": 0.003596782684326172, "step": 872} {"info/global_step": 873, "train_info/time_within_train_step": 2.7566897869110107, "step": 873} {"train_info/time_between_train_steps": 0.0037310123443603516, "step": 873} {"info/global_step": 874, "train_info/time_within_train_step": 2.757481575012207, "step": 874} {"train_info/time_between_train_steps": 0.0035533905029296875, "step": 874} {"info/global_step": 875, "train_info/time_within_train_step": 2.7565765380859375, "step": 875} {"train_info/time_between_train_steps": 0.003515481948852539, "step": 875} {"info/global_step": 876, "train_info/time_within_train_step": 2.756373882293701, "step": 876} {"train_info/time_between_train_steps": 0.003550291061401367, "step": 876} {"info/global_step": 877, "train_info/time_within_train_step": 2.7565598487854004, "step": 877} {"train_info/time_between_train_steps": 0.003522157669067383, "step": 877} {"info/global_step": 878, "train_info/time_within_train_step": 2.7560954093933105, "step": 878} {"train_info/time_between_train_steps": 0.003537416458129883, "step": 878} {"info/global_step": 879, "train_info/time_within_train_step": 2.755998373031616, "step": 879} {"train_info/time_between_train_steps": 0.0034439563751220703, "step": 879} {"info/global_step": 880, "train_info/time_within_train_step": 2.755924940109253, "step": 880} {"train_info/time_between_train_steps": 0.003487110137939453, "step": 880} {"info/global_step": 881, "train_info/time_within_train_step": 2.754669427871704, "step": 881} {"train_info/time_between_train_steps": 0.003568410873413086, "step": 881} {"info/global_step": 882, "train_info/time_within_train_step": 2.755784749984741, "step": 882} {"train_info/time_between_train_steps": 0.003558635711669922, "step": 882} {"info/global_step": 883, "train_info/time_within_train_step": 2.7559986114501953, "step": 883} {"train_info/time_between_train_steps": 0.0034410953521728516, "step": 883} {"info/global_step": 884, "train_info/time_within_train_step": 2.7551777362823486, "step": 884} {"train_info/time_between_train_steps": 0.003492593765258789, "step": 884} {"info/global_step": 885, "train_info/time_within_train_step": 2.7536797523498535, "step": 885} {"train_info/time_between_train_steps": 0.0034415721893310547, "step": 885} {"info/global_step": 886, "train_info/time_within_train_step": 2.755281686782837, "step": 886} {"train_info/time_between_train_steps": 0.003437519073486328, "step": 886} {"info/global_step": 887, "train_info/time_within_train_step": 2.7554657459259033, "step": 887} {"train_info/time_between_train_steps": 0.003464937210083008, "step": 887} {"info/global_step": 888, "train_info/time_within_train_step": 2.7556445598602295, "step": 888} {"train_info/time_between_train_steps": 0.0035300254821777344, "step": 888} {"info/global_step": 889, "train_info/time_within_train_step": 2.7558770179748535, "step": 889} {"train_info/time_between_train_steps": 0.003432750701904297, "step": 889} {"info/global_step": 890, "train_info/time_within_train_step": 2.756051540374756, "step": 890} {"train_info/time_between_train_steps": 0.0034966468811035156, "step": 890} {"info/global_step": 891, "train_info/time_within_train_step": 2.75606107711792, "step": 891} {"train_info/time_between_train_steps": 0.003458261489868164, "step": 891} {"info/global_step": 892, "train_info/time_within_train_step": 2.756206512451172, "step": 892} {"train_info/time_between_train_steps": 0.00345611572265625, "step": 892} {"info/global_step": 893, "train_info/time_within_train_step": 2.7561419010162354, "step": 893} {"train_info/time_between_train_steps": 0.003626108169555664, "step": 893} {"info/global_step": 894, "train_info/time_within_train_step": 2.7538678646087646, "step": 894} {"train_info/time_between_train_steps": 0.0034856796264648438, "step": 894} {"info/global_step": 895, "train_info/time_within_train_step": 2.7561306953430176, "step": 895} {"train_info/time_between_train_steps": 0.0035448074340820312, "step": 895} {"info/global_step": 896, "train_info/time_within_train_step": 2.7556607723236084, "step": 896} {"train_info/time_between_train_steps": 0.0035355091094970703, "step": 896} {"info/global_step": 897, "train_info/time_within_train_step": 3.059102773666382, "step": 897} {"train_info/time_between_train_steps": 0.0033330917358398438, "step": 897} {"info/global_step": 898, "train_info/time_within_train_step": 2.7546608448028564, "step": 898} {"train_info/time_between_train_steps": 0.003400087356567383, "step": 898} {"info/global_step": 899, "train_info/time_within_train_step": 2.7534494400024414, "step": 899} {"train_info/time_between_train_steps": 0.003358602523803711, "step": 899} {"info/global_step": 900, "train_info/time_within_train_step": 2.754509449005127, "step": 900} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746568630, "_runtime": 2639}, "step": 900} {"logs": {"train/loss": 5.2085, "train/learning_rate": 0.00054, "train/epoch": 1.0, "_timestamp": 1746568630, "_runtime": 2639}, "step": 900} {"train_info/time_between_train_steps": 0.013520479202270508, "step": 900} {"info/global_step": 901, "train_info/time_within_train_step": 2.7559595108032227, "step": 901} {"train_info/time_between_train_steps": 0.003469228744506836, "step": 901} {"info/global_step": 902, "train_info/time_within_train_step": 2.754303455352783, "step": 902} {"train_info/time_between_train_steps": 0.0033342838287353516, "step": 902} {"info/global_step": 903, "train_info/time_within_train_step": 2.7543962001800537, "step": 903} {"train_info/time_between_train_steps": 0.003271818161010742, "step": 903} {"info/global_step": 904, "train_info/time_within_train_step": 2.75463604927063, "step": 904} {"train_info/time_between_train_steps": 0.003317594528198242, "step": 904} {"info/global_step": 905, "train_info/time_within_train_step": 2.7552971839904785, "step": 905} {"train_info/time_between_train_steps": 0.0033555030822753906, "step": 905} {"info/global_step": 906, "train_info/time_within_train_step": 2.7553298473358154, "step": 906} {"train_info/time_between_train_steps": 0.0033943653106689453, "step": 906} {"info/global_step": 907, "train_info/time_within_train_step": 2.7545886039733887, "step": 907} {"train_info/time_between_train_steps": 0.0033669471740722656, "step": 907} {"info/global_step": 908, "train_info/time_within_train_step": 2.7552151679992676, "step": 908} {"train_info/time_between_train_steps": 0.003367185592651367, "step": 908} {"info/global_step": 909, "train_info/time_within_train_step": 2.754624128341675, "step": 909} {"train_info/time_between_train_steps": 0.0033502578735351562, "step": 909} {"info/global_step": 910, "train_info/time_within_train_step": 2.755352020263672, "step": 910} {"train_info/time_between_train_steps": 0.003315448760986328, "step": 910} {"info/global_step": 911, "train_info/time_within_train_step": 2.75520396232605, "step": 911} {"train_info/time_between_train_steps": 0.0033311843872070312, "step": 911} {"info/global_step": 912, "train_info/time_within_train_step": 2.755105495452881, "step": 912} {"train_info/time_between_train_steps": 0.0033500194549560547, "step": 912} {"info/global_step": 913, "train_info/time_within_train_step": 2.7544188499450684, "step": 913} {"train_info/time_between_train_steps": 0.0032935142517089844, "step": 913} {"info/global_step": 914, "train_info/time_within_train_step": 2.753923177719116, "step": 914} {"train_info/time_between_train_steps": 0.003385305404663086, "step": 914} {"info/global_step": 915, "train_info/time_within_train_step": 2.754635810852051, "step": 915} {"train_info/time_between_train_steps": 0.003401041030883789, "step": 915} {"info/global_step": 916, "train_info/time_within_train_step": 2.88247013092041, "step": 916} {"train_info/time_between_train_steps": 0.003262042999267578, "step": 916} {"info/global_step": 917, "train_info/time_within_train_step": 2.7535839080810547, "step": 917} {"train_info/time_between_train_steps": 0.003191709518432617, "step": 917} {"info/global_step": 918, "train_info/time_within_train_step": 2.7545340061187744, "step": 918} {"train_info/time_between_train_steps": 0.003215312957763672, "step": 918} {"info/global_step": 919, "train_info/time_within_train_step": 2.755251884460449, "step": 919} {"train_info/time_between_train_steps": 0.003294229507446289, "step": 919} {"info/global_step": 920, "train_info/time_within_train_step": 2.754642963409424, "step": 920} {"train_info/time_between_train_steps": 0.003286600112915039, "step": 920} {"info/global_step": 921, "train_info/time_within_train_step": 2.7551145553588867, "step": 921} {"train_info/time_between_train_steps": 0.0032036304473876953, "step": 921} {"info/global_step": 922, "train_info/time_within_train_step": 2.7551515102386475, "step": 922} {"train_info/time_between_train_steps": 0.00322723388671875, "step": 922} {"info/global_step": 923, "train_info/time_within_train_step": 2.755030393600464, "step": 923} {"train_info/time_between_train_steps": 0.0032036304473876953, "step": 923} {"info/global_step": 924, "train_info/time_within_train_step": 2.7530720233917236, "step": 924} {"train_info/time_between_train_steps": 0.0031752586364746094, "step": 924} {"info/global_step": 925, "train_info/time_within_train_step": 2.7556493282318115, "step": 925} {"train_info/time_between_train_steps": 0.0031974315643310547, "step": 925} {"info/global_step": 926, "train_info/time_within_train_step": 2.7550106048583984, "step": 926} {"train_info/time_between_train_steps": 0.003212451934814453, "step": 926} {"info/global_step": 927, "train_info/time_within_train_step": 2.7540884017944336, "step": 927} {"train_info/time_between_train_steps": 0.0031890869140625, "step": 927} {"info/global_step": 928, "train_info/time_within_train_step": 2.7545599937438965, "step": 928} {"train_info/time_between_train_steps": 0.0032510757446289062, "step": 928} {"info/global_step": 929, "train_info/time_within_train_step": 2.7538485527038574, "step": 929} {"train_info/time_between_train_steps": 0.0032126903533935547, "step": 929} {"info/global_step": 930, "train_info/time_within_train_step": 2.754948854446411, "step": 930} {"train_info/time_between_train_steps": 0.0032339096069335938, "step": 930} {"info/global_step": 931, "train_info/time_within_train_step": 2.755221366882324, "step": 931} {"train_info/time_between_train_steps": 0.0032165050506591797, "step": 931} {"info/global_step": 932, "train_info/time_within_train_step": 2.7539801597595215, "step": 932} {"train_info/time_between_train_steps": 0.0032355785369873047, "step": 932} {"info/global_step": 933, "train_info/time_within_train_step": 2.7540833950042725, "step": 933} {"train_info/time_between_train_steps": 0.0032765865325927734, "step": 933} {"info/global_step": 934, "train_info/time_within_train_step": 2.7538506984710693, "step": 934} {"train_info/time_between_train_steps": 0.0032646656036376953, "step": 934} {"info/global_step": 935, "train_info/time_within_train_step": 2.754387855529785, "step": 935} {"train_info/time_between_train_steps": 0.0032491683959960938, "step": 935} {"info/global_step": 936, "train_info/time_within_train_step": 2.7551023960113525, "step": 936} {"train_info/time_between_train_steps": 0.003276824951171875, "step": 936} {"info/global_step": 937, "train_info/time_within_train_step": 2.754357099533081, "step": 937} {"train_info/time_between_train_steps": 0.0032379627227783203, "step": 937} {"info/global_step": 938, "train_info/time_within_train_step": 2.754910469055176, "step": 938} {"train_info/time_between_train_steps": 0.003210783004760742, "step": 938} {"info/global_step": 939, "train_info/time_within_train_step": 2.755699872970581, "step": 939} {"train_info/time_between_train_steps": 0.0032846927642822266, "step": 939} {"info/global_step": 940, "train_info/time_within_train_step": 2.755463123321533, "step": 940} {"train_info/time_between_train_steps": 0.0031976699829101562, "step": 940} {"info/global_step": 941, "train_info/time_within_train_step": 2.756566286087036, "step": 941} {"train_info/time_between_train_steps": 0.003167867660522461, "step": 941} {"info/global_step": 942, "train_info/time_within_train_step": 2.755505323410034, "step": 942} {"train_info/time_between_train_steps": 0.003233194351196289, "step": 942} {"info/global_step": 943, "train_info/time_within_train_step": 2.7555699348449707, "step": 943} {"train_info/time_between_train_steps": 0.003233194351196289, "step": 943} {"info/global_step": 944, "train_info/time_within_train_step": 2.7537708282470703, "step": 944} {"train_info/time_between_train_steps": 0.0031960010528564453, "step": 944} {"info/global_step": 945, "train_info/time_within_train_step": 2.7550549507141113, "step": 945} {"train_info/time_between_train_steps": 0.0031881332397460938, "step": 945} {"info/global_step": 946, "train_info/time_within_train_step": 2.7547338008880615, "step": 946} {"train_info/time_between_train_steps": 0.0032012462615966797, "step": 946} {"info/global_step": 947, "train_info/time_within_train_step": 2.7541637420654297, "step": 947} {"train_info/time_between_train_steps": 0.0032129287719726562, "step": 947} {"info/global_step": 948, "train_info/time_within_train_step": 2.7556447982788086, "step": 948} {"train_info/time_between_train_steps": 0.0032312870025634766, "step": 948} {"info/global_step": 949, "train_info/time_within_train_step": 2.756160259246826, "step": 949} {"train_info/time_between_train_steps": 0.0031898021697998047, "step": 949} {"info/global_step": 950, "train_info/time_within_train_step": 2.755546808242798, "step": 950} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746568769, "_runtime": 2778}, "step": 950} {"logs": {"train/loss": 5.084, "train/learning_rate": 0.00057, "train/epoch": 1.01, "_timestamp": 1746568769, "_runtime": 2778}, "step": 950} {"train_info/time_between_train_steps": 0.013336658477783203, "step": 950} {"info/global_step": 951, "train_info/time_within_train_step": 2.7543036937713623, "step": 951} {"train_info/time_between_train_steps": 0.0031690597534179688, "step": 951} {"info/global_step": 952, "train_info/time_within_train_step": 2.754957914352417, "step": 952} {"train_info/time_between_train_steps": 0.0031430721282958984, "step": 952} {"info/global_step": 953, "train_info/time_within_train_step": 2.7519466876983643, "step": 953} {"train_info/time_between_train_steps": 0.0032193660736083984, "step": 953} {"info/global_step": 954, "train_info/time_within_train_step": 2.755516290664673, "step": 954} {"train_info/time_between_train_steps": 0.003196239471435547, "step": 954} {"info/global_step": 955, "train_info/time_within_train_step": 2.755553722381592, "step": 955} {"train_info/time_between_train_steps": 0.003189563751220703, "step": 955} {"info/global_step": 956, "train_info/time_within_train_step": 2.7543976306915283, "step": 956} {"train_info/time_between_train_steps": 0.0031888484954833984, "step": 956} {"info/global_step": 957, "train_info/time_within_train_step": 2.7549636363983154, "step": 957} {"train_info/time_between_train_steps": 0.003177165985107422, "step": 957} {"info/global_step": 958, "train_info/time_within_train_step": 2.7530834674835205, "step": 958} {"train_info/time_between_train_steps": 0.0031747817993164062, "step": 958} {"info/global_step": 959, "train_info/time_within_train_step": 2.7551074028015137, "step": 959} {"train_info/time_between_train_steps": 0.0032341480255126953, "step": 959} {"info/global_step": 960, "train_info/time_within_train_step": 2.753566026687622, "step": 960} {"train_info/time_between_train_steps": 0.003192901611328125, "step": 960} {"info/global_step": 961, "train_info/time_within_train_step": 2.754391670227051, "step": 961} {"train_info/time_between_train_steps": 0.003198862075805664, "step": 961} {"info/global_step": 962, "train_info/time_within_train_step": 2.7555837631225586, "step": 962} {"train_info/time_between_train_steps": 0.003210306167602539, "step": 962} {"info/global_step": 963, "train_info/time_within_train_step": 2.7552969455718994, "step": 963} {"train_info/time_between_train_steps": 0.0031914710998535156, "step": 963} {"info/global_step": 964, "train_info/time_within_train_step": 2.7548668384552, "step": 964} {"train_info/time_between_train_steps": 0.0031981468200683594, "step": 964} {"info/global_step": 965, "train_info/time_within_train_step": 2.7541329860687256, "step": 965} {"train_info/time_between_train_steps": 0.0032613277435302734, "step": 965} {"info/global_step": 966, "train_info/time_within_train_step": 2.7549800872802734, "step": 966} {"train_info/time_between_train_steps": 0.003184795379638672, "step": 966} {"info/global_step": 967, "train_info/time_within_train_step": 2.7552714347839355, "step": 967} {"train_info/time_between_train_steps": 0.003216981887817383, "step": 967} {"info/global_step": 968, "train_info/time_within_train_step": 2.752793788909912, "step": 968} {"train_info/time_between_train_steps": 0.0032291412353515625, "step": 968} {"info/global_step": 969, "train_info/time_within_train_step": 2.752336263656616, "step": 969} {"train_info/time_between_train_steps": 0.0032472610473632812, "step": 969} {"info/global_step": 970, "train_info/time_within_train_step": 2.753777027130127, "step": 970} {"train_info/time_between_train_steps": 0.0032052993774414062, "step": 970} {"info/global_step": 971, "train_info/time_within_train_step": 2.7536232471466064, "step": 971} {"train_info/time_between_train_steps": 0.0032269954681396484, "step": 971} {"info/global_step": 972, "train_info/time_within_train_step": 2.7529289722442627, "step": 972} {"train_info/time_between_train_steps": 0.0032339096069335938, "step": 972} {"info/global_step": 973, "train_info/time_within_train_step": 2.7534825801849365, "step": 973} {"train_info/time_between_train_steps": 0.0032417774200439453, "step": 973} {"info/global_step": 974, "train_info/time_within_train_step": 2.7535629272460938, "step": 974} {"train_info/time_between_train_steps": 0.0032193660736083984, "step": 974} {"info/global_step": 975, "train_info/time_within_train_step": 2.7516603469848633, "step": 975} {"train_info/time_between_train_steps": 0.0031893253326416016, "step": 975} {"info/global_step": 976, "train_info/time_within_train_step": 2.754199743270874, "step": 976} {"train_info/time_between_train_steps": 0.003245830535888672, "step": 976} {"info/global_step": 977, "train_info/time_within_train_step": 2.7543203830718994, "step": 977} {"train_info/time_between_train_steps": 0.0032181739807128906, "step": 977} {"info/global_step": 978, "train_info/time_within_train_step": 2.75138783454895, "step": 978} {"train_info/time_between_train_steps": 0.12281990051269531, "step": 978} {"info/global_step": 979, "train_info/time_within_train_step": 2.755410671234131, "step": 979} {"train_info/time_between_train_steps": 0.0032961368560791016, "step": 979} {"info/global_step": 980, "train_info/time_within_train_step": 2.753570556640625, "step": 980} {"train_info/time_between_train_steps": 0.0032491683959960938, "step": 980} {"info/global_step": 981, "train_info/time_within_train_step": 2.752735137939453, "step": 981} {"train_info/time_between_train_steps": 0.0032715797424316406, "step": 981} {"info/global_step": 982, "train_info/time_within_train_step": 2.75378680229187, "step": 982} {"train_info/time_between_train_steps": 0.003218412399291992, "step": 982} {"info/global_step": 983, "train_info/time_within_train_step": 2.75313138961792, "step": 983} {"train_info/time_between_train_steps": 0.0032625198364257812, "step": 983} {"info/global_step": 984, "train_info/time_within_train_step": 2.9746055603027344, "step": 984} {"train_info/time_between_train_steps": 0.003298521041870117, "step": 984} {"info/global_step": 985, "train_info/time_within_train_step": 2.752936601638794, "step": 985} {"train_info/time_between_train_steps": 0.003228902816772461, "step": 985} {"info/global_step": 986, "train_info/time_within_train_step": 2.7537291049957275, "step": 986} {"train_info/time_between_train_steps": 0.0036859512329101562, "step": 986} {"info/global_step": 987, "train_info/time_within_train_step": 2.7546074390411377, "step": 987} {"train_info/time_between_train_steps": 0.0032050609588623047, "step": 987} {"info/global_step": 988, "train_info/time_within_train_step": 2.752354383468628, "step": 988} {"train_info/time_between_train_steps": 0.0032885074615478516, "step": 988} {"info/global_step": 989, "train_info/time_within_train_step": 2.7550432682037354, "step": 989} {"train_info/time_between_train_steps": 0.0032548904418945312, "step": 989} {"info/global_step": 990, "train_info/time_within_train_step": 2.754272937774658, "step": 990} {"train_info/time_between_train_steps": 0.0031824111938476562, "step": 990} {"info/global_step": 991, "train_info/time_within_train_step": 2.754581928253174, "step": 991} {"train_info/time_between_train_steps": 0.0032727718353271484, "step": 991} {"info/global_step": 992, "train_info/time_within_train_step": 2.754232406616211, "step": 992} {"train_info/time_between_train_steps": 0.003223419189453125, "step": 992} {"info/global_step": 993, "train_info/time_within_train_step": 2.7551448345184326, "step": 993} {"train_info/time_between_train_steps": 0.0034117698669433594, "step": 993} {"info/global_step": 994, "train_info/time_within_train_step": 2.7542691230773926, "step": 994} {"train_info/time_between_train_steps": 0.0032722949981689453, "step": 994} {"info/global_step": 995, "train_info/time_within_train_step": 2.7554807662963867, "step": 995} {"train_info/time_between_train_steps": 0.0032215118408203125, "step": 995} {"info/global_step": 996, "train_info/time_within_train_step": 2.7533140182495117, "step": 996} {"train_info/time_between_train_steps": 0.0031881332397460938, "step": 996} {"info/global_step": 997, "train_info/time_within_train_step": 2.752920150756836, "step": 997} {"train_info/time_between_train_steps": 0.003184080123901367, "step": 997} {"info/global_step": 998, "train_info/time_within_train_step": 2.755711793899536, "step": 998} {"train_info/time_between_train_steps": 0.0031850337982177734, "step": 998} {"info/global_step": 999, "train_info/time_within_train_step": 2.755138635635376, "step": 999} {"train_info/time_between_train_steps": 0.0032939910888671875, "step": 999} {"info/global_step": 1000, "train_info/time_within_train_step": 3.2526190280914307, "step": 1000} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746568908, "_runtime": 2917}, "step": 1000} {"logs": {"train/loss": 5.0256, "train/learning_rate": 0.0006, "train/epoch": 1.01, "_timestamp": 1746568908, "_runtime": 2917}, "step": 1000} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746568913, "_runtime": 2922}, "step": 1000} {"logs": {"eval/loss": 5.386143207550049, "eval/runtime": 5.1826, "eval/samples_per_second": 36.661, "eval/steps_per_second": 1.158, "train/epoch": 1.01, "_timestamp": 1746568913, "_runtime": 2922}, "step": 1000} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746568913, "_runtime": 2922}, "step": 1000} {"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 5.386143207550049, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 218.35959180616592, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 5.1826, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 36.661, "train/epoch": 1.01, "_timestamp": 1746568913, "_runtime": 2922}, "step": 1000} {"train_info/time_between_train_steps": 52.9630765914917, "step": 1000} {"info/global_step": 1001, "train_info/time_within_train_step": 2.5285189151763916, "step": 1001} {"train_info/time_between_train_steps": 0.0032563209533691406, "step": 1001} {"info/global_step": 1002, "train_info/time_within_train_step": 2.543952703475952, "step": 1002} {"train_info/time_between_train_steps": 0.0032765865325927734, "step": 1002} {"info/global_step": 1003, "train_info/time_within_train_step": 2.6825520992279053, "step": 1003} {"train_info/time_between_train_steps": 0.003719329833984375, "step": 1003} {"info/global_step": 1004, "train_info/time_within_train_step": 2.6947977542877197, "step": 1004} {"train_info/time_between_train_steps": 0.0031893253326416016, "step": 1004} {"info/global_step": 1005, "train_info/time_within_train_step": 2.6935508251190186, "step": 1005} {"train_info/time_between_train_steps": 0.0036220550537109375, "step": 1005} {"info/global_step": 1006, "train_info/time_within_train_step": 2.6835522651672363, "step": 1006} {"train_info/time_between_train_steps": 0.0036497116088867188, "step": 1006} {"info/global_step": 1007, "train_info/time_within_train_step": 2.691126585006714, "step": 1007} {"train_info/time_between_train_steps": 0.0035948753356933594, "step": 1007} {"info/global_step": 1008, "train_info/time_within_train_step": 2.751970052719116, "step": 1008} {"train_info/time_between_train_steps": 0.004010200500488281, "step": 1008} {"info/global_step": 1009, "train_info/time_within_train_step": 2.754242420196533, "step": 1009} {"train_info/time_between_train_steps": 0.004084348678588867, "step": 1009} {"info/global_step": 1010, "train_info/time_within_train_step": 2.75608491897583, "step": 1010} {"train_info/time_between_train_steps": 0.0037534236907958984, "step": 1010} {"info/global_step": 1011, "train_info/time_within_train_step": 2.7532129287719727, "step": 1011} {"train_info/time_between_train_steps": 0.0035867691040039062, "step": 1011} {"info/global_step": 1012, "train_info/time_within_train_step": 2.7582528591156006, "step": 1012} {"train_info/time_between_train_steps": 0.0036840438842773438, "step": 1012} {"info/global_step": 1013, "train_info/time_within_train_step": 2.755253791809082, "step": 1013} {"train_info/time_between_train_steps": 0.00360107421875, "step": 1013} {"info/global_step": 1014, "train_info/time_within_train_step": 2.7566652297973633, "step": 1014} {"train_info/time_between_train_steps": 0.003676176071166992, "step": 1014} {"info/global_step": 1015, "train_info/time_within_train_step": 2.7558114528656006, "step": 1015} {"train_info/time_between_train_steps": 0.003579378128051758, "step": 1015} {"info/global_step": 1016, "train_info/time_within_train_step": 2.7567923069000244, "step": 1016} {"train_info/time_between_train_steps": 0.0036416053771972656, "step": 1016} {"info/global_step": 1017, "train_info/time_within_train_step": 2.7558047771453857, "step": 1017} {"train_info/time_between_train_steps": 0.0037059783935546875, "step": 1017} {"info/global_step": 1018, "train_info/time_within_train_step": 2.757009744644165, "step": 1018} {"train_info/time_between_train_steps": 0.0035715103149414062, "step": 1018} {"info/global_step": 1019, "train_info/time_within_train_step": 2.755457878112793, "step": 1019} {"train_info/time_between_train_steps": 0.0037162303924560547, "step": 1019} {"info/global_step": 1020, "train_info/time_within_train_step": 2.7546467781066895, "step": 1020} {"train_info/time_between_train_steps": 0.0035674571990966797, "step": 1020} {"info/global_step": 1021, "train_info/time_within_train_step": 2.7569968700408936, "step": 1021} {"train_info/time_between_train_steps": 0.0035254955291748047, "step": 1021} {"info/global_step": 1022, "train_info/time_within_train_step": 2.7580726146698, "step": 1022} {"train_info/time_between_train_steps": 0.003465414047241211, "step": 1022} {"info/global_step": 1023, "train_info/time_within_train_step": 2.782357931137085, "step": 1023} {"train_info/time_between_train_steps": 0.003873109817504883, "step": 1023} {"info/global_step": 1024, "train_info/time_within_train_step": 2.7589752674102783, "step": 1024} {"train_info/time_between_train_steps": 0.004083395004272461, "step": 1024} {"info/global_step": 1025, "train_info/time_within_train_step": 2.7594993114471436, "step": 1025} {"train_info/time_between_train_steps": 0.0041201114654541016, "step": 1025} {"info/global_step": 1026, "train_info/time_within_train_step": 3.1073708534240723, "step": 1026} {"train_info/time_between_train_steps": 0.003327608108520508, "step": 1026} {"info/global_step": 1027, "train_info/time_within_train_step": 2.756491184234619, "step": 1027} {"train_info/time_between_train_steps": 0.003349781036376953, "step": 1027} {"info/global_step": 1028, "train_info/time_within_train_step": 2.754934549331665, "step": 1028} {"train_info/time_between_train_steps": 0.0033800601959228516, "step": 1028} {"info/global_step": 1029, "train_info/time_within_train_step": 2.753781795501709, "step": 1029} {"train_info/time_between_train_steps": 0.0033087730407714844, "step": 1029} {"info/global_step": 1030, "train_info/time_within_train_step": 2.755951404571533, "step": 1030} {"train_info/time_between_train_steps": 0.0033261775970458984, "step": 1030} {"info/global_step": 1031, "train_info/time_within_train_step": 2.757171154022217, "step": 1031} {"train_info/time_between_train_steps": 0.0033965110778808594, "step": 1031} {"info/global_step": 1032, "train_info/time_within_train_step": 2.755791664123535, "step": 1032} {"train_info/time_between_train_steps": 0.003351926803588867, "step": 1032} {"info/global_step": 1033, "train_info/time_within_train_step": 2.7542240619659424, "step": 1033} {"train_info/time_between_train_steps": 0.0033533573150634766, "step": 1033} {"info/global_step": 1034, "train_info/time_within_train_step": 2.755793809890747, "step": 1034} {"train_info/time_between_train_steps": 0.0033745765686035156, "step": 1034} {"info/global_step": 1035, "train_info/time_within_train_step": 2.7554190158843994, "step": 1035} {"train_info/time_between_train_steps": 0.003383159637451172, "step": 1035} {"info/global_step": 1036, "train_info/time_within_train_step": 2.7564666271209717, "step": 1036} {"train_info/time_between_train_steps": 0.003360271453857422, "step": 1036} {"info/global_step": 1037, "train_info/time_within_train_step": 2.7556397914886475, "step": 1037} {"train_info/time_between_train_steps": 0.0033326148986816406, "step": 1037} {"info/global_step": 1038, "train_info/time_within_train_step": 2.755375385284424, "step": 1038} {"train_info/time_between_train_steps": 0.0033049583435058594, "step": 1038} {"info/global_step": 1039, "train_info/time_within_train_step": 2.755581855773926, "step": 1039} {"train_info/time_between_train_steps": 0.0034368038177490234, "step": 1039} {"info/global_step": 1040, "train_info/time_within_train_step": 2.7572083473205566, "step": 1040} {"train_info/time_between_train_steps": 0.003310680389404297, "step": 1040} {"info/global_step": 1041, "train_info/time_within_train_step": 2.917001485824585, "step": 1041} {"train_info/time_between_train_steps": 0.0034308433532714844, "step": 1041} {"info/global_step": 1042, "train_info/time_within_train_step": 2.761127471923828, "step": 1042} {"train_info/time_between_train_steps": 0.0033512115478515625, "step": 1042} {"info/global_step": 1043, "train_info/time_within_train_step": 2.7578208446502686, "step": 1043} {"train_info/time_between_train_steps": 0.0036046504974365234, "step": 1043} {"info/global_step": 1044, "train_info/time_within_train_step": 2.7561960220336914, "step": 1044} {"train_info/time_between_train_steps": 0.0035750865936279297, "step": 1044} {"info/global_step": 1045, "train_info/time_within_train_step": 2.7563486099243164, "step": 1045} {"train_info/time_between_train_steps": 0.0034689903259277344, "step": 1045} {"info/global_step": 1046, "train_info/time_within_train_step": 2.756014108657837, "step": 1046} {"train_info/time_between_train_steps": 0.003482818603515625, "step": 1046} {"info/global_step": 1047, "train_info/time_within_train_step": 2.757154703140259, "step": 1047} {"train_info/time_between_train_steps": 0.003503561019897461, "step": 1047} {"info/global_step": 1048, "train_info/time_within_train_step": 2.757420301437378, "step": 1048} {"train_info/time_between_train_steps": 0.0036478042602539062, "step": 1048} {"info/global_step": 1049, "train_info/time_within_train_step": 2.758274555206299, "step": 1049} {"train_info/time_between_train_steps": 0.0036149024963378906, "step": 1049} {"info/global_step": 1050, "train_info/time_within_train_step": 2.759038209915161, "step": 1050} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746569099, "_runtime": 3108}, "step": 1050} {"logs": {"train/loss": 4.9755, "train/learning_rate": 0.0005966666666666667, "train/epoch": 1.02, "_timestamp": 1746569099, "_runtime": 3108}, "step": 1050} {"train_info/time_between_train_steps": 0.018025636672973633, "step": 1050} {"info/global_step": 1051, "train_info/time_within_train_step": 2.757939100265503, "step": 1051} {"train_info/time_between_train_steps": 0.0035839080810546875, "step": 1051} {"info/global_step": 1052, "train_info/time_within_train_step": 2.7569069862365723, "step": 1052} {"train_info/time_between_train_steps": 0.00368499755859375, "step": 1052} {"info/global_step": 1053, "train_info/time_within_train_step": 2.757439613342285, "step": 1053} {"train_info/time_between_train_steps": 0.0036139488220214844, "step": 1053} {"info/global_step": 1054, "train_info/time_within_train_step": 2.7575912475585938, "step": 1054} {"train_info/time_between_train_steps": 0.003637552261352539, "step": 1054} {"info/global_step": 1055, "train_info/time_within_train_step": 2.755969285964966, "step": 1055} {"train_info/time_between_train_steps": 0.0036270618438720703, "step": 1055} {"info/global_step": 1056, "train_info/time_within_train_step": 2.7607851028442383, "step": 1056} {"train_info/time_between_train_steps": 0.003596067428588867, "step": 1056} {"info/global_step": 1057, "train_info/time_within_train_step": 2.755801200866699, "step": 1057} {"train_info/time_between_train_steps": 0.006800651550292969, "step": 1057} {"info/global_step": 1058, "train_info/time_within_train_step": 2.754591226577759, "step": 1058} {"train_info/time_between_train_steps": 0.006974697113037109, "step": 1058} {"info/global_step": 1059, "train_info/time_within_train_step": 2.7558066844940186, "step": 1059} {"train_info/time_between_train_steps": 0.005975008010864258, "step": 1059} {"info/global_step": 1060, "train_info/time_within_train_step": 2.7568306922912598, "step": 1060} {"train_info/time_between_train_steps": 0.0066776275634765625, "step": 1060} {"info/global_step": 1061, "train_info/time_within_train_step": 2.757145881652832, "step": 1061} {"train_info/time_between_train_steps": 0.006942272186279297, "step": 1061} {"info/global_step": 1062, "train_info/time_within_train_step": 2.754897117614746, "step": 1062} {"train_info/time_between_train_steps": 0.006934404373168945, "step": 1062} {"info/global_step": 1063, "train_info/time_within_train_step": 2.756683349609375, "step": 1063} {"train_info/time_between_train_steps": 0.006875753402709961, "step": 1063} {"info/global_step": 1064, "train_info/time_within_train_step": 2.7555434703826904, "step": 1064} {"train_info/time_between_train_steps": 0.006897926330566406, "step": 1064} {"info/global_step": 1065, "train_info/time_within_train_step": 2.7547647953033447, "step": 1065} {"train_info/time_between_train_steps": 0.0055696964263916016, "step": 1065} {"info/global_step": 1066, "train_info/time_within_train_step": 2.756176471710205, "step": 1066} {"train_info/time_between_train_steps": 0.006972551345825195, "step": 1066} {"info/global_step": 1067, "train_info/time_within_train_step": 2.755730390548706, "step": 1067} {"train_info/time_between_train_steps": 0.003503084182739258, "step": 1067} {"info/global_step": 1068, "train_info/time_within_train_step": 2.7553951740264893, "step": 1068} {"train_info/time_between_train_steps": 0.00697636604309082, "step": 1068} {"info/global_step": 1069, "train_info/time_within_train_step": 2.7558670043945312, "step": 1069} {"train_info/time_between_train_steps": 0.006712913513183594, "step": 1069} {"info/global_step": 1070, "train_info/time_within_train_step": 2.755831718444824, "step": 1070} {"train_info/time_between_train_steps": 0.005385160446166992, "step": 1070} {"info/global_step": 1071, "train_info/time_within_train_step": 2.7564985752105713, "step": 1071} {"train_info/time_between_train_steps": 0.0065097808837890625, "step": 1071} {"info/global_step": 1072, "train_info/time_within_train_step": 2.756009340286255, "step": 1072} {"train_info/time_between_train_steps": 0.0034821033477783203, "step": 1072} {"info/global_step": 1073, "train_info/time_within_train_step": 2.756823778152466, "step": 1073} {"train_info/time_between_train_steps": 0.003488302230834961, "step": 1073} {"info/global_step": 1074, "train_info/time_within_train_step": 2.7559943199157715, "step": 1074} {"train_info/time_between_train_steps": 0.00360107421875, "step": 1074} {"info/global_step": 1075, "train_info/time_within_train_step": 2.7547292709350586, "step": 1075} {"train_info/time_between_train_steps": 0.003492593765258789, "step": 1075} {"info/global_step": 1076, "train_info/time_within_train_step": 2.7499048709869385, "step": 1076} {"train_info/time_between_train_steps": 0.0034911632537841797, "step": 1076} {"info/global_step": 1077, "train_info/time_within_train_step": 2.7566123008728027, "step": 1077} {"train_info/time_between_train_steps": 0.0034799575805664062, "step": 1077} {"info/global_step": 1078, "train_info/time_within_train_step": 2.7565507888793945, "step": 1078} {"train_info/time_between_train_steps": 0.0035424232482910156, "step": 1078} {"info/global_step": 1079, "train_info/time_within_train_step": 2.7569169998168945, "step": 1079} {"train_info/time_between_train_steps": 0.0036118030548095703, "step": 1079} {"info/global_step": 1080, "train_info/time_within_train_step": 2.7554163932800293, "step": 1080} {"train_info/time_between_train_steps": 0.0035753250122070312, "step": 1080} {"info/global_step": 1081, "train_info/time_within_train_step": 2.7560837268829346, "step": 1081} {"train_info/time_between_train_steps": 0.0036242008209228516, "step": 1081} {"info/global_step": 1082, "train_info/time_within_train_step": 2.7559947967529297, "step": 1082} {"train_info/time_between_train_steps": 0.003621339797973633, "step": 1082} {"info/global_step": 1083, "train_info/time_within_train_step": 2.756817579269409, "step": 1083} {"train_info/time_between_train_steps": 0.0036962032318115234, "step": 1083} {"info/global_step": 1084, "train_info/time_within_train_step": 2.7565431594848633, "step": 1084} {"train_info/time_between_train_steps": 0.0036344528198242188, "step": 1084} {"info/global_step": 1085, "train_info/time_within_train_step": 2.757528305053711, "step": 1085} {"train_info/time_between_train_steps": 0.003800630569458008, "step": 1085} {"info/global_step": 1086, "train_info/time_within_train_step": 2.7570269107818604, "step": 1086} {"train_info/time_between_train_steps": 0.0037059783935546875, "step": 1086} {"info/global_step": 1087, "train_info/time_within_train_step": 2.7581684589385986, "step": 1087} {"train_info/time_between_train_steps": 0.003530263900756836, "step": 1087} {"info/global_step": 1088, "train_info/time_within_train_step": 2.7570033073425293, "step": 1088} {"train_info/time_between_train_steps": 0.003584623336791992, "step": 1088} {"info/global_step": 1089, "train_info/time_within_train_step": 2.7555837631225586, "step": 1089} {"train_info/time_between_train_steps": 0.0036041736602783203, "step": 1089} {"info/global_step": 1090, "train_info/time_within_train_step": 2.754239082336426, "step": 1090} {"train_info/time_between_train_steps": 0.0034868717193603516, "step": 1090} {"info/global_step": 1091, "train_info/time_within_train_step": 2.7559940814971924, "step": 1091} {"train_info/time_between_train_steps": 0.0034682750701904297, "step": 1091} {"info/global_step": 1092, "train_info/time_within_train_step": 2.7547500133514404, "step": 1092} {"train_info/time_between_train_steps": 0.003497600555419922, "step": 1092} {"info/global_step": 1093, "train_info/time_within_train_step": 2.7573957443237305, "step": 1093} {"train_info/time_between_train_steps": 0.0035605430603027344, "step": 1093} {"info/global_step": 1094, "train_info/time_within_train_step": 2.756643533706665, "step": 1094} {"train_info/time_between_train_steps": 0.0034775733947753906, "step": 1094} {"info/global_step": 1095, "train_info/time_within_train_step": 2.757021903991699, "step": 1095} {"train_info/time_between_train_steps": 0.003407001495361328, "step": 1095} {"info/global_step": 1096, "train_info/time_within_train_step": 2.7551429271698, "step": 1096} {"train_info/time_between_train_steps": 0.0035910606384277344, "step": 1096} {"info/global_step": 1097, "train_info/time_within_train_step": 2.752896308898926, "step": 1097} {"train_info/time_between_train_steps": 0.0035161972045898438, "step": 1097} {"info/global_step": 1098, "train_info/time_within_train_step": 2.755936861038208, "step": 1098} {"train_info/time_between_train_steps": 0.003492593765258789, "step": 1098} {"info/global_step": 1099, "train_info/time_within_train_step": 2.756133556365967, "step": 1099} {"train_info/time_between_train_steps": 0.003579378128051758, "step": 1099} {"info/global_step": 1100, "train_info/time_within_train_step": 2.7553255558013916, "step": 1100} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746569238, "_runtime": 3247}, "step": 1100} {"logs": {"train/loss": 4.9033, "train/learning_rate": 0.0005933333333333333, "train/epoch": 1.02, "_timestamp": 1746569238, "_runtime": 3247}, "step": 1100} {"train_info/time_between_train_steps": 0.013517141342163086, "step": 1100} {"info/global_step": 1101, "train_info/time_within_train_step": 2.757355213165283, "step": 1101} {"train_info/time_between_train_steps": 0.003541231155395508, "step": 1101} {"info/global_step": 1102, "train_info/time_within_train_step": 2.7551937103271484, "step": 1102} {"train_info/time_between_train_steps": 0.003519773483276367, "step": 1102} {"info/global_step": 1103, "train_info/time_within_train_step": 2.757514476776123, "step": 1103} {"train_info/time_between_train_steps": 0.1756587028503418, "step": 1103} {"info/global_step": 1104, "train_info/time_within_train_step": 2.755213499069214, "step": 1104} {"train_info/time_between_train_steps": 0.0033109188079833984, "step": 1104} {"info/global_step": 1105, "train_info/time_within_train_step": 2.7555630207061768, "step": 1105} {"train_info/time_between_train_steps": 0.003314971923828125, "step": 1105} {"info/global_step": 1106, "train_info/time_within_train_step": 2.7566044330596924, "step": 1106} {"train_info/time_between_train_steps": 0.0036563873291015625, "step": 1106} {"info/global_step": 1107, "train_info/time_within_train_step": 2.7576589584350586, "step": 1107} {"train_info/time_between_train_steps": 0.003700733184814453, "step": 1107} {"info/global_step": 1108, "train_info/time_within_train_step": 2.7565953731536865, "step": 1108} {"train_info/time_between_train_steps": 0.0037741661071777344, "step": 1108} {"info/global_step": 1109, "train_info/time_within_train_step": 2.7567553520202637, "step": 1109} {"train_info/time_between_train_steps": 0.0037539005279541016, "step": 1109} {"info/global_step": 1110, "train_info/time_within_train_step": 2.7576582431793213, "step": 1110} {"train_info/time_between_train_steps": 0.0037026405334472656, "step": 1110} {"info/global_step": 1111, "train_info/time_within_train_step": 2.758328914642334, "step": 1111} {"train_info/time_between_train_steps": 0.003786802291870117, "step": 1111} {"info/global_step": 1112, "train_info/time_within_train_step": 2.7573235034942627, "step": 1112} {"train_info/time_between_train_steps": 0.003733396530151367, "step": 1112} {"info/global_step": 1113, "train_info/time_within_train_step": 2.7575550079345703, "step": 1113} {"train_info/time_between_train_steps": 0.003785848617553711, "step": 1113} {"info/global_step": 1114, "train_info/time_within_train_step": 3.1174707412719727, "step": 1114} {"train_info/time_between_train_steps": 0.003459930419921875, "step": 1114} {"info/global_step": 1115, "train_info/time_within_train_step": 2.755690813064575, "step": 1115} {"train_info/time_between_train_steps": 0.0033271312713623047, "step": 1115} {"info/global_step": 1116, "train_info/time_within_train_step": 2.7544052600860596, "step": 1116} {"train_info/time_between_train_steps": 0.0033338069915771484, "step": 1116} {"info/global_step": 1117, "train_info/time_within_train_step": 2.755959987640381, "step": 1117} {"train_info/time_between_train_steps": 0.003348112106323242, "step": 1117} {"info/global_step": 1118, "train_info/time_within_train_step": 2.755248546600342, "step": 1118} {"train_info/time_between_train_steps": 0.003308534622192383, "step": 1118} {"info/global_step": 1119, "train_info/time_within_train_step": 2.755110502243042, "step": 1119} {"train_info/time_between_train_steps": 0.0035653114318847656, "step": 1119} {"info/global_step": 1120, "train_info/time_within_train_step": 2.7579591274261475, "step": 1120} {"train_info/time_between_train_steps": 0.003430604934692383, "step": 1120} {"info/global_step": 1121, "train_info/time_within_train_step": 2.7542684078216553, "step": 1121} {"train_info/time_between_train_steps": 0.0035538673400878906, "step": 1121} {"info/global_step": 1122, "train_info/time_within_train_step": 2.756770610809326, "step": 1122} {"train_info/time_between_train_steps": 0.0035266876220703125, "step": 1122} {"info/global_step": 1123, "train_info/time_within_train_step": 2.7553088665008545, "step": 1123} {"train_info/time_between_train_steps": 0.0035457611083984375, "step": 1123} {"info/global_step": 1124, "train_info/time_within_train_step": 2.754091501235962, "step": 1124} {"train_info/time_between_train_steps": 0.0035026073455810547, "step": 1124} {"info/global_step": 1125, "train_info/time_within_train_step": 2.7557590007781982, "step": 1125} {"train_info/time_between_train_steps": 0.003328561782836914, "step": 1125} {"info/global_step": 1126, "train_info/time_within_train_step": 2.7552099227905273, "step": 1126} {"train_info/time_between_train_steps": 0.003289461135864258, "step": 1126} {"info/global_step": 1127, "train_info/time_within_train_step": 2.7558963298797607, "step": 1127} {"train_info/time_between_train_steps": 0.003311634063720703, "step": 1127} {"info/global_step": 1128, "train_info/time_within_train_step": 2.757869243621826, "step": 1128} {"train_info/time_between_train_steps": 0.003317594528198242, "step": 1128} {"info/global_step": 1129, "train_info/time_within_train_step": 2.754182815551758, "step": 1129} {"train_info/time_between_train_steps": 0.0032880306243896484, "step": 1129} {"info/global_step": 1130, "train_info/time_within_train_step": 2.754380464553833, "step": 1130} {"train_info/time_between_train_steps": 0.0033288002014160156, "step": 1130} {"info/global_step": 1131, "train_info/time_within_train_step": 2.753826856613159, "step": 1131} {"train_info/time_between_train_steps": 0.0033121109008789062, "step": 1131} {"info/global_step": 1132, "train_info/time_within_train_step": 2.7557597160339355, "step": 1132} {"train_info/time_between_train_steps": 0.0033016204833984375, "step": 1132} {"info/global_step": 1133, "train_info/time_within_train_step": 2.7527501583099365, "step": 1133} {"train_info/time_between_train_steps": 0.003309011459350586, "step": 1133} {"info/global_step": 1134, "train_info/time_within_train_step": 2.754890203475952, "step": 1134} {"train_info/time_between_train_steps": 0.003296375274658203, "step": 1134} {"info/global_step": 1135, "train_info/time_within_train_step": 2.7542335987091064, "step": 1135} {"train_info/time_between_train_steps": 0.003264904022216797, "step": 1135} {"info/global_step": 1136, "train_info/time_within_train_step": 2.7558650970458984, "step": 1136} {"train_info/time_between_train_steps": 0.0033288002014160156, "step": 1136} {"info/global_step": 1137, "train_info/time_within_train_step": 2.754208564758301, "step": 1137} {"train_info/time_between_train_steps": 0.0033156871795654297, "step": 1137} {"info/global_step": 1138, "train_info/time_within_train_step": 2.754122495651245, "step": 1138} {"train_info/time_between_train_steps": 0.003295421600341797, "step": 1138} {"info/global_step": 1139, "train_info/time_within_train_step": 2.7544479370117188, "step": 1139} {"train_info/time_between_train_steps": 0.003298521041870117, "step": 1139} {"info/global_step": 1140, "train_info/time_within_train_step": 2.7526142597198486, "step": 1140} {"train_info/time_between_train_steps": 0.0032923221588134766, "step": 1140} {"info/global_step": 1141, "train_info/time_within_train_step": 2.755328893661499, "step": 1141} {"train_info/time_between_train_steps": 0.0033838748931884766, "step": 1141} {"info/global_step": 1142, "train_info/time_within_train_step": 2.755201578140259, "step": 1142} {"train_info/time_between_train_steps": 0.003346681594848633, "step": 1142} {"info/global_step": 1143, "train_info/time_within_train_step": 2.7545340061187744, "step": 1143} {"train_info/time_between_train_steps": 0.0033028125762939453, "step": 1143} {"info/global_step": 1144, "train_info/time_within_train_step": 2.7544171810150146, "step": 1144} {"train_info/time_between_train_steps": 0.0032830238342285156, "step": 1144} {"info/global_step": 1145, "train_info/time_within_train_step": 2.7550299167633057, "step": 1145} {"train_info/time_between_train_steps": 0.003318309783935547, "step": 1145} {"info/global_step": 1146, "train_info/time_within_train_step": 2.7549118995666504, "step": 1146} {"train_info/time_between_train_steps": 0.003349781036376953, "step": 1146} {"info/global_step": 1147, "train_info/time_within_train_step": 2.7558841705322266, "step": 1147} {"train_info/time_between_train_steps": 0.003304004669189453, "step": 1147} {"info/global_step": 1148, "train_info/time_within_train_step": 2.7543084621429443, "step": 1148} {"train_info/time_between_train_steps": 0.003276348114013672, "step": 1148} {"info/global_step": 1149, "train_info/time_within_train_step": 2.75321102142334, "step": 1149} {"train_info/time_between_train_steps": 0.003270387649536133, "step": 1149} {"info/global_step": 1150, "train_info/time_within_train_step": 2.7555387020111084, "step": 1150} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746569377, "_runtime": 3386}, "step": 1150} {"logs": {"train/loss": 4.8516, "train/learning_rate": 0.0005899999999999999, "train/epoch": 1.03, "_timestamp": 1746569377, "_runtime": 3386}, "step": 1150} {"train_info/time_between_train_steps": 0.012952804565429688, "step": 1150} {"info/global_step": 1151, "train_info/time_within_train_step": 2.755495548248291, "step": 1151} {"train_info/time_between_train_steps": 0.0033919811248779297, "step": 1151} {"info/global_step": 1152, "train_info/time_within_train_step": 2.7567996978759766, "step": 1152} {"train_info/time_between_train_steps": 0.003631114959716797, "step": 1152} {"info/global_step": 1153, "train_info/time_within_train_step": 2.7540109157562256, "step": 1153} {"train_info/time_between_train_steps": 0.003527402877807617, "step": 1153} {"info/global_step": 1154, "train_info/time_within_train_step": 2.755687713623047, "step": 1154} {"train_info/time_between_train_steps": 0.003648042678833008, "step": 1154} {"info/global_step": 1155, "train_info/time_within_train_step": 2.755730390548706, "step": 1155} {"train_info/time_between_train_steps": 0.003688812255859375, "step": 1155} {"info/global_step": 1156, "train_info/time_within_train_step": 2.756807327270508, "step": 1156} {"train_info/time_between_train_steps": 0.0035858154296875, "step": 1156} {"info/global_step": 1157, "train_info/time_within_train_step": 2.7567689418792725, "step": 1157} {"train_info/time_between_train_steps": 0.0035736560821533203, "step": 1157} {"info/global_step": 1158, "train_info/time_within_train_step": 2.7566041946411133, "step": 1158} {"train_info/time_between_train_steps": 0.0035414695739746094, "step": 1158} {"info/global_step": 1159, "train_info/time_within_train_step": 2.7568132877349854, "step": 1159} {"train_info/time_between_train_steps": 0.003555774688720703, "step": 1159} {"info/global_step": 1160, "train_info/time_within_train_step": 2.7553656101226807, "step": 1160} {"train_info/time_between_train_steps": 0.0034818649291992188, "step": 1160} {"info/global_step": 1161, "train_info/time_within_train_step": 2.7560834884643555, "step": 1161} {"train_info/time_between_train_steps": 0.0035812854766845703, "step": 1161} {"info/global_step": 1162, "train_info/time_within_train_step": 2.756521224975586, "step": 1162} {"train_info/time_between_train_steps": 0.0035049915313720703, "step": 1162} {"info/global_step": 1163, "train_info/time_within_train_step": 2.7556638717651367, "step": 1163} {"train_info/time_between_train_steps": 0.0036225318908691406, "step": 1163} {"info/global_step": 1164, "train_info/time_within_train_step": 2.7564544677734375, "step": 1164} {"train_info/time_between_train_steps": 0.0034856796264648438, "step": 1164} {"info/global_step": 1165, "train_info/time_within_train_step": 2.7540969848632812, "step": 1165} {"train_info/time_between_train_steps": 0.0035839080810546875, "step": 1165} {"info/global_step": 1166, "train_info/time_within_train_step": 2.941089391708374, "step": 1166} {"train_info/time_between_train_steps": 0.0032930374145507812, "step": 1166} {"info/global_step": 1167, "train_info/time_within_train_step": 2.7552144527435303, "step": 1167} {"train_info/time_between_train_steps": 0.0033767223358154297, "step": 1167} {"info/global_step": 1168, "train_info/time_within_train_step": 3.0815231800079346, "step": 1168} {"train_info/time_between_train_steps": 0.003284931182861328, "step": 1168} {"info/global_step": 1169, "train_info/time_within_train_step": 2.755720853805542, "step": 1169} {"train_info/time_between_train_steps": 0.0032808780670166016, "step": 1169} {"info/global_step": 1170, "train_info/time_within_train_step": 2.7561211585998535, "step": 1170} {"train_info/time_between_train_steps": 0.0033414363861083984, "step": 1170} {"info/global_step": 1171, "train_info/time_within_train_step": 2.7560768127441406, "step": 1171} {"train_info/time_between_train_steps": 0.003291606903076172, "step": 1171} {"info/global_step": 1172, "train_info/time_within_train_step": 2.7538678646087646, "step": 1172} {"train_info/time_between_train_steps": 0.0032312870025634766, "step": 1172} {"info/global_step": 1173, "train_info/time_within_train_step": 2.756472587585449, "step": 1173} {"train_info/time_between_train_steps": 0.003222942352294922, "step": 1173} {"info/global_step": 1174, "train_info/time_within_train_step": 2.7554216384887695, "step": 1174} {"train_info/time_between_train_steps": 0.003342866897583008, "step": 1174} {"info/global_step": 1175, "train_info/time_within_train_step": 2.7546753883361816, "step": 1175} {"train_info/time_between_train_steps": 0.0032792091369628906, "step": 1175} {"info/global_step": 1176, "train_info/time_within_train_step": 2.7549655437469482, "step": 1176} {"train_info/time_between_train_steps": 0.0035626888275146484, "step": 1176} {"info/global_step": 1177, "train_info/time_within_train_step": 2.7549808025360107, "step": 1177} {"train_info/time_between_train_steps": 0.0034923553466796875, "step": 1177} {"info/global_step": 1178, "train_info/time_within_train_step": 2.7560088634490967, "step": 1178} {"train_info/time_between_train_steps": 0.003761768341064453, "step": 1178} {"info/global_step": 1179, "train_info/time_within_train_step": 2.7561471462249756, "step": 1179} {"train_info/time_between_train_steps": 0.003632068634033203, "step": 1179} {"info/global_step": 1180, "train_info/time_within_train_step": 2.7568774223327637, "step": 1180} {"train_info/time_between_train_steps": 0.003779172897338867, "step": 1180} {"info/global_step": 1181, "train_info/time_within_train_step": 2.7561559677124023, "step": 1181} {"train_info/time_between_train_steps": 0.0037522315979003906, "step": 1181} {"info/global_step": 1182, "train_info/time_within_train_step": 2.7547318935394287, "step": 1182} {"train_info/time_between_train_steps": 0.003591299057006836, "step": 1182} {"info/global_step": 1183, "train_info/time_within_train_step": 2.755735158920288, "step": 1183} {"train_info/time_between_train_steps": 0.003633737564086914, "step": 1183} {"info/global_step": 1184, "train_info/time_within_train_step": 2.755185604095459, "step": 1184} {"train_info/time_between_train_steps": 0.003521442413330078, "step": 1184} {"info/global_step": 1185, "train_info/time_within_train_step": 2.756723642349243, "step": 1185} {"train_info/time_between_train_steps": 0.003606557846069336, "step": 1185} {"info/global_step": 1186, "train_info/time_within_train_step": 2.7554256916046143, "step": 1186} {"train_info/time_between_train_steps": 0.0034389495849609375, "step": 1186} {"info/global_step": 1187, "train_info/time_within_train_step": 2.7544872760772705, "step": 1187} {"train_info/time_between_train_steps": 0.0035080909729003906, "step": 1187} {"info/global_step": 1188, "train_info/time_within_train_step": 2.7562954425811768, "step": 1188} {"train_info/time_between_train_steps": 0.003580808639526367, "step": 1188} {"info/global_step": 1189, "train_info/time_within_train_step": 2.755302906036377, "step": 1189} {"train_info/time_between_train_steps": 0.0035257339477539062, "step": 1189} {"info/global_step": 1190, "train_info/time_within_train_step": 2.755507469177246, "step": 1190} {"train_info/time_between_train_steps": 0.003539562225341797, "step": 1190} {"info/global_step": 1191, "train_info/time_within_train_step": 2.7549684047698975, "step": 1191} {"train_info/time_between_train_steps": 0.0035431385040283203, "step": 1191} {"info/global_step": 1192, "train_info/time_within_train_step": 2.752988338470459, "step": 1192} {"train_info/time_between_train_steps": 0.0034711360931396484, "step": 1192} {"info/global_step": 1193, "train_info/time_within_train_step": 2.7550227642059326, "step": 1193} {"train_info/time_between_train_steps": 0.0035314559936523438, "step": 1193} {"info/global_step": 1194, "train_info/time_within_train_step": 2.755342483520508, "step": 1194} {"train_info/time_between_train_steps": 0.003515481948852539, "step": 1194} {"info/global_step": 1195, "train_info/time_within_train_step": 2.7550086975097656, "step": 1195} {"train_info/time_between_train_steps": 0.003522634506225586, "step": 1195} {"info/global_step": 1196, "train_info/time_within_train_step": 2.756194829940796, "step": 1196} {"train_info/time_between_train_steps": 0.0035698413848876953, "step": 1196} {"info/global_step": 1197, "train_info/time_within_train_step": 2.755276679992676, "step": 1197} {"train_info/time_between_train_steps": 0.0034112930297851562, "step": 1197} {"info/global_step": 1198, "train_info/time_within_train_step": 2.75606107711792, "step": 1198} {"train_info/time_between_train_steps": 0.0035314559936523438, "step": 1198} {"info/global_step": 1199, "train_info/time_within_train_step": 2.7533578872680664, "step": 1199} {"train_info/time_between_train_steps": 0.003652334213256836, "step": 1199} {"info/global_step": 1200, "train_info/time_within_train_step": 2.7540483474731445, "step": 1200} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746569516, "_runtime": 3525}, "step": 1200} {"logs": {"train/loss": 4.8089, "train/learning_rate": 0.0005866666666666665, "train/epoch": 1.03, "_timestamp": 1746569516, "_runtime": 3525}, "step": 1200} {"train_info/time_between_train_steps": 21.60381579399109, "step": 1200} {"info/global_step": 1201, "train_info/time_within_train_step": 2.5453109741210938, "step": 1201} {"train_info/time_between_train_steps": 0.003997325897216797, "step": 1201} {"info/global_step": 1202, "train_info/time_within_train_step": 2.5757365226745605, "step": 1202} {"train_info/time_between_train_steps": 0.0039386749267578125, "step": 1202} {"info/global_step": 1203, "train_info/time_within_train_step": 2.6941540241241455, "step": 1203} {"train_info/time_between_train_steps": 0.0041980743408203125, "step": 1203} {"info/global_step": 1204, "train_info/time_within_train_step": 2.711803913116455, "step": 1204} {"train_info/time_between_train_steps": 0.004120588302612305, "step": 1204} {"info/global_step": 1205, "train_info/time_within_train_step": 2.74177885055542, "step": 1205} {"train_info/time_between_train_steps": 0.004125833511352539, "step": 1205} {"info/global_step": 1206, "train_info/time_within_train_step": 2.7585244178771973, "step": 1206} {"train_info/time_between_train_steps": 0.004210472106933594, "step": 1206} {"info/global_step": 1207, "train_info/time_within_train_step": 3.1824939250946045, "step": 1207} {"train_info/time_between_train_steps": 0.0035202503204345703, "step": 1207} {"info/global_step": 1208, "train_info/time_within_train_step": 2.757336378097534, "step": 1208} {"train_info/time_between_train_steps": 0.003535032272338867, "step": 1208} {"info/global_step": 1209, "train_info/time_within_train_step": 2.756676435470581, "step": 1209} {"train_info/time_between_train_steps": 0.00341796875, "step": 1209} {"info/global_step": 1210, "train_info/time_within_train_step": 2.756880283355713, "step": 1210} {"train_info/time_between_train_steps": 0.003513813018798828, "step": 1210} {"info/global_step": 1211, "train_info/time_within_train_step": 2.7566494941711426, "step": 1211} {"train_info/time_between_train_steps": 0.0034766197204589844, "step": 1211} {"info/global_step": 1212, "train_info/time_within_train_step": 2.7566516399383545, "step": 1212} {"train_info/time_between_train_steps": 0.003538370132446289, "step": 1212} {"info/global_step": 1213, "train_info/time_within_train_step": 2.7563412189483643, "step": 1213} {"train_info/time_between_train_steps": 0.0036280155181884766, "step": 1213} {"info/global_step": 1214, "train_info/time_within_train_step": 2.757686138153076, "step": 1214} {"train_info/time_between_train_steps": 0.0036630630493164062, "step": 1214} {"info/global_step": 1215, "train_info/time_within_train_step": 2.7583060264587402, "step": 1215} {"train_info/time_between_train_steps": 0.004014730453491211, "step": 1215} {"info/global_step": 1216, "train_info/time_within_train_step": 2.757187843322754, "step": 1216} {"train_info/time_between_train_steps": 0.003741741180419922, "step": 1216} {"info/global_step": 1217, "train_info/time_within_train_step": 2.7573161125183105, "step": 1217} {"train_info/time_between_train_steps": 0.003757953643798828, "step": 1217} {"info/global_step": 1218, "train_info/time_within_train_step": 2.7560195922851562, "step": 1218} {"train_info/time_between_train_steps": 0.003662109375, "step": 1218} {"info/global_step": 1219, "train_info/time_within_train_step": 2.757347583770752, "step": 1219} {"train_info/time_between_train_steps": 0.0037348270416259766, "step": 1219} {"info/global_step": 1220, "train_info/time_within_train_step": 2.7554843425750732, "step": 1220} {"train_info/time_between_train_steps": 0.0036139488220214844, "step": 1220} {"info/global_step": 1221, "train_info/time_within_train_step": 2.75722599029541, "step": 1221} {"train_info/time_between_train_steps": 0.0034646987915039062, "step": 1221} {"info/global_step": 1222, "train_info/time_within_train_step": 2.757075071334839, "step": 1222} {"train_info/time_between_train_steps": 0.003496885299682617, "step": 1222} {"info/global_step": 1223, "train_info/time_within_train_step": 2.7556536197662354, "step": 1223} {"train_info/time_between_train_steps": 0.00434112548828125, "step": 1223} {"info/global_step": 1224, "train_info/time_within_train_step": 2.755418539047241, "step": 1224} {"train_info/time_between_train_steps": 0.0034112930297851562, "step": 1224} {"info/global_step": 1225, "train_info/time_within_train_step": 2.754969835281372, "step": 1225} {"train_info/time_between_train_steps": 0.0034942626953125, "step": 1225} {"info/global_step": 1226, "train_info/time_within_train_step": 2.7561066150665283, "step": 1226} {"train_info/time_between_train_steps": 0.003469705581665039, "step": 1226} {"info/global_step": 1227, "train_info/time_within_train_step": 2.7553200721740723, "step": 1227} {"train_info/time_between_train_steps": 0.003496408462524414, "step": 1227} {"info/global_step": 1228, "train_info/time_within_train_step": 2.753999948501587, "step": 1228} {"train_info/time_between_train_steps": 0.17960095405578613, "step": 1228} {"info/global_step": 1229, "train_info/time_within_train_step": 2.7554852962493896, "step": 1229} {"train_info/time_between_train_steps": 0.003406047821044922, "step": 1229} {"info/global_step": 1230, "train_info/time_within_train_step": 2.755169153213501, "step": 1230} {"train_info/time_between_train_steps": 0.003482818603515625, "step": 1230} {"info/global_step": 1231, "train_info/time_within_train_step": 2.755568027496338, "step": 1231} {"train_info/time_between_train_steps": 0.003579378128051758, "step": 1231} {"info/global_step": 1232, "train_info/time_within_train_step": 2.754547119140625, "step": 1232} {"train_info/time_between_train_steps": 0.0035414695739746094, "step": 1232} {"info/global_step": 1233, "train_info/time_within_train_step": 2.7572739124298096, "step": 1233} {"train_info/time_between_train_steps": 0.0035953521728515625, "step": 1233} {"info/global_step": 1234, "train_info/time_within_train_step": 2.7552146911621094, "step": 1234} {"train_info/time_between_train_steps": 0.0035254955291748047, "step": 1234} {"info/global_step": 1235, "train_info/time_within_train_step": 2.756671190261841, "step": 1235} {"train_info/time_between_train_steps": 0.003547191619873047, "step": 1235} {"info/global_step": 1236, "train_info/time_within_train_step": 2.753854751586914, "step": 1236} {"train_info/time_between_train_steps": 0.0035479068756103516, "step": 1236} {"info/global_step": 1237, "train_info/time_within_train_step": 2.7562990188598633, "step": 1237} {"train_info/time_between_train_steps": 0.003508329391479492, "step": 1237} {"info/global_step": 1238, "train_info/time_within_train_step": 2.7561867237091064, "step": 1238} {"train_info/time_between_train_steps": 0.0034875869750976562, "step": 1238} {"info/global_step": 1239, "train_info/time_within_train_step": 2.7565159797668457, "step": 1239} {"train_info/time_between_train_steps": 0.0034875869750976562, "step": 1239} {"info/global_step": 1240, "train_info/time_within_train_step": 2.7558233737945557, "step": 1240} {"train_info/time_between_train_steps": 0.0035250186920166016, "step": 1240} {"info/global_step": 1241, "train_info/time_within_train_step": 2.755150556564331, "step": 1241} {"train_info/time_between_train_steps": 0.003526926040649414, "step": 1241} {"info/global_step": 1242, "train_info/time_within_train_step": 2.755049228668213, "step": 1242} {"train_info/time_between_train_steps": 0.0035479068756103516, "step": 1242} {"info/global_step": 1243, "train_info/time_within_train_step": 2.754647731781006, "step": 1243} {"train_info/time_between_train_steps": 0.003555774688720703, "step": 1243} {"info/global_step": 1244, "train_info/time_within_train_step": 2.755070924758911, "step": 1244} {"train_info/time_between_train_steps": 0.003453493118286133, "step": 1244} {"info/global_step": 1245, "train_info/time_within_train_step": 2.754499673843384, "step": 1245} {"train_info/time_between_train_steps": 0.003504037857055664, "step": 1245} {"info/global_step": 1246, "train_info/time_within_train_step": 3.103872299194336, "step": 1246} {"train_info/time_between_train_steps": 0.0032491683959960938, "step": 1246} {"info/global_step": 1247, "train_info/time_within_train_step": 2.7556426525115967, "step": 1247} {"train_info/time_between_train_steps": 0.0035262107849121094, "step": 1247} {"info/global_step": 1248, "train_info/time_within_train_step": 2.7570536136627197, "step": 1248} {"train_info/time_between_train_steps": 0.0035910606384277344, "step": 1248} {"info/global_step": 1249, "train_info/time_within_train_step": 2.7572133541107178, "step": 1249} {"train_info/time_between_train_steps": 0.0035500526428222656, "step": 1249} {"info/global_step": 1250, "train_info/time_within_train_step": 3.29099440574646, "step": 1250} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746569677, "_runtime": 3686}, "step": 1250} {"logs": {"train/loss": 4.7674, "train/learning_rate": 0.0005833333333333333, "train/epoch": 1.04, "_timestamp": 1746569677, "_runtime": 3686}, "step": 1250} {"train_info/time_between_train_steps": 0.014180183410644531, "step": 1250} {"info/global_step": 1251, "train_info/time_within_train_step": 2.7549889087677, "step": 1251} {"train_info/time_between_train_steps": 0.0035207271575927734, "step": 1251} {"info/global_step": 1252, "train_info/time_within_train_step": 2.753110408782959, "step": 1252} {"train_info/time_between_train_steps": 0.0035483837127685547, "step": 1252} {"info/global_step": 1253, "train_info/time_within_train_step": 2.7541463375091553, "step": 1253} {"train_info/time_between_train_steps": 0.003578662872314453, "step": 1253} {"info/global_step": 1254, "train_info/time_within_train_step": 2.7551400661468506, "step": 1254} {"train_info/time_between_train_steps": 0.0034897327423095703, "step": 1254} {"info/global_step": 1255, "train_info/time_within_train_step": 2.755344867706299, "step": 1255} {"train_info/time_between_train_steps": 0.0035669803619384766, "step": 1255} {"info/global_step": 1256, "train_info/time_within_train_step": 2.7543094158172607, "step": 1256} {"train_info/time_between_train_steps": 0.003536701202392578, "step": 1256} {"info/global_step": 1257, "train_info/time_within_train_step": 2.7541275024414062, "step": 1257} {"train_info/time_between_train_steps": 0.0035152435302734375, "step": 1257} {"info/global_step": 1258, "train_info/time_within_train_step": 2.7549939155578613, "step": 1258} {"train_info/time_between_train_steps": 0.0036575794219970703, "step": 1258} {"info/global_step": 1259, "train_info/time_within_train_step": 2.7541091442108154, "step": 1259} {"train_info/time_between_train_steps": 0.00347900390625, "step": 1259} {"info/global_step": 1260, "train_info/time_within_train_step": 2.754584789276123, "step": 1260} {"train_info/time_between_train_steps": 0.0035572052001953125, "step": 1260} {"info/global_step": 1261, "train_info/time_within_train_step": 2.7550318241119385, "step": 1261} {"train_info/time_between_train_steps": 0.0036149024963378906, "step": 1261} {"info/global_step": 1262, "train_info/time_within_train_step": 2.756807327270508, "step": 1262} {"train_info/time_between_train_steps": 0.003686189651489258, "step": 1262} {"info/global_step": 1263, "train_info/time_within_train_step": 2.75666880607605, "step": 1263} {"train_info/time_between_train_steps": 0.0036306381225585938, "step": 1263} {"info/global_step": 1264, "train_info/time_within_train_step": 2.7556984424591064, "step": 1264} {"train_info/time_between_train_steps": 0.0036869049072265625, "step": 1264} {"info/global_step": 1265, "train_info/time_within_train_step": 2.76076602935791, "step": 1265} {"train_info/time_between_train_steps": 0.0036149024963378906, "step": 1265} {"info/global_step": 1266, "train_info/time_within_train_step": 2.7579848766326904, "step": 1266} {"train_info/time_between_train_steps": 0.0037119388580322266, "step": 1266} {"info/global_step": 1267, "train_info/time_within_train_step": 2.757154703140259, "step": 1267} {"train_info/time_between_train_steps": 0.0038170814514160156, "step": 1267} {"info/global_step": 1268, "train_info/time_within_train_step": 2.756110429763794, "step": 1268} {"train_info/time_between_train_steps": 0.0036737918853759766, "step": 1268} {"info/global_step": 1269, "train_info/time_within_train_step": 2.7564847469329834, "step": 1269} {"train_info/time_between_train_steps": 0.0036630630493164062, "step": 1269} {"info/global_step": 1270, "train_info/time_within_train_step": 2.7562623023986816, "step": 1270} {"train_info/time_between_train_steps": 0.003621339797973633, "step": 1270} {"info/global_step": 1271, "train_info/time_within_train_step": 2.7564644813537598, "step": 1271} {"train_info/time_between_train_steps": 0.003720998764038086, "step": 1271} {"info/global_step": 1272, "train_info/time_within_train_step": 2.7551605701446533, "step": 1272} {"train_info/time_between_train_steps": 0.003618001937866211, "step": 1272} {"info/global_step": 1273, "train_info/time_within_train_step": 2.7568185329437256, "step": 1273} {"train_info/time_between_train_steps": 0.0036172866821289062, "step": 1273} {"info/global_step": 1274, "train_info/time_within_train_step": 2.7560791969299316, "step": 1274} {"train_info/time_between_train_steps": 0.003671884536743164, "step": 1274} {"info/global_step": 1275, "train_info/time_within_train_step": 2.7566580772399902, "step": 1275} {"train_info/time_between_train_steps": 0.0036385059356689453, "step": 1275} {"info/global_step": 1276, "train_info/time_within_train_step": 2.7561891078948975, "step": 1276} {"train_info/time_between_train_steps": 0.003653287887573242, "step": 1276} {"info/global_step": 1277, "train_info/time_within_train_step": 2.7550904750823975, "step": 1277} {"train_info/time_between_train_steps": 0.0034627914428710938, "step": 1277} {"info/global_step": 1278, "train_info/time_within_train_step": 2.7547385692596436, "step": 1278} {"train_info/time_between_train_steps": 0.0034716129302978516, "step": 1278} {"info/global_step": 1279, "train_info/time_within_train_step": 2.75508189201355, "step": 1279} {"train_info/time_between_train_steps": 0.0035424232482910156, "step": 1279} {"info/global_step": 1280, "train_info/time_within_train_step": 2.7550251483917236, "step": 1280} {"train_info/time_between_train_steps": 0.0035049915313720703, "step": 1280} {"info/global_step": 1281, "train_info/time_within_train_step": 2.7543203830718994, "step": 1281} {"train_info/time_between_train_steps": 0.0035872459411621094, "step": 1281} {"info/global_step": 1282, "train_info/time_within_train_step": 2.7554538249969482, "step": 1282} {"train_info/time_between_train_steps": 0.0036704540252685547, "step": 1282} {"info/global_step": 1283, "train_info/time_within_train_step": 2.7555675506591797, "step": 1283} {"train_info/time_between_train_steps": 0.0036170482635498047, "step": 1283} {"info/global_step": 1284, "train_info/time_within_train_step": 2.7543513774871826, "step": 1284} {"train_info/time_between_train_steps": 0.0035729408264160156, "step": 1284} {"info/global_step": 1285, "train_info/time_within_train_step": 2.753533124923706, "step": 1285} {"train_info/time_between_train_steps": 0.003645658493041992, "step": 1285} {"info/global_step": 1286, "train_info/time_within_train_step": 2.755807399749756, "step": 1286} {"train_info/time_between_train_steps": 0.0035085678100585938, "step": 1286} {"info/global_step": 1287, "train_info/time_within_train_step": 2.754202127456665, "step": 1287} {"train_info/time_between_train_steps": 0.00345611572265625, "step": 1287} {"info/global_step": 1288, "train_info/time_within_train_step": 2.7560012340545654, "step": 1288} {"train_info/time_between_train_steps": 0.003507375717163086, "step": 1288} {"info/global_step": 1289, "train_info/time_within_train_step": 2.7559874057769775, "step": 1289} {"train_info/time_between_train_steps": 0.0035555362701416016, "step": 1289} {"info/global_step": 1290, "train_info/time_within_train_step": 2.756016254425049, "step": 1290} {"train_info/time_between_train_steps": 0.0035071372985839844, "step": 1290} {"info/global_step": 1291, "train_info/time_within_train_step": 2.9408998489379883, "step": 1291} {"train_info/time_between_train_steps": 0.003279447555541992, "step": 1291} {"info/global_step": 1292, "train_info/time_within_train_step": 2.7540996074676514, "step": 1292} {"train_info/time_between_train_steps": 0.0032770633697509766, "step": 1292} {"info/global_step": 1293, "train_info/time_within_train_step": 2.7547428607940674, "step": 1293} {"train_info/time_between_train_steps": 0.0033555030822753906, "step": 1293} {"info/global_step": 1294, "train_info/time_within_train_step": 2.7534217834472656, "step": 1294} {"train_info/time_between_train_steps": 0.003339529037475586, "step": 1294} {"info/global_step": 1295, "train_info/time_within_train_step": 2.7531189918518066, "step": 1295} {"train_info/time_between_train_steps": 0.003305673599243164, "step": 1295} {"info/global_step": 1296, "train_info/time_within_train_step": 2.751178026199341, "step": 1296} {"train_info/time_between_train_steps": 0.003322601318359375, "step": 1296} {"info/global_step": 1297, "train_info/time_within_train_step": 2.7539916038513184, "step": 1297} {"train_info/time_between_train_steps": 0.0033283233642578125, "step": 1297} {"info/global_step": 1298, "train_info/time_within_train_step": 2.753492593765259, "step": 1298} {"train_info/time_between_train_steps": 0.0032830238342285156, "step": 1298} {"info/global_step": 1299, "train_info/time_within_train_step": 2.7538557052612305, "step": 1299} {"train_info/time_between_train_steps": 0.003301382064819336, "step": 1299} {"info/global_step": 1300, "train_info/time_within_train_step": 2.754157781600952, "step": 1300} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746569815, "_runtime": 3824}, "step": 1300} {"logs": {"train/loss": 4.7077, "train/learning_rate": 0.00058, "train/epoch": 1.04, "_timestamp": 1746569815, "_runtime": 3824}, "step": 1300} {"train_info/time_between_train_steps": 0.01417994499206543, "step": 1300} {"info/global_step": 1301, "train_info/time_within_train_step": 2.7523746490478516, "step": 1301} {"train_info/time_between_train_steps": 0.0032525062561035156, "step": 1301} {"info/global_step": 1302, "train_info/time_within_train_step": 2.7542760372161865, "step": 1302} {"train_info/time_between_train_steps": 0.0033266544342041016, "step": 1302} {"info/global_step": 1303, "train_info/time_within_train_step": 2.7544238567352295, "step": 1303} {"train_info/time_between_train_steps": 0.003298521041870117, "step": 1303} {"info/global_step": 1304, "train_info/time_within_train_step": 2.754666328430176, "step": 1304} {"train_info/time_between_train_steps": 0.0032796859741210938, "step": 1304} {"info/global_step": 1305, "train_info/time_within_train_step": 2.7557451725006104, "step": 1305} {"train_info/time_between_train_steps": 0.0033638477325439453, "step": 1305} {"info/global_step": 1306, "train_info/time_within_train_step": 2.7543346881866455, "step": 1306} {"train_info/time_between_train_steps": 0.003308534622192383, "step": 1306} {"info/global_step": 1307, "train_info/time_within_train_step": 2.7537968158721924, "step": 1307} {"train_info/time_between_train_steps": 0.0034415721893310547, "step": 1307} {"info/global_step": 1308, "train_info/time_within_train_step": 2.7556426525115967, "step": 1308} {"train_info/time_between_train_steps": 0.003471851348876953, "step": 1308} {"info/global_step": 1309, "train_info/time_within_train_step": 2.7554683685302734, "step": 1309} {"train_info/time_between_train_steps": 0.0036301612854003906, "step": 1309} {"info/global_step": 1310, "train_info/time_within_train_step": 2.7564117908477783, "step": 1310} {"train_info/time_between_train_steps": 0.0035669803619384766, "step": 1310} {"info/global_step": 1311, "train_info/time_within_train_step": 2.7556967735290527, "step": 1311} {"train_info/time_between_train_steps": 0.003596782684326172, "step": 1311} {"info/global_step": 1312, "train_info/time_within_train_step": 2.7536208629608154, "step": 1312} {"train_info/time_between_train_steps": 0.0035400390625, "step": 1312} {"info/global_step": 1313, "train_info/time_within_train_step": 2.7552285194396973, "step": 1313} {"train_info/time_between_train_steps": 0.0035266876220703125, "step": 1313} {"info/global_step": 1314, "train_info/time_within_train_step": 2.7527031898498535, "step": 1314} {"train_info/time_between_train_steps": 0.0035355091094970703, "step": 1314} {"info/global_step": 1315, "train_info/time_within_train_step": 2.7527916431427, "step": 1315} {"train_info/time_between_train_steps": 0.0035033226013183594, "step": 1315} {"info/global_step": 1316, "train_info/time_within_train_step": 2.754934549331665, "step": 1316} {"train_info/time_between_train_steps": 0.0035393238067626953, "step": 1316} {"info/global_step": 1317, "train_info/time_within_train_step": 2.754747152328491, "step": 1317} {"train_info/time_between_train_steps": 0.0035219192504882812, "step": 1317} {"info/global_step": 1318, "train_info/time_within_train_step": 2.7535433769226074, "step": 1318} {"train_info/time_between_train_steps": 0.003527402877807617, "step": 1318} {"info/global_step": 1319, "train_info/time_within_train_step": 2.7549941539764404, "step": 1319} {"train_info/time_between_train_steps": 0.0036001205444335938, "step": 1319} {"info/global_step": 1320, "train_info/time_within_train_step": 2.7553179264068604, "step": 1320} {"train_info/time_between_train_steps": 0.003523588180541992, "step": 1320} {"info/global_step": 1321, "train_info/time_within_train_step": 2.7555596828460693, "step": 1321} {"train_info/time_between_train_steps": 0.003514528274536133, "step": 1321} {"info/global_step": 1322, "train_info/time_within_train_step": 2.75553035736084, "step": 1322} {"train_info/time_between_train_steps": 0.0035178661346435547, "step": 1322} {"info/global_step": 1323, "train_info/time_within_train_step": 2.7561373710632324, "step": 1323} {"train_info/time_between_train_steps": 0.00347900390625, "step": 1323} {"info/global_step": 1324, "train_info/time_within_train_step": 2.7548577785491943, "step": 1324} {"train_info/time_between_train_steps": 0.003529071807861328, "step": 1324} {"info/global_step": 1325, "train_info/time_within_train_step": 2.7548470497131348, "step": 1325} {"train_info/time_between_train_steps": 0.0035610198974609375, "step": 1325} {"info/global_step": 1326, "train_info/time_within_train_step": 2.754345655441284, "step": 1326} {"train_info/time_between_train_steps": 0.0034961700439453125, "step": 1326} {"info/global_step": 1327, "train_info/time_within_train_step": 2.7539937496185303, "step": 1327} {"train_info/time_between_train_steps": 0.0035834312438964844, "step": 1327} {"info/global_step": 1328, "train_info/time_within_train_step": 2.754929780960083, "step": 1328} {"train_info/time_between_train_steps": 0.0034661293029785156, "step": 1328} {"info/global_step": 1329, "train_info/time_within_train_step": 2.7542686462402344, "step": 1329} {"train_info/time_between_train_steps": 0.0034623146057128906, "step": 1329} {"info/global_step": 1330, "train_info/time_within_train_step": 2.754237651824951, "step": 1330} {"train_info/time_between_train_steps": 0.0034296512603759766, "step": 1330} {"info/global_step": 1331, "train_info/time_within_train_step": 2.7545390129089355, "step": 1331} {"train_info/time_between_train_steps": 0.003535032272338867, "step": 1331} {"info/global_step": 1332, "train_info/time_within_train_step": 2.7537734508514404, "step": 1332} {"train_info/time_between_train_steps": 0.00341033935546875, "step": 1332} {"info/global_step": 1333, "train_info/time_within_train_step": 2.7554142475128174, "step": 1333} {"train_info/time_between_train_steps": 0.003480195999145508, "step": 1333} {"info/global_step": 1334, "train_info/time_within_train_step": 2.753702163696289, "step": 1334} {"train_info/time_between_train_steps": 0.0035865306854248047, "step": 1334} {"info/global_step": 1335, "train_info/time_within_train_step": 3.096853494644165, "step": 1335} {"train_info/time_between_train_steps": 0.0032367706298828125, "step": 1335} {"info/global_step": 1336, "train_info/time_within_train_step": 2.7550854682922363, "step": 1336} {"train_info/time_between_train_steps": 0.003256082534790039, "step": 1336} {"info/global_step": 1337, "train_info/time_within_train_step": 2.754683256149292, "step": 1337} {"train_info/time_between_train_steps": 0.003285646438598633, "step": 1337} {"info/global_step": 1338, "train_info/time_within_train_step": 2.7537543773651123, "step": 1338} {"train_info/time_between_train_steps": 0.004118680953979492, "step": 1338} {"info/global_step": 1339, "train_info/time_within_train_step": 2.753960609436035, "step": 1339} {"train_info/time_between_train_steps": 0.0032358169555664062, "step": 1339} {"info/global_step": 1340, "train_info/time_within_train_step": 2.7546181678771973, "step": 1340} {"train_info/time_between_train_steps": 0.003281831741333008, "step": 1340} {"info/global_step": 1341, "train_info/time_within_train_step": 2.7540390491485596, "step": 1341} {"train_info/time_between_train_steps": 0.003509044647216797, "step": 1341} {"info/global_step": 1342, "train_info/time_within_train_step": 2.753664016723633, "step": 1342} {"train_info/time_between_train_steps": 0.003287076950073242, "step": 1342} {"info/global_step": 1343, "train_info/time_within_train_step": 2.7534596920013428, "step": 1343} {"train_info/time_between_train_steps": 0.003287792205810547, "step": 1343} {"info/global_step": 1344, "train_info/time_within_train_step": 2.754821538925171, "step": 1344} {"train_info/time_between_train_steps": 0.003277301788330078, "step": 1344} {"info/global_step": 1345, "train_info/time_within_train_step": 2.7546536922454834, "step": 1345} {"train_info/time_between_train_steps": 0.0033178329467773438, "step": 1345} {"info/global_step": 1346, "train_info/time_within_train_step": 2.7538089752197266, "step": 1346} {"train_info/time_between_train_steps": 0.003202199935913086, "step": 1346} {"info/global_step": 1347, "train_info/time_within_train_step": 2.756134271621704, "step": 1347} {"train_info/time_between_train_steps": 0.0032777786254882812, "step": 1347} {"info/global_step": 1348, "train_info/time_within_train_step": 2.7540855407714844, "step": 1348} {"train_info/time_between_train_steps": 0.0032892227172851562, "step": 1348} {"info/global_step": 1349, "train_info/time_within_train_step": 2.7545173168182373, "step": 1349} {"train_info/time_between_train_steps": 0.0032944679260253906, "step": 1349} {"info/global_step": 1350, "train_info/time_within_train_step": 2.754587411880493, "step": 1350} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746569954, "_runtime": 3963}, "step": 1350} {"logs": {"train/loss": 4.6788, "train/learning_rate": 0.0005766666666666666, "train/epoch": 1.05, "_timestamp": 1746569954, "_runtime": 3963}, "step": 1350} {"train_info/time_between_train_steps": 0.014238595962524414, "step": 1350} {"info/global_step": 1351, "train_info/time_within_train_step": 2.7549686431884766, "step": 1351} {"train_info/time_between_train_steps": 0.0032432079315185547, "step": 1351} {"info/global_step": 1352, "train_info/time_within_train_step": 2.755047082901001, "step": 1352} {"train_info/time_between_train_steps": 0.0032303333282470703, "step": 1352} {"info/global_step": 1353, "train_info/time_within_train_step": 2.754059076309204, "step": 1353} {"train_info/time_between_train_steps": 0.09894680976867676, "step": 1353} {"info/global_step": 1354, "train_info/time_within_train_step": 2.758518695831299, "step": 1354} {"train_info/time_between_train_steps": 0.0032300949096679688, "step": 1354} {"info/global_step": 1355, "train_info/time_within_train_step": 2.7541658878326416, "step": 1355} {"train_info/time_between_train_steps": 0.0032541751861572266, "step": 1355} {"info/global_step": 1356, "train_info/time_within_train_step": 2.753204822540283, "step": 1356} {"train_info/time_between_train_steps": 0.003206968307495117, "step": 1356} {"info/global_step": 1357, "train_info/time_within_train_step": 2.754331350326538, "step": 1357} {"train_info/time_between_train_steps": 0.0032050609588623047, "step": 1357} {"info/global_step": 1358, "train_info/time_within_train_step": 2.7553341388702393, "step": 1358} {"train_info/time_between_train_steps": 0.0032415390014648438, "step": 1358} {"info/global_step": 1359, "train_info/time_within_train_step": 2.754427671432495, "step": 1359} {"train_info/time_between_train_steps": 0.0032088756561279297, "step": 1359} {"info/global_step": 1360, "train_info/time_within_train_step": 2.7553000450134277, "step": 1360} {"train_info/time_between_train_steps": 0.003244161605834961, "step": 1360} {"info/global_step": 1361, "train_info/time_within_train_step": 2.75427508354187, "step": 1361} {"train_info/time_between_train_steps": 0.0031871795654296875, "step": 1361} {"info/global_step": 1362, "train_info/time_within_train_step": 2.7547945976257324, "step": 1362} {"train_info/time_between_train_steps": 0.003223419189453125, "step": 1362} {"info/global_step": 1363, "train_info/time_within_train_step": 2.7544023990631104, "step": 1363} {"train_info/time_between_train_steps": 0.0032062530517578125, "step": 1363} {"info/global_step": 1364, "train_info/time_within_train_step": 2.754732847213745, "step": 1364} {"train_info/time_between_train_steps": 0.0032346248626708984, "step": 1364} {"info/global_step": 1365, "train_info/time_within_train_step": 2.7545549869537354, "step": 1365} {"train_info/time_between_train_steps": 0.003255605697631836, "step": 1365} {"info/global_step": 1366, "train_info/time_within_train_step": 2.7529022693634033, "step": 1366} {"train_info/time_between_train_steps": 0.003206968307495117, "step": 1366} {"info/global_step": 1367, "train_info/time_within_train_step": 2.754443407058716, "step": 1367} {"train_info/time_between_train_steps": 0.0032148361206054688, "step": 1367} {"info/global_step": 1368, "train_info/time_within_train_step": 2.7537007331848145, "step": 1368} {"train_info/time_between_train_steps": 0.003270387649536133, "step": 1368} {"info/global_step": 1369, "train_info/time_within_train_step": 2.754779100418091, "step": 1369} {"train_info/time_between_train_steps": 0.0032196044921875, "step": 1369} {"info/global_step": 1370, "train_info/time_within_train_step": 2.755129814147949, "step": 1370} {"train_info/time_between_train_steps": 0.003233671188354492, "step": 1370} {"info/global_step": 1371, "train_info/time_within_train_step": 2.7546041011810303, "step": 1371} {"train_info/time_between_train_steps": 0.0032889842987060547, "step": 1371} {"info/global_step": 1372, "train_info/time_within_train_step": 2.7544188499450684, "step": 1372} {"train_info/time_between_train_steps": 0.003232717514038086, "step": 1372} {"info/global_step": 1373, "train_info/time_within_train_step": 2.7536020278930664, "step": 1373} {"train_info/time_between_train_steps": 0.0032148361206054688, "step": 1373} {"info/global_step": 1374, "train_info/time_within_train_step": 2.7545411586761475, "step": 1374} {"train_info/time_between_train_steps": 0.003278970718383789, "step": 1374} {"info/global_step": 1375, "train_info/time_within_train_step": 2.754554033279419, "step": 1375} {"train_info/time_between_train_steps": 0.003242015838623047, "step": 1375} {"info/global_step": 1376, "train_info/time_within_train_step": 2.7556509971618652, "step": 1376} {"train_info/time_between_train_steps": 0.003368377685546875, "step": 1376} {"info/global_step": 1377, "train_info/time_within_train_step": 2.7554266452789307, "step": 1377} {"train_info/time_between_train_steps": 0.0034046173095703125, "step": 1377} {"info/global_step": 1378, "train_info/time_within_train_step": 2.753538131713867, "step": 1378} {"train_info/time_between_train_steps": 0.003469228744506836, "step": 1378} {"info/global_step": 1379, "train_info/time_within_train_step": 2.7566165924072266, "step": 1379} {"train_info/time_between_train_steps": 0.003347158432006836, "step": 1379} {"info/global_step": 1380, "train_info/time_within_train_step": 2.7557625770568848, "step": 1380} {"train_info/time_between_train_steps": 0.0033702850341796875, "step": 1380} {"info/global_step": 1381, "train_info/time_within_train_step": 2.755028009414673, "step": 1381} {"train_info/time_between_train_steps": 0.0033888816833496094, "step": 1381} {"info/global_step": 1382, "train_info/time_within_train_step": 2.75514817237854, "step": 1382} {"train_info/time_between_train_steps": 0.0034453868865966797, "step": 1382} {"info/global_step": 1383, "train_info/time_within_train_step": 2.754047393798828, "step": 1383} {"train_info/time_between_train_steps": 0.0033762454986572266, "step": 1383} {"info/global_step": 1384, "train_info/time_within_train_step": 2.755751609802246, "step": 1384} {"train_info/time_between_train_steps": 0.003329753875732422, "step": 1384} {"info/global_step": 1385, "train_info/time_within_train_step": 2.754409074783325, "step": 1385} {"train_info/time_between_train_steps": 0.0033435821533203125, "step": 1385} {"info/global_step": 1386, "train_info/time_within_train_step": 2.754075288772583, "step": 1386} {"train_info/time_between_train_steps": 0.0033130645751953125, "step": 1386} {"info/global_step": 1387, "train_info/time_within_train_step": 2.7561724185943604, "step": 1387} {"train_info/time_between_train_steps": 0.00344085693359375, "step": 1387} {"info/global_step": 1388, "train_info/time_within_train_step": 2.7557218074798584, "step": 1388} {"train_info/time_between_train_steps": 0.003450155258178711, "step": 1388} {"info/global_step": 1389, "train_info/time_within_train_step": 2.9978396892547607, "step": 1389} {"train_info/time_between_train_steps": 0.0034058094024658203, "step": 1389} {"info/global_step": 1390, "train_info/time_within_train_step": 2.7567849159240723, "step": 1390} {"train_info/time_between_train_steps": 0.0034132003784179688, "step": 1390} {"info/global_step": 1391, "train_info/time_within_train_step": 2.7563936710357666, "step": 1391} {"train_info/time_between_train_steps": 0.0034017562866210938, "step": 1391} {"info/global_step": 1392, "train_info/time_within_train_step": 2.7563960552215576, "step": 1392} {"train_info/time_between_train_steps": 0.0034220218658447266, "step": 1392} {"info/global_step": 1393, "train_info/time_within_train_step": 2.7554843425750732, "step": 1393} {"train_info/time_between_train_steps": 0.0034415721893310547, "step": 1393} {"info/global_step": 1394, "train_info/time_within_train_step": 2.755680799484253, "step": 1394} {"train_info/time_between_train_steps": 0.019977569580078125, "step": 1394} {"info/global_step": 1395, "train_info/time_within_train_step": 2.75525164604187, "step": 1395} {"train_info/time_between_train_steps": 0.003123760223388672, "step": 1395} {"info/global_step": 1396, "train_info/time_within_train_step": 2.7552120685577393, "step": 1396} {"train_info/time_between_train_steps": 0.0030226707458496094, "step": 1396} {"info/global_step": 1397, "train_info/time_within_train_step": 2.755125045776367, "step": 1397} {"train_info/time_between_train_steps": 0.003007650375366211, "step": 1397} {"info/global_step": 1398, "train_info/time_within_train_step": 2.7536110877990723, "step": 1398} {"train_info/time_between_train_steps": 0.0029556751251220703, "step": 1398} {"info/global_step": 1399, "train_info/time_within_train_step": 2.753633499145508, "step": 1399} {"train_info/time_between_train_steps": 0.002923250198364258, "step": 1399} {"info/global_step": 1400, "train_info/time_within_train_step": 2.7525343894958496, "step": 1400} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746570093, "_runtime": 4102}, "step": 1400} {"logs": {"train/loss": 4.6554, "train/learning_rate": 0.0005733333333333334, "train/epoch": 1.05, "_timestamp": 1746570093, "_runtime": 4102}, "step": 1400} {"train_info/time_between_train_steps": 18.945873737335205, "step": 1400} {"info/global_step": 1401, "train_info/time_within_train_step": 2.5378236770629883, "step": 1401} {"train_info/time_between_train_steps": 0.002911090850830078, "step": 1401} {"info/global_step": 1402, "train_info/time_within_train_step": 2.565776824951172, "step": 1402} {"train_info/time_between_train_steps": 0.0030257701873779297, "step": 1402} {"info/global_step": 1403, "train_info/time_within_train_step": 2.6839752197265625, "step": 1403} {"train_info/time_between_train_steps": 0.003054380416870117, "step": 1403} {"info/global_step": 1404, "train_info/time_within_train_step": 2.7298998832702637, "step": 1404} {"train_info/time_between_train_steps": 0.0030798912048339844, "step": 1404} {"info/global_step": 1405, "train_info/time_within_train_step": 2.7504591941833496, "step": 1405} {"train_info/time_between_train_steps": 0.003027200698852539, "step": 1405} {"info/global_step": 1406, "train_info/time_within_train_step": 2.7560884952545166, "step": 1406} {"train_info/time_between_train_steps": 0.0030324459075927734, "step": 1406} {"info/global_step": 1407, "train_info/time_within_train_step": 2.7584211826324463, "step": 1407} {"train_info/time_between_train_steps": 0.0030722618103027344, "step": 1407} {"info/global_step": 1408, "train_info/time_within_train_step": 2.754483699798584, "step": 1408} {"train_info/time_between_train_steps": 0.0030891895294189453, "step": 1408} {"info/global_step": 1409, "train_info/time_within_train_step": 2.7564260959625244, "step": 1409} {"train_info/time_between_train_steps": 0.0029900074005126953, "step": 1409} {"info/global_step": 1410, "train_info/time_within_train_step": 2.756044864654541, "step": 1410} {"train_info/time_between_train_steps": 0.0030472278594970703, "step": 1410} {"info/global_step": 1411, "train_info/time_within_train_step": 2.7555840015411377, "step": 1411} {"train_info/time_between_train_steps": 0.0029976367950439453, "step": 1411} {"info/global_step": 1412, "train_info/time_within_train_step": 2.7571890354156494, "step": 1412} {"train_info/time_between_train_steps": 0.0030527114868164062, "step": 1412} {"info/global_step": 1413, "train_info/time_within_train_step": 2.754899263381958, "step": 1413} {"train_info/time_between_train_steps": 0.0030214786529541016, "step": 1413} {"info/global_step": 1414, "train_info/time_within_train_step": 2.7560923099517822, "step": 1414} {"train_info/time_between_train_steps": 0.002885580062866211, "step": 1414} {"info/global_step": 1415, "train_info/time_within_train_step": 2.7561819553375244, "step": 1415} {"train_info/time_between_train_steps": 0.002883434295654297, "step": 1415} {"info/global_step": 1416, "train_info/time_within_train_step": 2.7563700675964355, "step": 1416} {"train_info/time_between_train_steps": 0.002909421920776367, "step": 1416} {"info/global_step": 1417, "train_info/time_within_train_step": 2.754427909851074, "step": 1417} {"train_info/time_between_train_steps": 0.0029294490814208984, "step": 1417} {"info/global_step": 1418, "train_info/time_within_train_step": 2.754891872406006, "step": 1418} {"train_info/time_between_train_steps": 0.0028939247131347656, "step": 1418} {"info/global_step": 1419, "train_info/time_within_train_step": 2.7548787593841553, "step": 1419} {"train_info/time_between_train_steps": 0.0029439926147460938, "step": 1419} {"info/global_step": 1420, "train_info/time_within_train_step": 2.7549824714660645, "step": 1420} {"train_info/time_between_train_steps": 0.0029010772705078125, "step": 1420} {"info/global_step": 1421, "train_info/time_within_train_step": 2.7552237510681152, "step": 1421} {"train_info/time_between_train_steps": 0.002915620803833008, "step": 1421} {"info/global_step": 1422, "train_info/time_within_train_step": 2.7556416988372803, "step": 1422} {"train_info/time_between_train_steps": 0.0028939247131347656, "step": 1422} {"info/global_step": 1423, "train_info/time_within_train_step": 2.7539501190185547, "step": 1423} {"train_info/time_between_train_steps": 0.002933979034423828, "step": 1423} {"info/global_step": 1424, "train_info/time_within_train_step": 2.7545673847198486, "step": 1424} {"train_info/time_between_train_steps": 0.002907991409301758, "step": 1424} {"info/global_step": 1425, "train_info/time_within_train_step": 2.7547950744628906, "step": 1425} {"train_info/time_between_train_steps": 0.0029342174530029297, "step": 1425} {"info/global_step": 1426, "train_info/time_within_train_step": 2.7555816173553467, "step": 1426} {"train_info/time_between_train_steps": 0.0029251575469970703, "step": 1426} {"info/global_step": 1427, "train_info/time_within_train_step": 2.7545018196105957, "step": 1427} {"train_info/time_between_train_steps": 0.0029006004333496094, "step": 1427} {"info/global_step": 1428, "train_info/time_within_train_step": 2.7543766498565674, "step": 1428} {"train_info/time_between_train_steps": 0.0029556751251220703, "step": 1428} {"info/global_step": 1429, "train_info/time_within_train_step": 2.754969835281372, "step": 1429} {"train_info/time_between_train_steps": 0.0029456615447998047, "step": 1429} {"info/global_step": 1430, "train_info/time_within_train_step": 2.7558250427246094, "step": 1430} {"train_info/time_between_train_steps": 0.002948284149169922, "step": 1430} {"info/global_step": 1431, "train_info/time_within_train_step": 2.7566845417022705, "step": 1431} {"train_info/time_between_train_steps": 0.002947092056274414, "step": 1431} {"info/global_step": 1432, "train_info/time_within_train_step": 2.7550745010375977, "step": 1432} {"train_info/time_between_train_steps": 0.002942800521850586, "step": 1432} {"info/global_step": 1433, "train_info/time_within_train_step": 2.7547686100006104, "step": 1433} {"train_info/time_between_train_steps": 0.0030274391174316406, "step": 1433} {"info/global_step": 1434, "train_info/time_within_train_step": 2.7557876110076904, "step": 1434} {"train_info/time_between_train_steps": 0.0029702186584472656, "step": 1434} {"info/global_step": 1435, "train_info/time_within_train_step": 2.75561785697937, "step": 1435} {"train_info/time_between_train_steps": 0.0030319690704345703, "step": 1435} {"info/global_step": 1436, "train_info/time_within_train_step": 2.7532246112823486, "step": 1436} {"train_info/time_between_train_steps": 0.0029914379119873047, "step": 1436} {"info/global_step": 1437, "train_info/time_within_train_step": 2.7549619674682617, "step": 1437} {"train_info/time_between_train_steps": 0.0030393600463867188, "step": 1437} {"info/global_step": 1438, "train_info/time_within_train_step": 2.754591703414917, "step": 1438} {"train_info/time_between_train_steps": 0.0029604434967041016, "step": 1438} {"info/global_step": 1439, "train_info/time_within_train_step": 2.7554001808166504, "step": 1439} {"train_info/time_between_train_steps": 0.002994537353515625, "step": 1439} {"info/global_step": 1440, "train_info/time_within_train_step": 2.7554244995117188, "step": 1440} {"train_info/time_between_train_steps": 0.0030281543731689453, "step": 1440} {"info/global_step": 1441, "train_info/time_within_train_step": 2.756176233291626, "step": 1441} {"train_info/time_between_train_steps": 0.003039121627807617, "step": 1441} {"info/global_step": 1442, "train_info/time_within_train_step": 2.7550981044769287, "step": 1442} {"train_info/time_between_train_steps": 0.0030400753021240234, "step": 1442} {"info/global_step": 1443, "train_info/time_within_train_step": 2.954604148864746, "step": 1443} {"train_info/time_between_train_steps": 0.0029947757720947266, "step": 1443} {"info/global_step": 1444, "train_info/time_within_train_step": 2.7554643154144287, "step": 1444} {"train_info/time_between_train_steps": 0.0029745101928710938, "step": 1444} {"info/global_step": 1445, "train_info/time_within_train_step": 2.7573020458221436, "step": 1445} {"train_info/time_between_train_steps": 0.003003835678100586, "step": 1445} {"info/global_step": 1446, "train_info/time_within_train_step": 2.755425214767456, "step": 1446} {"train_info/time_between_train_steps": 0.0029425621032714844, "step": 1446} {"info/global_step": 1447, "train_info/time_within_train_step": 2.757030963897705, "step": 1447} {"train_info/time_between_train_steps": 0.003116130828857422, "step": 1447} {"info/global_step": 1448, "train_info/time_within_train_step": 2.75795316696167, "step": 1448} {"train_info/time_between_train_steps": 0.0029993057250976562, "step": 1448} {"info/global_step": 1449, "train_info/time_within_train_step": 2.7586302757263184, "step": 1449} {"train_info/time_between_train_steps": 0.0030260086059570312, "step": 1449} {"info/global_step": 1450, "train_info/time_within_train_step": 2.757216215133667, "step": 1450} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746570250, "_runtime": 4259}, "step": 1450} {"logs": {"train/loss": 4.6246, "train/learning_rate": 0.00057, "train/epoch": 1.06, "_timestamp": 1746570250, "_runtime": 4259}, "step": 1450} {"train_info/time_between_train_steps": 0.01737809181213379, "step": 1450} {"info/global_step": 1451, "train_info/time_within_train_step": 2.7570712566375732, "step": 1451} {"train_info/time_between_train_steps": 0.0030400753021240234, "step": 1451} {"info/global_step": 1452, "train_info/time_within_train_step": 2.7590532302856445, "step": 1452} {"train_info/time_between_train_steps": 0.003022909164428711, "step": 1452} {"info/global_step": 1453, "train_info/time_within_train_step": 2.756648540496826, "step": 1453} {"train_info/time_between_train_steps": 0.003058195114135742, "step": 1453} {"info/global_step": 1454, "train_info/time_within_train_step": 2.7598729133605957, "step": 1454} {"train_info/time_between_train_steps": 0.0030481815338134766, "step": 1454} {"info/global_step": 1455, "train_info/time_within_train_step": 2.7542097568511963, "step": 1455} {"train_info/time_between_train_steps": 0.003000020980834961, "step": 1455} {"info/global_step": 1456, "train_info/time_within_train_step": 2.757441997528076, "step": 1456} {"train_info/time_between_train_steps": 0.0030570030212402344, "step": 1456} {"info/global_step": 1457, "train_info/time_within_train_step": 2.757305383682251, "step": 1457} {"train_info/time_between_train_steps": 0.002989053726196289, "step": 1457} {"info/global_step": 1458, "train_info/time_within_train_step": 2.7556262016296387, "step": 1458} {"train_info/time_between_train_steps": 0.003113985061645508, "step": 1458} {"info/global_step": 1459, "train_info/time_within_train_step": 2.756692409515381, "step": 1459} {"train_info/time_between_train_steps": 0.002878904342651367, "step": 1459} {"info/global_step": 1460, "train_info/time_within_train_step": 2.7541465759277344, "step": 1460} {"train_info/time_between_train_steps": 0.0028934478759765625, "step": 1460} {"info/global_step": 1461, "train_info/time_within_train_step": 2.754659652709961, "step": 1461} {"train_info/time_between_train_steps": 0.002912759780883789, "step": 1461} {"info/global_step": 1462, "train_info/time_within_train_step": 2.754991054534912, "step": 1462} {"train_info/time_between_train_steps": 0.002892732620239258, "step": 1462} {"info/global_step": 1463, "train_info/time_within_train_step": 2.7527077198028564, "step": 1463} {"train_info/time_between_train_steps": 0.002935171127319336, "step": 1463} {"info/global_step": 1464, "train_info/time_within_train_step": 2.7558417320251465, "step": 1464} {"train_info/time_between_train_steps": 0.002935171127319336, "step": 1464} {"info/global_step": 1465, "train_info/time_within_train_step": 2.7540740966796875, "step": 1465} {"train_info/time_between_train_steps": 0.0030612945556640625, "step": 1465} {"info/global_step": 1466, "train_info/time_within_train_step": 2.759045124053955, "step": 1466} {"train_info/time_between_train_steps": 0.0029745101928710938, "step": 1466} {"info/global_step": 1467, "train_info/time_within_train_step": 2.7578608989715576, "step": 1467} {"train_info/time_between_train_steps": 0.0030345916748046875, "step": 1467} {"info/global_step": 1468, "train_info/time_within_train_step": 2.7580366134643555, "step": 1468} {"train_info/time_between_train_steps": 0.0029702186584472656, "step": 1468} {"info/global_step": 1469, "train_info/time_within_train_step": 2.755763053894043, "step": 1469} {"train_info/time_between_train_steps": 0.0030367374420166016, "step": 1469} {"info/global_step": 1470, "train_info/time_within_train_step": 2.7565925121307373, "step": 1470} {"train_info/time_between_train_steps": 0.0030219554901123047, "step": 1470} {"info/global_step": 1471, "train_info/time_within_train_step": 2.756061553955078, "step": 1471} {"train_info/time_between_train_steps": 0.003004789352416992, "step": 1471} {"info/global_step": 1472, "train_info/time_within_train_step": 2.7567977905273438, "step": 1472} {"train_info/time_between_train_steps": 0.0030603408813476562, "step": 1472} {"info/global_step": 1473, "train_info/time_within_train_step": 2.7566449642181396, "step": 1473} {"train_info/time_between_train_steps": 0.003072023391723633, "step": 1473} {"info/global_step": 1474, "train_info/time_within_train_step": 2.7552506923675537, "step": 1474} {"train_info/time_between_train_steps": 0.0032563209533691406, "step": 1474} {"info/global_step": 1475, "train_info/time_within_train_step": 2.753941297531128, "step": 1475} {"train_info/time_between_train_steps": 0.003009319305419922, "step": 1475} {"info/global_step": 1476, "train_info/time_within_train_step": 2.7540395259857178, "step": 1476} {"train_info/time_between_train_steps": 0.002980470657348633, "step": 1476} {"info/global_step": 1477, "train_info/time_within_train_step": 2.755643129348755, "step": 1477} {"train_info/time_between_train_steps": 0.0031774044036865234, "step": 1477} {"info/global_step": 1478, "train_info/time_within_train_step": 2.7555553913116455, "step": 1478} {"train_info/time_between_train_steps": 0.003002643585205078, "step": 1478} {"info/global_step": 1479, "train_info/time_within_train_step": 2.7549140453338623, "step": 1479} {"train_info/time_between_train_steps": 0.002966165542602539, "step": 1479} {"info/global_step": 1480, "train_info/time_within_train_step": 2.7552835941314697, "step": 1480} {"train_info/time_between_train_steps": 0.002967357635498047, "step": 1480} {"info/global_step": 1481, "train_info/time_within_train_step": 2.756002426147461, "step": 1481} {"train_info/time_between_train_steps": 0.0029985904693603516, "step": 1481} {"info/global_step": 1482, "train_info/time_within_train_step": 2.755880117416382, "step": 1482} {"train_info/time_between_train_steps": 0.003007650375366211, "step": 1482} {"info/global_step": 1483, "train_info/time_within_train_step": 2.755643367767334, "step": 1483} {"train_info/time_between_train_steps": 0.002950906753540039, "step": 1483} {"info/global_step": 1484, "train_info/time_within_train_step": 2.754467725753784, "step": 1484} {"train_info/time_between_train_steps": 0.0029850006103515625, "step": 1484} {"info/global_step": 1485, "train_info/time_within_train_step": 2.925973415374756, "step": 1485} {"train_info/time_between_train_steps": 0.0029959678649902344, "step": 1485} {"info/global_step": 1486, "train_info/time_within_train_step": 2.7540223598480225, "step": 1486} {"train_info/time_between_train_steps": 0.0029609203338623047, "step": 1486} {"info/global_step": 1487, "train_info/time_within_train_step": 2.781266450881958, "step": 1487} {"train_info/time_between_train_steps": 0.002991914749145508, "step": 1487} {"info/global_step": 1488, "train_info/time_within_train_step": 2.7544281482696533, "step": 1488} {"train_info/time_between_train_steps": 0.002973318099975586, "step": 1488} {"info/global_step": 1489, "train_info/time_within_train_step": 2.7548577785491943, "step": 1489} {"train_info/time_between_train_steps": 0.0029697418212890625, "step": 1489} {"info/global_step": 1490, "train_info/time_within_train_step": 2.7544844150543213, "step": 1490} {"train_info/time_between_train_steps": 0.0029647350311279297, "step": 1490} {"info/global_step": 1491, "train_info/time_within_train_step": 2.7528765201568604, "step": 1491} {"train_info/time_between_train_steps": 0.0029654502868652344, "step": 1491} {"info/global_step": 1492, "train_info/time_within_train_step": 2.7556512355804443, "step": 1492} {"train_info/time_between_train_steps": 0.0030934810638427734, "step": 1492} {"info/global_step": 1493, "train_info/time_within_train_step": 2.755528211593628, "step": 1493} {"train_info/time_between_train_steps": 0.0029096603393554688, "step": 1493} {"info/global_step": 1494, "train_info/time_within_train_step": 2.7557497024536133, "step": 1494} {"train_info/time_between_train_steps": 0.002965688705444336, "step": 1494} {"info/global_step": 1495, "train_info/time_within_train_step": 2.7550101280212402, "step": 1495} {"train_info/time_between_train_steps": 0.003068685531616211, "step": 1495} {"info/global_step": 1496, "train_info/time_within_train_step": 2.7559902667999268, "step": 1496} {"train_info/time_between_train_steps": 0.0029702186584472656, "step": 1496} {"info/global_step": 1497, "train_info/time_within_train_step": 2.7551610469818115, "step": 1497} {"train_info/time_between_train_steps": 0.00296783447265625, "step": 1497} {"info/global_step": 1498, "train_info/time_within_train_step": 2.756140947341919, "step": 1498} {"train_info/time_between_train_steps": 0.0029671192169189453, "step": 1498} {"info/global_step": 1499, "train_info/time_within_train_step": 2.755344867706299, "step": 1499} {"train_info/time_between_train_steps": 0.003051280975341797, "step": 1499} {"info/global_step": 1500, "train_info/time_within_train_step": 3.3047373294830322, "step": 1500} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746570389, "_runtime": 4398}, "step": 1500} {"logs": {"train/loss": 4.5845, "train/learning_rate": 0.0005666666666666666, "train/epoch": 1.06, "_timestamp": 1746570389, "_runtime": 4398}, "step": 1500} {"train_info/time_between_train_steps": 0.012725353240966797, "step": 1500} {"info/global_step": 1501, "train_info/time_within_train_step": 2.75640606880188, "step": 1501} {"train_info/time_between_train_steps": 0.003109455108642578, "step": 1501} {"info/global_step": 1502, "train_info/time_within_train_step": 2.7568888664245605, "step": 1502} {"train_info/time_between_train_steps": 0.0030612945556640625, "step": 1502} {"info/global_step": 1503, "train_info/time_within_train_step": 2.7568891048431396, "step": 1503} {"train_info/time_between_train_steps": 0.0030100345611572266, "step": 1503} {"info/global_step": 1504, "train_info/time_within_train_step": 2.7560770511627197, "step": 1504} {"train_info/time_between_train_steps": 0.0030007362365722656, "step": 1504} {"info/global_step": 1505, "train_info/time_within_train_step": 2.7539596557617188, "step": 1505} {"train_info/time_between_train_steps": 0.0030837059020996094, "step": 1505} {"info/global_step": 1506, "train_info/time_within_train_step": 2.7573273181915283, "step": 1506} {"train_info/time_between_train_steps": 0.0029146671295166016, "step": 1506} {"info/global_step": 1507, "train_info/time_within_train_step": 2.7548351287841797, "step": 1507} {"train_info/time_between_train_steps": 0.0029251575469970703, "step": 1507} {"info/global_step": 1508, "train_info/time_within_train_step": 2.7539782524108887, "step": 1508} {"train_info/time_between_train_steps": 0.0029201507568359375, "step": 1508} {"info/global_step": 1509, "train_info/time_within_train_step": 2.7560696601867676, "step": 1509} {"train_info/time_between_train_steps": 0.002928018569946289, "step": 1509} {"info/global_step": 1510, "train_info/time_within_train_step": 2.7530465126037598, "step": 1510} {"train_info/time_between_train_steps": 0.0029306411743164062, "step": 1510} {"info/global_step": 1511, "train_info/time_within_train_step": 2.754640579223633, "step": 1511} {"train_info/time_between_train_steps": 0.0028715133666992188, "step": 1511} {"info/global_step": 1512, "train_info/time_within_train_step": 2.7546772956848145, "step": 1512} {"train_info/time_between_train_steps": 0.002907991409301758, "step": 1512} {"info/global_step": 1513, "train_info/time_within_train_step": 2.754894733428955, "step": 1513} {"train_info/time_between_train_steps": 0.0033257007598876953, "step": 1513} {"info/global_step": 1514, "train_info/time_within_train_step": 2.7564806938171387, "step": 1514} {"train_info/time_between_train_steps": 0.0031125545501708984, "step": 1514} {"info/global_step": 1515, "train_info/time_within_train_step": 2.7579996585845947, "step": 1515} {"train_info/time_between_train_steps": 0.0031998157501220703, "step": 1515} {"info/global_step": 1516, "train_info/time_within_train_step": 2.7556283473968506, "step": 1516} {"train_info/time_between_train_steps": 0.003133058547973633, "step": 1516} {"info/global_step": 1517, "train_info/time_within_train_step": 2.7565975189208984, "step": 1517} {"train_info/time_between_train_steps": 0.0029807090759277344, "step": 1517} {"info/global_step": 1518, "train_info/time_within_train_step": 2.753103256225586, "step": 1518} {"train_info/time_between_train_steps": 0.0030019283294677734, "step": 1518} {"info/global_step": 1519, "train_info/time_within_train_step": 2.753636121749878, "step": 1519} {"train_info/time_between_train_steps": 0.0029518604278564453, "step": 1519} {"info/global_step": 1520, "train_info/time_within_train_step": 2.753941297531128, "step": 1520} {"train_info/time_between_train_steps": 0.0029578208923339844, "step": 1520} {"info/global_step": 1521, "train_info/time_within_train_step": 2.7539303302764893, "step": 1521} {"train_info/time_between_train_steps": 0.0029692649841308594, "step": 1521} {"info/global_step": 1522, "train_info/time_within_train_step": 2.753732442855835, "step": 1522} {"train_info/time_between_train_steps": 0.002899169921875, "step": 1522} {"info/global_step": 1523, "train_info/time_within_train_step": 2.753842830657959, "step": 1523} {"train_info/time_between_train_steps": 0.002997875213623047, "step": 1523} {"info/global_step": 1524, "train_info/time_within_train_step": 2.7549283504486084, "step": 1524} {"train_info/time_between_train_steps": 0.0029854774475097656, "step": 1524} {"info/global_step": 1525, "train_info/time_within_train_step": 2.7547523975372314, "step": 1525} {"train_info/time_between_train_steps": 0.0030012130737304688, "step": 1525} {"info/global_step": 1526, "train_info/time_within_train_step": 2.7553513050079346, "step": 1526} {"train_info/time_between_train_steps": 0.0029327869415283203, "step": 1526} {"info/global_step": 1527, "train_info/time_within_train_step": 2.7546420097351074, "step": 1527} {"train_info/time_between_train_steps": 0.0029478073120117188, "step": 1527} {"info/global_step": 1528, "train_info/time_within_train_step": 2.7548279762268066, "step": 1528} {"train_info/time_between_train_steps": 0.002971172332763672, "step": 1528} {"info/global_step": 1529, "train_info/time_within_train_step": 2.753922939300537, "step": 1529} {"train_info/time_between_train_steps": 0.002938985824584961, "step": 1529} {"info/global_step": 1530, "train_info/time_within_train_step": 2.755272150039673, "step": 1530} {"train_info/time_between_train_steps": 0.00292205810546875, "step": 1530} {"info/global_step": 1531, "train_info/time_within_train_step": 2.756195545196533, "step": 1531} {"train_info/time_between_train_steps": 0.0030257701873779297, "step": 1531} {"info/global_step": 1532, "train_info/time_within_train_step": 2.756880760192871, "step": 1532} {"train_info/time_between_train_steps": 0.002954721450805664, "step": 1532} {"info/global_step": 1533, "train_info/time_within_train_step": 2.7547357082366943, "step": 1533} {"train_info/time_between_train_steps": 0.0029070377349853516, "step": 1533} {"info/global_step": 1534, "train_info/time_within_train_step": 2.753493070602417, "step": 1534} {"train_info/time_between_train_steps": 0.002907991409301758, "step": 1534} {"info/global_step": 1535, "train_info/time_within_train_step": 2.754166841506958, "step": 1535} {"train_info/time_between_train_steps": 0.002969503402709961, "step": 1535} {"info/global_step": 1536, "train_info/time_within_train_step": 2.754441738128662, "step": 1536} {"train_info/time_between_train_steps": 0.002962827682495117, "step": 1536} {"info/global_step": 1537, "train_info/time_within_train_step": 2.7538397312164307, "step": 1537} {"train_info/time_between_train_steps": 0.002987384796142578, "step": 1537} {"info/global_step": 1538, "train_info/time_within_train_step": 2.754173517227173, "step": 1538} {"train_info/time_between_train_steps": 0.0030426979064941406, "step": 1538} {"info/global_step": 1539, "train_info/time_within_train_step": 2.753781318664551, "step": 1539} {"train_info/time_between_train_steps": 0.0029151439666748047, "step": 1539} {"info/global_step": 1540, "train_info/time_within_train_step": 2.754503011703491, "step": 1540} {"train_info/time_between_train_steps": 0.0029387474060058594, "step": 1540} {"info/global_step": 1541, "train_info/time_within_train_step": 2.7545645236968994, "step": 1541} {"train_info/time_between_train_steps": 0.0028946399688720703, "step": 1541} {"info/global_step": 1542, "train_info/time_within_train_step": 2.754202127456665, "step": 1542} {"train_info/time_between_train_steps": 0.0029523372650146484, "step": 1542} {"info/global_step": 1543, "train_info/time_within_train_step": 2.753190755844116, "step": 1543} {"train_info/time_between_train_steps": 0.0029892921447753906, "step": 1543} {"info/global_step": 1544, "train_info/time_within_train_step": 2.7550599575042725, "step": 1544} {"train_info/time_between_train_steps": 0.002981901168823242, "step": 1544} {"info/global_step": 1545, "train_info/time_within_train_step": 2.7559216022491455, "step": 1545} {"train_info/time_between_train_steps": 0.003015279769897461, "step": 1545} {"info/global_step": 1546, "train_info/time_within_train_step": 2.756340742111206, "step": 1546} {"train_info/time_between_train_steps": 0.003051280975341797, "step": 1546} {"info/global_step": 1547, "train_info/time_within_train_step": 2.757364273071289, "step": 1547} {"train_info/time_between_train_steps": 0.0031070709228515625, "step": 1547} {"info/global_step": 1548, "train_info/time_within_train_step": 2.757233142852783, "step": 1548} {"train_info/time_between_train_steps": 0.003060579299926758, "step": 1548} {"info/global_step": 1549, "train_info/time_within_train_step": 2.757758378982544, "step": 1549} {"train_info/time_between_train_steps": 0.0030629634857177734, "step": 1549} {"info/global_step": 1550, "train_info/time_within_train_step": 2.7574117183685303, "step": 1550} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746570527, "_runtime": 4536}, "step": 1550} {"logs": {"train/loss": 4.5581, "train/learning_rate": 0.0005633333333333333, "train/epoch": 1.07, "_timestamp": 1746570527, "_runtime": 4536}, "step": 1550} {"train_info/time_between_train_steps": 0.01386880874633789, "step": 1550} {"info/global_step": 1551, "train_info/time_within_train_step": 2.7549078464508057, "step": 1551} {"train_info/time_between_train_steps": 0.0030944347381591797, "step": 1551} {"info/global_step": 1552, "train_info/time_within_train_step": 2.761906147003174, "step": 1552} {"train_info/time_between_train_steps": 0.0030786991119384766, "step": 1552} {"info/global_step": 1553, "train_info/time_within_train_step": 2.754089832305908, "step": 1553} {"train_info/time_between_train_steps": 0.003091096878051758, "step": 1553} {"info/global_step": 1554, "train_info/time_within_train_step": 2.762192487716675, "step": 1554} {"train_info/time_between_train_steps": 0.0030710697174072266, "step": 1554} {"info/global_step": 1555, "train_info/time_within_train_step": 2.758395195007324, "step": 1555} {"train_info/time_between_train_steps": 0.006018400192260742, "step": 1555} {"info/global_step": 1556, "train_info/time_within_train_step": 2.7545430660247803, "step": 1556} {"train_info/time_between_train_steps": 0.005947589874267578, "step": 1556} {"info/global_step": 1557, "train_info/time_within_train_step": 2.7543444633483887, "step": 1557} {"train_info/time_between_train_steps": 0.0028929710388183594, "step": 1557} {"info/global_step": 1558, "train_info/time_within_train_step": 2.753743886947632, "step": 1558} {"train_info/time_between_train_steps": 0.002968311309814453, "step": 1558} {"info/global_step": 1559, "train_info/time_within_train_step": 2.753997802734375, "step": 1559} {"train_info/time_between_train_steps": 0.00295257568359375, "step": 1559} {"info/global_step": 1560, "train_info/time_within_train_step": 2.7546558380126953, "step": 1560} {"train_info/time_between_train_steps": 0.0028939247131347656, "step": 1560} {"info/global_step": 1561, "train_info/time_within_train_step": 2.755373954772949, "step": 1561} {"train_info/time_between_train_steps": 0.002930164337158203, "step": 1561} {"info/global_step": 1562, "train_info/time_within_train_step": 2.7544102668762207, "step": 1562} {"train_info/time_between_train_steps": 0.002866506576538086, "step": 1562} {"info/global_step": 1563, "train_info/time_within_train_step": 2.753946304321289, "step": 1563} {"train_info/time_between_train_steps": 0.002874135971069336, "step": 1563} {"info/global_step": 1564, "train_info/time_within_train_step": 2.753145933151245, "step": 1564} {"train_info/time_between_train_steps": 0.002897500991821289, "step": 1564} {"info/global_step": 1565, "train_info/time_within_train_step": 2.754514455795288, "step": 1565} {"train_info/time_between_train_steps": 0.002880573272705078, "step": 1565} {"info/global_step": 1566, "train_info/time_within_train_step": 2.753790855407715, "step": 1566} {"train_info/time_between_train_steps": 0.0029227733612060547, "step": 1566} {"info/global_step": 1567, "train_info/time_within_train_step": 2.7548398971557617, "step": 1567} {"train_info/time_between_train_steps": 0.00304412841796875, "step": 1567} {"info/global_step": 1568, "train_info/time_within_train_step": 2.7537567615509033, "step": 1568} {"train_info/time_between_train_steps": 0.002933979034423828, "step": 1568} {"info/global_step": 1569, "train_info/time_within_train_step": 2.7532198429107666, "step": 1569} {"train_info/time_between_train_steps": 0.003015279769897461, "step": 1569} {"info/global_step": 1570, "train_info/time_within_train_step": 2.753818988800049, "step": 1570} {"train_info/time_between_train_steps": 0.003003358840942383, "step": 1570} {"info/global_step": 1571, "train_info/time_within_train_step": 2.7536563873291016, "step": 1571} {"train_info/time_between_train_steps": 0.0029926300048828125, "step": 1571} {"info/global_step": 1572, "train_info/time_within_train_step": 2.754061222076416, "step": 1572} {"train_info/time_between_train_steps": 0.002978086471557617, "step": 1572} {"info/global_step": 1573, "train_info/time_within_train_step": 2.7542288303375244, "step": 1573} {"train_info/time_between_train_steps": 0.002964019775390625, "step": 1573} {"info/global_step": 1574, "train_info/time_within_train_step": 2.7552032470703125, "step": 1574} {"train_info/time_between_train_steps": 0.002882719039916992, "step": 1574} {"info/global_step": 1575, "train_info/time_within_train_step": 2.75429368019104, "step": 1575} {"train_info/time_between_train_steps": 0.0028862953186035156, "step": 1575} {"info/global_step": 1576, "train_info/time_within_train_step": 2.7555348873138428, "step": 1576} {"train_info/time_between_train_steps": 0.002925395965576172, "step": 1576} {"info/global_step": 1577, "train_info/time_within_train_step": 2.755397081375122, "step": 1577} {"train_info/time_between_train_steps": 0.002930164337158203, "step": 1577} {"info/global_step": 1578, "train_info/time_within_train_step": 2.7537245750427246, "step": 1578} {"train_info/time_between_train_steps": 0.003100156784057617, "step": 1578} {"info/global_step": 1579, "train_info/time_within_train_step": 2.754596471786499, "step": 1579} {"train_info/time_between_train_steps": 0.002945423126220703, "step": 1579} {"info/global_step": 1580, "train_info/time_within_train_step": 2.761413335800171, "step": 1580} {"train_info/time_between_train_steps": 0.002935171127319336, "step": 1580} {"info/global_step": 1581, "train_info/time_within_train_step": 2.7605538368225098, "step": 1581} {"train_info/time_between_train_steps": 0.0030159950256347656, "step": 1581} {"info/global_step": 1582, "train_info/time_within_train_step": 2.7548041343688965, "step": 1582} {"train_info/time_between_train_steps": 0.0029480457305908203, "step": 1582} {"info/global_step": 1583, "train_info/time_within_train_step": 2.7547802925109863, "step": 1583} {"train_info/time_between_train_steps": 0.0029573440551757812, "step": 1583} {"info/global_step": 1584, "train_info/time_within_train_step": 2.751532793045044, "step": 1584} {"train_info/time_between_train_steps": 0.003001689910888672, "step": 1584} {"info/global_step": 1585, "train_info/time_within_train_step": 2.753185749053955, "step": 1585} {"train_info/time_between_train_steps": 0.0029866695404052734, "step": 1585} {"info/global_step": 1586, "train_info/time_within_train_step": 2.7535245418548584, "step": 1586} {"train_info/time_between_train_steps": 0.0029697418212890625, "step": 1586} {"info/global_step": 1587, "train_info/time_within_train_step": 2.86552095413208, "step": 1587} {"train_info/time_between_train_steps": 0.002994060516357422, "step": 1587} {"info/global_step": 1588, "train_info/time_within_train_step": 2.753784418106079, "step": 1588} {"train_info/time_between_train_steps": 0.002996206283569336, "step": 1588} {"info/global_step": 1589, "train_info/time_within_train_step": 2.7541449069976807, "step": 1589} {"train_info/time_between_train_steps": 0.003010988235473633, "step": 1589} {"info/global_step": 1590, "train_info/time_within_train_step": 2.7551777362823486, "step": 1590} {"train_info/time_between_train_steps": 0.002978086471557617, "step": 1590} {"info/global_step": 1591, "train_info/time_within_train_step": 2.7544572353363037, "step": 1591} {"train_info/time_between_train_steps": 0.002961397171020508, "step": 1591} {"info/global_step": 1592, "train_info/time_within_train_step": 2.754812240600586, "step": 1592} {"train_info/time_between_train_steps": 0.0029442310333251953, "step": 1592} {"info/global_step": 1593, "train_info/time_within_train_step": 2.7542290687561035, "step": 1593} {"train_info/time_between_train_steps": 0.002961397171020508, "step": 1593} {"info/global_step": 1594, "train_info/time_within_train_step": 2.754075050354004, "step": 1594} {"train_info/time_between_train_steps": 0.002949953079223633, "step": 1594} {"info/global_step": 1595, "train_info/time_within_train_step": 2.754258871078491, "step": 1595} {"train_info/time_between_train_steps": 0.002907276153564453, "step": 1595} {"info/global_step": 1596, "train_info/time_within_train_step": 2.7523982524871826, "step": 1596} {"train_info/time_between_train_steps": 0.0030133724212646484, "step": 1596} {"info/global_step": 1597, "train_info/time_within_train_step": 2.7541468143463135, "step": 1597} {"train_info/time_between_train_steps": 0.0030295848846435547, "step": 1597} {"info/global_step": 1598, "train_info/time_within_train_step": 2.7537522315979004, "step": 1598} {"train_info/time_between_train_steps": 0.002889394760131836, "step": 1598} {"info/global_step": 1599, "train_info/time_within_train_step": 2.7529428005218506, "step": 1599} {"train_info/time_between_train_steps": 0.002941131591796875, "step": 1599} {"info/global_step": 1600, "train_info/time_within_train_step": 2.754321813583374, "step": 1600} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746570666, "_runtime": 4675}, "step": 1600} {"logs": {"train/loss": 4.5352, "train/learning_rate": 0.00056, "train/epoch": 1.07, "_timestamp": 1746570666, "_runtime": 4675}, "step": 1600} {"train_info/time_between_train_steps": 24.225514888763428, "step": 1600} {"info/global_step": 1601, "train_info/time_within_train_step": 2.5341341495513916, "step": 1601} {"train_info/time_between_train_steps": 0.002999544143676758, "step": 1601} {"info/global_step": 1602, "train_info/time_within_train_step": 2.5764381885528564, "step": 1602} {"train_info/time_between_train_steps": 0.0029828548431396484, "step": 1602} {"info/global_step": 1603, "train_info/time_within_train_step": 2.7108020782470703, "step": 1603} {"train_info/time_between_train_steps": 0.0030100345611572266, "step": 1603} {"info/global_step": 1604, "train_info/time_within_train_step": 2.726712703704834, "step": 1604} {"train_info/time_between_train_steps": 0.002995014190673828, "step": 1604} {"info/global_step": 1605, "train_info/time_within_train_step": 2.7298314571380615, "step": 1605} {"train_info/time_between_train_steps": 0.0029659271240234375, "step": 1605} {"info/global_step": 1606, "train_info/time_within_train_step": 2.751950740814209, "step": 1606} {"train_info/time_between_train_steps": 0.003018617630004883, "step": 1606} {"info/global_step": 1607, "train_info/time_within_train_step": 2.7538208961486816, "step": 1607} {"train_info/time_between_train_steps": 0.0029473304748535156, "step": 1607} {"info/global_step": 1608, "train_info/time_within_train_step": 2.7538363933563232, "step": 1608} {"train_info/time_between_train_steps": 0.00299835205078125, "step": 1608} {"info/global_step": 1609, "train_info/time_within_train_step": 2.7536752223968506, "step": 1609} {"train_info/time_between_train_steps": 0.0029861927032470703, "step": 1609} {"info/global_step": 1610, "train_info/time_within_train_step": 2.754762649536133, "step": 1610} {"train_info/time_between_train_steps": 0.003025054931640625, "step": 1610} {"info/global_step": 1611, "train_info/time_within_train_step": 2.754598379135132, "step": 1611} {"train_info/time_between_train_steps": 0.0029773712158203125, "step": 1611} {"info/global_step": 1612, "train_info/time_within_train_step": 2.7530858516693115, "step": 1612} {"train_info/time_between_train_steps": 0.003000974655151367, "step": 1612} {"info/global_step": 1613, "train_info/time_within_train_step": 2.7541351318359375, "step": 1613} {"train_info/time_between_train_steps": 0.003023386001586914, "step": 1613} {"info/global_step": 1614, "train_info/time_within_train_step": 2.7561373710632324, "step": 1614} {"train_info/time_between_train_steps": 0.002981901168823242, "step": 1614} {"info/global_step": 1615, "train_info/time_within_train_step": 2.7559685707092285, "step": 1615} {"train_info/time_between_train_steps": 0.0029516220092773438, "step": 1615} {"info/global_step": 1616, "train_info/time_within_train_step": 2.755654811859131, "step": 1616} {"train_info/time_between_train_steps": 0.0029969215393066406, "step": 1616} {"info/global_step": 1617, "train_info/time_within_train_step": 2.756284475326538, "step": 1617} {"train_info/time_between_train_steps": 0.0029342174530029297, "step": 1617} {"info/global_step": 1618, "train_info/time_within_train_step": 2.7549221515655518, "step": 1618} {"train_info/time_between_train_steps": 0.002969026565551758, "step": 1618} {"info/global_step": 1619, "train_info/time_within_train_step": 2.7540459632873535, "step": 1619} {"train_info/time_between_train_steps": 0.002950906753540039, "step": 1619} {"info/global_step": 1620, "train_info/time_within_train_step": 2.7555549144744873, "step": 1620} {"train_info/time_between_train_steps": 0.0029265880584716797, "step": 1620} {"info/global_step": 1621, "train_info/time_within_train_step": 2.7553935050964355, "step": 1621} {"train_info/time_between_train_steps": 0.0029413700103759766, "step": 1621} {"info/global_step": 1622, "train_info/time_within_train_step": 2.7554593086242676, "step": 1622} {"train_info/time_between_train_steps": 0.0029337406158447266, "step": 1622} {"info/global_step": 1623, "train_info/time_within_train_step": 2.7537074089050293, "step": 1623} {"train_info/time_between_train_steps": 0.0029621124267578125, "step": 1623} {"info/global_step": 1624, "train_info/time_within_train_step": 2.754570722579956, "step": 1624} {"train_info/time_between_train_steps": 0.0028905868530273438, "step": 1624} {"info/global_step": 1625, "train_info/time_within_train_step": 2.7552902698516846, "step": 1625} {"train_info/time_between_train_steps": 0.0029358863830566406, "step": 1625} {"info/global_step": 1626, "train_info/time_within_train_step": 2.753352165222168, "step": 1626} {"train_info/time_between_train_steps": 0.0030221939086914062, "step": 1626} {"info/global_step": 1627, "train_info/time_within_train_step": 2.7553470134735107, "step": 1627} {"train_info/time_between_train_steps": 0.0029785633087158203, "step": 1627} {"info/global_step": 1628, "train_info/time_within_train_step": 2.7541465759277344, "step": 1628} {"train_info/time_between_train_steps": 0.0029439926147460938, "step": 1628} {"info/global_step": 1629, "train_info/time_within_train_step": 2.7535288333892822, "step": 1629} {"train_info/time_between_train_steps": 0.002989053726196289, "step": 1629} {"info/global_step": 1630, "train_info/time_within_train_step": 2.755152940750122, "step": 1630} {"train_info/time_between_train_steps": 0.0030286312103271484, "step": 1630} {"info/global_step": 1631, "train_info/time_within_train_step": 2.7548086643218994, "step": 1631} {"train_info/time_between_train_steps": 0.002981901168823242, "step": 1631} {"info/global_step": 1632, "train_info/time_within_train_step": 2.755326509475708, "step": 1632} {"train_info/time_between_train_steps": 0.0029921531677246094, "step": 1632} {"info/global_step": 1633, "train_info/time_within_train_step": 2.7529847621917725, "step": 1633} {"train_info/time_between_train_steps": 0.002910137176513672, "step": 1633} {"info/global_step": 1634, "train_info/time_within_train_step": 2.7542927265167236, "step": 1634} {"train_info/time_between_train_steps": 0.002943754196166992, "step": 1634} {"info/global_step": 1635, "train_info/time_within_train_step": 2.7547125816345215, "step": 1635} {"train_info/time_between_train_steps": 0.002886533737182617, "step": 1635} {"info/global_step": 1636, "train_info/time_within_train_step": 2.755047082901001, "step": 1636} {"train_info/time_between_train_steps": 0.0029556751251220703, "step": 1636} {"info/global_step": 1637, "train_info/time_within_train_step": 2.755452871322632, "step": 1637} {"train_info/time_between_train_steps": 0.0029363632202148438, "step": 1637} {"info/global_step": 1638, "train_info/time_within_train_step": 2.7550575733184814, "step": 1638} {"train_info/time_between_train_steps": 0.0029888153076171875, "step": 1638} {"info/global_step": 1639, "train_info/time_within_train_step": 2.751899003982544, "step": 1639} {"train_info/time_between_train_steps": 0.0029625892639160156, "step": 1639} {"info/global_step": 1640, "train_info/time_within_train_step": 2.752614974975586, "step": 1640} {"train_info/time_between_train_steps": 0.002981424331665039, "step": 1640} {"info/global_step": 1641, "train_info/time_within_train_step": 2.7545344829559326, "step": 1641} {"train_info/time_between_train_steps": 0.0029587745666503906, "step": 1641} {"info/global_step": 1642, "train_info/time_within_train_step": 2.752716064453125, "step": 1642} {"train_info/time_between_train_steps": 0.002965211868286133, "step": 1642} {"info/global_step": 1643, "train_info/time_within_train_step": 2.7546474933624268, "step": 1643} {"train_info/time_between_train_steps": 0.0029778480529785156, "step": 1643} {"info/global_step": 1644, "train_info/time_within_train_step": 2.7537481784820557, "step": 1644} {"train_info/time_between_train_steps": 0.0029668807983398438, "step": 1644} {"info/global_step": 1645, "train_info/time_within_train_step": 2.7539303302764893, "step": 1645} {"train_info/time_between_train_steps": 0.0029859542846679688, "step": 1645} {"info/global_step": 1646, "train_info/time_within_train_step": 2.7531111240386963, "step": 1646} {"train_info/time_between_train_steps": 0.002997875213623047, "step": 1646} {"info/global_step": 1647, "train_info/time_within_train_step": 2.7544491291046143, "step": 1647} {"train_info/time_between_train_steps": 0.003010988235473633, "step": 1647} {"info/global_step": 1648, "train_info/time_within_train_step": 2.7521018981933594, "step": 1648} {"train_info/time_between_train_steps": 0.0029754638671875, "step": 1648} {"info/global_step": 1649, "train_info/time_within_train_step": 2.7540252208709717, "step": 1649} {"train_info/time_between_train_steps": 0.003025054931640625, "step": 1649} {"info/global_step": 1650, "train_info/time_within_train_step": 2.749574661254883, "step": 1650} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746570828, "_runtime": 4837}, "step": 1650} {"logs": {"train/loss": 4.506, "train/learning_rate": 0.0005566666666666667, "train/epoch": 1.08, "_timestamp": 1746570828, "_runtime": 4837}, "step": 1650} {"train_info/time_between_train_steps": 0.015506744384765625, "step": 1650} {"info/global_step": 1651, "train_info/time_within_train_step": 2.7522220611572266, "step": 1651} {"train_info/time_between_train_steps": 0.0030074119567871094, "step": 1651} {"info/global_step": 1652, "train_info/time_within_train_step": 2.754854679107666, "step": 1652} {"train_info/time_between_train_steps": 0.0030183792114257812, "step": 1652} {"info/global_step": 1653, "train_info/time_within_train_step": 2.7533464431762695, "step": 1653} {"train_info/time_between_train_steps": 0.0030057430267333984, "step": 1653} {"info/global_step": 1654, "train_info/time_within_train_step": 2.754044532775879, "step": 1654} {"train_info/time_between_train_steps": 0.0029706954956054688, "step": 1654} {"info/global_step": 1655, "train_info/time_within_train_step": 2.754843235015869, "step": 1655} {"train_info/time_between_train_steps": 0.0030078887939453125, "step": 1655} {"info/global_step": 1656, "train_info/time_within_train_step": 2.754377841949463, "step": 1656} {"train_info/time_between_train_steps": 0.002991199493408203, "step": 1656} {"info/global_step": 1657, "train_info/time_within_train_step": 2.7546579837799072, "step": 1657} {"train_info/time_between_train_steps": 0.0029850006103515625, "step": 1657} {"info/global_step": 1658, "train_info/time_within_train_step": 2.753726005554199, "step": 1658} {"train_info/time_between_train_steps": 0.0029866695404052734, "step": 1658} {"info/global_step": 1659, "train_info/time_within_train_step": 2.7529871463775635, "step": 1659} {"train_info/time_between_train_steps": 0.0029702186584472656, "step": 1659} {"info/global_step": 1660, "train_info/time_within_train_step": 2.753023624420166, "step": 1660} {"train_info/time_between_train_steps": 0.003015279769897461, "step": 1660} {"info/global_step": 1661, "train_info/time_within_train_step": 2.7543392181396484, "step": 1661} {"train_info/time_between_train_steps": 0.002998828887939453, "step": 1661} {"info/global_step": 1662, "train_info/time_within_train_step": 2.7537457942962646, "step": 1662} {"train_info/time_between_train_steps": 0.0029790401458740234, "step": 1662} {"info/global_step": 1663, "train_info/time_within_train_step": 2.754164934158325, "step": 1663} {"train_info/time_between_train_steps": 0.002920866012573242, "step": 1663} {"info/global_step": 1664, "train_info/time_within_train_step": 2.7529470920562744, "step": 1664} {"train_info/time_between_train_steps": 0.0030565261840820312, "step": 1664} {"info/global_step": 1665, "train_info/time_within_train_step": 2.7547388076782227, "step": 1665} {"train_info/time_between_train_steps": 0.003018617630004883, "step": 1665} {"info/global_step": 1666, "train_info/time_within_train_step": 2.7548444271087646, "step": 1666} {"train_info/time_between_train_steps": 0.0030281543731689453, "step": 1666} {"info/global_step": 1667, "train_info/time_within_train_step": 2.753495454788208, "step": 1667} {"train_info/time_between_train_steps": 0.002900362014770508, "step": 1667} {"info/global_step": 1668, "train_info/time_within_train_step": 2.754190683364868, "step": 1668} {"train_info/time_between_train_steps": 0.0029723644256591797, "step": 1668} {"info/global_step": 1669, "train_info/time_within_train_step": 2.753469228744507, "step": 1669} {"train_info/time_between_train_steps": 0.002984285354614258, "step": 1669} {"info/global_step": 1670, "train_info/time_within_train_step": 2.7538814544677734, "step": 1670} {"train_info/time_between_train_steps": 0.003027677536010742, "step": 1670} {"info/global_step": 1671, "train_info/time_within_train_step": 2.8114380836486816, "step": 1671} {"train_info/time_between_train_steps": 0.0030608177185058594, "step": 1671} {"info/global_step": 1672, "train_info/time_within_train_step": 2.7542507648468018, "step": 1672} {"train_info/time_between_train_steps": 0.0030455589294433594, "step": 1672} {"info/global_step": 1673, "train_info/time_within_train_step": 2.75309157371521, "step": 1673} {"train_info/time_between_train_steps": 0.0030341148376464844, "step": 1673} {"info/global_step": 1674, "train_info/time_within_train_step": 2.75526762008667, "step": 1674} {"train_info/time_between_train_steps": 0.002953052520751953, "step": 1674} {"info/global_step": 1675, "train_info/time_within_train_step": 2.7519283294677734, "step": 1675} {"train_info/time_between_train_steps": 0.0030410289764404297, "step": 1675} {"info/global_step": 1676, "train_info/time_within_train_step": 2.7540268898010254, "step": 1676} {"train_info/time_between_train_steps": 0.003010988235473633, "step": 1676} {"info/global_step": 1677, "train_info/time_within_train_step": 2.754716396331787, "step": 1677} {"train_info/time_between_train_steps": 0.0029447078704833984, "step": 1677} {"info/global_step": 1678, "train_info/time_within_train_step": 2.7544643878936768, "step": 1678} {"train_info/time_between_train_steps": 0.003028392791748047, "step": 1678} {"info/global_step": 1679, "train_info/time_within_train_step": 2.753434896469116, "step": 1679} {"train_info/time_between_train_steps": 0.0029506683349609375, "step": 1679} {"info/global_step": 1680, "train_info/time_within_train_step": 2.758965492248535, "step": 1680} {"train_info/time_between_train_steps": 0.002873659133911133, "step": 1680} {"info/global_step": 1681, "train_info/time_within_train_step": 2.7525861263275146, "step": 1681} {"train_info/time_between_train_steps": 0.0029098987579345703, "step": 1681} {"info/global_step": 1682, "train_info/time_within_train_step": 2.752944231033325, "step": 1682} {"train_info/time_between_train_steps": 0.002958059310913086, "step": 1682} {"info/global_step": 1683, "train_info/time_within_train_step": 2.7535877227783203, "step": 1683} {"train_info/time_between_train_steps": 0.002946138381958008, "step": 1683} {"info/global_step": 1684, "train_info/time_within_train_step": 2.75219464302063, "step": 1684} {"train_info/time_between_train_steps": 0.003025054931640625, "step": 1684} {"info/global_step": 1685, "train_info/time_within_train_step": 2.754225730895996, "step": 1685} {"train_info/time_between_train_steps": 0.0030205249786376953, "step": 1685} {"info/global_step": 1686, "train_info/time_within_train_step": 2.7538676261901855, "step": 1686} {"train_info/time_between_train_steps": 0.003055095672607422, "step": 1686} {"info/global_step": 1687, "train_info/time_within_train_step": 2.754748582839966, "step": 1687} {"train_info/time_between_train_steps": 0.003186941146850586, "step": 1687} {"info/global_step": 1688, "train_info/time_within_train_step": 2.75527024269104, "step": 1688} {"train_info/time_between_train_steps": 0.003154277801513672, "step": 1688} {"info/global_step": 1689, "train_info/time_within_train_step": 2.754605293273926, "step": 1689} {"train_info/time_between_train_steps": 0.0030717849731445312, "step": 1689} {"info/global_step": 1690, "train_info/time_within_train_step": 2.7553887367248535, "step": 1690} {"train_info/time_between_train_steps": 0.0032012462615966797, "step": 1690} {"info/global_step": 1691, "train_info/time_within_train_step": 2.754323959350586, "step": 1691} {"train_info/time_between_train_steps": 0.003272533416748047, "step": 1691} {"info/global_step": 1692, "train_info/time_within_train_step": 2.753133535385132, "step": 1692} {"train_info/time_between_train_steps": 0.0032205581665039062, "step": 1692} {"info/global_step": 1693, "train_info/time_within_train_step": 2.755376100540161, "step": 1693} {"train_info/time_between_train_steps": 0.003058910369873047, "step": 1693} {"info/global_step": 1694, "train_info/time_within_train_step": 2.7533278465270996, "step": 1694} {"train_info/time_between_train_steps": 0.003209829330444336, "step": 1694} {"info/global_step": 1695, "train_info/time_within_train_step": 2.755715847015381, "step": 1695} {"train_info/time_between_train_steps": 0.0031414031982421875, "step": 1695} {"info/global_step": 1696, "train_info/time_within_train_step": 2.7562201023101807, "step": 1696} {"train_info/time_between_train_steps": 0.0033736228942871094, "step": 1696} {"info/global_step": 1697, "train_info/time_within_train_step": 2.755662202835083, "step": 1697} {"train_info/time_between_train_steps": 0.003926753997802734, "step": 1697} {"info/global_step": 1698, "train_info/time_within_train_step": 2.756964683532715, "step": 1698} {"train_info/time_between_train_steps": 0.0030913352966308594, "step": 1698} {"info/global_step": 1699, "train_info/time_within_train_step": 2.754641532897949, "step": 1699} {"train_info/time_between_train_steps": 0.003507375717163086, "step": 1699} {"info/global_step": 1700, "train_info/time_within_train_step": 2.7552154064178467, "step": 1700} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746570967, "_runtime": 4976}, "step": 1700} {"logs": {"train/loss": 4.4801, "train/learning_rate": 0.0005533333333333333, "train/epoch": 1.08, "_timestamp": 1746570967, "_runtime": 4976}, "step": 1700} {"train_info/time_between_train_steps": 0.014726400375366211, "step": 1700} {"info/global_step": 1701, "train_info/time_within_train_step": 2.7554473876953125, "step": 1701} {"train_info/time_between_train_steps": 0.003659486770629883, "step": 1701} {"info/global_step": 1702, "train_info/time_within_train_step": 2.7575364112854004, "step": 1702} {"train_info/time_between_train_steps": 0.003421783447265625, "step": 1702} {"info/global_step": 1703, "train_info/time_within_train_step": 2.7565085887908936, "step": 1703} {"train_info/time_between_train_steps": 0.003988027572631836, "step": 1703} {"info/global_step": 1704, "train_info/time_within_train_step": 2.7565879821777344, "step": 1704} {"train_info/time_between_train_steps": 0.003915548324584961, "step": 1704} {"info/global_step": 1705, "train_info/time_within_train_step": 2.757469654083252, "step": 1705} {"train_info/time_between_train_steps": 0.003703594207763672, "step": 1705} {"info/global_step": 1706, "train_info/time_within_train_step": 2.7563834190368652, "step": 1706} {"train_info/time_between_train_steps": 0.003788471221923828, "step": 1706} {"train_info/time_between_train_steps": 3.276606321334839, "step": 1706} {"info/global_step": 1707, "train_info/time_within_train_step": 2.6644678115844727, "step": 1707} {"train_info/time_between_train_steps": 0.003134489059448242, "step": 1707} {"info/global_step": 1708, "train_info/time_within_train_step": 2.7556395530700684, "step": 1708} {"train_info/time_between_train_steps": 0.0032317638397216797, "step": 1708} {"info/global_step": 1709, "train_info/time_within_train_step": 2.7548987865448, "step": 1709} {"train_info/time_between_train_steps": 0.0031273365020751953, "step": 1709} {"info/global_step": 1710, "train_info/time_within_train_step": 2.7547996044158936, "step": 1710} {"train_info/time_between_train_steps": 0.0031042098999023438, "step": 1710} {"info/global_step": 1711, "train_info/time_within_train_step": 2.75433611869812, "step": 1711} {"train_info/time_between_train_steps": 0.003153562545776367, "step": 1711} {"info/global_step": 1712, "train_info/time_within_train_step": 2.7550547122955322, "step": 1712} {"train_info/time_between_train_steps": 0.003130197525024414, "step": 1712} {"info/global_step": 1713, "train_info/time_within_train_step": 2.7538905143737793, "step": 1713} {"train_info/time_between_train_steps": 0.003184080123901367, "step": 1713} {"info/global_step": 1714, "train_info/time_within_train_step": 2.7532753944396973, "step": 1714} {"train_info/time_between_train_steps": 0.003150463104248047, "step": 1714} {"info/global_step": 1715, "train_info/time_within_train_step": 2.75380539894104, "step": 1715} {"train_info/time_between_train_steps": 0.0031785964965820312, "step": 1715} {"info/global_step": 1716, "train_info/time_within_train_step": 2.7552311420440674, "step": 1716} {"train_info/time_between_train_steps": 0.0031425952911376953, "step": 1716} {"info/global_step": 1717, "train_info/time_within_train_step": 2.7542221546173096, "step": 1717} {"train_info/time_between_train_steps": 0.0032072067260742188, "step": 1717} {"info/global_step": 1718, "train_info/time_within_train_step": 2.7547595500946045, "step": 1718} {"train_info/time_between_train_steps": 0.0031349658966064453, "step": 1718} {"info/global_step": 1719, "train_info/time_within_train_step": 2.754239082336426, "step": 1719} {"train_info/time_between_train_steps": 0.003106355667114258, "step": 1719} {"info/global_step": 1720, "train_info/time_within_train_step": 2.7546753883361816, "step": 1720} {"train_info/time_between_train_steps": 0.0031099319458007812, "step": 1720} {"info/global_step": 1721, "train_info/time_within_train_step": 2.7541215419769287, "step": 1721} {"train_info/time_between_train_steps": 0.0031316280364990234, "step": 1721} {"info/global_step": 1722, "train_info/time_within_train_step": 2.7544429302215576, "step": 1722} {"train_info/time_between_train_steps": 0.0032258033752441406, "step": 1722} {"info/global_step": 1723, "train_info/time_within_train_step": 2.7539241313934326, "step": 1723} {"train_info/time_between_train_steps": 0.0031456947326660156, "step": 1723} {"info/global_step": 1724, "train_info/time_within_train_step": 2.753675699234009, "step": 1724} {"train_info/time_between_train_steps": 0.0031507015228271484, "step": 1724} {"info/global_step": 1725, "train_info/time_within_train_step": 2.7547504901885986, "step": 1725} {"train_info/time_between_train_steps": 0.003129720687866211, "step": 1725} {"info/global_step": 1726, "train_info/time_within_train_step": 2.754171371459961, "step": 1726} {"train_info/time_between_train_steps": 0.0031235218048095703, "step": 1726} {"info/global_step": 1727, "train_info/time_within_train_step": 2.7550809383392334, "step": 1727} {"train_info/time_between_train_steps": 0.0031316280364990234, "step": 1727} {"info/global_step": 1728, "train_info/time_within_train_step": 2.75490403175354, "step": 1728} {"train_info/time_between_train_steps": 0.0032012462615966797, "step": 1728} {"info/global_step": 1729, "train_info/time_within_train_step": 2.754664182662964, "step": 1729} {"train_info/time_between_train_steps": 0.003126859664916992, "step": 1729} {"info/global_step": 1730, "train_info/time_within_train_step": 2.755460739135742, "step": 1730} {"train_info/time_between_train_steps": 0.0031533241271972656, "step": 1730} {"info/global_step": 1731, "train_info/time_within_train_step": 2.75395131111145, "step": 1731} {"train_info/time_between_train_steps": 0.0031647682189941406, "step": 1731} {"info/global_step": 1732, "train_info/time_within_train_step": 2.753972053527832, "step": 1732} {"train_info/time_between_train_steps": 0.0031981468200683594, "step": 1732} {"info/global_step": 1733, "train_info/time_within_train_step": 2.752650022506714, "step": 1733} {"train_info/time_between_train_steps": 0.003129243850708008, "step": 1733} {"info/global_step": 1734, "train_info/time_within_train_step": 2.754272937774658, "step": 1734} {"train_info/time_between_train_steps": 0.0031828880310058594, "step": 1734} {"info/global_step": 1735, "train_info/time_within_train_step": 2.7554473876953125, "step": 1735} {"train_info/time_between_train_steps": 0.0031833648681640625, "step": 1735} {"info/global_step": 1736, "train_info/time_within_train_step": 2.7545032501220703, "step": 1736} {"train_info/time_between_train_steps": 0.003196239471435547, "step": 1736} {"info/global_step": 1737, "train_info/time_within_train_step": 2.7535884380340576, "step": 1737} {"train_info/time_between_train_steps": 0.0031948089599609375, "step": 1737} {"info/global_step": 1738, "train_info/time_within_train_step": 2.7553486824035645, "step": 1738} {"train_info/time_between_train_steps": 0.0031554698944091797, "step": 1738} {"info/global_step": 1739, "train_info/time_within_train_step": 2.754486322402954, "step": 1739} {"train_info/time_between_train_steps": 0.0031280517578125, "step": 1739} {"info/global_step": 1740, "train_info/time_within_train_step": 2.7539992332458496, "step": 1740} {"train_info/time_between_train_steps": 0.0031485557556152344, "step": 1740} {"info/global_step": 1741, "train_info/time_within_train_step": 2.754385232925415, "step": 1741} {"train_info/time_between_train_steps": 0.0031430721282958984, "step": 1741} {"info/global_step": 1742, "train_info/time_within_train_step": 2.7551372051239014, "step": 1742} {"train_info/time_between_train_steps": 0.003168821334838867, "step": 1742} {"info/global_step": 1743, "train_info/time_within_train_step": 2.753270149230957, "step": 1743} {"train_info/time_between_train_steps": 0.0032181739807128906, "step": 1743} {"info/global_step": 1744, "train_info/time_within_train_step": 2.7553505897521973, "step": 1744} {"train_info/time_between_train_steps": 0.003177642822265625, "step": 1744} {"info/global_step": 1745, "train_info/time_within_train_step": 2.755216121673584, "step": 1745} {"train_info/time_between_train_steps": 0.0032019615173339844, "step": 1745} {"info/global_step": 1746, "train_info/time_within_train_step": 2.7569477558135986, "step": 1746} {"train_info/time_between_train_steps": 0.003147125244140625, "step": 1746} {"info/global_step": 1747, "train_info/time_within_train_step": 2.7550742626190186, "step": 1747} {"train_info/time_between_train_steps": 0.0031883716583251953, "step": 1747} {"info/global_step": 1748, "train_info/time_within_train_step": 2.7557051181793213, "step": 1748} {"train_info/time_between_train_steps": 0.003215789794921875, "step": 1748} {"info/global_step": 1749, "train_info/time_within_train_step": 3.3362162113189697, "step": 1749} {"train_info/time_between_train_steps": 0.003118753433227539, "step": 1749} {"info/global_step": 1750, "train_info/time_within_train_step": 2.7555572986602783, "step": 1750} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746571109, "_runtime": 5118}, "step": 1750} {"logs": {"train/loss": 4.5108, "train/learning_rate": 0.0005499999999999999, "train/epoch": 2.0, "_timestamp": 1746571109, "_runtime": 5118}, "step": 1750} {"train_info/time_between_train_steps": 0.011041402816772461, "step": 1750} {"info/global_step": 1751, "train_info/time_within_train_step": 2.7544000148773193, "step": 1751} {"train_info/time_between_train_steps": 0.0032215118408203125, "step": 1751} {"info/global_step": 1752, "train_info/time_within_train_step": 2.7527382373809814, "step": 1752} {"train_info/time_between_train_steps": 0.0032236576080322266, "step": 1752} {"info/global_step": 1753, "train_info/time_within_train_step": 2.755333662033081, "step": 1753} {"train_info/time_between_train_steps": 0.0032258033752441406, "step": 1753} {"info/global_step": 1754, "train_info/time_within_train_step": 2.755114793777466, "step": 1754} {"train_info/time_between_train_steps": 0.003123044967651367, "step": 1754} {"info/global_step": 1755, "train_info/time_within_train_step": 2.7551803588867188, "step": 1755} {"train_info/time_between_train_steps": 0.0032045841217041016, "step": 1755} {"info/global_step": 1756, "train_info/time_within_train_step": 2.754689931869507, "step": 1756} {"train_info/time_between_train_steps": 0.0032036304473876953, "step": 1756} {"info/global_step": 1757, "train_info/time_within_train_step": 2.7552826404571533, "step": 1757} {"train_info/time_between_train_steps": 0.003124713897705078, "step": 1757} {"info/global_step": 1758, "train_info/time_within_train_step": 2.7538881301879883, "step": 1758} {"train_info/time_between_train_steps": 0.0031900405883789062, "step": 1758} {"info/global_step": 1759, "train_info/time_within_train_step": 2.958641529083252, "step": 1759} {"train_info/time_between_train_steps": 0.0031585693359375, "step": 1759} {"info/global_step": 1760, "train_info/time_within_train_step": 2.7554962635040283, "step": 1760} {"train_info/time_between_train_steps": 0.0031871795654296875, "step": 1760} {"info/global_step": 1761, "train_info/time_within_train_step": 2.754829168319702, "step": 1761} {"train_info/time_between_train_steps": 0.0031812191009521484, "step": 1761} {"info/global_step": 1762, "train_info/time_within_train_step": 2.754350185394287, "step": 1762} {"train_info/time_between_train_steps": 0.0032205581665039062, "step": 1762} {"info/global_step": 1763, "train_info/time_within_train_step": 2.7545459270477295, "step": 1763} {"train_info/time_between_train_steps": 0.0031821727752685547, "step": 1763} {"info/global_step": 1764, "train_info/time_within_train_step": 2.7546746730804443, "step": 1764} {"train_info/time_between_train_steps": 0.003176450729370117, "step": 1764} {"info/global_step": 1765, "train_info/time_within_train_step": 2.7556378841400146, "step": 1765} {"train_info/time_between_train_steps": 0.0032134056091308594, "step": 1765} {"info/global_step": 1766, "train_info/time_within_train_step": 2.7550148963928223, "step": 1766} {"train_info/time_between_train_steps": 0.003197908401489258, "step": 1766} {"info/global_step": 1767, "train_info/time_within_train_step": 2.755650281906128, "step": 1767} {"train_info/time_between_train_steps": 0.0031998157501220703, "step": 1767} {"info/global_step": 1768, "train_info/time_within_train_step": 2.75384521484375, "step": 1768} {"train_info/time_between_train_steps": 0.0031197071075439453, "step": 1768} {"info/global_step": 1769, "train_info/time_within_train_step": 2.8739545345306396, "step": 1769} {"train_info/time_between_train_steps": 0.0031218528747558594, "step": 1769} {"info/global_step": 1770, "train_info/time_within_train_step": 2.754957437515259, "step": 1770} {"train_info/time_between_train_steps": 0.0031731128692626953, "step": 1770} {"info/global_step": 1771, "train_info/time_within_train_step": 2.754551410675049, "step": 1771} {"train_info/time_between_train_steps": 0.0031228065490722656, "step": 1771} {"info/global_step": 1772, "train_info/time_within_train_step": 2.7547664642333984, "step": 1772} {"train_info/time_between_train_steps": 0.003165006637573242, "step": 1772} {"info/global_step": 1773, "train_info/time_within_train_step": 2.7546095848083496, "step": 1773} {"train_info/time_between_train_steps": 0.0031654834747314453, "step": 1773} {"info/global_step": 1774, "train_info/time_within_train_step": 2.753206253051758, "step": 1774} {"train_info/time_between_train_steps": 0.0032269954681396484, "step": 1774} {"info/global_step": 1775, "train_info/time_within_train_step": 2.754369020462036, "step": 1775} {"train_info/time_between_train_steps": 0.003134012222290039, "step": 1775} {"info/global_step": 1776, "train_info/time_within_train_step": 2.7549216747283936, "step": 1776} {"train_info/time_between_train_steps": 0.003225088119506836, "step": 1776} {"info/global_step": 1777, "train_info/time_within_train_step": 2.7519750595092773, "step": 1777} {"train_info/time_between_train_steps": 0.0032346248626708984, "step": 1777} {"info/global_step": 1778, "train_info/time_within_train_step": 2.7557034492492676, "step": 1778} {"train_info/time_between_train_steps": 0.003137826919555664, "step": 1778} {"info/global_step": 1779, "train_info/time_within_train_step": 2.755155086517334, "step": 1779} {"train_info/time_between_train_steps": 0.003177642822265625, "step": 1779} {"info/global_step": 1780, "train_info/time_within_train_step": 2.7542316913604736, "step": 1780} {"train_info/time_between_train_steps": 0.0031321048736572266, "step": 1780} {"info/global_step": 1781, "train_info/time_within_train_step": 2.7545359134674072, "step": 1781} {"train_info/time_between_train_steps": 0.0032007694244384766, "step": 1781} {"info/global_step": 1782, "train_info/time_within_train_step": 2.7556986808776855, "step": 1782} {"train_info/time_between_train_steps": 0.00322723388671875, "step": 1782} {"info/global_step": 1783, "train_info/time_within_train_step": 2.754453182220459, "step": 1783} {"train_info/time_between_train_steps": 0.003160238265991211, "step": 1783} {"info/global_step": 1784, "train_info/time_within_train_step": 2.751211166381836, "step": 1784} {"train_info/time_between_train_steps": 0.0031392574310302734, "step": 1784} {"info/global_step": 1785, "train_info/time_within_train_step": 2.7546212673187256, "step": 1785} {"train_info/time_between_train_steps": 0.003636598587036133, "step": 1785} {"info/global_step": 1786, "train_info/time_within_train_step": 2.7524380683898926, "step": 1786} {"train_info/time_between_train_steps": 0.003172636032104492, "step": 1786} {"info/global_step": 1787, "train_info/time_within_train_step": 2.751729726791382, "step": 1787} {"train_info/time_between_train_steps": 0.0031485557556152344, "step": 1787} {"info/global_step": 1788, "train_info/time_within_train_step": 2.754155397415161, "step": 1788} {"train_info/time_between_train_steps": 0.0031914710998535156, "step": 1788} {"info/global_step": 1789, "train_info/time_within_train_step": 2.7545559406280518, "step": 1789} {"train_info/time_between_train_steps": 0.003098726272583008, "step": 1789} {"info/global_step": 1790, "train_info/time_within_train_step": 2.7519984245300293, "step": 1790} {"train_info/time_between_train_steps": 0.003153085708618164, "step": 1790} {"info/global_step": 1791, "train_info/time_within_train_step": 2.7531661987304688, "step": 1791} {"train_info/time_between_train_steps": 0.0031125545501708984, "step": 1791} {"info/global_step": 1792, "train_info/time_within_train_step": 2.7552223205566406, "step": 1792} {"train_info/time_between_train_steps": 0.003111124038696289, "step": 1792} {"info/global_step": 1793, "train_info/time_within_train_step": 2.7544541358947754, "step": 1793} {"train_info/time_between_train_steps": 0.0031070709228515625, "step": 1793} {"info/global_step": 1794, "train_info/time_within_train_step": 2.752857208251953, "step": 1794} {"train_info/time_between_train_steps": 0.0031557083129882812, "step": 1794} {"info/global_step": 1795, "train_info/time_within_train_step": 2.7539894580841064, "step": 1795} {"train_info/time_between_train_steps": 0.003103971481323242, "step": 1795} {"info/global_step": 1796, "train_info/time_within_train_step": 2.7549171447753906, "step": 1796} {"train_info/time_between_train_steps": 0.003153085708618164, "step": 1796} {"info/global_step": 1797, "train_info/time_within_train_step": 2.753413438796997, "step": 1797} {"train_info/time_between_train_steps": 0.0031120777130126953, "step": 1797} {"info/global_step": 1798, "train_info/time_within_train_step": 2.753904104232788, "step": 1798} {"train_info/time_between_train_steps": 0.003104686737060547, "step": 1798} {"info/global_step": 1799, "train_info/time_within_train_step": 2.754603147506714, "step": 1799} {"train_info/time_between_train_steps": 0.0031065940856933594, "step": 1799} {"info/global_step": 1800, "train_info/time_within_train_step": 2.754464864730835, "step": 1800} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746571247, "_runtime": 5256}, "step": 1800} {"logs": {"train/loss": 4.4314, "train/learning_rate": 0.0005466666666666667, "train/epoch": 2.01, "_timestamp": 1746571247, "_runtime": 5256}, "step": 1800} {"train_info/time_between_train_steps": 38.42958307266235, "step": 1800} {"info/global_step": 1801, "train_info/time_within_train_step": 2.5250189304351807, "step": 1801} {"train_info/time_between_train_steps": 0.0032711029052734375, "step": 1801} {"info/global_step": 1802, "train_info/time_within_train_step": 2.5721659660339355, "step": 1802} {"train_info/time_between_train_steps": 0.00310516357421875, "step": 1802} {"info/global_step": 1803, "train_info/time_within_train_step": 2.7105860710144043, "step": 1803} {"train_info/time_between_train_steps": 0.003139019012451172, "step": 1803} {"info/global_step": 1804, "train_info/time_within_train_step": 2.7027018070220947, "step": 1804} {"train_info/time_between_train_steps": 0.0031404495239257812, "step": 1804} {"info/global_step": 1805, "train_info/time_within_train_step": 2.7098653316497803, "step": 1805} {"train_info/time_between_train_steps": 0.003110647201538086, "step": 1805} {"info/global_step": 1806, "train_info/time_within_train_step": 2.734187364578247, "step": 1806} {"train_info/time_between_train_steps": 0.003172636032104492, "step": 1806} {"info/global_step": 1807, "train_info/time_within_train_step": 2.7531070709228516, "step": 1807} {"train_info/time_between_train_steps": 0.003198862075805664, "step": 1807} {"info/global_step": 1808, "train_info/time_within_train_step": 2.75582218170166, "step": 1808} {"train_info/time_between_train_steps": 0.0031626224517822266, "step": 1808} {"info/global_step": 1809, "train_info/time_within_train_step": 2.7545433044433594, "step": 1809} {"train_info/time_between_train_steps": 0.0031585693359375, "step": 1809} {"info/global_step": 1810, "train_info/time_within_train_step": 2.755838394165039, "step": 1810} {"train_info/time_between_train_steps": 0.0031075477600097656, "step": 1810} {"info/global_step": 1811, "train_info/time_within_train_step": 2.753899574279785, "step": 1811} {"train_info/time_between_train_steps": 0.003152608871459961, "step": 1811} {"info/global_step": 1812, "train_info/time_within_train_step": 2.757497787475586, "step": 1812} {"train_info/time_between_train_steps": 0.0033473968505859375, "step": 1812} {"info/global_step": 1813, "train_info/time_within_train_step": 2.7555630207061768, "step": 1813} {"train_info/time_between_train_steps": 0.0032668113708496094, "step": 1813} {"info/global_step": 1814, "train_info/time_within_train_step": 2.756211042404175, "step": 1814} {"train_info/time_between_train_steps": 0.0032296180725097656, "step": 1814} {"info/global_step": 1815, "train_info/time_within_train_step": 2.756196975708008, "step": 1815} {"train_info/time_between_train_steps": 0.0032646656036376953, "step": 1815} {"info/global_step": 1816, "train_info/time_within_train_step": 2.7559072971343994, "step": 1816} {"train_info/time_between_train_steps": 0.0032110214233398438, "step": 1816} {"info/global_step": 1817, "train_info/time_within_train_step": 2.7564682960510254, "step": 1817} {"train_info/time_between_train_steps": 0.003176450729370117, "step": 1817} {"info/global_step": 1818, "train_info/time_within_train_step": 2.7562332153320312, "step": 1818} {"train_info/time_between_train_steps": 0.003148317337036133, "step": 1818} {"info/global_step": 1819, "train_info/time_within_train_step": 2.7568581104278564, "step": 1819} {"train_info/time_between_train_steps": 0.0031626224517822266, "step": 1819} {"info/global_step": 1820, "train_info/time_within_train_step": 2.9981236457824707, "step": 1820} {"train_info/time_between_train_steps": 0.003276348114013672, "step": 1820} {"info/global_step": 1821, "train_info/time_within_train_step": 2.7567481994628906, "step": 1821} {"train_info/time_between_train_steps": 0.003319263458251953, "step": 1821} {"info/global_step": 1822, "train_info/time_within_train_step": 2.7544450759887695, "step": 1822} {"train_info/time_between_train_steps": 0.003280162811279297, "step": 1822} {"info/global_step": 1823, "train_info/time_within_train_step": 2.7555487155914307, "step": 1823} {"train_info/time_between_train_steps": 0.0031783580780029297, "step": 1823} {"info/global_step": 1824, "train_info/time_within_train_step": 2.7563319206237793, "step": 1824} {"train_info/time_between_train_steps": 0.003203153610229492, "step": 1824} {"info/global_step": 1825, "train_info/time_within_train_step": 2.7556838989257812, "step": 1825} {"train_info/time_between_train_steps": 0.003270387649536133, "step": 1825} {"info/global_step": 1826, "train_info/time_within_train_step": 2.757028102874756, "step": 1826} {"train_info/time_between_train_steps": 0.0032241344451904297, "step": 1826} {"info/global_step": 1827, "train_info/time_within_train_step": 2.7572734355926514, "step": 1827} {"train_info/time_between_train_steps": 0.0032472610473632812, "step": 1827} {"info/global_step": 1828, "train_info/time_within_train_step": 2.757481575012207, "step": 1828} {"train_info/time_between_train_steps": 0.0030934810638427734, "step": 1828} {"info/global_step": 1829, "train_info/time_within_train_step": 2.7558794021606445, "step": 1829} {"train_info/time_between_train_steps": 0.0032002925872802734, "step": 1829} {"info/global_step": 1830, "train_info/time_within_train_step": 2.756279945373535, "step": 1830} {"train_info/time_between_train_steps": 0.003206491470336914, "step": 1830} {"info/global_step": 1831, "train_info/time_within_train_step": 2.755303382873535, "step": 1831} {"train_info/time_between_train_steps": 0.13422322273254395, "step": 1831} {"info/global_step": 1832, "train_info/time_within_train_step": 2.773402690887451, "step": 1832} {"train_info/time_between_train_steps": 0.0031690597534179688, "step": 1832} {"info/global_step": 1833, "train_info/time_within_train_step": 2.7555830478668213, "step": 1833} {"train_info/time_between_train_steps": 0.003189563751220703, "step": 1833} {"info/global_step": 1834, "train_info/time_within_train_step": 2.7564339637756348, "step": 1834} {"train_info/time_between_train_steps": 0.0031511783599853516, "step": 1834} {"info/global_step": 1835, "train_info/time_within_train_step": 2.7564857006073, "step": 1835} {"train_info/time_between_train_steps": 0.0031654834747314453, "step": 1835} {"info/global_step": 1836, "train_info/time_within_train_step": 2.756943941116333, "step": 1836} {"train_info/time_between_train_steps": 0.003117084503173828, "step": 1836} {"info/global_step": 1837, "train_info/time_within_train_step": 2.7557320594787598, "step": 1837} {"train_info/time_between_train_steps": 0.0032520294189453125, "step": 1837} {"info/global_step": 1838, "train_info/time_within_train_step": 2.755683183670044, "step": 1838} {"train_info/time_between_train_steps": 0.003180980682373047, "step": 1838} {"info/global_step": 1839, "train_info/time_within_train_step": 2.758068561553955, "step": 1839} {"train_info/time_between_train_steps": 0.003223896026611328, "step": 1839} {"info/global_step": 1840, "train_info/time_within_train_step": 2.7555079460144043, "step": 1840} {"train_info/time_between_train_steps": 0.0032536983489990234, "step": 1840} {"info/global_step": 1841, "train_info/time_within_train_step": 2.755176544189453, "step": 1841} {"train_info/time_between_train_steps": 0.0031952857971191406, "step": 1841} {"info/global_step": 1842, "train_info/time_within_train_step": 2.754868745803833, "step": 1842} {"train_info/time_between_train_steps": 0.0032052993774414062, "step": 1842} {"info/global_step": 1843, "train_info/time_within_train_step": 2.755547523498535, "step": 1843} {"train_info/time_between_train_steps": 0.0032281875610351562, "step": 1843} {"info/global_step": 1844, "train_info/time_within_train_step": 2.755621910095215, "step": 1844} {"train_info/time_between_train_steps": 0.003217935562133789, "step": 1844} {"info/global_step": 1845, "train_info/time_within_train_step": 2.755714178085327, "step": 1845} {"train_info/time_between_train_steps": 0.003173351287841797, "step": 1845} {"info/global_step": 1846, "train_info/time_within_train_step": 2.7555739879608154, "step": 1846} {"train_info/time_between_train_steps": 0.003169536590576172, "step": 1846} {"info/global_step": 1847, "train_info/time_within_train_step": 2.7549660205841064, "step": 1847} {"train_info/time_between_train_steps": 0.003123760223388672, "step": 1847} {"info/global_step": 1848, "train_info/time_within_train_step": 2.7555179595947266, "step": 1848} {"train_info/time_between_train_steps": 0.003204345703125, "step": 1848} {"info/global_step": 1849, "train_info/time_within_train_step": 2.7537965774536133, "step": 1849} {"train_info/time_between_train_steps": 0.003187417984008789, "step": 1849} {"info/global_step": 1850, "train_info/time_within_train_step": 2.7559125423431396, "step": 1850} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746571424, "_runtime": 5433}, "step": 1850} {"logs": {"train/loss": 4.408, "train/learning_rate": 0.0005433333333333333, "train/epoch": 2.01, "_timestamp": 1746571424, "_runtime": 5433}, "step": 1850} {"train_info/time_between_train_steps": 0.012602567672729492, "step": 1850} {"info/global_step": 1851, "train_info/time_within_train_step": 2.754363536834717, "step": 1851} {"train_info/time_between_train_steps": 0.003209829330444336, "step": 1851} {"info/global_step": 1852, "train_info/time_within_train_step": 2.755547523498535, "step": 1852} {"train_info/time_between_train_steps": 0.0032172203063964844, "step": 1852} {"info/global_step": 1853, "train_info/time_within_train_step": 2.7558839321136475, "step": 1853} {"train_info/time_between_train_steps": 0.0032134056091308594, "step": 1853} {"info/global_step": 1854, "train_info/time_within_train_step": 2.756037473678589, "step": 1854} {"train_info/time_between_train_steps": 0.0031614303588867188, "step": 1854} {"info/global_step": 1855, "train_info/time_within_train_step": 2.7556042671203613, "step": 1855} {"train_info/time_between_train_steps": 0.003207683563232422, "step": 1855} {"info/global_step": 1856, "train_info/time_within_train_step": 2.756239891052246, "step": 1856} {"train_info/time_between_train_steps": 0.0031337738037109375, "step": 1856} {"info/global_step": 1857, "train_info/time_within_train_step": 2.754323720932007, "step": 1857} {"train_info/time_between_train_steps": 0.0032303333282470703, "step": 1857} {"info/global_step": 1858, "train_info/time_within_train_step": 2.7547929286956787, "step": 1858} {"train_info/time_between_train_steps": 0.0032012462615966797, "step": 1858} {"info/global_step": 1859, "train_info/time_within_train_step": 2.7554585933685303, "step": 1859} {"train_info/time_between_train_steps": 0.0032377243041992188, "step": 1859} {"info/global_step": 1860, "train_info/time_within_train_step": 2.755934953689575, "step": 1860} {"train_info/time_between_train_steps": 0.0032312870025634766, "step": 1860} {"info/global_step": 1861, "train_info/time_within_train_step": 2.7527542114257812, "step": 1861} {"train_info/time_between_train_steps": 0.003191232681274414, "step": 1861} {"info/global_step": 1862, "train_info/time_within_train_step": 2.755763053894043, "step": 1862} {"train_info/time_between_train_steps": 0.0032415390014648438, "step": 1862} {"info/global_step": 1863, "train_info/time_within_train_step": 2.754049301147461, "step": 1863} {"train_info/time_between_train_steps": 0.003148317337036133, "step": 1863} {"info/global_step": 1864, "train_info/time_within_train_step": 2.7552270889282227, "step": 1864} {"train_info/time_between_train_steps": 0.003194570541381836, "step": 1864} {"info/global_step": 1865, "train_info/time_within_train_step": 2.7541656494140625, "step": 1865} {"train_info/time_between_train_steps": 0.0032105445861816406, "step": 1865} {"info/global_step": 1866, "train_info/time_within_train_step": 2.755216598510742, "step": 1866} {"train_info/time_between_train_steps": 0.004676103591918945, "step": 1866} {"info/global_step": 1867, "train_info/time_within_train_step": 2.756072759628296, "step": 1867} {"train_info/time_between_train_steps": 0.003203868865966797, "step": 1867} {"info/global_step": 1868, "train_info/time_within_train_step": 2.7553012371063232, "step": 1868} {"train_info/time_between_train_steps": 0.003221273422241211, "step": 1868} {"info/global_step": 1869, "train_info/time_within_train_step": 2.7563297748565674, "step": 1869} {"train_info/time_between_train_steps": 0.003208637237548828, "step": 1869} {"info/global_step": 1870, "train_info/time_within_train_step": 2.75601863861084, "step": 1870} {"train_info/time_between_train_steps": 0.0031747817993164062, "step": 1870} {"info/global_step": 1871, "train_info/time_within_train_step": 2.7554802894592285, "step": 1871} {"train_info/time_between_train_steps": 0.003178119659423828, "step": 1871} {"info/global_step": 1872, "train_info/time_within_train_step": 2.7561347484588623, "step": 1872} {"train_info/time_between_train_steps": 0.003189563751220703, "step": 1872} {"info/global_step": 1873, "train_info/time_within_train_step": 2.7559847831726074, "step": 1873} {"train_info/time_between_train_steps": 0.0032112598419189453, "step": 1873} {"info/global_step": 1874, "train_info/time_within_train_step": 2.993623971939087, "step": 1874} {"train_info/time_between_train_steps": 0.003111124038696289, "step": 1874} {"info/global_step": 1875, "train_info/time_within_train_step": 2.755767345428467, "step": 1875} {"train_info/time_between_train_steps": 0.003134489059448242, "step": 1875} {"info/global_step": 1876, "train_info/time_within_train_step": 2.755343437194824, "step": 1876} {"train_info/time_between_train_steps": 0.0031304359436035156, "step": 1876} {"info/global_step": 1877, "train_info/time_within_train_step": 2.754007577896118, "step": 1877} {"train_info/time_between_train_steps": 0.0031173229217529297, "step": 1877} {"info/global_step": 1878, "train_info/time_within_train_step": 2.755065441131592, "step": 1878} {"train_info/time_between_train_steps": 0.00313568115234375, "step": 1878} {"info/global_step": 1879, "train_info/time_within_train_step": 2.7554385662078857, "step": 1879} {"train_info/time_between_train_steps": 0.0030961036682128906, "step": 1879} {"info/global_step": 1880, "train_info/time_within_train_step": 2.754979133605957, "step": 1880} {"train_info/time_between_train_steps": 0.003096342086791992, "step": 1880} {"info/global_step": 1881, "train_info/time_within_train_step": 2.7544875144958496, "step": 1881} {"train_info/time_between_train_steps": 0.0031096935272216797, "step": 1881} {"info/global_step": 1882, "train_info/time_within_train_step": 2.7560837268829346, "step": 1882} {"train_info/time_between_train_steps": 0.0031058788299560547, "step": 1882} {"info/global_step": 1883, "train_info/time_within_train_step": 2.7555813789367676, "step": 1883} {"train_info/time_between_train_steps": 0.0031173229217529297, "step": 1883} {"info/global_step": 1884, "train_info/time_within_train_step": 2.7542004585266113, "step": 1884} {"train_info/time_between_train_steps": 0.003161191940307617, "step": 1884} {"info/global_step": 1885, "train_info/time_within_train_step": 2.756270170211792, "step": 1885} {"train_info/time_between_train_steps": 0.003118276596069336, "step": 1885} {"info/global_step": 1886, "train_info/time_within_train_step": 2.7560036182403564, "step": 1886} {"train_info/time_between_train_steps": 0.003162384033203125, "step": 1886} {"info/global_step": 1887, "train_info/time_within_train_step": 2.7543811798095703, "step": 1887} {"train_info/time_between_train_steps": 0.003100872039794922, "step": 1887} {"info/global_step": 1888, "train_info/time_within_train_step": 2.7561726570129395, "step": 1888} {"train_info/time_between_train_steps": 0.0031075477600097656, "step": 1888} {"info/global_step": 1889, "train_info/time_within_train_step": 2.7563328742980957, "step": 1889} {"train_info/time_between_train_steps": 0.0031256675720214844, "step": 1889} {"info/global_step": 1890, "train_info/time_within_train_step": 2.7558767795562744, "step": 1890} {"train_info/time_between_train_steps": 0.0031402111053466797, "step": 1890} {"info/global_step": 1891, "train_info/time_within_train_step": 2.7562546730041504, "step": 1891} {"train_info/time_between_train_steps": 0.003131866455078125, "step": 1891} {"info/global_step": 1892, "train_info/time_within_train_step": 2.7555055618286133, "step": 1892} {"train_info/time_between_train_steps": 0.003145456314086914, "step": 1892} {"info/global_step": 1893, "train_info/time_within_train_step": 2.759039878845215, "step": 1893} {"train_info/time_between_train_steps": 0.003251314163208008, "step": 1893} {"info/global_step": 1894, "train_info/time_within_train_step": 2.886793375015259, "step": 1894} {"train_info/time_between_train_steps": 0.003244638442993164, "step": 1894} {"info/global_step": 1895, "train_info/time_within_train_step": 2.75671648979187, "step": 1895} {"train_info/time_between_train_steps": 0.0033364295959472656, "step": 1895} {"info/global_step": 1896, "train_info/time_within_train_step": 2.7554874420166016, "step": 1896} {"train_info/time_between_train_steps": 0.003223896026611328, "step": 1896} {"info/global_step": 1897, "train_info/time_within_train_step": 2.7565197944641113, "step": 1897} {"train_info/time_between_train_steps": 0.0032014846801757812, "step": 1897} {"info/global_step": 1898, "train_info/time_within_train_step": 2.7550125122070312, "step": 1898} {"train_info/time_between_train_steps": 0.003144979476928711, "step": 1898} {"info/global_step": 1899, "train_info/time_within_train_step": 2.7547147274017334, "step": 1899} {"train_info/time_between_train_steps": 0.003109455108642578, "step": 1899} {"info/global_step": 1900, "train_info/time_within_train_step": 2.754686117172241, "step": 1900} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746571563, "_runtime": 5572}, "step": 1900} {"logs": {"train/loss": 4.3868, "train/learning_rate": 0.00054, "train/epoch": 2.02, "_timestamp": 1746571563, "_runtime": 5572}, "step": 1900} {"train_info/time_between_train_steps": 0.013178110122680664, "step": 1900} {"info/global_step": 1901, "train_info/time_within_train_step": 2.7534306049346924, "step": 1901} {"train_info/time_between_train_steps": 0.0031409263610839844, "step": 1901} {"info/global_step": 1902, "train_info/time_within_train_step": 2.7546379566192627, "step": 1902} {"train_info/time_between_train_steps": 0.0031871795654296875, "step": 1902} {"info/global_step": 1903, "train_info/time_within_train_step": 2.7556540966033936, "step": 1903} {"train_info/time_between_train_steps": 0.003225564956665039, "step": 1903} {"info/global_step": 1904, "train_info/time_within_train_step": 2.7559235095977783, "step": 1904} {"train_info/time_between_train_steps": 0.0031669139862060547, "step": 1904} {"info/global_step": 1905, "train_info/time_within_train_step": 2.7552132606506348, "step": 1905} {"train_info/time_between_train_steps": 0.003161907196044922, "step": 1905} {"info/global_step": 1906, "train_info/time_within_train_step": 2.756225109100342, "step": 1906} {"train_info/time_between_train_steps": 0.003141641616821289, "step": 1906} {"info/global_step": 1907, "train_info/time_within_train_step": 2.757108688354492, "step": 1907} {"train_info/time_between_train_steps": 0.0031359195709228516, "step": 1907} {"info/global_step": 1908, "train_info/time_within_train_step": 2.7558350563049316, "step": 1908} {"train_info/time_between_train_steps": 0.0031502246856689453, "step": 1908} {"info/global_step": 1909, "train_info/time_within_train_step": 2.7555558681488037, "step": 1909} {"train_info/time_between_train_steps": 0.003192424774169922, "step": 1909} {"info/global_step": 1910, "train_info/time_within_train_step": 2.755574941635132, "step": 1910} {"train_info/time_between_train_steps": 0.003152608871459961, "step": 1910} {"info/global_step": 1911, "train_info/time_within_train_step": 2.7551674842834473, "step": 1911} {"train_info/time_between_train_steps": 0.0031633377075195312, "step": 1911} {"info/global_step": 1912, "train_info/time_within_train_step": 2.7557194232940674, "step": 1912} {"train_info/time_between_train_steps": 0.0031862258911132812, "step": 1912} {"info/global_step": 1913, "train_info/time_within_train_step": 2.9859981536865234, "step": 1913} {"train_info/time_between_train_steps": 0.003122568130493164, "step": 1913} {"info/global_step": 1914, "train_info/time_within_train_step": 2.753958225250244, "step": 1914} {"train_info/time_between_train_steps": 0.003101348876953125, "step": 1914} {"info/global_step": 1915, "train_info/time_within_train_step": 2.7538201808929443, "step": 1915} {"train_info/time_between_train_steps": 0.003160715103149414, "step": 1915} {"info/global_step": 1916, "train_info/time_within_train_step": 2.7527167797088623, "step": 1916} {"train_info/time_between_train_steps": 0.003125905990600586, "step": 1916} {"info/global_step": 1917, "train_info/time_within_train_step": 2.7543580532073975, "step": 1917} {"train_info/time_between_train_steps": 0.003113269805908203, "step": 1917} {"info/global_step": 1918, "train_info/time_within_train_step": 2.7541990280151367, "step": 1918} {"train_info/time_between_train_steps": 0.0031325817108154297, "step": 1918} {"info/global_step": 1919, "train_info/time_within_train_step": 2.7537484169006348, "step": 1919} {"train_info/time_between_train_steps": 0.0030889511108398438, "step": 1919} {"info/global_step": 1920, "train_info/time_within_train_step": 2.7556264400482178, "step": 1920} {"train_info/time_between_train_steps": 0.003113985061645508, "step": 1920} {"info/global_step": 1921, "train_info/time_within_train_step": 2.7805025577545166, "step": 1921} {"train_info/time_between_train_steps": 0.003153085708618164, "step": 1921} {"info/global_step": 1922, "train_info/time_within_train_step": 2.754956007003784, "step": 1922} {"train_info/time_between_train_steps": 0.0030965805053710938, "step": 1922} {"info/global_step": 1923, "train_info/time_within_train_step": 2.7548203468322754, "step": 1923} {"train_info/time_between_train_steps": 0.0031354427337646484, "step": 1923} {"info/global_step": 1924, "train_info/time_within_train_step": 2.7561168670654297, "step": 1924} {"train_info/time_between_train_steps": 0.0031652450561523438, "step": 1924} {"info/global_step": 1925, "train_info/time_within_train_step": 2.7544853687286377, "step": 1925} {"train_info/time_between_train_steps": 0.003125429153442383, "step": 1925} {"info/global_step": 1926, "train_info/time_within_train_step": 2.7579431533813477, "step": 1926} {"train_info/time_between_train_steps": 0.00313568115234375, "step": 1926} {"info/global_step": 1927, "train_info/time_within_train_step": 2.7555274963378906, "step": 1927} {"train_info/time_between_train_steps": 0.003114938735961914, "step": 1927} {"info/global_step": 1928, "train_info/time_within_train_step": 2.7550487518310547, "step": 1928} {"train_info/time_between_train_steps": 0.0031714439392089844, "step": 1928} {"info/global_step": 1929, "train_info/time_within_train_step": 2.754732131958008, "step": 1929} {"train_info/time_between_train_steps": 0.0031294822692871094, "step": 1929} {"info/global_step": 1930, "train_info/time_within_train_step": 2.753617525100708, "step": 1930} {"train_info/time_between_train_steps": 0.0031282901763916016, "step": 1930} {"info/global_step": 1931, "train_info/time_within_train_step": 2.752532958984375, "step": 1931} {"train_info/time_between_train_steps": 0.00313568115234375, "step": 1931} {"info/global_step": 1932, "train_info/time_within_train_step": 2.752869129180908, "step": 1932} {"train_info/time_between_train_steps": 0.0031447410583496094, "step": 1932} {"info/global_step": 1933, "train_info/time_within_train_step": 2.754685401916504, "step": 1933} {"train_info/time_between_train_steps": 0.003108978271484375, "step": 1933} {"info/global_step": 1934, "train_info/time_within_train_step": 2.7556560039520264, "step": 1934} {"train_info/time_between_train_steps": 0.0031642913818359375, "step": 1934} {"info/global_step": 1935, "train_info/time_within_train_step": 2.755197048187256, "step": 1935} {"train_info/time_between_train_steps": 0.003141641616821289, "step": 1935} {"info/global_step": 1936, "train_info/time_within_train_step": 2.755180835723877, "step": 1936} {"train_info/time_between_train_steps": 0.003110170364379883, "step": 1936} {"info/global_step": 1937, "train_info/time_within_train_step": 2.7551255226135254, "step": 1937} {"train_info/time_between_train_steps": 0.003113269805908203, "step": 1937} {"info/global_step": 1938, "train_info/time_within_train_step": 2.755932092666626, "step": 1938} {"train_info/time_between_train_steps": 0.003131389617919922, "step": 1938} {"info/global_step": 1939, "train_info/time_within_train_step": 2.755568027496338, "step": 1939} {"train_info/time_between_train_steps": 0.0031833648681640625, "step": 1939} {"info/global_step": 1940, "train_info/time_within_train_step": 2.75570011138916, "step": 1940} {"train_info/time_between_train_steps": 0.003099203109741211, "step": 1940} {"info/global_step": 1941, "train_info/time_within_train_step": 2.7541604042053223, "step": 1941} {"train_info/time_between_train_steps": 0.003167390823364258, "step": 1941} {"info/global_step": 1942, "train_info/time_within_train_step": 2.754155158996582, "step": 1942} {"train_info/time_between_train_steps": 0.003115415573120117, "step": 1942} {"info/global_step": 1943, "train_info/time_within_train_step": 2.756474018096924, "step": 1943} {"train_info/time_between_train_steps": 0.003142833709716797, "step": 1943} {"info/global_step": 1944, "train_info/time_within_train_step": 2.7555952072143555, "step": 1944} {"train_info/time_between_train_steps": 0.003187894821166992, "step": 1944} {"info/global_step": 1945, "train_info/time_within_train_step": 2.7541379928588867, "step": 1945} {"train_info/time_between_train_steps": 0.0031118392944335938, "step": 1945} {"info/global_step": 1946, "train_info/time_within_train_step": 2.7543230056762695, "step": 1946} {"train_info/time_between_train_steps": 0.003124713897705078, "step": 1946} {"info/global_step": 1947, "train_info/time_within_train_step": 2.756406784057617, "step": 1947} {"train_info/time_between_train_steps": 0.0031151771545410156, "step": 1947} {"info/global_step": 1948, "train_info/time_within_train_step": 2.7546277046203613, "step": 1948} {"train_info/time_between_train_steps": 0.0030972957611083984, "step": 1948} {"info/global_step": 1949, "train_info/time_within_train_step": 2.7551472187042236, "step": 1949} {"train_info/time_between_train_steps": 0.003122568130493164, "step": 1949} {"info/global_step": 1950, "train_info/time_within_train_step": 2.7518389225006104, "step": 1950} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746571702, "_runtime": 5711}, "step": 1950} {"logs": {"train/loss": 4.3636, "train/learning_rate": 0.0005366666666666666, "train/epoch": 2.02, "_timestamp": 1746571702, "_runtime": 5711}, "step": 1950} {"train_info/time_between_train_steps": 0.014369010925292969, "step": 1950} {"info/global_step": 1951, "train_info/time_within_train_step": 2.7559010982513428, "step": 1951} {"train_info/time_between_train_steps": 0.0031042098999023438, "step": 1951} {"info/global_step": 1952, "train_info/time_within_train_step": 2.755201578140259, "step": 1952} {"train_info/time_between_train_steps": 0.0031294822692871094, "step": 1952} {"info/global_step": 1953, "train_info/time_within_train_step": 2.7557342052459717, "step": 1953} {"train_info/time_between_train_steps": 0.003111600875854492, "step": 1953} {"info/global_step": 1954, "train_info/time_within_train_step": 2.755683660507202, "step": 1954} {"train_info/time_between_train_steps": 0.003205537796020508, "step": 1954} {"info/global_step": 1955, "train_info/time_within_train_step": 2.7559351921081543, "step": 1955} {"train_info/time_between_train_steps": 0.003291606903076172, "step": 1955} {"info/global_step": 1956, "train_info/time_within_train_step": 2.7559196949005127, "step": 1956} {"train_info/time_between_train_steps": 0.13164949417114258, "step": 1956} {"info/global_step": 1957, "train_info/time_within_train_step": 2.7551302909851074, "step": 1957} {"train_info/time_between_train_steps": 0.0031363964080810547, "step": 1957} {"info/global_step": 1958, "train_info/time_within_train_step": 2.757535457611084, "step": 1958} {"train_info/time_between_train_steps": 0.0031404495239257812, "step": 1958} {"info/global_step": 1959, "train_info/time_within_train_step": 2.754753589630127, "step": 1959} {"train_info/time_between_train_steps": 0.003187417984008789, "step": 1959} {"info/global_step": 1960, "train_info/time_within_train_step": 2.755699872970581, "step": 1960} {"train_info/time_between_train_steps": 0.003122568130493164, "step": 1960} {"info/global_step": 1961, "train_info/time_within_train_step": 2.755242109298706, "step": 1961} {"train_info/time_between_train_steps": 0.003157377243041992, "step": 1961} {"info/global_step": 1962, "train_info/time_within_train_step": 2.7539775371551514, "step": 1962} {"train_info/time_between_train_steps": 0.0031697750091552734, "step": 1962} {"info/global_step": 1963, "train_info/time_within_train_step": 2.750925064086914, "step": 1963} {"train_info/time_between_train_steps": 0.003156900405883789, "step": 1963} {"info/global_step": 1964, "train_info/time_within_train_step": 2.7545342445373535, "step": 1964} {"train_info/time_between_train_steps": 0.0031414031982421875, "step": 1964} {"info/global_step": 1965, "train_info/time_within_train_step": 2.75494647026062, "step": 1965} {"train_info/time_between_train_steps": 0.003139495849609375, "step": 1965} {"info/global_step": 1966, "train_info/time_within_train_step": 2.7561426162719727, "step": 1966} {"train_info/time_between_train_steps": 0.0031571388244628906, "step": 1966} {"info/global_step": 1967, "train_info/time_within_train_step": 2.755699634552002, "step": 1967} {"train_info/time_between_train_steps": 0.0031321048736572266, "step": 1967} {"info/global_step": 1968, "train_info/time_within_train_step": 2.755829095840454, "step": 1968} {"train_info/time_between_train_steps": 0.003138303756713867, "step": 1968} {"info/global_step": 1969, "train_info/time_within_train_step": 2.7557473182678223, "step": 1969} {"train_info/time_between_train_steps": 0.003186464309692383, "step": 1969} {"info/global_step": 1970, "train_info/time_within_train_step": 2.7553629875183105, "step": 1970} {"train_info/time_between_train_steps": 0.003195047378540039, "step": 1970} {"info/global_step": 1971, "train_info/time_within_train_step": 2.754739999771118, "step": 1971} {"train_info/time_between_train_steps": 0.003124713897705078, "step": 1971} {"info/global_step": 1972, "train_info/time_within_train_step": 2.7550415992736816, "step": 1972} {"train_info/time_between_train_steps": 0.003145456314086914, "step": 1972} {"info/global_step": 1973, "train_info/time_within_train_step": 2.755072832107544, "step": 1973} {"train_info/time_between_train_steps": 0.0031423568725585938, "step": 1973} {"info/global_step": 1974, "train_info/time_within_train_step": 2.7556939125061035, "step": 1974} {"train_info/time_between_train_steps": 0.0031156539916992188, "step": 1974} {"info/global_step": 1975, "train_info/time_within_train_step": 2.7538530826568604, "step": 1975} {"train_info/time_between_train_steps": 0.003143787384033203, "step": 1975} {"info/global_step": 1976, "train_info/time_within_train_step": 2.7549145221710205, "step": 1976} {"train_info/time_between_train_steps": 0.0031630992889404297, "step": 1976} {"info/global_step": 1977, "train_info/time_within_train_step": 2.7532742023468018, "step": 1977} {"train_info/time_between_train_steps": 0.0032057762145996094, "step": 1977} {"info/global_step": 1978, "train_info/time_within_train_step": 2.75514817237854, "step": 1978} {"train_info/time_between_train_steps": 0.003167867660522461, "step": 1978} {"info/global_step": 1979, "train_info/time_within_train_step": 2.755660057067871, "step": 1979} {"train_info/time_between_train_steps": 0.0031538009643554688, "step": 1979} {"info/global_step": 1980, "train_info/time_within_train_step": 2.7550833225250244, "step": 1980} {"train_info/time_between_train_steps": 0.003125905990600586, "step": 1980} {"info/global_step": 1981, "train_info/time_within_train_step": 2.754366159439087, "step": 1981} {"train_info/time_between_train_steps": 0.0031867027282714844, "step": 1981} {"info/global_step": 1982, "train_info/time_within_train_step": 2.75455379486084, "step": 1982} {"train_info/time_between_train_steps": 0.003162860870361328, "step": 1982} {"info/global_step": 1983, "train_info/time_within_train_step": 2.7548749446868896, "step": 1983} {"train_info/time_between_train_steps": 0.003169536590576172, "step": 1983} {"info/global_step": 1984, "train_info/time_within_train_step": 2.754960536956787, "step": 1984} {"train_info/time_between_train_steps": 0.0031414031982421875, "step": 1984} {"info/global_step": 1985, "train_info/time_within_train_step": 2.7528076171875, "step": 1985} {"train_info/time_between_train_steps": 0.003103494644165039, "step": 1985} {"info/global_step": 1986, "train_info/time_within_train_step": 2.754364013671875, "step": 1986} {"train_info/time_between_train_steps": 0.0031228065490722656, "step": 1986} {"info/global_step": 1987, "train_info/time_within_train_step": 2.755068063735962, "step": 1987} {"train_info/time_between_train_steps": 0.0031371116638183594, "step": 1987} {"info/global_step": 1988, "train_info/time_within_train_step": 2.75575852394104, "step": 1988} {"train_info/time_between_train_steps": 0.0031447410583496094, "step": 1988} {"info/global_step": 1989, "train_info/time_within_train_step": 2.754909038543701, "step": 1989} {"train_info/time_between_train_steps": 0.003108978271484375, "step": 1989} {"info/global_step": 1990, "train_info/time_within_train_step": 2.755042791366577, "step": 1990} {"train_info/time_between_train_steps": 0.003178834915161133, "step": 1990} {"info/global_step": 1991, "train_info/time_within_train_step": 2.7558891773223877, "step": 1991} {"train_info/time_between_train_steps": 0.003138303756713867, "step": 1991} {"info/global_step": 1992, "train_info/time_within_train_step": 2.7569215297698975, "step": 1992} {"train_info/time_between_train_steps": 0.0031518936157226562, "step": 1992} {"info/global_step": 1993, "train_info/time_within_train_step": 2.754687786102295, "step": 1993} {"train_info/time_between_train_steps": 0.0031435489654541016, "step": 1993} {"info/global_step": 1994, "train_info/time_within_train_step": 2.7551395893096924, "step": 1994} {"train_info/time_between_train_steps": 0.0031774044036865234, "step": 1994} {"info/global_step": 1995, "train_info/time_within_train_step": 2.7554497718811035, "step": 1995} {"train_info/time_between_train_steps": 0.003145933151245117, "step": 1995} {"info/global_step": 1996, "train_info/time_within_train_step": 2.7546982765197754, "step": 1996} {"train_info/time_between_train_steps": 0.003154277801513672, "step": 1996} {"info/global_step": 1997, "train_info/time_within_train_step": 2.755215644836426, "step": 1997} {"train_info/time_between_train_steps": 0.003187417984008789, "step": 1997} {"info/global_step": 1998, "train_info/time_within_train_step": 2.754516124725342, "step": 1998} {"train_info/time_between_train_steps": 0.003197908401489258, "step": 1998} {"info/global_step": 1999, "train_info/time_within_train_step": 3.342618942260742, "step": 1999} {"train_info/time_between_train_steps": 0.0031926631927490234, "step": 1999} {"info/global_step": 2000, "train_info/time_within_train_step": 2.7512247562408447, "step": 2000} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746571841, "_runtime": 5850}, "step": 2000} {"logs": {"train/loss": 4.3366, "train/learning_rate": 0.0005333333333333333, "train/epoch": 2.03, "_timestamp": 1746571841, "_runtime": 5850}, "step": 2000} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746571846, "_runtime": 5855}, "step": 2000} {"logs": {"eval/loss": 4.836623191833496, "eval/runtime": 5.3861, "eval/samples_per_second": 35.276, "eval/steps_per_second": 1.114, "train/epoch": 2.03, "_timestamp": 1746571846, "_runtime": 5855}, "step": 2000} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746571846, "_runtime": 5855}, "step": 2000} {"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.836623191833496, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 126.04300923391749, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 5.3861, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 35.276, "train/epoch": 2.03, "_timestamp": 1746571846, "_runtime": 5855}, "step": 2000} {"train_info/time_between_train_steps": 19.507963180541992, "step": 2000} {"info/global_step": 2001, "train_info/time_within_train_step": 2.556950330734253, "step": 2001} {"train_info/time_between_train_steps": 0.0031778812408447266, "step": 2001} {"info/global_step": 2002, "train_info/time_within_train_step": 2.60054349899292, "step": 2002} {"train_info/time_between_train_steps": 0.003236055374145508, "step": 2002} {"info/global_step": 2003, "train_info/time_within_train_step": 2.7379119396209717, "step": 2003} {"train_info/time_between_train_steps": 0.003236055374145508, "step": 2003} {"info/global_step": 2004, "train_info/time_within_train_step": 2.7518608570098877, "step": 2004} {"train_info/time_between_train_steps": 0.003230571746826172, "step": 2004} {"info/global_step": 2005, "train_info/time_within_train_step": 2.7535958290100098, "step": 2005} {"train_info/time_between_train_steps": 0.0033392906188964844, "step": 2005} {"info/global_step": 2006, "train_info/time_within_train_step": 2.7547221183776855, "step": 2006} {"train_info/time_between_train_steps": 0.003194093704223633, "step": 2006} {"info/global_step": 2007, "train_info/time_within_train_step": 2.7549781799316406, "step": 2007} {"train_info/time_between_train_steps": 0.0031957626342773438, "step": 2007} {"info/global_step": 2008, "train_info/time_within_train_step": 2.755498170852661, "step": 2008} {"train_info/time_between_train_steps": 0.0032546520233154297, "step": 2008} {"info/global_step": 2009, "train_info/time_within_train_step": 2.755352258682251, "step": 2009} {"train_info/time_between_train_steps": 0.003159761428833008, "step": 2009} {"info/global_step": 2010, "train_info/time_within_train_step": 2.755648136138916, "step": 2010} {"train_info/time_between_train_steps": 0.0032012462615966797, "step": 2010} {"info/global_step": 2011, "train_info/time_within_train_step": 2.755052328109741, "step": 2011} {"train_info/time_between_train_steps": 0.003187417984008789, "step": 2011} {"info/global_step": 2012, "train_info/time_within_train_step": 2.7546913623809814, "step": 2012} {"train_info/time_between_train_steps": 0.003263235092163086, "step": 2012} {"info/global_step": 2013, "train_info/time_within_train_step": 2.755254030227661, "step": 2013} {"train_info/time_between_train_steps": 0.0032448768615722656, "step": 2013} {"info/global_step": 2014, "train_info/time_within_train_step": 2.7551982402801514, "step": 2014} {"train_info/time_between_train_steps": 0.0031731128692626953, "step": 2014} {"info/global_step": 2015, "train_info/time_within_train_step": 2.755949020385742, "step": 2015} {"train_info/time_between_train_steps": 0.0032956600189208984, "step": 2015} {"info/global_step": 2016, "train_info/time_within_train_step": 2.755711317062378, "step": 2016} {"train_info/time_between_train_steps": 0.0032711029052734375, "step": 2016} {"info/global_step": 2017, "train_info/time_within_train_step": 2.7562131881713867, "step": 2017} {"train_info/time_between_train_steps": 0.0032041072845458984, "step": 2017} {"info/global_step": 2018, "train_info/time_within_train_step": 2.754478931427002, "step": 2018} {"train_info/time_between_train_steps": 0.0032722949981689453, "step": 2018} {"info/global_step": 2019, "train_info/time_within_train_step": 2.880833387374878, "step": 2019} {"train_info/time_between_train_steps": 0.003274679183959961, "step": 2019} {"info/global_step": 2020, "train_info/time_within_train_step": 2.756809949874878, "step": 2020} {"train_info/time_between_train_steps": 0.0032405853271484375, "step": 2020} {"info/global_step": 2021, "train_info/time_within_train_step": 2.7563369274139404, "step": 2021} {"train_info/time_between_train_steps": 0.0031728744506835938, "step": 2021} {"info/global_step": 2022, "train_info/time_within_train_step": 2.7562801837921143, "step": 2022} {"train_info/time_between_train_steps": 0.0032196044921875, "step": 2022} {"info/global_step": 2023, "train_info/time_within_train_step": 2.757384777069092, "step": 2023} {"train_info/time_between_train_steps": 0.003237485885620117, "step": 2023} {"info/global_step": 2024, "train_info/time_within_train_step": 2.755784511566162, "step": 2024} {"train_info/time_between_train_steps": 0.003155231475830078, "step": 2024} {"info/global_step": 2025, "train_info/time_within_train_step": 2.7561757564544678, "step": 2025} {"train_info/time_between_train_steps": 0.003279447555541992, "step": 2025} {"info/global_step": 2026, "train_info/time_within_train_step": 2.7550740242004395, "step": 2026} {"train_info/time_between_train_steps": 0.0032248497009277344, "step": 2026} {"info/global_step": 2027, "train_info/time_within_train_step": 2.7564120292663574, "step": 2027} {"train_info/time_between_train_steps": 0.0032689571380615234, "step": 2027} {"info/global_step": 2028, "train_info/time_within_train_step": 2.755650520324707, "step": 2028} {"train_info/time_between_train_steps": 0.0032804012298583984, "step": 2028} {"info/global_step": 2029, "train_info/time_within_train_step": 2.755038022994995, "step": 2029} {"train_info/time_between_train_steps": 0.0032279491424560547, "step": 2029} {"info/global_step": 2030, "train_info/time_within_train_step": 2.7539634704589844, "step": 2030} {"train_info/time_between_train_steps": 0.0032384395599365234, "step": 2030} {"info/global_step": 2031, "train_info/time_within_train_step": 2.7554283142089844, "step": 2031} {"train_info/time_between_train_steps": 0.0032455921173095703, "step": 2031} {"info/global_step": 2032, "train_info/time_within_train_step": 2.7551002502441406, "step": 2032} {"train_info/time_between_train_steps": 0.0031995773315429688, "step": 2032} {"info/global_step": 2033, "train_info/time_within_train_step": 2.7562975883483887, "step": 2033} {"train_info/time_between_train_steps": 0.0031616687774658203, "step": 2033} {"info/global_step": 2034, "train_info/time_within_train_step": 2.7549867630004883, "step": 2034} {"train_info/time_between_train_steps": 0.003194570541381836, "step": 2034} {"info/global_step": 2035, "train_info/time_within_train_step": 2.7595651149749756, "step": 2035} {"train_info/time_between_train_steps": 0.003234386444091797, "step": 2035} {"info/global_step": 2036, "train_info/time_within_train_step": 2.754612922668457, "step": 2036} {"train_info/time_between_train_steps": 0.0031867027282714844, "step": 2036} {"info/global_step": 2037, "train_info/time_within_train_step": 2.7550697326660156, "step": 2037} {"train_info/time_between_train_steps": 0.003200531005859375, "step": 2037} {"info/global_step": 2038, "train_info/time_within_train_step": 2.7543656826019287, "step": 2038} {"train_info/time_between_train_steps": 0.00318145751953125, "step": 2038} {"info/global_step": 2039, "train_info/time_within_train_step": 2.7561023235321045, "step": 2039} {"train_info/time_between_train_steps": 0.0031762123107910156, "step": 2039} {"info/global_step": 2040, "train_info/time_within_train_step": 2.7558908462524414, "step": 2040} {"train_info/time_between_train_steps": 0.003196239471435547, "step": 2040} {"info/global_step": 2041, "train_info/time_within_train_step": 2.7556943893432617, "step": 2041} {"train_info/time_between_train_steps": 0.0031294822692871094, "step": 2041} {"info/global_step": 2042, "train_info/time_within_train_step": 2.754570960998535, "step": 2042} {"train_info/time_between_train_steps": 0.0031430721282958984, "step": 2042} {"info/global_step": 2043, "train_info/time_within_train_step": 2.7559821605682373, "step": 2043} {"train_info/time_between_train_steps": 0.0031032562255859375, "step": 2043} {"info/global_step": 2044, "train_info/time_within_train_step": 2.755988597869873, "step": 2044} {"train_info/time_between_train_steps": 0.0031118392944335938, "step": 2044} {"info/global_step": 2045, "train_info/time_within_train_step": 2.755263566970825, "step": 2045} {"train_info/time_between_train_steps": 0.0031125545501708984, "step": 2045} {"info/global_step": 2046, "train_info/time_within_train_step": 2.754676342010498, "step": 2046} {"train_info/time_between_train_steps": 0.003142833709716797, "step": 2046} {"info/global_step": 2047, "train_info/time_within_train_step": 2.754984140396118, "step": 2047} {"train_info/time_between_train_steps": 0.0031630992889404297, "step": 2047} {"info/global_step": 2048, "train_info/time_within_train_step": 2.7554383277893066, "step": 2048} {"train_info/time_between_train_steps": 0.0031630992889404297, "step": 2048} {"info/global_step": 2049, "train_info/time_within_train_step": 2.7548294067382812, "step": 2049} {"train_info/time_between_train_steps": 0.003185749053955078, "step": 2049} {"info/global_step": 2050, "train_info/time_within_train_step": 2.7551729679107666, "step": 2050} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746571998, "_runtime": 6007}, "step": 2050} {"logs": {"train/loss": 4.3261, "train/learning_rate": 0.00053, "train/epoch": 2.03, "_timestamp": 1746571998, "_runtime": 6007}, "step": 2050} {"train_info/time_between_train_steps": 0.013577938079833984, "step": 2050} {"info/global_step": 2051, "train_info/time_within_train_step": 2.755099058151245, "step": 2051} {"train_info/time_between_train_steps": 0.003176450729370117, "step": 2051} {"info/global_step": 2052, "train_info/time_within_train_step": 2.7543015480041504, "step": 2052} {"train_info/time_between_train_steps": 0.003178834915161133, "step": 2052} {"info/global_step": 2053, "train_info/time_within_train_step": 2.755617380142212, "step": 2053} {"train_info/time_between_train_steps": 0.0031354427337646484, "step": 2053} {"info/global_step": 2054, "train_info/time_within_train_step": 2.754270315170288, "step": 2054} {"train_info/time_between_train_steps": 0.003164529800415039, "step": 2054} {"info/global_step": 2055, "train_info/time_within_train_step": 2.7545955181121826, "step": 2055} {"train_info/time_between_train_steps": 0.003123044967651367, "step": 2055} {"info/global_step": 2056, "train_info/time_within_train_step": 2.7546980381011963, "step": 2056} {"train_info/time_between_train_steps": 0.0031757354736328125, "step": 2056} {"info/global_step": 2057, "train_info/time_within_train_step": 2.755460023880005, "step": 2057} {"train_info/time_between_train_steps": 0.0031554698944091797, "step": 2057} {"info/global_step": 2058, "train_info/time_within_train_step": 2.7542896270751953, "step": 2058} {"train_info/time_between_train_steps": 0.003135204315185547, "step": 2058} {"info/global_step": 2059, "train_info/time_within_train_step": 2.7542107105255127, "step": 2059} {"train_info/time_between_train_steps": 0.0031235218048095703, "step": 2059} {"info/global_step": 2060, "train_info/time_within_train_step": 2.7544634342193604, "step": 2060} {"train_info/time_between_train_steps": 0.0032072067260742188, "step": 2060} {"info/global_step": 2061, "train_info/time_within_train_step": 2.7529306411743164, "step": 2061} {"train_info/time_between_train_steps": 0.0031104087829589844, "step": 2061} {"info/global_step": 2062, "train_info/time_within_train_step": 2.75424861907959, "step": 2062} {"train_info/time_between_train_steps": 0.0031375885009765625, "step": 2062} {"info/global_step": 2063, "train_info/time_within_train_step": 2.753655195236206, "step": 2063} {"train_info/time_between_train_steps": 0.0031652450561523438, "step": 2063} {"info/global_step": 2064, "train_info/time_within_train_step": 2.753460168838501, "step": 2064} {"train_info/time_between_train_steps": 0.003195524215698242, "step": 2064} {"info/global_step": 2065, "train_info/time_within_train_step": 2.75441312789917, "step": 2065} {"train_info/time_between_train_steps": 0.003128528594970703, "step": 2065} {"info/global_step": 2066, "train_info/time_within_train_step": 2.7543182373046875, "step": 2066} {"train_info/time_between_train_steps": 0.0031418800354003906, "step": 2066} {"info/global_step": 2067, "train_info/time_within_train_step": 2.755444288253784, "step": 2067} {"train_info/time_between_train_steps": 0.0031278133392333984, "step": 2067} {"info/global_step": 2068, "train_info/time_within_train_step": 2.7545413970947266, "step": 2068} {"train_info/time_between_train_steps": 0.0031888484954833984, "step": 2068} {"info/global_step": 2069, "train_info/time_within_train_step": 2.754876136779785, "step": 2069} {"train_info/time_between_train_steps": 0.003155946731567383, "step": 2069} {"info/global_step": 2070, "train_info/time_within_train_step": 2.7543981075286865, "step": 2070} {"train_info/time_between_train_steps": 0.0031595230102539062, "step": 2070} {"info/global_step": 2071, "train_info/time_within_train_step": 2.7545948028564453, "step": 2071} {"train_info/time_between_train_steps": 0.0031964778900146484, "step": 2071} {"info/global_step": 2072, "train_info/time_within_train_step": 2.7532033920288086, "step": 2072} {"train_info/time_between_train_steps": 0.003132343292236328, "step": 2072} {"info/global_step": 2073, "train_info/time_within_train_step": 2.753837823867798, "step": 2073} {"train_info/time_between_train_steps": 0.003112316131591797, "step": 2073} {"info/global_step": 2074, "train_info/time_within_train_step": 2.7540907859802246, "step": 2074} {"train_info/time_between_train_steps": 0.003201007843017578, "step": 2074} {"info/global_step": 2075, "train_info/time_within_train_step": 2.7539219856262207, "step": 2075} {"train_info/time_between_train_steps": 0.003121614456176758, "step": 2075} {"info/global_step": 2076, "train_info/time_within_train_step": 2.754389762878418, "step": 2076} {"train_info/time_between_train_steps": 0.0031692981719970703, "step": 2076} {"info/global_step": 2077, "train_info/time_within_train_step": 2.7540154457092285, "step": 2077} {"train_info/time_between_train_steps": 0.0031402111053466797, "step": 2077} {"info/global_step": 2078, "train_info/time_within_train_step": 2.753079652786255, "step": 2078} {"train_info/time_between_train_steps": 0.0031447410583496094, "step": 2078} {"info/global_step": 2079, "train_info/time_within_train_step": 2.7536933422088623, "step": 2079} {"train_info/time_between_train_steps": 0.0031278133392333984, "step": 2079} {"info/global_step": 2080, "train_info/time_within_train_step": 2.7552452087402344, "step": 2080} {"train_info/time_between_train_steps": 0.003202676773071289, "step": 2080} {"info/global_step": 2081, "train_info/time_within_train_step": 2.7550837993621826, "step": 2081} {"train_info/time_between_train_steps": 0.12483596801757812, "step": 2081} {"info/global_step": 2082, "train_info/time_within_train_step": 2.7547500133514404, "step": 2082} {"train_info/time_between_train_steps": 0.0032007694244384766, "step": 2082} {"info/global_step": 2083, "train_info/time_within_train_step": 2.754197359085083, "step": 2083} {"train_info/time_between_train_steps": 0.003161907196044922, "step": 2083} {"info/global_step": 2084, "train_info/time_within_train_step": 2.7552521228790283, "step": 2084} {"train_info/time_between_train_steps": 0.0031518936157226562, "step": 2084} {"info/global_step": 2085, "train_info/time_within_train_step": 2.754755735397339, "step": 2085} {"train_info/time_between_train_steps": 0.003108501434326172, "step": 2085} {"info/global_step": 2086, "train_info/time_within_train_step": 2.9870100021362305, "step": 2086} {"train_info/time_between_train_steps": 0.003139495849609375, "step": 2086} {"info/global_step": 2087, "train_info/time_within_train_step": 2.7542147636413574, "step": 2087} {"train_info/time_between_train_steps": 0.003114938735961914, "step": 2087} {"info/global_step": 2088, "train_info/time_within_train_step": 2.7750401496887207, "step": 2088} {"train_info/time_between_train_steps": 0.0032906532287597656, "step": 2088} {"info/global_step": 2089, "train_info/time_within_train_step": 2.753390073776245, "step": 2089} {"train_info/time_between_train_steps": 0.0031325817108154297, "step": 2089} {"info/global_step": 2090, "train_info/time_within_train_step": 2.7536139488220215, "step": 2090} {"train_info/time_between_train_steps": 0.0031261444091796875, "step": 2090} {"info/global_step": 2091, "train_info/time_within_train_step": 2.754167318344116, "step": 2091} {"train_info/time_between_train_steps": 0.003147602081298828, "step": 2091} {"info/global_step": 2092, "train_info/time_within_train_step": 2.7550575733184814, "step": 2092} {"train_info/time_between_train_steps": 0.0032050609588623047, "step": 2092} {"info/global_step": 2093, "train_info/time_within_train_step": 2.7562103271484375, "step": 2093} {"train_info/time_between_train_steps": 0.003192901611328125, "step": 2093} {"info/global_step": 2094, "train_info/time_within_train_step": 2.7542011737823486, "step": 2094} {"train_info/time_between_train_steps": 0.003200054168701172, "step": 2094} {"info/global_step": 2095, "train_info/time_within_train_step": 2.755239486694336, "step": 2095} {"train_info/time_between_train_steps": 0.003215789794921875, "step": 2095} {"info/global_step": 2096, "train_info/time_within_train_step": 2.7542474269866943, "step": 2096} {"train_info/time_between_train_steps": 0.0031728744506835938, "step": 2096} {"info/global_step": 2097, "train_info/time_within_train_step": 2.754765510559082, "step": 2097} {"train_info/time_between_train_steps": 0.0032477378845214844, "step": 2097} {"info/global_step": 2098, "train_info/time_within_train_step": 2.7548844814300537, "step": 2098} {"train_info/time_between_train_steps": 0.003160715103149414, "step": 2098} {"info/global_step": 2099, "train_info/time_within_train_step": 2.7543797492980957, "step": 2099} {"train_info/time_between_train_steps": 0.003194570541381836, "step": 2099} {"info/global_step": 2100, "train_info/time_within_train_step": 2.7548654079437256, "step": 2100} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746572137, "_runtime": 6146}, "step": 2100} {"logs": {"train/loss": 4.313, "train/learning_rate": 0.0005266666666666666, "train/epoch": 2.04, "_timestamp": 1746572137, "_runtime": 6146}, "step": 2100} {"train_info/time_between_train_steps": 0.014428138732910156, "step": 2100} {"info/global_step": 2101, "train_info/time_within_train_step": 2.753458023071289, "step": 2101} {"train_info/time_between_train_steps": 0.003237009048461914, "step": 2101} {"info/global_step": 2102, "train_info/time_within_train_step": 2.7537147998809814, "step": 2102} {"train_info/time_between_train_steps": 0.0032477378845214844, "step": 2102} {"info/global_step": 2103, "train_info/time_within_train_step": 2.755220651626587, "step": 2103} {"train_info/time_between_train_steps": 0.003177165985107422, "step": 2103} {"info/global_step": 2104, "train_info/time_within_train_step": 2.7556841373443604, "step": 2104} {"train_info/time_between_train_steps": 0.003309488296508789, "step": 2104} {"info/global_step": 2105, "train_info/time_within_train_step": 2.7551674842834473, "step": 2105} {"train_info/time_between_train_steps": 0.0032782554626464844, "step": 2105} {"info/global_step": 2106, "train_info/time_within_train_step": 2.7551300525665283, "step": 2106} {"train_info/time_between_train_steps": 0.003241300582885742, "step": 2106} {"info/global_step": 2107, "train_info/time_within_train_step": 2.7549350261688232, "step": 2107} {"train_info/time_between_train_steps": 0.0032224655151367188, "step": 2107} {"info/global_step": 2108, "train_info/time_within_train_step": 2.756664514541626, "step": 2108} {"train_info/time_between_train_steps": 0.003281831741333008, "step": 2108} {"info/global_step": 2109, "train_info/time_within_train_step": 2.755505084991455, "step": 2109} {"train_info/time_between_train_steps": 0.003186941146850586, "step": 2109} {"info/global_step": 2110, "train_info/time_within_train_step": 2.755101442337036, "step": 2110} {"train_info/time_between_train_steps": 0.003175973892211914, "step": 2110} {"info/global_step": 2111, "train_info/time_within_train_step": 2.754889488220215, "step": 2111} {"train_info/time_between_train_steps": 0.0031800270080566406, "step": 2111} {"info/global_step": 2112, "train_info/time_within_train_step": 2.755369186401367, "step": 2112} {"train_info/time_between_train_steps": 0.0031533241271972656, "step": 2112} {"info/global_step": 2113, "train_info/time_within_train_step": 2.753957986831665, "step": 2113} {"train_info/time_between_train_steps": 0.0031197071075439453, "step": 2113} {"info/global_step": 2114, "train_info/time_within_train_step": 2.7540276050567627, "step": 2114} {"train_info/time_between_train_steps": 0.0031392574310302734, "step": 2114} {"info/global_step": 2115, "train_info/time_within_train_step": 2.7548437118530273, "step": 2115} {"train_info/time_between_train_steps": 0.003169536590576172, "step": 2115} {"info/global_step": 2116, "train_info/time_within_train_step": 2.7545158863067627, "step": 2116} {"train_info/time_between_train_steps": 0.0031480789184570312, "step": 2116} {"info/global_step": 2117, "train_info/time_within_train_step": 2.7550208568573, "step": 2117} {"train_info/time_between_train_steps": 0.0031807422637939453, "step": 2117} {"info/global_step": 2118, "train_info/time_within_train_step": 2.7538537979125977, "step": 2118} {"train_info/time_between_train_steps": 0.0030999183654785156, "step": 2118} {"info/global_step": 2119, "train_info/time_within_train_step": 2.754448175430298, "step": 2119} {"train_info/time_between_train_steps": 0.003119945526123047, "step": 2119} {"info/global_step": 2120, "train_info/time_within_train_step": 2.754875659942627, "step": 2120} {"train_info/time_between_train_steps": 0.0031020641326904297, "step": 2120} {"info/global_step": 2121, "train_info/time_within_train_step": 2.753682851791382, "step": 2121} {"train_info/time_between_train_steps": 0.0031385421752929688, "step": 2121} {"info/global_step": 2122, "train_info/time_within_train_step": 2.754683494567871, "step": 2122} {"train_info/time_between_train_steps": 0.0031418800354003906, "step": 2122} {"info/global_step": 2123, "train_info/time_within_train_step": 2.7554028034210205, "step": 2123} {"train_info/time_between_train_steps": 0.003175497055053711, "step": 2123} {"info/global_step": 2124, "train_info/time_within_train_step": 2.757028102874756, "step": 2124} {"train_info/time_between_train_steps": 0.003194093704223633, "step": 2124} {"info/global_step": 2125, "train_info/time_within_train_step": 2.754286289215088, "step": 2125} {"train_info/time_between_train_steps": 0.003185272216796875, "step": 2125} {"info/global_step": 2126, "train_info/time_within_train_step": 2.7541394233703613, "step": 2126} {"train_info/time_between_train_steps": 0.0031523704528808594, "step": 2126} {"info/global_step": 2127, "train_info/time_within_train_step": 2.7553422451019287, "step": 2127} {"train_info/time_between_train_steps": 0.003113985061645508, "step": 2127} {"info/global_step": 2128, "train_info/time_within_train_step": 2.755547523498535, "step": 2128} {"train_info/time_between_train_steps": 0.0031585693359375, "step": 2128} {"info/global_step": 2129, "train_info/time_within_train_step": 2.755675792694092, "step": 2129} {"train_info/time_between_train_steps": 0.0031867027282714844, "step": 2129} {"info/global_step": 2130, "train_info/time_within_train_step": 2.7532856464385986, "step": 2130} {"train_info/time_between_train_steps": 0.003286123275756836, "step": 2130} {"info/global_step": 2131, "train_info/time_within_train_step": 2.7544987201690674, "step": 2131} {"train_info/time_between_train_steps": 0.0031599998474121094, "step": 2131} {"info/global_step": 2132, "train_info/time_within_train_step": 2.75130033493042, "step": 2132} {"train_info/time_between_train_steps": 0.0031473636627197266, "step": 2132} {"info/global_step": 2133, "train_info/time_within_train_step": 2.7540993690490723, "step": 2133} {"train_info/time_between_train_steps": 0.003143310546875, "step": 2133} {"info/global_step": 2134, "train_info/time_within_train_step": 2.7533888816833496, "step": 2134} {"train_info/time_between_train_steps": 0.0031931400299072266, "step": 2134} {"info/global_step": 2135, "train_info/time_within_train_step": 2.7526118755340576, "step": 2135} {"train_info/time_between_train_steps": 0.0031523704528808594, "step": 2135} {"info/global_step": 2136, "train_info/time_within_train_step": 2.7537155151367188, "step": 2136} {"train_info/time_between_train_steps": 0.003114461898803711, "step": 2136} {"info/global_step": 2137, "train_info/time_within_train_step": 2.75470232963562, "step": 2137} {"train_info/time_between_train_steps": 0.003219127655029297, "step": 2137} {"info/global_step": 2138, "train_info/time_within_train_step": 2.7544989585876465, "step": 2138} {"train_info/time_between_train_steps": 0.0031538009643554688, "step": 2138} {"info/global_step": 2139, "train_info/time_within_train_step": 2.7539443969726562, "step": 2139} {"train_info/time_between_train_steps": 0.003175497055053711, "step": 2139} {"info/global_step": 2140, "train_info/time_within_train_step": 2.989859104156494, "step": 2140} {"train_info/time_between_train_steps": 0.003134489059448242, "step": 2140} {"info/global_step": 2141, "train_info/time_within_train_step": 2.752230644226074, "step": 2141} {"train_info/time_between_train_steps": 0.0031135082244873047, "step": 2141} {"info/global_step": 2142, "train_info/time_within_train_step": 2.754037857055664, "step": 2142} {"train_info/time_between_train_steps": 0.0031938552856445312, "step": 2142} {"info/global_step": 2143, "train_info/time_within_train_step": 2.7546818256378174, "step": 2143} {"train_info/time_between_train_steps": 0.003104686737060547, "step": 2143} {"info/global_step": 2144, "train_info/time_within_train_step": 2.878190755844116, "step": 2144} {"train_info/time_between_train_steps": 0.0031461715698242188, "step": 2144} {"info/global_step": 2145, "train_info/time_within_train_step": 2.756690740585327, "step": 2145} {"train_info/time_between_train_steps": 0.0031404495239257812, "step": 2145} {"info/global_step": 2146, "train_info/time_within_train_step": 2.758671760559082, "step": 2146} {"train_info/time_between_train_steps": 0.003142118453979492, "step": 2146} {"info/global_step": 2147, "train_info/time_within_train_step": 2.754607915878296, "step": 2147} {"train_info/time_between_train_steps": 0.003134489059448242, "step": 2147} {"info/global_step": 2148, "train_info/time_within_train_step": 2.7544291019439697, "step": 2148} {"train_info/time_between_train_steps": 0.0031800270080566406, "step": 2148} {"info/global_step": 2149, "train_info/time_within_train_step": 2.7546117305755615, "step": 2149} {"train_info/time_between_train_steps": 0.0031855106353759766, "step": 2149} {"info/global_step": 2150, "train_info/time_within_train_step": 2.7529544830322266, "step": 2150} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746572276, "_runtime": 6285}, "step": 2150} {"logs": {"train/loss": 4.2797, "train/learning_rate": 0.0005233333333333333, "train/epoch": 2.04, "_timestamp": 1746572276, "_runtime": 6285}, "step": 2150} {"train_info/time_between_train_steps": 0.013911247253417969, "step": 2150} {"info/global_step": 2151, "train_info/time_within_train_step": 2.754696846008301, "step": 2151} {"train_info/time_between_train_steps": 0.0031692981719970703, "step": 2151} {"info/global_step": 2152, "train_info/time_within_train_step": 2.753477096557617, "step": 2152} {"train_info/time_between_train_steps": 0.0031294822692871094, "step": 2152} {"info/global_step": 2153, "train_info/time_within_train_step": 2.7541816234588623, "step": 2153} {"train_info/time_between_train_steps": 0.0031821727752685547, "step": 2153} {"info/global_step": 2154, "train_info/time_within_train_step": 2.756513833999634, "step": 2154} {"train_info/time_between_train_steps": 0.003134489059448242, "step": 2154} {"info/global_step": 2155, "train_info/time_within_train_step": 2.7549476623535156, "step": 2155} {"train_info/time_between_train_steps": 0.003124713897705078, "step": 2155} {"info/global_step": 2156, "train_info/time_within_train_step": 2.75447416305542, "step": 2156} {"train_info/time_between_train_steps": 0.003144502639770508, "step": 2156} {"info/global_step": 2157, "train_info/time_within_train_step": 2.7547316551208496, "step": 2157} {"train_info/time_between_train_steps": 0.0032215118408203125, "step": 2157} {"info/global_step": 2158, "train_info/time_within_train_step": 2.755638360977173, "step": 2158} {"train_info/time_between_train_steps": 0.0031385421752929688, "step": 2158} {"info/global_step": 2159, "train_info/time_within_train_step": 2.7544851303100586, "step": 2159} {"train_info/time_between_train_steps": 0.003153085708618164, "step": 2159} {"info/global_step": 2160, "train_info/time_within_train_step": 2.753981113433838, "step": 2160} {"train_info/time_between_train_steps": 0.0031626224517822266, "step": 2160} {"info/global_step": 2161, "train_info/time_within_train_step": 2.7543654441833496, "step": 2161} {"train_info/time_between_train_steps": 0.0031325817108154297, "step": 2161} {"info/global_step": 2162, "train_info/time_within_train_step": 2.7538833618164062, "step": 2162} {"train_info/time_between_train_steps": 0.003183603286743164, "step": 2162} {"info/global_step": 2163, "train_info/time_within_train_step": 2.7546348571777344, "step": 2163} {"train_info/time_between_train_steps": 0.003192901611328125, "step": 2163} {"info/global_step": 2164, "train_info/time_within_train_step": 2.753950834274292, "step": 2164} {"train_info/time_between_train_steps": 0.0031893253326416016, "step": 2164} {"info/global_step": 2165, "train_info/time_within_train_step": 2.7546727657318115, "step": 2165} {"train_info/time_between_train_steps": 0.003152608871459961, "step": 2165} {"info/global_step": 2166, "train_info/time_within_train_step": 2.754148006439209, "step": 2166} {"train_info/time_between_train_steps": 0.003240346908569336, "step": 2166} {"info/global_step": 2167, "train_info/time_within_train_step": 2.7540030479431152, "step": 2167} {"train_info/time_between_train_steps": 0.003204822540283203, "step": 2167} {"info/global_step": 2168, "train_info/time_within_train_step": 2.7550783157348633, "step": 2168} {"train_info/time_between_train_steps": 0.0031931400299072266, "step": 2168} {"info/global_step": 2169, "train_info/time_within_train_step": 2.7549569606781006, "step": 2169} {"train_info/time_between_train_steps": 0.0032024383544921875, "step": 2169} {"info/global_step": 2170, "train_info/time_within_train_step": 2.754178524017334, "step": 2170} {"train_info/time_between_train_steps": 0.0031380653381347656, "step": 2170} {"info/global_step": 2171, "train_info/time_within_train_step": 2.7546544075012207, "step": 2171} {"train_info/time_between_train_steps": 0.0031735897064208984, "step": 2171} {"info/global_step": 2172, "train_info/time_within_train_step": 2.7544193267822266, "step": 2172} {"train_info/time_between_train_steps": 0.0031533241271972656, "step": 2172} {"info/global_step": 2173, "train_info/time_within_train_step": 2.7555577754974365, "step": 2173} {"train_info/time_between_train_steps": 0.0031223297119140625, "step": 2173} {"info/global_step": 2174, "train_info/time_within_train_step": 2.7546401023864746, "step": 2174} {"train_info/time_between_train_steps": 0.0031425952911376953, "step": 2174} {"info/global_step": 2175, "train_info/time_within_train_step": 2.755862236022949, "step": 2175} {"train_info/time_between_train_steps": 0.003162860870361328, "step": 2175} {"info/global_step": 2176, "train_info/time_within_train_step": 2.75447678565979, "step": 2176} {"train_info/time_between_train_steps": 0.003117084503173828, "step": 2176} {"info/global_step": 2177, "train_info/time_within_train_step": 2.7546591758728027, "step": 2177} {"train_info/time_between_train_steps": 0.003185272216796875, "step": 2177} {"info/global_step": 2178, "train_info/time_within_train_step": 2.7556326389312744, "step": 2178} {"train_info/time_between_train_steps": 0.0031592845916748047, "step": 2178} {"info/global_step": 2179, "train_info/time_within_train_step": 2.98865008354187, "step": 2179} {"train_info/time_between_train_steps": 0.0031545162200927734, "step": 2179} {"info/global_step": 2180, "train_info/time_within_train_step": 2.755204677581787, "step": 2180} {"train_info/time_between_train_steps": 0.003159761428833008, "step": 2180} {"info/global_step": 2181, "train_info/time_within_train_step": 2.7545554637908936, "step": 2181} {"train_info/time_between_train_steps": 0.003152132034301758, "step": 2181} {"info/global_step": 2182, "train_info/time_within_train_step": 2.753709554672241, "step": 2182} {"train_info/time_between_train_steps": 0.003142833709716797, "step": 2182} {"info/global_step": 2183, "train_info/time_within_train_step": 2.7556493282318115, "step": 2183} {"train_info/time_between_train_steps": 0.0031189918518066406, "step": 2183} {"info/global_step": 2184, "train_info/time_within_train_step": 2.755211114883423, "step": 2184} {"train_info/time_between_train_steps": 0.003168344497680664, "step": 2184} {"info/global_step": 2185, "train_info/time_within_train_step": 2.7549874782562256, "step": 2185} {"train_info/time_between_train_steps": 0.0031304359436035156, "step": 2185} {"info/global_step": 2186, "train_info/time_within_train_step": 2.756145477294922, "step": 2186} {"train_info/time_between_train_steps": 0.00312042236328125, "step": 2186} {"info/global_step": 2187, "train_info/time_within_train_step": 2.7558305263519287, "step": 2187} {"train_info/time_between_train_steps": 0.003153085708618164, "step": 2187} {"info/global_step": 2188, "train_info/time_within_train_step": 2.754800796508789, "step": 2188} {"train_info/time_between_train_steps": 0.003148794174194336, "step": 2188} {"info/global_step": 2189, "train_info/time_within_train_step": 2.7547292709350586, "step": 2189} {"train_info/time_between_train_steps": 0.0031490325927734375, "step": 2189} {"info/global_step": 2190, "train_info/time_within_train_step": 2.754709243774414, "step": 2190} {"train_info/time_between_train_steps": 0.0031821727752685547, "step": 2190} {"info/global_step": 2191, "train_info/time_within_train_step": 2.755662441253662, "step": 2191} {"train_info/time_between_train_steps": 0.003171205520629883, "step": 2191} {"info/global_step": 2192, "train_info/time_within_train_step": 2.754035711288452, "step": 2192} {"train_info/time_between_train_steps": 0.003137826919555664, "step": 2192} {"info/global_step": 2193, "train_info/time_within_train_step": 2.7556629180908203, "step": 2193} {"train_info/time_between_train_steps": 0.0031609535217285156, "step": 2193} {"info/global_step": 2194, "train_info/time_within_train_step": 2.7554168701171875, "step": 2194} {"train_info/time_between_train_steps": 0.0031599998474121094, "step": 2194} {"info/global_step": 2195, "train_info/time_within_train_step": 2.7555737495422363, "step": 2195} {"train_info/time_between_train_steps": 0.003137350082397461, "step": 2195} {"info/global_step": 2196, "train_info/time_within_train_step": 2.7553675174713135, "step": 2196} {"train_info/time_between_train_steps": 0.003125429153442383, "step": 2196} {"info/global_step": 2197, "train_info/time_within_train_step": 2.7549688816070557, "step": 2197} {"train_info/time_between_train_steps": 0.003155231475830078, "step": 2197} {"info/global_step": 2198, "train_info/time_within_train_step": 2.7551822662353516, "step": 2198} {"train_info/time_between_train_steps": 0.0031347274780273438, "step": 2198} {"info/global_step": 2199, "train_info/time_within_train_step": 2.755258798599243, "step": 2199} {"train_info/time_between_train_steps": 0.003144502639770508, "step": 2199} {"info/global_step": 2200, "train_info/time_within_train_step": 2.754999876022339, "step": 2200} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746572415, "_runtime": 6424}, "step": 2200} {"logs": {"train/loss": 4.2717, "train/learning_rate": 0.00052, "train/epoch": 2.05, "_timestamp": 1746572415, "_runtime": 6424}, "step": 2200} {"train_info/time_between_train_steps": 23.303309202194214, "step": 2200} {"info/global_step": 2201, "train_info/time_within_train_step": 2.5251176357269287, "step": 2201} {"train_info/time_between_train_steps": 0.003127574920654297, "step": 2201} {"info/global_step": 2202, "train_info/time_within_train_step": 2.5644962787628174, "step": 2202} {"train_info/time_between_train_steps": 0.003144502639770508, "step": 2202} {"info/global_step": 2203, "train_info/time_within_train_step": 2.6934473514556885, "step": 2203} {"train_info/time_between_train_steps": 0.003167867660522461, "step": 2203} {"info/global_step": 2204, "train_info/time_within_train_step": 2.7377994060516357, "step": 2204} {"train_info/time_between_train_steps": 0.003131389617919922, "step": 2204} {"info/global_step": 2205, "train_info/time_within_train_step": 2.7502529621124268, "step": 2205} {"train_info/time_between_train_steps": 0.00313568115234375, "step": 2205} {"info/global_step": 2206, "train_info/time_within_train_step": 2.754086971282959, "step": 2206} {"train_info/time_between_train_steps": 0.08865618705749512, "step": 2206} {"info/global_step": 2207, "train_info/time_within_train_step": 2.754741668701172, "step": 2207} {"train_info/time_between_train_steps": 0.003125905990600586, "step": 2207} {"info/global_step": 2208, "train_info/time_within_train_step": 2.755167007446289, "step": 2208} {"train_info/time_between_train_steps": 0.0031647682189941406, "step": 2208} {"info/global_step": 2209, "train_info/time_within_train_step": 2.7562716007232666, "step": 2209} {"train_info/time_between_train_steps": 0.0031278133392333984, "step": 2209} {"info/global_step": 2210, "train_info/time_within_train_step": 2.755967140197754, "step": 2210} {"train_info/time_between_train_steps": 0.0031740665435791016, "step": 2210} {"info/global_step": 2211, "train_info/time_within_train_step": 2.75543212890625, "step": 2211} {"train_info/time_between_train_steps": 0.0032317638397216797, "step": 2211} {"info/global_step": 2212, "train_info/time_within_train_step": 2.7557930946350098, "step": 2212} {"train_info/time_between_train_steps": 0.0031349658966064453, "step": 2212} {"info/global_step": 2213, "train_info/time_within_train_step": 2.7566211223602295, "step": 2213} {"train_info/time_between_train_steps": 0.003143787384033203, "step": 2213} {"info/global_step": 2214, "train_info/time_within_train_step": 2.756424903869629, "step": 2214} {"train_info/time_between_train_steps": 0.0031566619873046875, "step": 2214} {"info/global_step": 2215, "train_info/time_within_train_step": 2.7561285495758057, "step": 2215} {"train_info/time_between_train_steps": 0.0031371116638183594, "step": 2215} {"info/global_step": 2216, "train_info/time_within_train_step": 2.756281852722168, "step": 2216} {"train_info/time_between_train_steps": 0.0031266212463378906, "step": 2216} {"info/global_step": 2217, "train_info/time_within_train_step": 2.756636142730713, "step": 2217} {"train_info/time_between_train_steps": 0.0031800270080566406, "step": 2217} {"info/global_step": 2218, "train_info/time_within_train_step": 2.754809856414795, "step": 2218} {"train_info/time_between_train_steps": 0.003148317337036133, "step": 2218} {"info/global_step": 2219, "train_info/time_within_train_step": 2.755826234817505, "step": 2219} {"train_info/time_between_train_steps": 0.003148317337036133, "step": 2219} {"info/global_step": 2220, "train_info/time_within_train_step": 2.7557191848754883, "step": 2220} {"train_info/time_between_train_steps": 0.00316619873046875, "step": 2220} {"info/global_step": 2221, "train_info/time_within_train_step": 2.754972219467163, "step": 2221} {"train_info/time_between_train_steps": 0.003155946731567383, "step": 2221} {"info/global_step": 2222, "train_info/time_within_train_step": 2.756211519241333, "step": 2222} {"train_info/time_between_train_steps": 0.0032134056091308594, "step": 2222} {"info/global_step": 2223, "train_info/time_within_train_step": 2.756439447402954, "step": 2223} {"train_info/time_between_train_steps": 0.003127574920654297, "step": 2223} {"info/global_step": 2224, "train_info/time_within_train_step": 2.7552857398986816, "step": 2224} {"train_info/time_between_train_steps": 0.0031442642211914062, "step": 2224} {"info/global_step": 2225, "train_info/time_within_train_step": 2.7560956478118896, "step": 2225} {"train_info/time_between_train_steps": 0.003198862075805664, "step": 2225} {"info/global_step": 2226, "train_info/time_within_train_step": 2.7567594051361084, "step": 2226} {"train_info/time_between_train_steps": 0.0031380653381347656, "step": 2226} {"info/global_step": 2227, "train_info/time_within_train_step": 2.755906820297241, "step": 2227} {"train_info/time_between_train_steps": 0.003127574920654297, "step": 2227} {"info/global_step": 2228, "train_info/time_within_train_step": 2.7553486824035645, "step": 2228} {"train_info/time_between_train_steps": 0.0031626224517822266, "step": 2228} {"info/global_step": 2229, "train_info/time_within_train_step": 2.757016181945801, "step": 2229} {"train_info/time_between_train_steps": 0.0031294822692871094, "step": 2229} {"info/global_step": 2230, "train_info/time_within_train_step": 2.756582498550415, "step": 2230} {"train_info/time_between_train_steps": 0.0031180381774902344, "step": 2230} {"info/global_step": 2231, "train_info/time_within_train_step": 2.9795727729797363, "step": 2231} {"train_info/time_between_train_steps": 0.003138303756713867, "step": 2231} {"info/global_step": 2232, "train_info/time_within_train_step": 2.7801249027252197, "step": 2232} {"train_info/time_between_train_steps": 0.003152608871459961, "step": 2232} {"info/global_step": 2233, "train_info/time_within_train_step": 2.7556240558624268, "step": 2233} {"train_info/time_between_train_steps": 0.0031213760375976562, "step": 2233} {"info/global_step": 2234, "train_info/time_within_train_step": 2.7542803287506104, "step": 2234} {"train_info/time_between_train_steps": 0.003144979476928711, "step": 2234} {"info/global_step": 2235, "train_info/time_within_train_step": 2.755286693572998, "step": 2235} {"train_info/time_between_train_steps": 0.0031397342681884766, "step": 2235} {"info/global_step": 2236, "train_info/time_within_train_step": 2.754460573196411, "step": 2236} {"train_info/time_between_train_steps": 0.0031554698944091797, "step": 2236} {"info/global_step": 2237, "train_info/time_within_train_step": 2.754201650619507, "step": 2237} {"train_info/time_between_train_steps": 0.003153562545776367, "step": 2237} {"info/global_step": 2238, "train_info/time_within_train_step": 2.7549805641174316, "step": 2238} {"train_info/time_between_train_steps": 0.003137826919555664, "step": 2238} {"info/global_step": 2239, "train_info/time_within_train_step": 2.754187822341919, "step": 2239} {"train_info/time_between_train_steps": 0.0031380653381347656, "step": 2239} {"info/global_step": 2240, "train_info/time_within_train_step": 2.7542800903320312, "step": 2240} {"train_info/time_between_train_steps": 0.0031414031982421875, "step": 2240} {"info/global_step": 2241, "train_info/time_within_train_step": 2.7548086643218994, "step": 2241} {"train_info/time_between_train_steps": 0.003128528594970703, "step": 2241} {"info/global_step": 2242, "train_info/time_within_train_step": 2.756275177001953, "step": 2242} {"train_info/time_between_train_steps": 0.003143787384033203, "step": 2242} {"info/global_step": 2243, "train_info/time_within_train_step": 2.756474018096924, "step": 2243} {"train_info/time_between_train_steps": 0.0031363964080810547, "step": 2243} {"info/global_step": 2244, "train_info/time_within_train_step": 2.7554128170013428, "step": 2244} {"train_info/time_between_train_steps": 0.003139972686767578, "step": 2244} {"info/global_step": 2245, "train_info/time_within_train_step": 2.753082036972046, "step": 2245} {"train_info/time_between_train_steps": 0.003122091293334961, "step": 2245} {"info/global_step": 2246, "train_info/time_within_train_step": 2.7554736137390137, "step": 2246} {"train_info/time_between_train_steps": 0.003130674362182617, "step": 2246} {"info/global_step": 2247, "train_info/time_within_train_step": 2.754760980606079, "step": 2247} {"train_info/time_between_train_steps": 0.017890453338623047, "step": 2247} {"info/global_step": 2248, "train_info/time_within_train_step": 2.7543721199035645, "step": 2248} {"train_info/time_between_train_steps": 0.002886056900024414, "step": 2248} {"info/global_step": 2249, "train_info/time_within_train_step": 3.3563334941864014, "step": 2249} {"train_info/time_between_train_steps": 0.0028710365295410156, "step": 2249} {"info/global_step": 2250, "train_info/time_within_train_step": 2.7535102367401123, "step": 2250} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746572577, "_runtime": 6586}, "step": 2250} {"logs": {"train/loss": 4.2634, "train/learning_rate": 0.0005166666666666667, "train/epoch": 2.05, "_timestamp": 1746572577, "_runtime": 6586}, "step": 2250} {"train_info/time_between_train_steps": 0.012134552001953125, "step": 2250} {"info/global_step": 2251, "train_info/time_within_train_step": 2.753115653991699, "step": 2251} {"train_info/time_between_train_steps": 0.0029048919677734375, "step": 2251} {"info/global_step": 2252, "train_info/time_within_train_step": 2.753526210784912, "step": 2252} {"train_info/time_between_train_steps": 0.0028574466705322266, "step": 2252} {"info/global_step": 2253, "train_info/time_within_train_step": 2.7543017864227295, "step": 2253} {"train_info/time_between_train_steps": 0.0028357505798339844, "step": 2253} {"info/global_step": 2254, "train_info/time_within_train_step": 2.7545995712280273, "step": 2254} {"train_info/time_between_train_steps": 0.002867460250854492, "step": 2254} {"info/global_step": 2255, "train_info/time_within_train_step": 2.7545135021209717, "step": 2255} {"train_info/time_between_train_steps": 0.0028302669525146484, "step": 2255} {"info/global_step": 2256, "train_info/time_within_train_step": 2.75262713432312, "step": 2256} {"train_info/time_between_train_steps": 0.002874612808227539, "step": 2256} {"info/global_step": 2257, "train_info/time_within_train_step": 2.7550363540649414, "step": 2257} {"train_info/time_between_train_steps": 0.0028455257415771484, "step": 2257} {"info/global_step": 2258, "train_info/time_within_train_step": 2.7540035247802734, "step": 2258} {"train_info/time_between_train_steps": 0.002874612808227539, "step": 2258} {"info/global_step": 2259, "train_info/time_within_train_step": 2.754530668258667, "step": 2259} {"train_info/time_between_train_steps": 0.0028548240661621094, "step": 2259} {"info/global_step": 2260, "train_info/time_within_train_step": 2.753196954727173, "step": 2260} {"train_info/time_between_train_steps": 0.0028531551361083984, "step": 2260} {"info/global_step": 2261, "train_info/time_within_train_step": 2.7539737224578857, "step": 2261} {"train_info/time_between_train_steps": 0.0028946399688720703, "step": 2261} {"info/global_step": 2262, "train_info/time_within_train_step": 2.7534027099609375, "step": 2262} {"train_info/time_between_train_steps": 0.0029129981994628906, "step": 2262} {"info/global_step": 2263, "train_info/time_within_train_step": 2.7535526752471924, "step": 2263} {"train_info/time_between_train_steps": 0.0028426647186279297, "step": 2263} {"info/global_step": 2264, "train_info/time_within_train_step": 2.7545509338378906, "step": 2264} {"train_info/time_between_train_steps": 0.0028548240661621094, "step": 2264} {"info/global_step": 2265, "train_info/time_within_train_step": 2.7552833557128906, "step": 2265} {"train_info/time_between_train_steps": 0.0028791427612304688, "step": 2265} {"info/global_step": 2266, "train_info/time_within_train_step": 2.753368616104126, "step": 2266} {"train_info/time_between_train_steps": 0.0028684139251708984, "step": 2266} {"info/global_step": 2267, "train_info/time_within_train_step": 2.7540881633758545, "step": 2267} {"train_info/time_between_train_steps": 0.0028400421142578125, "step": 2267} {"info/global_step": 2268, "train_info/time_within_train_step": 2.7542920112609863, "step": 2268} {"train_info/time_between_train_steps": 0.0029332637786865234, "step": 2268} {"info/global_step": 2269, "train_info/time_within_train_step": 2.7556188106536865, "step": 2269} {"train_info/time_between_train_steps": 0.0028531551361083984, "step": 2269} {"info/global_step": 2270, "train_info/time_within_train_step": 2.755523443222046, "step": 2270} {"train_info/time_between_train_steps": 0.0028896331787109375, "step": 2270} {"info/global_step": 2271, "train_info/time_within_train_step": 2.7545206546783447, "step": 2271} {"train_info/time_between_train_steps": 0.0028810501098632812, "step": 2271} {"info/global_step": 2272, "train_info/time_within_train_step": 2.754786968231201, "step": 2272} {"train_info/time_between_train_steps": 0.002854585647583008, "step": 2272} {"info/global_step": 2273, "train_info/time_within_train_step": 2.7542624473571777, "step": 2273} {"train_info/time_between_train_steps": 0.002926349639892578, "step": 2273} {"info/global_step": 2274, "train_info/time_within_train_step": 2.754451274871826, "step": 2274} {"train_info/time_between_train_steps": 0.002908468246459961, "step": 2274} {"info/global_step": 2275, "train_info/time_within_train_step": 2.753523588180542, "step": 2275} {"train_info/time_between_train_steps": 0.0028448104858398438, "step": 2275} {"info/global_step": 2276, "train_info/time_within_train_step": 2.7539546489715576, "step": 2276} {"train_info/time_between_train_steps": 0.002859830856323242, "step": 2276} {"info/global_step": 2277, "train_info/time_within_train_step": 2.7544174194335938, "step": 2277} {"train_info/time_between_train_steps": 0.0028710365295410156, "step": 2277} {"info/global_step": 2278, "train_info/time_within_train_step": 2.754380464553833, "step": 2278} {"train_info/time_between_train_steps": 0.0028662681579589844, "step": 2278} {"info/global_step": 2279, "train_info/time_within_train_step": 2.754648208618164, "step": 2279} {"train_info/time_between_train_steps": 0.0028874874114990234, "step": 2279} {"info/global_step": 2280, "train_info/time_within_train_step": 2.7536544799804688, "step": 2280} {"train_info/time_between_train_steps": 0.0028748512268066406, "step": 2280} {"info/global_step": 2281, "train_info/time_within_train_step": 2.7543158531188965, "step": 2281} {"train_info/time_between_train_steps": 0.002854585647583008, "step": 2281} {"info/global_step": 2282, "train_info/time_within_train_step": 2.754926919937134, "step": 2282} {"train_info/time_between_train_steps": 0.002859354019165039, "step": 2282} {"info/global_step": 2283, "train_info/time_within_train_step": 2.753540277481079, "step": 2283} {"train_info/time_between_train_steps": 0.002872467041015625, "step": 2283} {"info/global_step": 2284, "train_info/time_within_train_step": 2.754587173461914, "step": 2284} {"train_info/time_between_train_steps": 0.002834320068359375, "step": 2284} {"info/global_step": 2285, "train_info/time_within_train_step": 2.7548036575317383, "step": 2285} {"train_info/time_between_train_steps": 0.002872467041015625, "step": 2285} {"info/global_step": 2286, "train_info/time_within_train_step": 2.754929542541504, "step": 2286} {"train_info/time_between_train_steps": 0.0028977394104003906, "step": 2286} {"info/global_step": 2287, "train_info/time_within_train_step": 2.7545077800750732, "step": 2287} {"train_info/time_between_train_steps": 0.0028760433197021484, "step": 2287} {"info/global_step": 2288, "train_info/time_within_train_step": 2.7558717727661133, "step": 2288} {"train_info/time_between_train_steps": 0.002891063690185547, "step": 2288} {"info/global_step": 2289, "train_info/time_within_train_step": 2.7554562091827393, "step": 2289} {"train_info/time_between_train_steps": 0.002885580062866211, "step": 2289} {"info/global_step": 2290, "train_info/time_within_train_step": 2.7551422119140625, "step": 2290} {"train_info/time_between_train_steps": 0.0028793811798095703, "step": 2290} {"info/global_step": 2291, "train_info/time_within_train_step": 2.755134344100952, "step": 2291} {"train_info/time_between_train_steps": 0.002905607223510742, "step": 2291} {"info/global_step": 2292, "train_info/time_within_train_step": 2.7534937858581543, "step": 2292} {"train_info/time_between_train_steps": 0.0028655529022216797, "step": 2292} {"info/global_step": 2293, "train_info/time_within_train_step": 2.75469970703125, "step": 2293} {"train_info/time_between_train_steps": 0.002849102020263672, "step": 2293} {"info/global_step": 2294, "train_info/time_within_train_step": 2.7549948692321777, "step": 2294} {"train_info/time_between_train_steps": 0.0028510093688964844, "step": 2294} {"info/global_step": 2295, "train_info/time_within_train_step": 2.754808187484741, "step": 2295} {"train_info/time_between_train_steps": 0.002915620803833008, "step": 2295} {"info/global_step": 2296, "train_info/time_within_train_step": 2.754239082336426, "step": 2296} {"train_info/time_between_train_steps": 0.002875804901123047, "step": 2296} {"info/global_step": 2297, "train_info/time_within_train_step": 2.7539737224578857, "step": 2297} {"train_info/time_between_train_steps": 0.002836465835571289, "step": 2297} {"info/global_step": 2298, "train_info/time_within_train_step": 2.754701614379883, "step": 2298} {"train_info/time_between_train_steps": 0.0028705596923828125, "step": 2298} {"info/global_step": 2299, "train_info/time_within_train_step": 2.7546451091766357, "step": 2299} {"train_info/time_between_train_steps": 0.002866983413696289, "step": 2299} {"info/global_step": 2300, "train_info/time_within_train_step": 2.7538299560546875, "step": 2300} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746572715, "_runtime": 6724}, "step": 2300} {"logs": {"train/loss": 4.248, "train/learning_rate": 0.0005133333333333333, "train/epoch": 2.06, "_timestamp": 1746572715, "_runtime": 6724}, "step": 2300} {"train_info/time_between_train_steps": 0.014352560043334961, "step": 2300} {"info/global_step": 2301, "train_info/time_within_train_step": 2.7542662620544434, "step": 2301} {"train_info/time_between_train_steps": 0.0028634071350097656, "step": 2301} {"info/global_step": 2302, "train_info/time_within_train_step": 2.755566120147705, "step": 2302} {"train_info/time_between_train_steps": 0.0029010772705078125, "step": 2302} {"info/global_step": 2303, "train_info/time_within_train_step": 2.7547311782836914, "step": 2303} {"train_info/time_between_train_steps": 0.0028829574584960938, "step": 2303} {"info/global_step": 2304, "train_info/time_within_train_step": 2.7537992000579834, "step": 2304} {"train_info/time_between_train_steps": 0.0028853416442871094, "step": 2304} {"info/global_step": 2305, "train_info/time_within_train_step": 2.753223419189453, "step": 2305} {"train_info/time_between_train_steps": 0.0028748512268066406, "step": 2305} {"info/global_step": 2306, "train_info/time_within_train_step": 2.7543423175811768, "step": 2306} {"train_info/time_between_train_steps": 0.0029494762420654297, "step": 2306} {"info/global_step": 2307, "train_info/time_within_train_step": 2.754319429397583, "step": 2307} {"train_info/time_between_train_steps": 0.002875804901123047, "step": 2307} {"info/global_step": 2308, "train_info/time_within_train_step": 2.7549126148223877, "step": 2308} {"train_info/time_between_train_steps": 0.0028839111328125, "step": 2308} {"info/global_step": 2309, "train_info/time_within_train_step": 2.7536752223968506, "step": 2309} {"train_info/time_between_train_steps": 0.002853870391845703, "step": 2309} {"info/global_step": 2310, "train_info/time_within_train_step": 2.7530148029327393, "step": 2310} {"train_info/time_between_train_steps": 0.0028486251831054688, "step": 2310} {"info/global_step": 2311, "train_info/time_within_train_step": 2.753960609436035, "step": 2311} {"train_info/time_between_train_steps": 0.0028967857360839844, "step": 2311} {"info/global_step": 2312, "train_info/time_within_train_step": 2.754777193069458, "step": 2312} {"train_info/time_between_train_steps": 0.0028524398803710938, "step": 2312} {"info/global_step": 2313, "train_info/time_within_train_step": 2.754525899887085, "step": 2313} {"train_info/time_between_train_steps": 0.002858877182006836, "step": 2313} {"info/global_step": 2314, "train_info/time_within_train_step": 2.754821300506592, "step": 2314} {"train_info/time_between_train_steps": 0.0028772354125976562, "step": 2314} {"info/global_step": 2315, "train_info/time_within_train_step": 2.754845142364502, "step": 2315} {"train_info/time_between_train_steps": 0.002849578857421875, "step": 2315} {"info/global_step": 2316, "train_info/time_within_train_step": 2.7548396587371826, "step": 2316} {"train_info/time_between_train_steps": 0.002870798110961914, "step": 2316} {"info/global_step": 2317, "train_info/time_within_train_step": 2.7548115253448486, "step": 2317} {"train_info/time_between_train_steps": 0.0029113292694091797, "step": 2317} {"info/global_step": 2318, "train_info/time_within_train_step": 2.752437114715576, "step": 2318} {"train_info/time_between_train_steps": 0.0028467178344726562, "step": 2318} {"info/global_step": 2319, "train_info/time_within_train_step": 2.7549562454223633, "step": 2319} {"train_info/time_between_train_steps": 0.0028803348541259766, "step": 2319} {"info/global_step": 2320, "train_info/time_within_train_step": 2.7535829544067383, "step": 2320} {"train_info/time_between_train_steps": 0.002866506576538086, "step": 2320} {"info/global_step": 2321, "train_info/time_within_train_step": 2.7537660598754883, "step": 2321} {"train_info/time_between_train_steps": 0.0028557777404785156, "step": 2321} {"info/global_step": 2322, "train_info/time_within_train_step": 2.7529773712158203, "step": 2322} {"train_info/time_between_train_steps": 0.0028848648071289062, "step": 2322} {"info/global_step": 2323, "train_info/time_within_train_step": 2.7546443939208984, "step": 2323} {"train_info/time_between_train_steps": 0.002862215042114258, "step": 2323} {"info/global_step": 2324, "train_info/time_within_train_step": 2.7534048557281494, "step": 2324} {"train_info/time_between_train_steps": 0.0028450489044189453, "step": 2324} {"info/global_step": 2325, "train_info/time_within_train_step": 2.7538280487060547, "step": 2325} {"train_info/time_between_train_steps": 0.002866029739379883, "step": 2325} {"info/global_step": 2326, "train_info/time_within_train_step": 2.7549901008605957, "step": 2326} {"train_info/time_between_train_steps": 0.002859354019165039, "step": 2326} {"info/global_step": 2327, "train_info/time_within_train_step": 2.7526795864105225, "step": 2327} {"train_info/time_between_train_steps": 0.0028307437896728516, "step": 2327} {"info/global_step": 2328, "train_info/time_within_train_step": 2.754549980163574, "step": 2328} {"train_info/time_between_train_steps": 0.0029191970825195312, "step": 2328} {"info/global_step": 2329, "train_info/time_within_train_step": 2.7534921169281006, "step": 2329} {"train_info/time_between_train_steps": 0.002862691879272461, "step": 2329} {"info/global_step": 2330, "train_info/time_within_train_step": 2.7529170513153076, "step": 2330} {"train_info/time_between_train_steps": 0.002853870391845703, "step": 2330} {"info/global_step": 2331, "train_info/time_within_train_step": 2.7533841133117676, "step": 2331} {"train_info/time_between_train_steps": 0.0029458999633789062, "step": 2331} {"info/global_step": 2332, "train_info/time_within_train_step": 2.7539143562316895, "step": 2332} {"train_info/time_between_train_steps": 0.0028717517852783203, "step": 2332} {"info/global_step": 2333, "train_info/time_within_train_step": 2.7528300285339355, "step": 2333} {"train_info/time_between_train_steps": 0.002837657928466797, "step": 2333} {"info/global_step": 2334, "train_info/time_within_train_step": 2.752016305923462, "step": 2334} {"train_info/time_between_train_steps": 0.0029175281524658203, "step": 2334} {"info/global_step": 2335, "train_info/time_within_train_step": 2.912320852279663, "step": 2335} {"train_info/time_between_train_steps": 0.002874135971069336, "step": 2335} {"info/global_step": 2336, "train_info/time_within_train_step": 2.752772569656372, "step": 2336} {"train_info/time_between_train_steps": 0.0028412342071533203, "step": 2336} {"info/global_step": 2337, "train_info/time_within_train_step": 2.75154447555542, "step": 2337} {"train_info/time_between_train_steps": 0.002897977828979492, "step": 2337} {"info/global_step": 2338, "train_info/time_within_train_step": 2.7537097930908203, "step": 2338} {"train_info/time_between_train_steps": 0.002853870391845703, "step": 2338} {"info/global_step": 2339, "train_info/time_within_train_step": 2.75195574760437, "step": 2339} {"train_info/time_between_train_steps": 0.002877950668334961, "step": 2339} {"info/global_step": 2340, "train_info/time_within_train_step": 2.7533302307128906, "step": 2340} {"train_info/time_between_train_steps": 0.0029180049896240234, "step": 2340} {"info/global_step": 2341, "train_info/time_within_train_step": 2.7539539337158203, "step": 2341} {"train_info/time_between_train_steps": 0.0028717517852783203, "step": 2341} {"info/global_step": 2342, "train_info/time_within_train_step": 2.754990816116333, "step": 2342} {"train_info/time_between_train_steps": 0.002863645553588867, "step": 2342} {"info/global_step": 2343, "train_info/time_within_train_step": 2.754667282104492, "step": 2343} {"train_info/time_between_train_steps": 0.0028438568115234375, "step": 2343} {"info/global_step": 2344, "train_info/time_within_train_step": 2.7531652450561523, "step": 2344} {"train_info/time_between_train_steps": 0.0028672218322753906, "step": 2344} {"info/global_step": 2345, "train_info/time_within_train_step": 2.7524683475494385, "step": 2345} {"train_info/time_between_train_steps": 0.002840757369995117, "step": 2345} {"info/global_step": 2346, "train_info/time_within_train_step": 2.7546274662017822, "step": 2346} {"train_info/time_between_train_steps": 0.002809762954711914, "step": 2346} {"info/global_step": 2347, "train_info/time_within_train_step": 2.7540953159332275, "step": 2347} {"train_info/time_between_train_steps": 0.002830982208251953, "step": 2347} {"info/global_step": 2348, "train_info/time_within_train_step": 2.754404067993164, "step": 2348} {"train_info/time_between_train_steps": 0.0028755664825439453, "step": 2348} {"info/global_step": 2349, "train_info/time_within_train_step": 2.7540738582611084, "step": 2349} {"train_info/time_between_train_steps": 0.002841472625732422, "step": 2349} {"info/global_step": 2350, "train_info/time_within_train_step": 2.7537569999694824, "step": 2350} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746572853, "_runtime": 6862}, "step": 2350} {"logs": {"train/loss": 4.2288, "train/learning_rate": 0.0005099999999999999, "train/epoch": 2.06, "_timestamp": 1746572853, "_runtime": 6862}, "step": 2350} {"train_info/time_between_train_steps": 0.010540008544921875, "step": 2350} {"info/global_step": 2351, "train_info/time_within_train_step": 2.7532360553741455, "step": 2351} {"train_info/time_between_train_steps": 0.0028388500213623047, "step": 2351} {"info/global_step": 2352, "train_info/time_within_train_step": 2.7538504600524902, "step": 2352} {"train_info/time_between_train_steps": 0.0028595924377441406, "step": 2352} {"info/global_step": 2353, "train_info/time_within_train_step": 2.7532894611358643, "step": 2353} {"train_info/time_between_train_steps": 0.0028803348541259766, "step": 2353} {"info/global_step": 2354, "train_info/time_within_train_step": 2.754146099090576, "step": 2354} {"train_info/time_between_train_steps": 0.002893686294555664, "step": 2354} {"info/global_step": 2355, "train_info/time_within_train_step": 2.753441095352173, "step": 2355} {"train_info/time_between_train_steps": 0.002876758575439453, "step": 2355} {"info/global_step": 2356, "train_info/time_within_train_step": 2.7544188499450684, "step": 2356} {"train_info/time_between_train_steps": 0.0028798580169677734, "step": 2356} {"info/global_step": 2357, "train_info/time_within_train_step": 2.7543387413024902, "step": 2357} {"train_info/time_between_train_steps": 0.0028946399688720703, "step": 2357} {"info/global_step": 2358, "train_info/time_within_train_step": 2.7534291744232178, "step": 2358} {"train_info/time_between_train_steps": 0.0028612613677978516, "step": 2358} {"info/global_step": 2359, "train_info/time_within_train_step": 2.7531116008758545, "step": 2359} {"train_info/time_between_train_steps": 0.002936840057373047, "step": 2359} {"info/global_step": 2360, "train_info/time_within_train_step": 2.7523233890533447, "step": 2360} {"train_info/time_between_train_steps": 0.0028939247131347656, "step": 2360} {"info/global_step": 2361, "train_info/time_within_train_step": 2.7533950805664062, "step": 2361} {"train_info/time_between_train_steps": 0.002868175506591797, "step": 2361} {"info/global_step": 2362, "train_info/time_within_train_step": 2.7539799213409424, "step": 2362} {"train_info/time_between_train_steps": 0.0028722286224365234, "step": 2362} {"info/global_step": 2363, "train_info/time_within_train_step": 2.7551655769348145, "step": 2363} {"train_info/time_between_train_steps": 0.0029571056365966797, "step": 2363} {"info/global_step": 2364, "train_info/time_within_train_step": 2.7539222240448, "step": 2364} {"train_info/time_between_train_steps": 0.0028793811798095703, "step": 2364} {"info/global_step": 2365, "train_info/time_within_train_step": 2.7542901039123535, "step": 2365} {"train_info/time_between_train_steps": 0.002878904342651367, "step": 2365} {"info/global_step": 2366, "train_info/time_within_train_step": 2.7530806064605713, "step": 2366} {"train_info/time_between_train_steps": 0.0028781890869140625, "step": 2366} {"info/global_step": 2367, "train_info/time_within_train_step": 2.753673791885376, "step": 2367} {"train_info/time_between_train_steps": 0.0028913021087646484, "step": 2367} {"info/global_step": 2368, "train_info/time_within_train_step": 2.7511680126190186, "step": 2368} {"train_info/time_between_train_steps": 0.0029027462005615234, "step": 2368} {"info/global_step": 2369, "train_info/time_within_train_step": 2.7543036937713623, "step": 2369} {"train_info/time_between_train_steps": 0.0028846263885498047, "step": 2369} {"info/global_step": 2370, "train_info/time_within_train_step": 2.754305839538574, "step": 2370} {"train_info/time_between_train_steps": 0.0028858184814453125, "step": 2370} {"info/global_step": 2371, "train_info/time_within_train_step": 2.7546424865722656, "step": 2371} {"train_info/time_between_train_steps": 0.002893686294555664, "step": 2371} {"info/global_step": 2372, "train_info/time_within_train_step": 2.7538297176361084, "step": 2372} {"train_info/time_between_train_steps": 0.0029201507568359375, "step": 2372} {"info/global_step": 2373, "train_info/time_within_train_step": 2.754470109939575, "step": 2373} {"train_info/time_between_train_steps": 0.002909421920776367, "step": 2373} {"info/global_step": 2374, "train_info/time_within_train_step": 2.7538020610809326, "step": 2374} {"train_info/time_between_train_steps": 0.0029523372650146484, "step": 2374} {"info/global_step": 2375, "train_info/time_within_train_step": 2.757525682449341, "step": 2375} {"train_info/time_between_train_steps": 0.003933906555175781, "step": 2375} {"info/global_step": 2376, "train_info/time_within_train_step": 2.75991153717041, "step": 2376} {"train_info/time_between_train_steps": 0.0038232803344726562, "step": 2376} {"info/global_step": 2377, "train_info/time_within_train_step": 2.7555289268493652, "step": 2377} {"train_info/time_between_train_steps": 0.002903461456298828, "step": 2377} {"info/global_step": 2378, "train_info/time_within_train_step": 2.754913568496704, "step": 2378} {"train_info/time_between_train_steps": 0.0029387474060058594, "step": 2378} {"info/global_step": 2379, "train_info/time_within_train_step": 2.7645907402038574, "step": 2379} {"train_info/time_between_train_steps": 0.0038614273071289062, "step": 2379} {"info/global_step": 2380, "train_info/time_within_train_step": 2.7569239139556885, "step": 2380} {"train_info/time_between_train_steps": 0.002918243408203125, "step": 2380} {"info/global_step": 2381, "train_info/time_within_train_step": 2.7548792362213135, "step": 2381} {"train_info/time_between_train_steps": 0.002937793731689453, "step": 2381} {"info/global_step": 2382, "train_info/time_within_train_step": 2.754422903060913, "step": 2382} {"train_info/time_between_train_steps": 0.002871990203857422, "step": 2382} {"info/global_step": 2383, "train_info/time_within_train_step": 2.7537460327148438, "step": 2383} {"train_info/time_between_train_steps": 0.0028717517852783203, "step": 2383} {"info/global_step": 2384, "train_info/time_within_train_step": 2.753730058670044, "step": 2384} {"train_info/time_between_train_steps": 0.002879619598388672, "step": 2384} {"info/global_step": 2385, "train_info/time_within_train_step": 2.753082513809204, "step": 2385} {"train_info/time_between_train_steps": 0.00286865234375, "step": 2385} {"info/global_step": 2386, "train_info/time_within_train_step": 2.7546744346618652, "step": 2386} {"train_info/time_between_train_steps": 0.0028913021087646484, "step": 2386} {"info/global_step": 2387, "train_info/time_within_train_step": 2.7520334720611572, "step": 2387} {"train_info/time_between_train_steps": 0.0028944015502929688, "step": 2387} {"info/global_step": 2388, "train_info/time_within_train_step": 2.753962993621826, "step": 2388} {"train_info/time_between_train_steps": 0.002872467041015625, "step": 2388} {"info/global_step": 2389, "train_info/time_within_train_step": 2.753455638885498, "step": 2389} {"train_info/time_between_train_steps": 0.0028781890869140625, "step": 2389} {"info/global_step": 2390, "train_info/time_within_train_step": 2.753843307495117, "step": 2390} {"train_info/time_between_train_steps": 0.0028650760650634766, "step": 2390} {"info/global_step": 2391, "train_info/time_within_train_step": 2.754800319671631, "step": 2391} {"train_info/time_between_train_steps": 0.0028853416442871094, "step": 2391} {"info/global_step": 2392, "train_info/time_within_train_step": 2.7558467388153076, "step": 2392} {"train_info/time_between_train_steps": 0.0029473304748535156, "step": 2392} {"info/global_step": 2393, "train_info/time_within_train_step": 2.878302574157715, "step": 2393} {"train_info/time_between_train_steps": 0.0028755664825439453, "step": 2393} {"info/global_step": 2394, "train_info/time_within_train_step": 2.7532410621643066, "step": 2394} {"train_info/time_between_train_steps": 0.0028848648071289062, "step": 2394} {"info/global_step": 2395, "train_info/time_within_train_step": 2.754213571548462, "step": 2395} {"train_info/time_between_train_steps": 0.002917766571044922, "step": 2395} {"info/global_step": 2396, "train_info/time_within_train_step": 2.7548747062683105, "step": 2396} {"train_info/time_between_train_steps": 0.002841472625732422, "step": 2396} {"info/global_step": 2397, "train_info/time_within_train_step": 2.7544915676116943, "step": 2397} {"train_info/time_between_train_steps": 0.002855539321899414, "step": 2397} {"info/global_step": 2398, "train_info/time_within_train_step": 2.753225326538086, "step": 2398} {"train_info/time_between_train_steps": 0.002878427505493164, "step": 2398} {"info/global_step": 2399, "train_info/time_within_train_step": 2.7531211376190186, "step": 2399} {"train_info/time_between_train_steps": 0.0028541088104248047, "step": 2399} {"info/global_step": 2400, "train_info/time_within_train_step": 2.7539005279541016, "step": 2400} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746572992, "_runtime": 7001}, "step": 2400} {"logs": {"train/loss": 4.2146, "train/learning_rate": 0.0005066666666666667, "train/epoch": 2.07, "_timestamp": 1746572992, "_runtime": 7001}, "step": 2400} {"train_info/time_between_train_steps": 33.766555070877075, "step": 2400} {"info/global_step": 2401, "train_info/time_within_train_step": 2.5343432426452637, "step": 2401} {"train_info/time_between_train_steps": 0.002868175506591797, "step": 2401} {"info/global_step": 2402, "train_info/time_within_train_step": 2.5584824085235596, "step": 2402} {"train_info/time_between_train_steps": 0.002875089645385742, "step": 2402} {"info/global_step": 2403, "train_info/time_within_train_step": 2.685892105102539, "step": 2403} {"train_info/time_between_train_steps": 0.0028753280639648438, "step": 2403} {"info/global_step": 2404, "train_info/time_within_train_step": 2.723583698272705, "step": 2404} {"train_info/time_between_train_steps": 0.0029146671295166016, "step": 2404} {"info/global_step": 2405, "train_info/time_within_train_step": 2.7234437465667725, "step": 2405} {"train_info/time_between_train_steps": 0.0028755664825439453, "step": 2405} {"info/global_step": 2406, "train_info/time_within_train_step": 2.7195634841918945, "step": 2406} {"train_info/time_between_train_steps": 0.0029060840606689453, "step": 2406} {"info/global_step": 2407, "train_info/time_within_train_step": 2.7508931159973145, "step": 2407} {"train_info/time_between_train_steps": 0.002849578857421875, "step": 2407} {"info/global_step": 2408, "train_info/time_within_train_step": 2.7523059844970703, "step": 2408} {"train_info/time_between_train_steps": 0.002869844436645508, "step": 2408} {"info/global_step": 2409, "train_info/time_within_train_step": 2.753926992416382, "step": 2409} {"train_info/time_between_train_steps": 0.002856731414794922, "step": 2409} {"info/global_step": 2410, "train_info/time_within_train_step": 2.7534735202789307, "step": 2410} {"train_info/time_between_train_steps": 0.002908468246459961, "step": 2410} {"info/global_step": 2411, "train_info/time_within_train_step": 2.7549028396606445, "step": 2411} {"train_info/time_between_train_steps": 0.0028564929962158203, "step": 2411} {"info/global_step": 2412, "train_info/time_within_train_step": 2.754135847091675, "step": 2412} {"train_info/time_between_train_steps": 0.002833843231201172, "step": 2412} {"info/global_step": 2413, "train_info/time_within_train_step": 2.7534642219543457, "step": 2413} {"train_info/time_between_train_steps": 0.0028526782989501953, "step": 2413} {"info/global_step": 2414, "train_info/time_within_train_step": 2.7546374797821045, "step": 2414} {"train_info/time_between_train_steps": 0.0028803348541259766, "step": 2414} {"info/global_step": 2415, "train_info/time_within_train_step": 2.754570960998535, "step": 2415} {"train_info/time_between_train_steps": 0.002869844436645508, "step": 2415} {"info/global_step": 2416, "train_info/time_within_train_step": 2.753828763961792, "step": 2416} {"train_info/time_between_train_steps": 0.002841472625732422, "step": 2416} {"info/global_step": 2417, "train_info/time_within_train_step": 2.754283905029297, "step": 2417} {"train_info/time_between_train_steps": 0.0029363632202148438, "step": 2417} {"info/global_step": 2418, "train_info/time_within_train_step": 2.7537569999694824, "step": 2418} {"train_info/time_between_train_steps": 0.0028603076934814453, "step": 2418} {"info/global_step": 2419, "train_info/time_within_train_step": 2.7541842460632324, "step": 2419} {"train_info/time_between_train_steps": 0.0028543472290039062, "step": 2419} {"info/global_step": 2420, "train_info/time_within_train_step": 2.7537589073181152, "step": 2420} {"train_info/time_between_train_steps": 0.002862215042114258, "step": 2420} {"info/global_step": 2421, "train_info/time_within_train_step": 2.755249261856079, "step": 2421} {"train_info/time_between_train_steps": 0.00287628173828125, "step": 2421} {"info/global_step": 2422, "train_info/time_within_train_step": 2.7602992057800293, "step": 2422} {"train_info/time_between_train_steps": 0.0028390884399414062, "step": 2422} {"info/global_step": 2423, "train_info/time_within_train_step": 2.7550618648529053, "step": 2423} {"train_info/time_between_train_steps": 0.0028524398803710938, "step": 2423} {"info/global_step": 2424, "train_info/time_within_train_step": 2.754242181777954, "step": 2424} {"train_info/time_between_train_steps": 0.0028655529022216797, "step": 2424} {"info/global_step": 2425, "train_info/time_within_train_step": 2.7535314559936523, "step": 2425} {"train_info/time_between_train_steps": 0.002844572067260742, "step": 2425} {"info/global_step": 2426, "train_info/time_within_train_step": 2.753618001937866, "step": 2426} {"train_info/time_between_train_steps": 0.0033376216888427734, "step": 2426} {"info/global_step": 2427, "train_info/time_within_train_step": 2.754661798477173, "step": 2427} {"train_info/time_between_train_steps": 0.002857208251953125, "step": 2427} {"info/global_step": 2428, "train_info/time_within_train_step": 2.754688024520874, "step": 2428} {"train_info/time_between_train_steps": 0.0028650760650634766, "step": 2428} {"info/global_step": 2429, "train_info/time_within_train_step": 2.754129648208618, "step": 2429} {"train_info/time_between_train_steps": 0.002891063690185547, "step": 2429} {"info/global_step": 2430, "train_info/time_within_train_step": 2.7558298110961914, "step": 2430} {"train_info/time_between_train_steps": 0.002855062484741211, "step": 2430} {"info/global_step": 2431, "train_info/time_within_train_step": 2.755695104598999, "step": 2431} {"train_info/time_between_train_steps": 0.0028443336486816406, "step": 2431} {"info/global_step": 2432, "train_info/time_within_train_step": 2.7552926540374756, "step": 2432} {"train_info/time_between_train_steps": 0.0028731822967529297, "step": 2432} {"info/global_step": 2433, "train_info/time_within_train_step": 2.755345106124878, "step": 2433} {"train_info/time_between_train_steps": 0.0028765201568603516, "step": 2433} {"info/global_step": 2434, "train_info/time_within_train_step": 2.755981206893921, "step": 2434} {"train_info/time_between_train_steps": 0.002905130386352539, "step": 2434} {"info/global_step": 2435, "train_info/time_within_train_step": 2.754678249359131, "step": 2435} {"train_info/time_between_train_steps": 0.0028619766235351562, "step": 2435} {"info/global_step": 2436, "train_info/time_within_train_step": 2.756608009338379, "step": 2436} {"train_info/time_between_train_steps": 0.0028564929962158203, "step": 2436} {"info/global_step": 2437, "train_info/time_within_train_step": 2.7544445991516113, "step": 2437} {"train_info/time_between_train_steps": 0.0029015541076660156, "step": 2437} {"info/global_step": 2438, "train_info/time_within_train_step": 2.754748821258545, "step": 2438} {"train_info/time_between_train_steps": 0.002872467041015625, "step": 2438} {"info/global_step": 2439, "train_info/time_within_train_step": 2.7545270919799805, "step": 2439} {"train_info/time_between_train_steps": 0.002905607223510742, "step": 2439} {"info/global_step": 2440, "train_info/time_within_train_step": 2.7543954849243164, "step": 2440} {"train_info/time_between_train_steps": 0.002900838851928711, "step": 2440} {"info/global_step": 2441, "train_info/time_within_train_step": 2.7535855770111084, "step": 2441} {"train_info/time_between_train_steps": 0.002877950668334961, "step": 2441} {"info/global_step": 2442, "train_info/time_within_train_step": 2.7527031898498535, "step": 2442} {"train_info/time_between_train_steps": 0.002919435501098633, "step": 2442} {"info/global_step": 2443, "train_info/time_within_train_step": 2.753948926925659, "step": 2443} {"train_info/time_between_train_steps": 0.002902507781982422, "step": 2443} {"info/global_step": 2444, "train_info/time_within_train_step": 2.753267288208008, "step": 2444} {"train_info/time_between_train_steps": 0.002875089645385742, "step": 2444} {"info/global_step": 2445, "train_info/time_within_train_step": 2.7533295154571533, "step": 2445} {"train_info/time_between_train_steps": 0.002851247787475586, "step": 2445} {"info/global_step": 2446, "train_info/time_within_train_step": 2.753765106201172, "step": 2446} {"train_info/time_between_train_steps": 0.0028655529022216797, "step": 2446} {"info/global_step": 2447, "train_info/time_within_train_step": 2.7557778358459473, "step": 2447} {"train_info/time_between_train_steps": 0.0028123855590820312, "step": 2447} {"info/global_step": 2448, "train_info/time_within_train_step": 2.7538115978240967, "step": 2448} {"train_info/time_between_train_steps": 0.0028502941131591797, "step": 2448} {"info/global_step": 2449, "train_info/time_within_train_step": 2.7543160915374756, "step": 2449} {"train_info/time_between_train_steps": 0.0028574466705322266, "step": 2449} {"info/global_step": 2450, "train_info/time_within_train_step": 2.7545461654663086, "step": 2450} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746573163, "_runtime": 7172}, "step": 2450} {"logs": {"train/loss": 4.1977, "train/learning_rate": 0.0005033333333333333, "train/epoch": 2.07, "_timestamp": 1746573163, "_runtime": 7172}, "step": 2450} {"train_info/time_between_train_steps": 0.013475656509399414, "step": 2450} {"info/global_step": 2451, "train_info/time_within_train_step": 2.75557804107666, "step": 2451} {"train_info/time_between_train_steps": 0.002828359603881836, "step": 2451} {"info/global_step": 2452, "train_info/time_within_train_step": 2.755962371826172, "step": 2452} {"train_info/time_between_train_steps": 0.0028696060180664062, "step": 2452} {"info/global_step": 2453, "train_info/time_within_train_step": 2.7548136711120605, "step": 2453} {"train_info/time_between_train_steps": 0.0028526782989501953, "step": 2453} {"info/global_step": 2454, "train_info/time_within_train_step": 2.759808301925659, "step": 2454} {"train_info/time_between_train_steps": 0.0028955936431884766, "step": 2454} {"info/global_step": 2455, "train_info/time_within_train_step": 2.75441312789917, "step": 2455} {"train_info/time_between_train_steps": 0.002887725830078125, "step": 2455} {"info/global_step": 2456, "train_info/time_within_train_step": 2.7549915313720703, "step": 2456} {"train_info/time_between_train_steps": 0.0028481483459472656, "step": 2456} {"info/global_step": 2457, "train_info/time_within_train_step": 2.7542285919189453, "step": 2457} {"train_info/time_between_train_steps": 0.002894878387451172, "step": 2457} {"info/global_step": 2458, "train_info/time_within_train_step": 2.7541298866271973, "step": 2458} {"train_info/time_between_train_steps": 0.0028998851776123047, "step": 2458} {"info/global_step": 2459, "train_info/time_within_train_step": 2.7536051273345947, "step": 2459} {"train_info/time_between_train_steps": 0.0028696060180664062, "step": 2459} {"info/global_step": 2460, "train_info/time_within_train_step": 2.7537269592285156, "step": 2460} {"train_info/time_between_train_steps": 0.002874612808227539, "step": 2460} {"info/global_step": 2461, "train_info/time_within_train_step": 2.7534632682800293, "step": 2461} {"train_info/time_between_train_steps": 0.0028867721557617188, "step": 2461} {"info/global_step": 2462, "train_info/time_within_train_step": 2.7550601959228516, "step": 2462} {"train_info/time_between_train_steps": 0.002899646759033203, "step": 2462} {"info/global_step": 2463, "train_info/time_within_train_step": 2.754796266555786, "step": 2463} {"train_info/time_between_train_steps": 0.0028641223907470703, "step": 2463} {"info/global_step": 2464, "train_info/time_within_train_step": 2.754246950149536, "step": 2464} {"train_info/time_between_train_steps": 0.0028629302978515625, "step": 2464} {"info/global_step": 2465, "train_info/time_within_train_step": 2.7542383670806885, "step": 2465} {"train_info/time_between_train_steps": 0.00286102294921875, "step": 2465} {"info/global_step": 2466, "train_info/time_within_train_step": 2.7550134658813477, "step": 2466} {"train_info/time_between_train_steps": 0.0028955936431884766, "step": 2466} {"info/global_step": 2467, "train_info/time_within_train_step": 2.754256010055542, "step": 2467} {"train_info/time_between_train_steps": 0.002889394760131836, "step": 2467} {"info/global_step": 2468, "train_info/time_within_train_step": 2.7548155784606934, "step": 2468} {"train_info/time_between_train_steps": 0.002900838851928711, "step": 2468} {"info/global_step": 2469, "train_info/time_within_train_step": 2.7542691230773926, "step": 2469} {"train_info/time_between_train_steps": 0.0029091835021972656, "step": 2469} {"info/global_step": 2470, "train_info/time_within_train_step": 2.7544612884521484, "step": 2470} {"train_info/time_between_train_steps": 0.0028772354125976562, "step": 2470} {"info/global_step": 2471, "train_info/time_within_train_step": 2.7555582523345947, "step": 2471} {"train_info/time_between_train_steps": 0.0028955936431884766, "step": 2471} {"info/global_step": 2472, "train_info/time_within_train_step": 2.753822088241577, "step": 2472} {"train_info/time_between_train_steps": 0.0029273033142089844, "step": 2472} {"info/global_step": 2473, "train_info/time_within_train_step": 2.7543556690216064, "step": 2473} {"train_info/time_between_train_steps": 0.002858877182006836, "step": 2473} {"info/global_step": 2474, "train_info/time_within_train_step": 2.752969980239868, "step": 2474} {"train_info/time_between_train_steps": 0.0028603076934814453, "step": 2474} {"info/global_step": 2475, "train_info/time_within_train_step": 2.75368595123291, "step": 2475} {"train_info/time_between_train_steps": 0.00289154052734375, "step": 2475} {"info/global_step": 2476, "train_info/time_within_train_step": 2.753396511077881, "step": 2476} {"train_info/time_between_train_steps": 0.0028951168060302734, "step": 2476} {"info/global_step": 2477, "train_info/time_within_train_step": 2.7541565895080566, "step": 2477} {"train_info/time_between_train_steps": 0.0028951168060302734, "step": 2477} {"info/global_step": 2478, "train_info/time_within_train_step": 2.75463604927063, "step": 2478} {"train_info/time_between_train_steps": 0.002882242202758789, "step": 2478} {"info/global_step": 2479, "train_info/time_within_train_step": 2.754092216491699, "step": 2479} {"train_info/time_between_train_steps": 0.002857208251953125, "step": 2479} {"info/global_step": 2480, "train_info/time_within_train_step": 2.754561185836792, "step": 2480} {"train_info/time_between_train_steps": 0.002881288528442383, "step": 2480} {"info/global_step": 2481, "train_info/time_within_train_step": 2.828941583633423, "step": 2481} {"train_info/time_between_train_steps": 0.0028700828552246094, "step": 2481} {"info/global_step": 2482, "train_info/time_within_train_step": 2.7537386417388916, "step": 2482} {"train_info/time_between_train_steps": 0.002863645553588867, "step": 2482} {"info/global_step": 2483, "train_info/time_within_train_step": 2.7539525032043457, "step": 2483} {"train_info/time_between_train_steps": 0.0028841495513916016, "step": 2483} {"info/global_step": 2484, "train_info/time_within_train_step": 2.755038261413574, "step": 2484} {"train_info/time_between_train_steps": 0.0028853416442871094, "step": 2484} {"info/global_step": 2485, "train_info/time_within_train_step": 2.7546987533569336, "step": 2485} {"train_info/time_between_train_steps": 0.002869129180908203, "step": 2485} {"info/global_step": 2486, "train_info/time_within_train_step": 2.7539334297180176, "step": 2486} {"train_info/time_between_train_steps": 0.0028870105743408203, "step": 2486} {"info/global_step": 2487, "train_info/time_within_train_step": 2.754708766937256, "step": 2487} {"train_info/time_between_train_steps": 0.0028574466705322266, "step": 2487} {"info/global_step": 2488, "train_info/time_within_train_step": 2.7548601627349854, "step": 2488} {"train_info/time_between_train_steps": 0.0028564929962158203, "step": 2488} {"info/global_step": 2489, "train_info/time_within_train_step": 2.7543137073516846, "step": 2489} {"train_info/time_between_train_steps": 0.0028731822967529297, "step": 2489} {"info/global_step": 2490, "train_info/time_within_train_step": 2.7539544105529785, "step": 2490} {"train_info/time_between_train_steps": 0.0028870105743408203, "step": 2490} {"info/global_step": 2491, "train_info/time_within_train_step": 2.7522411346435547, "step": 2491} {"train_info/time_between_train_steps": 0.002875089645385742, "step": 2491} {"info/global_step": 2492, "train_info/time_within_train_step": 2.753328800201416, "step": 2492} {"train_info/time_between_train_steps": 0.0028891563415527344, "step": 2492} {"info/global_step": 2493, "train_info/time_within_train_step": 2.754467010498047, "step": 2493} {"train_info/time_between_train_steps": 0.002877950668334961, "step": 2493} {"info/global_step": 2494, "train_info/time_within_train_step": 2.7542293071746826, "step": 2494} {"train_info/time_between_train_steps": 0.002866506576538086, "step": 2494} {"info/global_step": 2495, "train_info/time_within_train_step": 2.7546536922454834, "step": 2495} {"train_info/time_between_train_steps": 0.002857685089111328, "step": 2495} {"info/global_step": 2496, "train_info/time_within_train_step": 2.7546417713165283, "step": 2496} {"train_info/time_between_train_steps": 0.002862215042114258, "step": 2496} {"info/global_step": 2497, "train_info/time_within_train_step": 2.7519354820251465, "step": 2497} {"train_info/time_between_train_steps": 0.002892732620239258, "step": 2497} {"info/global_step": 2498, "train_info/time_within_train_step": 2.7550220489501953, "step": 2498} {"train_info/time_between_train_steps": 0.002873659133911133, "step": 2498} {"info/global_step": 2499, "train_info/time_within_train_step": 3.3598132133483887, "step": 2499} {"train_info/time_between_train_steps": 0.0028836727142333984, "step": 2499} {"info/global_step": 2500, "train_info/time_within_train_step": 2.7508037090301514, "step": 2500} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746573302, "_runtime": 7311}, "step": 2500} {"logs": {"train/loss": 4.1841, "train/learning_rate": 0.0005, "train/epoch": 2.08, "_timestamp": 1746573302, "_runtime": 7311}, "step": 2500} {"train_info/time_between_train_steps": 0.014342308044433594, "step": 2500} {"info/global_step": 2501, "train_info/time_within_train_step": 2.754415273666382, "step": 2501} {"train_info/time_between_train_steps": 0.002836942672729492, "step": 2501} {"info/global_step": 2502, "train_info/time_within_train_step": 2.75264835357666, "step": 2502} {"train_info/time_between_train_steps": 0.002869844436645508, "step": 2502} {"info/global_step": 2503, "train_info/time_within_train_step": 2.7538607120513916, "step": 2503} {"train_info/time_between_train_steps": 0.0028738975524902344, "step": 2503} {"info/global_step": 2504, "train_info/time_within_train_step": 2.7525699138641357, "step": 2504} {"train_info/time_between_train_steps": 0.0028755664825439453, "step": 2504} {"info/global_step": 2505, "train_info/time_within_train_step": 2.755049705505371, "step": 2505} {"train_info/time_between_train_steps": 0.0028829574584960938, "step": 2505} {"info/global_step": 2506, "train_info/time_within_train_step": 2.754420518875122, "step": 2506} {"train_info/time_between_train_steps": 0.0028793811798095703, "step": 2506} {"info/global_step": 2507, "train_info/time_within_train_step": 2.7542495727539062, "step": 2507} {"train_info/time_between_train_steps": 0.00290679931640625, "step": 2507} {"info/global_step": 2508, "train_info/time_within_train_step": 2.7525522708892822, "step": 2508} {"train_info/time_between_train_steps": 0.0029053688049316406, "step": 2508} {"info/global_step": 2509, "train_info/time_within_train_step": 2.754516124725342, "step": 2509} {"train_info/time_between_train_steps": 0.0028574466705322266, "step": 2509} {"info/global_step": 2510, "train_info/time_within_train_step": 2.7537429332733154, "step": 2510} {"train_info/time_between_train_steps": 0.002920389175415039, "step": 2510} {"info/global_step": 2511, "train_info/time_within_train_step": 2.7535817623138428, "step": 2511} {"train_info/time_between_train_steps": 0.002881765365600586, "step": 2511} {"info/global_step": 2512, "train_info/time_within_train_step": 2.754950523376465, "step": 2512} {"train_info/time_between_train_steps": 0.0029418468475341797, "step": 2512} {"info/global_step": 2513, "train_info/time_within_train_step": 2.752451181411743, "step": 2513} {"train_info/time_between_train_steps": 0.0029306411743164062, "step": 2513} {"info/global_step": 2514, "train_info/time_within_train_step": 2.7537596225738525, "step": 2514} {"train_info/time_between_train_steps": 0.00292205810546875, "step": 2514} {"info/global_step": 2515, "train_info/time_within_train_step": 2.7535316944122314, "step": 2515} {"train_info/time_between_train_steps": 0.0028810501098632812, "step": 2515} {"info/global_step": 2516, "train_info/time_within_train_step": 2.7527122497558594, "step": 2516} {"train_info/time_between_train_steps": 0.002925395965576172, "step": 2516} {"info/global_step": 2517, "train_info/time_within_train_step": 2.7533984184265137, "step": 2517} {"train_info/time_between_train_steps": 0.002885103225708008, "step": 2517} {"info/global_step": 2518, "train_info/time_within_train_step": 2.754582405090332, "step": 2518} {"train_info/time_between_train_steps": 0.003009796142578125, "step": 2518} {"info/global_step": 2519, "train_info/time_within_train_step": 2.7539329528808594, "step": 2519} {"train_info/time_between_train_steps": 0.002964019775390625, "step": 2519} {"info/global_step": 2520, "train_info/time_within_train_step": 2.753922462463379, "step": 2520} {"train_info/time_between_train_steps": 0.002977132797241211, "step": 2520} {"info/global_step": 2521, "train_info/time_within_train_step": 2.753591299057007, "step": 2521} {"train_info/time_between_train_steps": 0.003003358840942383, "step": 2521} {"info/global_step": 2522, "train_info/time_within_train_step": 2.7549211978912354, "step": 2522} {"train_info/time_between_train_steps": 0.002897977828979492, "step": 2522} {"info/global_step": 2523, "train_info/time_within_train_step": 2.754145383834839, "step": 2523} {"train_info/time_between_train_steps": 0.003017425537109375, "step": 2523} {"info/global_step": 2524, "train_info/time_within_train_step": 2.755439281463623, "step": 2524} {"train_info/time_between_train_steps": 0.0028710365295410156, "step": 2524} {"info/global_step": 2525, "train_info/time_within_train_step": 2.753824234008789, "step": 2525} {"train_info/time_between_train_steps": 0.0030143260955810547, "step": 2525} {"info/global_step": 2526, "train_info/time_within_train_step": 2.754004955291748, "step": 2526} {"train_info/time_between_train_steps": 0.0029594898223876953, "step": 2526} {"info/global_step": 2527, "train_info/time_within_train_step": 2.754239559173584, "step": 2527} {"train_info/time_between_train_steps": 0.0029535293579101562, "step": 2527} {"info/global_step": 2528, "train_info/time_within_train_step": 2.7551462650299072, "step": 2528} {"train_info/time_between_train_steps": 0.0029976367950439453, "step": 2528} {"info/global_step": 2529, "train_info/time_within_train_step": 2.753228187561035, "step": 2529} {"train_info/time_between_train_steps": 0.002843618392944336, "step": 2529} {"info/global_step": 2530, "train_info/time_within_train_step": 2.753229856491089, "step": 2530} {"train_info/time_between_train_steps": 0.002969503402709961, "step": 2530} {"info/global_step": 2531, "train_info/time_within_train_step": 2.7541589736938477, "step": 2531} {"train_info/time_between_train_steps": 0.0029723644256591797, "step": 2531} {"info/global_step": 2532, "train_info/time_within_train_step": 2.754058361053467, "step": 2532} {"train_info/time_between_train_steps": 0.0029871463775634766, "step": 2532} {"info/global_step": 2533, "train_info/time_within_train_step": 2.7543482780456543, "step": 2533} {"train_info/time_between_train_steps": 0.0029158592224121094, "step": 2533} {"info/global_step": 2534, "train_info/time_within_train_step": 2.7544822692871094, "step": 2534} {"train_info/time_between_train_steps": 0.002957582473754883, "step": 2534} {"info/global_step": 2535, "train_info/time_within_train_step": 2.799771785736084, "step": 2535} {"train_info/time_between_train_steps": 0.0029401779174804688, "step": 2535} {"info/global_step": 2536, "train_info/time_within_train_step": 2.7551701068878174, "step": 2536} {"train_info/time_between_train_steps": 0.0031304359436035156, "step": 2536} {"info/global_step": 2537, "train_info/time_within_train_step": 2.754837989807129, "step": 2537} {"train_info/time_between_train_steps": 0.003016948699951172, "step": 2537} {"info/global_step": 2538, "train_info/time_within_train_step": 2.7551047801971436, "step": 2538} {"train_info/time_between_train_steps": 0.002924680709838867, "step": 2538} {"info/global_step": 2539, "train_info/time_within_train_step": 2.754058837890625, "step": 2539} {"train_info/time_between_train_steps": 0.0030257701873779297, "step": 2539} {"info/global_step": 2540, "train_info/time_within_train_step": 2.7532601356506348, "step": 2540} {"train_info/time_between_train_steps": 0.0029752254486083984, "step": 2540} {"info/global_step": 2541, "train_info/time_within_train_step": 2.7551333904266357, "step": 2541} {"train_info/time_between_train_steps": 0.003124713897705078, "step": 2541} {"info/global_step": 2542, "train_info/time_within_train_step": 2.754873514175415, "step": 2542} {"train_info/time_between_train_steps": 0.003111124038696289, "step": 2542} {"info/global_step": 2543, "train_info/time_within_train_step": 2.754789352416992, "step": 2543} {"train_info/time_between_train_steps": 0.0031554698944091797, "step": 2543} {"info/global_step": 2544, "train_info/time_within_train_step": 2.754241466522217, "step": 2544} {"train_info/time_between_train_steps": 0.003210306167602539, "step": 2544} {"info/global_step": 2545, "train_info/time_within_train_step": 2.75563645362854, "step": 2545} {"train_info/time_between_train_steps": 0.0030946731567382812, "step": 2545} {"info/global_step": 2546, "train_info/time_within_train_step": 2.7546093463897705, "step": 2546} {"train_info/time_between_train_steps": 0.003213167190551758, "step": 2546} {"info/global_step": 2547, "train_info/time_within_train_step": 2.754254102706909, "step": 2547} {"train_info/time_between_train_steps": 0.003109455108642578, "step": 2547} {"info/global_step": 2548, "train_info/time_within_train_step": 2.75537371635437, "step": 2548} {"train_info/time_between_train_steps": 0.003170013427734375, "step": 2548} {"info/global_step": 2549, "train_info/time_within_train_step": 2.7559680938720703, "step": 2549} {"train_info/time_between_train_steps": 0.0031359195709228516, "step": 2549} {"info/global_step": 2550, "train_info/time_within_train_step": 2.7556087970733643, "step": 2550} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746573441, "_runtime": 7450}, "step": 2550} {"logs": {"train/loss": 4.1695, "train/learning_rate": 0.0004966666666666666, "train/epoch": 2.08, "_timestamp": 1746573441, "_runtime": 7450}, "step": 2550} {"train_info/time_between_train_steps": 0.014137744903564453, "step": 2550} {"info/global_step": 2551, "train_info/time_within_train_step": 2.756133556365967, "step": 2551} {"train_info/time_between_train_steps": 0.0030629634857177734, "step": 2551} {"info/global_step": 2552, "train_info/time_within_train_step": 2.7550508975982666, "step": 2552} {"train_info/time_between_train_steps": 0.003113985061645508, "step": 2552} {"info/global_step": 2553, "train_info/time_within_train_step": 2.7547354698181152, "step": 2553} {"train_info/time_between_train_steps": 0.0031554698944091797, "step": 2553} {"info/global_step": 2554, "train_info/time_within_train_step": 2.755645990371704, "step": 2554} {"train_info/time_between_train_steps": 0.003290414810180664, "step": 2554} {"info/global_step": 2555, "train_info/time_within_train_step": 2.7543370723724365, "step": 2555} {"train_info/time_between_train_steps": 0.0032851696014404297, "step": 2555} {"info/global_step": 2556, "train_info/time_within_train_step": 2.7554714679718018, "step": 2556} {"train_info/time_between_train_steps": 0.0035016536712646484, "step": 2556} {"info/global_step": 2557, "train_info/time_within_train_step": 2.755061388015747, "step": 2557} {"train_info/time_between_train_steps": 0.0033159255981445312, "step": 2557} {"info/global_step": 2558, "train_info/time_within_train_step": 2.756960153579712, "step": 2558} {"train_info/time_between_train_steps": 0.0033788681030273438, "step": 2558} {"info/global_step": 2559, "train_info/time_within_train_step": 2.753448247909546, "step": 2559} {"train_info/time_between_train_steps": 0.0033621788024902344, "step": 2559} {"train_info/time_between_train_steps": 3.2429685592651367, "step": 2559} {"info/global_step": 2560, "train_info/time_within_train_step": 2.6700806617736816, "step": 2560} {"train_info/time_between_train_steps": 0.003139495849609375, "step": 2560} {"info/global_step": 2561, "train_info/time_within_train_step": 2.7545268535614014, "step": 2561} {"train_info/time_between_train_steps": 0.0031685829162597656, "step": 2561} {"info/global_step": 2562, "train_info/time_within_train_step": 2.756096839904785, "step": 2562} {"train_info/time_between_train_steps": 0.0031228065490722656, "step": 2562} {"info/global_step": 2563, "train_info/time_within_train_step": 2.755868911743164, "step": 2563} {"train_info/time_between_train_steps": 0.003129720687866211, "step": 2563} {"info/global_step": 2564, "train_info/time_within_train_step": 2.753840923309326, "step": 2564} {"train_info/time_between_train_steps": 0.0031261444091796875, "step": 2564} {"info/global_step": 2565, "train_info/time_within_train_step": 2.753296136856079, "step": 2565} {"train_info/time_between_train_steps": 0.0031778812408447266, "step": 2565} {"info/global_step": 2566, "train_info/time_within_train_step": 2.755429744720459, "step": 2566} {"train_info/time_between_train_steps": 0.0031511783599853516, "step": 2566} {"info/global_step": 2567, "train_info/time_within_train_step": 2.754080295562744, "step": 2567} {"train_info/time_between_train_steps": 0.003123760223388672, "step": 2567} {"info/global_step": 2568, "train_info/time_within_train_step": 2.7552783489227295, "step": 2568} {"train_info/time_between_train_steps": 0.003127574920654297, "step": 2568} {"info/global_step": 2569, "train_info/time_within_train_step": 2.754357099533081, "step": 2569} {"train_info/time_between_train_steps": 0.003108501434326172, "step": 2569} {"info/global_step": 2570, "train_info/time_within_train_step": 2.756807327270508, "step": 2570} {"train_info/time_between_train_steps": 0.0031366348266601562, "step": 2570} {"info/global_step": 2571, "train_info/time_within_train_step": 2.7524497509002686, "step": 2571} {"train_info/time_between_train_steps": 0.0031206607818603516, "step": 2571} {"info/global_step": 2572, "train_info/time_within_train_step": 2.7545413970947266, "step": 2572} {"train_info/time_between_train_steps": 0.0031652450561523438, "step": 2572} {"info/global_step": 2573, "train_info/time_within_train_step": 2.7919058799743652, "step": 2573} {"train_info/time_between_train_steps": 0.0031499862670898438, "step": 2573} {"info/global_step": 2574, "train_info/time_within_train_step": 2.755307197570801, "step": 2574} {"train_info/time_between_train_steps": 0.0031266212463378906, "step": 2574} {"info/global_step": 2575, "train_info/time_within_train_step": 2.7556257247924805, "step": 2575} {"train_info/time_between_train_steps": 0.0031540393829345703, "step": 2575} {"info/global_step": 2576, "train_info/time_within_train_step": 2.7549540996551514, "step": 2576} {"train_info/time_between_train_steps": 0.003171682357788086, "step": 2576} {"info/global_step": 2577, "train_info/time_within_train_step": 2.754729747772217, "step": 2577} {"train_info/time_between_train_steps": 0.0031735897064208984, "step": 2577} {"info/global_step": 2578, "train_info/time_within_train_step": 2.756242036819458, "step": 2578} {"train_info/time_between_train_steps": 0.0031082630157470703, "step": 2578} {"info/global_step": 2579, "train_info/time_within_train_step": 2.7567784786224365, "step": 2579} {"train_info/time_between_train_steps": 0.0031266212463378906, "step": 2579} {"info/global_step": 2580, "train_info/time_within_train_step": 2.7543835639953613, "step": 2580} {"train_info/time_between_train_steps": 0.0030863285064697266, "step": 2580} {"info/global_step": 2581, "train_info/time_within_train_step": 2.7554385662078857, "step": 2581} {"train_info/time_between_train_steps": 0.003172159194946289, "step": 2581} {"info/global_step": 2582, "train_info/time_within_train_step": 2.7555792331695557, "step": 2582} {"train_info/time_between_train_steps": 0.003133535385131836, "step": 2582} {"info/global_step": 2583, "train_info/time_within_train_step": 2.756031036376953, "step": 2583} {"train_info/time_between_train_steps": 0.0031156539916992188, "step": 2583} {"info/global_step": 2584, "train_info/time_within_train_step": 2.7560324668884277, "step": 2584} {"train_info/time_between_train_steps": 0.0031490325927734375, "step": 2584} {"info/global_step": 2585, "train_info/time_within_train_step": 2.7541961669921875, "step": 2585} {"train_info/time_between_train_steps": 0.0031311511993408203, "step": 2585} {"info/global_step": 2586, "train_info/time_within_train_step": 2.75301194190979, "step": 2586} {"train_info/time_between_train_steps": 0.003172636032104492, "step": 2586} {"info/global_step": 2587, "train_info/time_within_train_step": 2.7555158138275146, "step": 2587} {"train_info/time_between_train_steps": 0.0031347274780273438, "step": 2587} {"info/global_step": 2588, "train_info/time_within_train_step": 2.7558295726776123, "step": 2588} {"train_info/time_between_train_steps": 0.0031740665435791016, "step": 2588} {"info/global_step": 2589, "train_info/time_within_train_step": 2.7551190853118896, "step": 2589} {"train_info/time_between_train_steps": 0.003126382827758789, "step": 2589} {"info/global_step": 2590, "train_info/time_within_train_step": 2.755275011062622, "step": 2590} {"train_info/time_between_train_steps": 0.0031163692474365234, "step": 2590} {"info/global_step": 2591, "train_info/time_within_train_step": 2.75488543510437, "step": 2591} {"train_info/time_between_train_steps": 0.0030961036682128906, "step": 2591} {"info/global_step": 2592, "train_info/time_within_train_step": 2.7554118633270264, "step": 2592} {"train_info/time_between_train_steps": 0.003099679946899414, "step": 2592} {"info/global_step": 2593, "train_info/time_within_train_step": 2.7558350563049316, "step": 2593} {"train_info/time_between_train_steps": 0.003129243850708008, "step": 2593} {"info/global_step": 2594, "train_info/time_within_train_step": 2.9551517963409424, "step": 2594} {"train_info/time_between_train_steps": 0.003105640411376953, "step": 2594} {"info/global_step": 2595, "train_info/time_within_train_step": 2.7559566497802734, "step": 2595} {"train_info/time_between_train_steps": 0.006285429000854492, "step": 2595} {"info/global_step": 2596, "train_info/time_within_train_step": 2.7568626403808594, "step": 2596} {"train_info/time_between_train_steps": 0.006285905838012695, "step": 2596} {"info/global_step": 2597, "train_info/time_within_train_step": 2.7560787200927734, "step": 2597} {"train_info/time_between_train_steps": 0.0032224655151367188, "step": 2597} {"info/global_step": 2598, "train_info/time_within_train_step": 2.7561397552490234, "step": 2598} {"train_info/time_between_train_steps": 0.0031478404998779297, "step": 2598} {"info/global_step": 2599, "train_info/time_within_train_step": 2.755676507949829, "step": 2599} {"train_info/time_between_train_steps": 0.003124237060546875, "step": 2599} {"info/global_step": 2600, "train_info/time_within_train_step": 2.75480055809021, "step": 2600} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746573582, "_runtime": 7591}, "step": 2600} {"logs": {"train/loss": 4.209, "train/learning_rate": 0.0004933333333333333, "train/epoch": 3.0, "_timestamp": 1746573582, "_runtime": 7591}, "step": 2600} {"train_info/time_between_train_steps": 23.918346166610718, "step": 2600} {"info/global_step": 2601, "train_info/time_within_train_step": 2.5314128398895264, "step": 2601} {"train_info/time_between_train_steps": 0.0031585693359375, "step": 2601} {"info/global_step": 2602, "train_info/time_within_train_step": 2.573089361190796, "step": 2602} {"train_info/time_between_train_steps": 0.003142118453979492, "step": 2602} {"info/global_step": 2603, "train_info/time_within_train_step": 2.6987838745117188, "step": 2603} {"train_info/time_between_train_steps": 0.003156423568725586, "step": 2603} {"info/global_step": 2604, "train_info/time_within_train_step": 2.71079683303833, "step": 2604} {"train_info/time_between_train_steps": 0.0031261444091796875, "step": 2604} {"info/global_step": 2605, "train_info/time_within_train_step": 2.746802568435669, "step": 2605} {"train_info/time_between_train_steps": 0.003145456314086914, "step": 2605} {"info/global_step": 2606, "train_info/time_within_train_step": 2.7547965049743652, "step": 2606} {"train_info/time_between_train_steps": 0.003112316131591797, "step": 2606} {"info/global_step": 2607, "train_info/time_within_train_step": 2.7538974285125732, "step": 2607} {"train_info/time_between_train_steps": 0.0031189918518066406, "step": 2607} {"info/global_step": 2608, "train_info/time_within_train_step": 2.7536537647247314, "step": 2608} {"train_info/time_between_train_steps": 0.003158092498779297, "step": 2608} {"info/global_step": 2609, "train_info/time_within_train_step": 2.7534525394439697, "step": 2609} {"train_info/time_between_train_steps": 0.0031299591064453125, "step": 2609} {"info/global_step": 2610, "train_info/time_within_train_step": 2.7533349990844727, "step": 2610} {"train_info/time_between_train_steps": 0.0031251907348632812, "step": 2610} {"info/global_step": 2611, "train_info/time_within_train_step": 2.754666328430176, "step": 2611} {"train_info/time_between_train_steps": 0.0031175613403320312, "step": 2611} {"info/global_step": 2612, "train_info/time_within_train_step": 2.7534561157226562, "step": 2612} {"train_info/time_between_train_steps": 0.0031495094299316406, "step": 2612} {"info/global_step": 2613, "train_info/time_within_train_step": 2.7528586387634277, "step": 2613} {"train_info/time_between_train_steps": 0.0031392574310302734, "step": 2613} {"info/global_step": 2614, "train_info/time_within_train_step": 2.7541942596435547, "step": 2614} {"train_info/time_between_train_steps": 0.0031414031982421875, "step": 2614} {"info/global_step": 2615, "train_info/time_within_train_step": 2.754225254058838, "step": 2615} {"train_info/time_between_train_steps": 0.003162384033203125, "step": 2615} {"info/global_step": 2616, "train_info/time_within_train_step": 2.756518602371216, "step": 2616} {"train_info/time_between_train_steps": 0.003159761428833008, "step": 2616} {"info/global_step": 2617, "train_info/time_within_train_step": 2.754789352416992, "step": 2617} {"train_info/time_between_train_steps": 0.0031294822692871094, "step": 2617} {"info/global_step": 2618, "train_info/time_within_train_step": 2.7555174827575684, "step": 2618} {"train_info/time_between_train_steps": 0.0031251907348632812, "step": 2618} {"info/global_step": 2619, "train_info/time_within_train_step": 2.7554125785827637, "step": 2619} {"train_info/time_between_train_steps": 0.0031249523162841797, "step": 2619} {"info/global_step": 2620, "train_info/time_within_train_step": 2.7554829120635986, "step": 2620} {"train_info/time_between_train_steps": 0.0031316280364990234, "step": 2620} {"info/global_step": 2621, "train_info/time_within_train_step": 2.755079984664917, "step": 2621} {"train_info/time_between_train_steps": 0.003124713897705078, "step": 2621} {"info/global_step": 2622, "train_info/time_within_train_step": 2.8737003803253174, "step": 2622} {"train_info/time_between_train_steps": 0.0031266212463378906, "step": 2622} {"info/global_step": 2623, "train_info/time_within_train_step": 2.755981922149658, "step": 2623} {"train_info/time_between_train_steps": 0.0032143592834472656, "step": 2623} {"info/global_step": 2624, "train_info/time_within_train_step": 2.754967212677002, "step": 2624} {"train_info/time_between_train_steps": 0.0031518936157226562, "step": 2624} {"info/global_step": 2625, "train_info/time_within_train_step": 2.7548718452453613, "step": 2625} {"train_info/time_between_train_steps": 0.0031511783599853516, "step": 2625} {"info/global_step": 2626, "train_info/time_within_train_step": 2.7539994716644287, "step": 2626} {"train_info/time_between_train_steps": 0.003602743148803711, "step": 2626} {"info/global_step": 2627, "train_info/time_within_train_step": 2.755007028579712, "step": 2627} {"train_info/time_between_train_steps": 0.003186941146850586, "step": 2627} {"info/global_step": 2628, "train_info/time_within_train_step": 2.7534384727478027, "step": 2628} {"train_info/time_between_train_steps": 0.00315093994140625, "step": 2628} {"info/global_step": 2629, "train_info/time_within_train_step": 2.7549374103546143, "step": 2629} {"train_info/time_between_train_steps": 0.003140687942504883, "step": 2629} {"info/global_step": 2630, "train_info/time_within_train_step": 2.754951238632202, "step": 2630} {"train_info/time_between_train_steps": 0.0031371116638183594, "step": 2630} {"info/global_step": 2631, "train_info/time_within_train_step": 2.755786180496216, "step": 2631} {"train_info/time_between_train_steps": 0.003149747848510742, "step": 2631} {"info/global_step": 2632, "train_info/time_within_train_step": 2.7555129528045654, "step": 2632} {"train_info/time_between_train_steps": 0.003220796585083008, "step": 2632} {"info/global_step": 2633, "train_info/time_within_train_step": 2.7550318241119385, "step": 2633} {"train_info/time_between_train_steps": 0.003149271011352539, "step": 2633} {"info/global_step": 2634, "train_info/time_within_train_step": 2.7556755542755127, "step": 2634} {"train_info/time_between_train_steps": 0.003161191940307617, "step": 2634} {"info/global_step": 2635, "train_info/time_within_train_step": 2.755385637283325, "step": 2635} {"train_info/time_between_train_steps": 0.003167390823364258, "step": 2635} {"info/global_step": 2636, "train_info/time_within_train_step": 2.7558248043060303, "step": 2636} {"train_info/time_between_train_steps": 0.0031685829162597656, "step": 2636} {"info/global_step": 2637, "train_info/time_within_train_step": 2.755524158477783, "step": 2637} {"train_info/time_between_train_steps": 0.00313568115234375, "step": 2637} {"info/global_step": 2638, "train_info/time_within_train_step": 2.755812644958496, "step": 2638} {"train_info/time_between_train_steps": 0.0031311511993408203, "step": 2638} {"info/global_step": 2639, "train_info/time_within_train_step": 2.7537424564361572, "step": 2639} {"train_info/time_between_train_steps": 0.003159761428833008, "step": 2639} {"info/global_step": 2640, "train_info/time_within_train_step": 2.7544565200805664, "step": 2640} {"train_info/time_between_train_steps": 0.003145933151245117, "step": 2640} {"info/global_step": 2641, "train_info/time_within_train_step": 2.753484010696411, "step": 2641} {"train_info/time_between_train_steps": 0.003139495849609375, "step": 2641} {"info/global_step": 2642, "train_info/time_within_train_step": 2.753305435180664, "step": 2642} {"train_info/time_between_train_steps": 0.003129720687866211, "step": 2642} {"info/global_step": 2643, "train_info/time_within_train_step": 2.753812551498413, "step": 2643} {"train_info/time_between_train_steps": 0.0031385421752929688, "step": 2643} {"info/global_step": 2644, "train_info/time_within_train_step": 2.75425124168396, "step": 2644} {"train_info/time_between_train_steps": 0.003139972686767578, "step": 2644} {"info/global_step": 2645, "train_info/time_within_train_step": 2.7543351650238037, "step": 2645} {"train_info/time_between_train_steps": 0.003135204315185547, "step": 2645} {"info/global_step": 2646, "train_info/time_within_train_step": 2.7546560764312744, "step": 2646} {"train_info/time_between_train_steps": 0.0031986236572265625, "step": 2646} {"info/global_step": 2647, "train_info/time_within_train_step": 2.754547119140625, "step": 2647} {"train_info/time_between_train_steps": 0.003171682357788086, "step": 2647} {"info/global_step": 2648, "train_info/time_within_train_step": 2.754329204559326, "step": 2648} {"train_info/time_between_train_steps": 0.003116130828857422, "step": 2648} {"info/global_step": 2649, "train_info/time_within_train_step": 2.7549681663513184, "step": 2649} {"train_info/time_between_train_steps": 0.0031507015228271484, "step": 2649} {"info/global_step": 2650, "train_info/time_within_train_step": 2.7544875144958496, "step": 2650} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746573744, "_runtime": 7753}, "step": 2650} {"logs": {"train/loss": 4.1427, "train/learning_rate": 0.00049, "train/epoch": 3.01, "_timestamp": 1746573744, "_runtime": 7753}, "step": 2650} {"train_info/time_between_train_steps": 0.013477325439453125, "step": 2650} {"info/global_step": 2651, "train_info/time_within_train_step": 2.7545325756073, "step": 2651} {"train_info/time_between_train_steps": 0.003114461898803711, "step": 2651} {"info/global_step": 2652, "train_info/time_within_train_step": 2.7555644512176514, "step": 2652} {"train_info/time_between_train_steps": 0.0031359195709228516, "step": 2652} {"info/global_step": 2653, "train_info/time_within_train_step": 2.754699468612671, "step": 2653} {"train_info/time_between_train_steps": 0.0031752586364746094, "step": 2653} {"info/global_step": 2654, "train_info/time_within_train_step": 2.755044460296631, "step": 2654} {"train_info/time_between_train_steps": 0.0031342506408691406, "step": 2654} {"info/global_step": 2655, "train_info/time_within_train_step": 2.753925323486328, "step": 2655} {"train_info/time_between_train_steps": 0.003160715103149414, "step": 2655} {"info/global_step": 2656, "train_info/time_within_train_step": 2.752929925918579, "step": 2656} {"train_info/time_between_train_steps": 0.0031206607818603516, "step": 2656} {"info/global_step": 2657, "train_info/time_within_train_step": 2.7547852993011475, "step": 2657} {"train_info/time_between_train_steps": 0.003141641616821289, "step": 2657} {"info/global_step": 2658, "train_info/time_within_train_step": 2.75174617767334, "step": 2658} {"train_info/time_between_train_steps": 0.003201007843017578, "step": 2658} {"info/global_step": 2659, "train_info/time_within_train_step": 2.7525739669799805, "step": 2659} {"train_info/time_between_train_steps": 0.003133535385131836, "step": 2659} {"info/global_step": 2660, "train_info/time_within_train_step": 2.7545876502990723, "step": 2660} {"train_info/time_between_train_steps": 0.003129243850708008, "step": 2660} {"info/global_step": 2661, "train_info/time_within_train_step": 2.7552037239074707, "step": 2661} {"train_info/time_between_train_steps": 0.003141164779663086, "step": 2661} {"info/global_step": 2662, "train_info/time_within_train_step": 2.7547855377197266, "step": 2662} {"train_info/time_between_train_steps": 0.003118276596069336, "step": 2662} {"info/global_step": 2663, "train_info/time_within_train_step": 2.7550582885742188, "step": 2663} {"train_info/time_between_train_steps": 0.0031440258026123047, "step": 2663} {"info/global_step": 2664, "train_info/time_within_train_step": 2.7549962997436523, "step": 2664} {"train_info/time_between_train_steps": 0.0031495094299316406, "step": 2664} {"info/global_step": 2665, "train_info/time_within_train_step": 2.7551708221435547, "step": 2665} {"train_info/time_between_train_steps": 0.0031256675720214844, "step": 2665} {"info/global_step": 2666, "train_info/time_within_train_step": 2.7539849281311035, "step": 2666} {"train_info/time_between_train_steps": 0.0031652450561523438, "step": 2666} {"info/global_step": 2667, "train_info/time_within_train_step": 2.7535815238952637, "step": 2667} {"train_info/time_between_train_steps": 0.0031747817993164062, "step": 2667} {"info/global_step": 2668, "train_info/time_within_train_step": 2.7549855709075928, "step": 2668} {"train_info/time_between_train_steps": 0.003113269805908203, "step": 2668} {"info/global_step": 2669, "train_info/time_within_train_step": 2.754232883453369, "step": 2669} {"train_info/time_between_train_steps": 0.003130674362182617, "step": 2669} {"info/global_step": 2670, "train_info/time_within_train_step": 2.7545385360717773, "step": 2670} {"train_info/time_between_train_steps": 0.003115415573120117, "step": 2670} {"info/global_step": 2671, "train_info/time_within_train_step": 2.7541439533233643, "step": 2671} {"train_info/time_between_train_steps": 0.0031723976135253906, "step": 2671} {"info/global_step": 2672, "train_info/time_within_train_step": 2.7537572383880615, "step": 2672} {"train_info/time_between_train_steps": 0.003124237060546875, "step": 2672} {"info/global_step": 2673, "train_info/time_within_train_step": 2.751732349395752, "step": 2673} {"train_info/time_between_train_steps": 0.003107309341430664, "step": 2673} {"info/global_step": 2674, "train_info/time_within_train_step": 2.7535979747772217, "step": 2674} {"train_info/time_between_train_steps": 0.0031523704528808594, "step": 2674} {"info/global_step": 2675, "train_info/time_within_train_step": 2.965712070465088, "step": 2675} {"train_info/time_between_train_steps": 0.0031485557556152344, "step": 2675} {"info/global_step": 2676, "train_info/time_within_train_step": 2.754077434539795, "step": 2676} {"train_info/time_between_train_steps": 0.003108978271484375, "step": 2676} {"info/global_step": 2677, "train_info/time_within_train_step": 2.7526426315307617, "step": 2677} {"train_info/time_between_train_steps": 0.0031228065490722656, "step": 2677} {"info/global_step": 2678, "train_info/time_within_train_step": 2.7543532848358154, "step": 2678} {"train_info/time_between_train_steps": 0.0031652450561523438, "step": 2678} {"info/global_step": 2679, "train_info/time_within_train_step": 2.7548766136169434, "step": 2679} {"train_info/time_between_train_steps": 0.0031282901763916016, "step": 2679} {"info/global_step": 2680, "train_info/time_within_train_step": 2.7520101070404053, "step": 2680} {"train_info/time_between_train_steps": 0.0031414031982421875, "step": 2680} {"info/global_step": 2681, "train_info/time_within_train_step": 2.754391670227051, "step": 2681} {"train_info/time_between_train_steps": 0.0031528472900390625, "step": 2681} {"info/global_step": 2682, "train_info/time_within_train_step": 2.754060745239258, "step": 2682} {"train_info/time_between_train_steps": 0.003161907196044922, "step": 2682} {"info/global_step": 2683, "train_info/time_within_train_step": 2.753894567489624, "step": 2683} {"train_info/time_between_train_steps": 0.0031456947326660156, "step": 2683} {"info/global_step": 2684, "train_info/time_within_train_step": 2.7536888122558594, "step": 2684} {"train_info/time_between_train_steps": 0.12305355072021484, "step": 2684} {"info/global_step": 2685, "train_info/time_within_train_step": 2.753497838973999, "step": 2685} {"train_info/time_between_train_steps": 0.0031316280364990234, "step": 2685} {"info/global_step": 2686, "train_info/time_within_train_step": 2.752833127975464, "step": 2686} {"train_info/time_between_train_steps": 0.0032122135162353516, "step": 2686} {"info/global_step": 2687, "train_info/time_within_train_step": 2.7527077198028564, "step": 2687} {"train_info/time_between_train_steps": 0.003147602081298828, "step": 2687} {"info/global_step": 2688, "train_info/time_within_train_step": 2.7516891956329346, "step": 2688} {"train_info/time_between_train_steps": 0.003136157989501953, "step": 2688} {"info/global_step": 2689, "train_info/time_within_train_step": 2.752023935317993, "step": 2689} {"train_info/time_between_train_steps": 0.0031752586364746094, "step": 2689} {"info/global_step": 2690, "train_info/time_within_train_step": 2.753627300262451, "step": 2690} {"train_info/time_between_train_steps": 0.003143310546875, "step": 2690} {"info/global_step": 2691, "train_info/time_within_train_step": 2.7528316974639893, "step": 2691} {"train_info/time_between_train_steps": 0.0031630992889404297, "step": 2691} {"info/global_step": 2692, "train_info/time_within_train_step": 2.7534146308898926, "step": 2692} {"train_info/time_between_train_steps": 0.0031354427337646484, "step": 2692} {"info/global_step": 2693, "train_info/time_within_train_step": 2.7540442943573, "step": 2693} {"train_info/time_between_train_steps": 0.003127574920654297, "step": 2693} {"info/global_step": 2694, "train_info/time_within_train_step": 2.754399538040161, "step": 2694} {"train_info/time_between_train_steps": 0.0031518936157226562, "step": 2694} {"info/global_step": 2695, "train_info/time_within_train_step": 2.7522292137145996, "step": 2695} {"train_info/time_between_train_steps": 0.0031578540802001953, "step": 2695} {"info/global_step": 2696, "train_info/time_within_train_step": 2.754210948944092, "step": 2696} {"train_info/time_between_train_steps": 0.003132343292236328, "step": 2696} {"info/global_step": 2697, "train_info/time_within_train_step": 2.75597882270813, "step": 2697} {"train_info/time_between_train_steps": 0.0031380653381347656, "step": 2697} {"info/global_step": 2698, "train_info/time_within_train_step": 2.754368782043457, "step": 2698} {"train_info/time_between_train_steps": 0.003196239471435547, "step": 2698} {"info/global_step": 2699, "train_info/time_within_train_step": 2.7530767917633057, "step": 2699} {"train_info/time_between_train_steps": 0.0031270980834960938, "step": 2699} {"info/global_step": 2700, "train_info/time_within_train_step": 2.753692388534546, "step": 2700} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746573883, "_runtime": 7892}, "step": 2700} {"logs": {"train/loss": 4.1279, "train/learning_rate": 0.0004866666666666666, "train/epoch": 3.01, "_timestamp": 1746573883, "_runtime": 7892}, "step": 2700} {"train_info/time_between_train_steps": 0.013303995132446289, "step": 2700} {"info/global_step": 2701, "train_info/time_within_train_step": 2.753418207168579, "step": 2701} {"train_info/time_between_train_steps": 0.003144502639770508, "step": 2701} {"info/global_step": 2702, "train_info/time_within_train_step": 2.754242181777954, "step": 2702} {"train_info/time_between_train_steps": 0.0031812191009521484, "step": 2702} {"info/global_step": 2703, "train_info/time_within_train_step": 2.755138397216797, "step": 2703} {"train_info/time_between_train_steps": 0.0031964778900146484, "step": 2703} {"info/global_step": 2704, "train_info/time_within_train_step": 2.7533767223358154, "step": 2704} {"train_info/time_between_train_steps": 0.003185749053955078, "step": 2704} {"info/global_step": 2705, "train_info/time_within_train_step": 2.7540738582611084, "step": 2705} {"train_info/time_between_train_steps": 0.00313568115234375, "step": 2705} {"info/global_step": 2706, "train_info/time_within_train_step": 2.7536444664001465, "step": 2706} {"train_info/time_between_train_steps": 0.003136157989501953, "step": 2706} {"info/global_step": 2707, "train_info/time_within_train_step": 2.7535972595214844, "step": 2707} {"train_info/time_between_train_steps": 0.003139495849609375, "step": 2707} {"info/global_step": 2708, "train_info/time_within_train_step": 2.754239797592163, "step": 2708} {"train_info/time_between_train_steps": 0.0031299591064453125, "step": 2708} {"info/global_step": 2709, "train_info/time_within_train_step": 2.7543773651123047, "step": 2709} {"train_info/time_between_train_steps": 0.0031654834747314453, "step": 2709} {"info/global_step": 2710, "train_info/time_within_train_step": 2.754239797592163, "step": 2710} {"train_info/time_between_train_steps": 0.0031495094299316406, "step": 2710} {"info/global_step": 2711, "train_info/time_within_train_step": 2.7550172805786133, "step": 2711} {"train_info/time_between_train_steps": 0.0031235218048095703, "step": 2711} {"info/global_step": 2712, "train_info/time_within_train_step": 2.754523277282715, "step": 2712} {"train_info/time_between_train_steps": 0.0031402111053466797, "step": 2712} {"info/global_step": 2713, "train_info/time_within_train_step": 2.7540433406829834, "step": 2713} {"train_info/time_between_train_steps": 0.0031232833862304688, "step": 2713} {"info/global_step": 2714, "train_info/time_within_train_step": 2.753795862197876, "step": 2714} {"train_info/time_between_train_steps": 0.0031898021697998047, "step": 2714} {"info/global_step": 2715, "train_info/time_within_train_step": 2.7545783519744873, "step": 2715} {"train_info/time_between_train_steps": 0.003232240676879883, "step": 2715} {"info/global_step": 2716, "train_info/time_within_train_step": 2.7542757987976074, "step": 2716} {"train_info/time_between_train_steps": 0.003239154815673828, "step": 2716} {"info/global_step": 2717, "train_info/time_within_train_step": 2.752776622772217, "step": 2717} {"train_info/time_between_train_steps": 0.0032196044921875, "step": 2717} {"info/global_step": 2718, "train_info/time_within_train_step": 2.754782199859619, "step": 2718} {"train_info/time_between_train_steps": 0.0032377243041992188, "step": 2718} {"info/global_step": 2719, "train_info/time_within_train_step": 2.753856658935547, "step": 2719} {"train_info/time_between_train_steps": 0.0031964778900146484, "step": 2719} {"info/global_step": 2720, "train_info/time_within_train_step": 2.7544164657592773, "step": 2720} {"train_info/time_between_train_steps": 0.003221750259399414, "step": 2720} {"info/global_step": 2721, "train_info/time_within_train_step": 2.7534821033477783, "step": 2721} {"train_info/time_between_train_steps": 0.0032258033752441406, "step": 2721} {"info/global_step": 2722, "train_info/time_within_train_step": 2.7540414333343506, "step": 2722} {"train_info/time_between_train_steps": 0.0031745433807373047, "step": 2722} {"info/global_step": 2723, "train_info/time_within_train_step": 2.7539525032043457, "step": 2723} {"train_info/time_between_train_steps": 0.0031654834747314453, "step": 2723} {"info/global_step": 2724, "train_info/time_within_train_step": 2.7522804737091064, "step": 2724} {"train_info/time_between_train_steps": 0.0032029151916503906, "step": 2724} {"info/global_step": 2725, "train_info/time_within_train_step": 2.754127025604248, "step": 2725} {"train_info/time_between_train_steps": 0.0031304359436035156, "step": 2725} {"info/global_step": 2726, "train_info/time_within_train_step": 2.7531676292419434, "step": 2726} {"train_info/time_between_train_steps": 0.003184795379638672, "step": 2726} {"info/global_step": 2727, "train_info/time_within_train_step": 2.7545015811920166, "step": 2727} {"train_info/time_between_train_steps": 0.0031499862670898438, "step": 2727} {"info/global_step": 2728, "train_info/time_within_train_step": 2.753239393234253, "step": 2728} {"train_info/time_between_train_steps": 0.003119945526123047, "step": 2728} {"info/global_step": 2729, "train_info/time_within_train_step": 2.975782871246338, "step": 2729} {"train_info/time_between_train_steps": 0.0031626224517822266, "step": 2729} {"info/global_step": 2730, "train_info/time_within_train_step": 2.753239870071411, "step": 2730} {"train_info/time_between_train_steps": 0.003130197525024414, "step": 2730} {"info/global_step": 2731, "train_info/time_within_train_step": 2.7529280185699463, "step": 2731} {"train_info/time_between_train_steps": 0.0031549930572509766, "step": 2731} {"info/global_step": 2732, "train_info/time_within_train_step": 2.7554287910461426, "step": 2732} {"train_info/time_between_train_steps": 0.0031442642211914062, "step": 2732} {"info/global_step": 2733, "train_info/time_within_train_step": 2.754725694656372, "step": 2733} {"train_info/time_between_train_steps": 0.003194093704223633, "step": 2733} {"info/global_step": 2734, "train_info/time_within_train_step": 2.7532384395599365, "step": 2734} {"train_info/time_between_train_steps": 0.0031023025512695312, "step": 2734} {"info/global_step": 2735, "train_info/time_within_train_step": 2.7536866664886475, "step": 2735} {"train_info/time_between_train_steps": 0.0031838417053222656, "step": 2735} {"info/global_step": 2736, "train_info/time_within_train_step": 2.753617525100708, "step": 2736} {"train_info/time_between_train_steps": 0.003203153610229492, "step": 2736} {"info/global_step": 2737, "train_info/time_within_train_step": 2.756194829940796, "step": 2737} {"train_info/time_between_train_steps": 0.003206491470336914, "step": 2737} {"info/global_step": 2738, "train_info/time_within_train_step": 2.754032850265503, "step": 2738} {"train_info/time_between_train_steps": 0.0032129287719726562, "step": 2738} {"info/global_step": 2739, "train_info/time_within_train_step": 2.7520711421966553, "step": 2739} {"train_info/time_between_train_steps": 0.0032405853271484375, "step": 2739} {"info/global_step": 2740, "train_info/time_within_train_step": 2.7535693645477295, "step": 2740} {"train_info/time_between_train_steps": 0.003228425979614258, "step": 2740} {"info/global_step": 2741, "train_info/time_within_train_step": 2.753143787384033, "step": 2741} {"train_info/time_between_train_steps": 0.003214120864868164, "step": 2741} {"info/global_step": 2742, "train_info/time_within_train_step": 2.7532787322998047, "step": 2742} {"train_info/time_between_train_steps": 0.0031652450561523438, "step": 2742} {"info/global_step": 2743, "train_info/time_within_train_step": 2.753108501434326, "step": 2743} {"train_info/time_between_train_steps": 0.0032541751861572266, "step": 2743} {"info/global_step": 2744, "train_info/time_within_train_step": 2.754112482070923, "step": 2744} {"train_info/time_between_train_steps": 0.003198385238647461, "step": 2744} {"info/global_step": 2745, "train_info/time_within_train_step": 2.753926992416382, "step": 2745} {"train_info/time_between_train_steps": 0.003153085708618164, "step": 2745} {"info/global_step": 2746, "train_info/time_within_train_step": 2.7537434101104736, "step": 2746} {"train_info/time_between_train_steps": 0.0031795501708984375, "step": 2746} {"info/global_step": 2747, "train_info/time_within_train_step": 2.9015588760375977, "step": 2747} {"train_info/time_between_train_steps": 0.0033233165740966797, "step": 2747} {"info/global_step": 2748, "train_info/time_within_train_step": 2.755185604095459, "step": 2748} {"train_info/time_between_train_steps": 0.0032172203063964844, "step": 2748} {"info/global_step": 2749, "train_info/time_within_train_step": 3.3677048683166504, "step": 2749} {"train_info/time_between_train_steps": 0.0032150745391845703, "step": 2749} {"info/global_step": 2750, "train_info/time_within_train_step": 2.7545454502105713, "step": 2750} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746574022, "_runtime": 8031}, "step": 2750} {"logs": {"train/loss": 4.1095, "train/learning_rate": 0.0004833333333333333, "train/epoch": 3.02, "_timestamp": 1746574022, "_runtime": 8031}, "step": 2750} {"train_info/time_between_train_steps": 0.012844085693359375, "step": 2750} {"info/global_step": 2751, "train_info/time_within_train_step": 2.754420518875122, "step": 2751} {"train_info/time_between_train_steps": 0.003432750701904297, "step": 2751} {"info/global_step": 2752, "train_info/time_within_train_step": 2.7547383308410645, "step": 2752} {"train_info/time_between_train_steps": 0.003315448760986328, "step": 2752} {"info/global_step": 2753, "train_info/time_within_train_step": 2.7558276653289795, "step": 2753} {"train_info/time_between_train_steps": 0.003534078598022461, "step": 2753} {"info/global_step": 2754, "train_info/time_within_train_step": 2.753960132598877, "step": 2754} {"train_info/time_between_train_steps": 0.003689289093017578, "step": 2754} {"info/global_step": 2755, "train_info/time_within_train_step": 2.754883050918579, "step": 2755} {"train_info/time_between_train_steps": 0.0035839080810546875, "step": 2755} {"info/global_step": 2756, "train_info/time_within_train_step": 2.7552754878997803, "step": 2756} {"train_info/time_between_train_steps": 0.0036017894744873047, "step": 2756} {"info/global_step": 2757, "train_info/time_within_train_step": 2.753756284713745, "step": 2757} {"train_info/time_between_train_steps": 0.0035953521728515625, "step": 2757} {"info/global_step": 2758, "train_info/time_within_train_step": 2.754760265350342, "step": 2758} {"train_info/time_between_train_steps": 0.00348663330078125, "step": 2758} {"info/global_step": 2759, "train_info/time_within_train_step": 2.7549219131469727, "step": 2759} {"train_info/time_between_train_steps": 0.003534555435180664, "step": 2759} {"info/global_step": 2760, "train_info/time_within_train_step": 2.7557504177093506, "step": 2760} {"train_info/time_between_train_steps": 0.0035233497619628906, "step": 2760} {"info/global_step": 2761, "train_info/time_within_train_step": 2.7531356811523438, "step": 2761} {"train_info/time_between_train_steps": 0.003498077392578125, "step": 2761} {"info/global_step": 2762, "train_info/time_within_train_step": 2.754753351211548, "step": 2762} {"train_info/time_between_train_steps": 0.003553628921508789, "step": 2762} {"info/global_step": 2763, "train_info/time_within_train_step": 2.7550039291381836, "step": 2763} {"train_info/time_between_train_steps": 0.0034782886505126953, "step": 2763} {"info/global_step": 2764, "train_info/time_within_train_step": 2.755234479904175, "step": 2764} {"train_info/time_between_train_steps": 0.0036144256591796875, "step": 2764} {"info/global_step": 2765, "train_info/time_within_train_step": 2.7551889419555664, "step": 2765} {"train_info/time_between_train_steps": 0.003575563430786133, "step": 2765} {"info/global_step": 2766, "train_info/time_within_train_step": 2.7550904750823975, "step": 2766} {"train_info/time_between_train_steps": 0.0036466121673583984, "step": 2766} {"info/global_step": 2767, "train_info/time_within_train_step": 2.753166437149048, "step": 2767} {"train_info/time_between_train_steps": 0.0035064220428466797, "step": 2767} {"info/global_step": 2768, "train_info/time_within_train_step": 3.068704605102539, "step": 2768} {"train_info/time_between_train_steps": 0.0033452510833740234, "step": 2768} {"info/global_step": 2769, "train_info/time_within_train_step": 2.751880407333374, "step": 2769} {"train_info/time_between_train_steps": 0.003276348114013672, "step": 2769} {"info/global_step": 2770, "train_info/time_within_train_step": 2.753602981567383, "step": 2770} {"train_info/time_between_train_steps": 0.0032553672790527344, "step": 2770} {"info/global_step": 2771, "train_info/time_within_train_step": 2.7544729709625244, "step": 2771} {"train_info/time_between_train_steps": 0.0032911300659179688, "step": 2771} {"info/global_step": 2772, "train_info/time_within_train_step": 2.754713535308838, "step": 2772} {"train_info/time_between_train_steps": 0.003247499465942383, "step": 2772} {"info/global_step": 2773, "train_info/time_within_train_step": 2.754831075668335, "step": 2773} {"train_info/time_between_train_steps": 0.003345012664794922, "step": 2773} {"info/global_step": 2774, "train_info/time_within_train_step": 2.7543840408325195, "step": 2774} {"train_info/time_between_train_steps": 0.0032529830932617188, "step": 2774} {"info/global_step": 2775, "train_info/time_within_train_step": 2.7543575763702393, "step": 2775} {"train_info/time_between_train_steps": 0.0034437179565429688, "step": 2775} {"info/global_step": 2776, "train_info/time_within_train_step": 2.7545831203460693, "step": 2776} {"train_info/time_between_train_steps": 0.0033111572265625, "step": 2776} {"info/global_step": 2777, "train_info/time_within_train_step": 2.755254030227661, "step": 2777} {"train_info/time_between_train_steps": 0.0033462047576904297, "step": 2777} {"info/global_step": 2778, "train_info/time_within_train_step": 2.7535860538482666, "step": 2778} {"train_info/time_between_train_steps": 0.0033025741577148438, "step": 2778} {"info/global_step": 2779, "train_info/time_within_train_step": 2.7545485496520996, "step": 2779} {"train_info/time_between_train_steps": 0.003286600112915039, "step": 2779} {"info/global_step": 2780, "train_info/time_within_train_step": 2.7548608779907227, "step": 2780} {"train_info/time_between_train_steps": 0.003340482711791992, "step": 2780} {"info/global_step": 2781, "train_info/time_within_train_step": 2.7539143562316895, "step": 2781} {"train_info/time_between_train_steps": 0.0033402442932128906, "step": 2781} {"info/global_step": 2782, "train_info/time_within_train_step": 2.7555019855499268, "step": 2782} {"train_info/time_between_train_steps": 0.003337860107421875, "step": 2782} {"info/global_step": 2783, "train_info/time_within_train_step": 2.7540910243988037, "step": 2783} {"train_info/time_between_train_steps": 0.003454446792602539, "step": 2783} {"info/global_step": 2784, "train_info/time_within_train_step": 2.7540841102600098, "step": 2784} {"train_info/time_between_train_steps": 0.0034372806549072266, "step": 2784} {"info/global_step": 2785, "train_info/time_within_train_step": 2.7540700435638428, "step": 2785} {"train_info/time_between_train_steps": 0.003391742706298828, "step": 2785} {"info/global_step": 2786, "train_info/time_within_train_step": 2.755084276199341, "step": 2786} {"train_info/time_between_train_steps": 0.0033004283905029297, "step": 2786} {"info/global_step": 2787, "train_info/time_within_train_step": 2.7558610439300537, "step": 2787} {"train_info/time_between_train_steps": 0.0032372474670410156, "step": 2787} {"info/global_step": 2788, "train_info/time_within_train_step": 2.754603624343872, "step": 2788} {"train_info/time_between_train_steps": 0.003398418426513672, "step": 2788} {"info/global_step": 2789, "train_info/time_within_train_step": 2.754237651824951, "step": 2789} {"train_info/time_between_train_steps": 0.0032923221588134766, "step": 2789} {"info/global_step": 2790, "train_info/time_within_train_step": 2.7538068294525146, "step": 2790} {"train_info/time_between_train_steps": 0.003377199172973633, "step": 2790} {"info/global_step": 2791, "train_info/time_within_train_step": 2.753849983215332, "step": 2791} {"train_info/time_between_train_steps": 0.00328826904296875, "step": 2791} {"info/global_step": 2792, "train_info/time_within_train_step": 2.753911256790161, "step": 2792} {"train_info/time_between_train_steps": 0.0032966136932373047, "step": 2792} {"info/global_step": 2793, "train_info/time_within_train_step": 2.755035877227783, "step": 2793} {"train_info/time_between_train_steps": 0.0032858848571777344, "step": 2793} {"info/global_step": 2794, "train_info/time_within_train_step": 2.7537922859191895, "step": 2794} {"train_info/time_between_train_steps": 0.0032629966735839844, "step": 2794} {"info/global_step": 2795, "train_info/time_within_train_step": 2.7549564838409424, "step": 2795} {"train_info/time_between_train_steps": 0.0034122467041015625, "step": 2795} {"info/global_step": 2796, "train_info/time_within_train_step": 2.754148244857788, "step": 2796} {"train_info/time_between_train_steps": 0.0032618045806884766, "step": 2796} {"info/global_step": 2797, "train_info/time_within_train_step": 2.755152463912964, "step": 2797} {"train_info/time_between_train_steps": 0.003306150436401367, "step": 2797} {"info/global_step": 2798, "train_info/time_within_train_step": 2.753049373626709, "step": 2798} {"train_info/time_between_train_steps": 0.0032842159271240234, "step": 2798} {"info/global_step": 2799, "train_info/time_within_train_step": 2.754399538040161, "step": 2799} {"train_info/time_between_train_steps": 0.0034236907958984375, "step": 2799} {"info/global_step": 2800, "train_info/time_within_train_step": 2.7546591758728027, "step": 2800} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746574161, "_runtime": 8170}, "step": 2800} {"logs": {"train/loss": 4.1, "train/learning_rate": 0.00047999999999999996, "train/epoch": 3.02, "_timestamp": 1746574161, "_runtime": 8170}, "step": 2800} {"train_info/time_between_train_steps": 14.78260588645935, "step": 2800} {"info/global_step": 2801, "train_info/time_within_train_step": 2.5316689014434814, "step": 2801} {"train_info/time_between_train_steps": 0.003271818161010742, "step": 2801} {"info/global_step": 2802, "train_info/time_within_train_step": 2.589722156524658, "step": 2802} {"train_info/time_between_train_steps": 0.0032455921173095703, "step": 2802} {"info/global_step": 2803, "train_info/time_within_train_step": 2.7310948371887207, "step": 2803} {"train_info/time_between_train_steps": 0.0032651424407958984, "step": 2803} {"info/global_step": 2804, "train_info/time_within_train_step": 2.7510690689086914, "step": 2804} {"train_info/time_between_train_steps": 0.003347635269165039, "step": 2804} {"info/global_step": 2805, "train_info/time_within_train_step": 2.7533702850341797, "step": 2805} {"train_info/time_between_train_steps": 0.003375530242919922, "step": 2805} {"info/global_step": 2806, "train_info/time_within_train_step": 2.754636287689209, "step": 2806} {"train_info/time_between_train_steps": 0.0032320022583007812, "step": 2806} {"info/global_step": 2807, "train_info/time_within_train_step": 2.7551238536834717, "step": 2807} {"train_info/time_between_train_steps": 0.003217458724975586, "step": 2807} {"info/global_step": 2808, "train_info/time_within_train_step": 2.755110502243042, "step": 2808} {"train_info/time_between_train_steps": 0.00324249267578125, "step": 2808} {"info/global_step": 2809, "train_info/time_within_train_step": 2.7559688091278076, "step": 2809} {"train_info/time_between_train_steps": 0.13964176177978516, "step": 2809} {"info/global_step": 2810, "train_info/time_within_train_step": 2.7767443656921387, "step": 2810} {"train_info/time_between_train_steps": 0.003333568572998047, "step": 2810} {"info/global_step": 2811, "train_info/time_within_train_step": 2.75608491897583, "step": 2811} {"train_info/time_between_train_steps": 0.003234386444091797, "step": 2811} {"info/global_step": 2812, "train_info/time_within_train_step": 2.7564847469329834, "step": 2812} {"train_info/time_between_train_steps": 0.0032875537872314453, "step": 2812} {"info/global_step": 2813, "train_info/time_within_train_step": 2.757148265838623, "step": 2813} {"train_info/time_between_train_steps": 0.0032835006713867188, "step": 2813} {"info/global_step": 2814, "train_info/time_within_train_step": 2.7558555603027344, "step": 2814} {"train_info/time_between_train_steps": 0.0033779144287109375, "step": 2814} {"info/global_step": 2815, "train_info/time_within_train_step": 2.7546627521514893, "step": 2815} {"train_info/time_between_train_steps": 0.0032792091369628906, "step": 2815} {"info/global_step": 2816, "train_info/time_within_train_step": 2.754991292953491, "step": 2816} {"train_info/time_between_train_steps": 0.0033016204833984375, "step": 2816} {"info/global_step": 2817, "train_info/time_within_train_step": 2.7547788619995117, "step": 2817} {"train_info/time_between_train_steps": 0.0032668113708496094, "step": 2817} {"info/global_step": 2818, "train_info/time_within_train_step": 2.755098581314087, "step": 2818} {"train_info/time_between_train_steps": 0.0031783580780029297, "step": 2818} {"info/global_step": 2819, "train_info/time_within_train_step": 2.7546796798706055, "step": 2819} {"train_info/time_between_train_steps": 0.003314971923828125, "step": 2819} {"info/global_step": 2820, "train_info/time_within_train_step": 2.755542039871216, "step": 2820} {"train_info/time_between_train_steps": 0.0032918453216552734, "step": 2820} {"info/global_step": 2821, "train_info/time_within_train_step": 2.7551798820495605, "step": 2821} {"train_info/time_between_train_steps": 0.0033044815063476562, "step": 2821} {"info/global_step": 2822, "train_info/time_within_train_step": 2.755293607711792, "step": 2822} {"train_info/time_between_train_steps": 0.0032396316528320312, "step": 2822} {"info/global_step": 2823, "train_info/time_within_train_step": 2.756314992904663, "step": 2823} {"train_info/time_between_train_steps": 0.0032820701599121094, "step": 2823} {"info/global_step": 2824, "train_info/time_within_train_step": 2.755753993988037, "step": 2824} {"train_info/time_between_train_steps": 0.003278493881225586, "step": 2824} {"info/global_step": 2825, "train_info/time_within_train_step": 2.756180763244629, "step": 2825} {"train_info/time_between_train_steps": 0.0032536983489990234, "step": 2825} {"info/global_step": 2826, "train_info/time_within_train_step": 2.7562546730041504, "step": 2826} {"train_info/time_between_train_steps": 0.003307342529296875, "step": 2826} {"info/global_step": 2827, "train_info/time_within_train_step": 2.7549936771392822, "step": 2827} {"train_info/time_between_train_steps": 0.0032629966735839844, "step": 2827} {"info/global_step": 2828, "train_info/time_within_train_step": 2.7546045780181885, "step": 2828} {"train_info/time_between_train_steps": 0.0032968521118164062, "step": 2828} {"info/global_step": 2829, "train_info/time_within_train_step": 2.755845785140991, "step": 2829} {"train_info/time_between_train_steps": 0.0032863616943359375, "step": 2829} {"info/global_step": 2830, "train_info/time_within_train_step": 2.7554304599761963, "step": 2830} {"train_info/time_between_train_steps": 0.0032088756561279297, "step": 2830} {"info/global_step": 2831, "train_info/time_within_train_step": 2.7563765048980713, "step": 2831} {"train_info/time_between_train_steps": 0.0031926631927490234, "step": 2831} {"info/global_step": 2832, "train_info/time_within_train_step": 2.755434989929199, "step": 2832} {"train_info/time_between_train_steps": 0.003242969512939453, "step": 2832} {"info/global_step": 2833, "train_info/time_within_train_step": 2.7549710273742676, "step": 2833} {"train_info/time_between_train_steps": 0.0032126903533935547, "step": 2833} {"info/global_step": 2834, "train_info/time_within_train_step": 2.7555909156799316, "step": 2834} {"train_info/time_between_train_steps": 0.003227710723876953, "step": 2834} {"info/global_step": 2835, "train_info/time_within_train_step": 2.9997360706329346, "step": 2835} {"train_info/time_between_train_steps": 0.0032579898834228516, "step": 2835} {"info/global_step": 2836, "train_info/time_within_train_step": 2.7548155784606934, "step": 2836} {"train_info/time_between_train_steps": 0.003287792205810547, "step": 2836} {"info/global_step": 2837, "train_info/time_within_train_step": 2.7536942958831787, "step": 2837} {"train_info/time_between_train_steps": 0.003202199935913086, "step": 2837} {"info/global_step": 2838, "train_info/time_within_train_step": 2.755974054336548, "step": 2838} {"train_info/time_between_train_steps": 0.003782033920288086, "step": 2838} {"info/global_step": 2839, "train_info/time_within_train_step": 2.7554867267608643, "step": 2839} {"train_info/time_between_train_steps": 0.003306150436401367, "step": 2839} {"info/global_step": 2840, "train_info/time_within_train_step": 2.75714111328125, "step": 2840} {"train_info/time_between_train_steps": 0.0032448768615722656, "step": 2840} {"info/global_step": 2841, "train_info/time_within_train_step": 2.7562203407287598, "step": 2841} {"train_info/time_between_train_steps": 0.003289461135864258, "step": 2841} {"info/global_step": 2842, "train_info/time_within_train_step": 2.7560534477233887, "step": 2842} {"train_info/time_between_train_steps": 0.0032584667205810547, "step": 2842} {"info/global_step": 2843, "train_info/time_within_train_step": 2.756343126296997, "step": 2843} {"train_info/time_between_train_steps": 0.0032193660736083984, "step": 2843} {"info/global_step": 2844, "train_info/time_within_train_step": 2.7563817501068115, "step": 2844} {"train_info/time_between_train_steps": 0.003262042999267578, "step": 2844} {"info/global_step": 2845, "train_info/time_within_train_step": 2.7556755542755127, "step": 2845} {"train_info/time_between_train_steps": 0.0032815933227539062, "step": 2845} {"info/global_step": 2846, "train_info/time_within_train_step": 2.7547435760498047, "step": 2846} {"train_info/time_between_train_steps": 0.003273487091064453, "step": 2846} {"info/global_step": 2847, "train_info/time_within_train_step": 2.7559053897857666, "step": 2847} {"train_info/time_between_train_steps": 0.0032024383544921875, "step": 2847} {"info/global_step": 2848, "train_info/time_within_train_step": 2.751779079437256, "step": 2848} {"train_info/time_between_train_steps": 0.003200054168701172, "step": 2848} {"info/global_step": 2849, "train_info/time_within_train_step": 2.75478196144104, "step": 2849} {"train_info/time_between_train_steps": 0.0032613277435302734, "step": 2849} {"info/global_step": 2850, "train_info/time_within_train_step": 2.7556464672088623, "step": 2850} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746574314, "_runtime": 8323}, "step": 2850} {"logs": {"train/loss": 4.0765, "train/learning_rate": 0.0004766666666666666, "train/epoch": 3.03, "_timestamp": 1746574314, "_runtime": 8323}, "step": 2850} {"train_info/time_between_train_steps": 0.012656688690185547, "step": 2850} {"info/global_step": 2851, "train_info/time_within_train_step": 2.755232334136963, "step": 2851} {"train_info/time_between_train_steps": 0.0032701492309570312, "step": 2851} {"info/global_step": 2852, "train_info/time_within_train_step": 2.755147933959961, "step": 2852} {"train_info/time_between_train_steps": 0.003281831741333008, "step": 2852} {"info/global_step": 2853, "train_info/time_within_train_step": 2.7537899017333984, "step": 2853} {"train_info/time_between_train_steps": 0.0032835006713867188, "step": 2853} {"info/global_step": 2854, "train_info/time_within_train_step": 2.754887342453003, "step": 2854} {"train_info/time_between_train_steps": 0.0033121109008789062, "step": 2854} {"info/global_step": 2855, "train_info/time_within_train_step": 2.7562272548675537, "step": 2855} {"train_info/time_between_train_steps": 0.0038530826568603516, "step": 2855} {"info/global_step": 2856, "train_info/time_within_train_step": 2.7557578086853027, "step": 2856} {"train_info/time_between_train_steps": 0.003340482711791992, "step": 2856} {"info/global_step": 2857, "train_info/time_within_train_step": 2.7565438747406006, "step": 2857} {"train_info/time_between_train_steps": 0.0032978057861328125, "step": 2857} {"info/global_step": 2858, "train_info/time_within_train_step": 2.7573258876800537, "step": 2858} {"train_info/time_between_train_steps": 0.0033044815063476562, "step": 2858} {"info/global_step": 2859, "train_info/time_within_train_step": 2.756761312484741, "step": 2859} {"train_info/time_between_train_steps": 0.0033292770385742188, "step": 2859} {"info/global_step": 2860, "train_info/time_within_train_step": 2.756560802459717, "step": 2860} {"train_info/time_between_train_steps": 0.0033402442932128906, "step": 2860} {"info/global_step": 2861, "train_info/time_within_train_step": 2.757584810256958, "step": 2861} {"train_info/time_between_train_steps": 0.0033082962036132812, "step": 2861} {"info/global_step": 2862, "train_info/time_within_train_step": 2.756866931915283, "step": 2862} {"train_info/time_between_train_steps": 0.0032265186309814453, "step": 2862} {"info/global_step": 2863, "train_info/time_within_train_step": 2.756007194519043, "step": 2863} {"train_info/time_between_train_steps": 0.0031862258911132812, "step": 2863} {"info/global_step": 2864, "train_info/time_within_train_step": 2.7566771507263184, "step": 2864} {"train_info/time_between_train_steps": 0.003328084945678711, "step": 2864} {"info/global_step": 2865, "train_info/time_within_train_step": 2.756974697113037, "step": 2865} {"train_info/time_between_train_steps": 0.0033452510833740234, "step": 2865} {"info/global_step": 2866, "train_info/time_within_train_step": 2.7555952072143555, "step": 2866} {"train_info/time_between_train_steps": 0.0033054351806640625, "step": 2866} {"info/global_step": 2867, "train_info/time_within_train_step": 2.755730152130127, "step": 2867} {"train_info/time_between_train_steps": 0.0033431053161621094, "step": 2867} {"info/global_step": 2868, "train_info/time_within_train_step": 2.756140947341919, "step": 2868} {"train_info/time_between_train_steps": 0.0033102035522460938, "step": 2868} {"info/global_step": 2869, "train_info/time_within_train_step": 2.7562310695648193, "step": 2869} {"train_info/time_between_train_steps": 0.0033111572265625, "step": 2869} {"info/global_step": 2870, "train_info/time_within_train_step": 2.7561042308807373, "step": 2870} {"train_info/time_between_train_steps": 0.003335237503051758, "step": 2870} {"info/global_step": 2871, "train_info/time_within_train_step": 2.7562789916992188, "step": 2871} {"train_info/time_between_train_steps": 0.0033261775970458984, "step": 2871} {"info/global_step": 2872, "train_info/time_within_train_step": 2.8777663707733154, "step": 2872} {"train_info/time_between_train_steps": 0.003191232681274414, "step": 2872} {"info/global_step": 2873, "train_info/time_within_train_step": 2.7540178298950195, "step": 2873} {"train_info/time_between_train_steps": 0.0031957626342773438, "step": 2873} {"info/global_step": 2874, "train_info/time_within_train_step": 2.754754066467285, "step": 2874} {"train_info/time_between_train_steps": 0.0032134056091308594, "step": 2874} {"info/global_step": 2875, "train_info/time_within_train_step": 2.9841830730438232, "step": 2875} {"train_info/time_between_train_steps": 0.003188610076904297, "step": 2875} {"info/global_step": 2876, "train_info/time_within_train_step": 2.755169630050659, "step": 2876} {"train_info/time_between_train_steps": 0.003210783004760742, "step": 2876} {"info/global_step": 2877, "train_info/time_within_train_step": 2.755936861038208, "step": 2877} {"train_info/time_between_train_steps": 0.003195047378540039, "step": 2877} {"info/global_step": 2878, "train_info/time_within_train_step": 2.7546722888946533, "step": 2878} {"train_info/time_between_train_steps": 0.003164052963256836, "step": 2878} {"info/global_step": 2879, "train_info/time_within_train_step": 2.7533228397369385, "step": 2879} {"train_info/time_between_train_steps": 0.0031845569610595703, "step": 2879} {"info/global_step": 2880, "train_info/time_within_train_step": 2.7544314861297607, "step": 2880} {"train_info/time_between_train_steps": 0.003171682357788086, "step": 2880} {"info/global_step": 2881, "train_info/time_within_train_step": 2.7555553913116455, "step": 2881} {"train_info/time_between_train_steps": 0.0032494068145751953, "step": 2881} {"info/global_step": 2882, "train_info/time_within_train_step": 2.7556262016296387, "step": 2882} {"train_info/time_between_train_steps": 0.0031812191009521484, "step": 2882} {"info/global_step": 2883, "train_info/time_within_train_step": 2.7551238536834717, "step": 2883} {"train_info/time_between_train_steps": 0.0031943321228027344, "step": 2883} {"info/global_step": 2884, "train_info/time_within_train_step": 2.75459885597229, "step": 2884} {"train_info/time_between_train_steps": 0.003172159194946289, "step": 2884} {"info/global_step": 2885, "train_info/time_within_train_step": 2.754918098449707, "step": 2885} {"train_info/time_between_train_steps": 0.0032618045806884766, "step": 2885} {"info/global_step": 2886, "train_info/time_within_train_step": 2.756715774536133, "step": 2886} {"train_info/time_between_train_steps": 0.0031540393829345703, "step": 2886} {"info/global_step": 2887, "train_info/time_within_train_step": 2.7787563800811768, "step": 2887} {"train_info/time_between_train_steps": 0.0032393932342529297, "step": 2887} {"info/global_step": 2888, "train_info/time_within_train_step": 2.754303455352783, "step": 2888} {"train_info/time_between_train_steps": 0.0031938552856445312, "step": 2888} {"info/global_step": 2889, "train_info/time_within_train_step": 2.7542498111724854, "step": 2889} {"train_info/time_between_train_steps": 0.003172159194946289, "step": 2889} {"info/global_step": 2890, "train_info/time_within_train_step": 2.754007339477539, "step": 2890} {"train_info/time_between_train_steps": 0.003228902816772461, "step": 2890} {"info/global_step": 2891, "train_info/time_within_train_step": 2.7547454833984375, "step": 2891} {"train_info/time_between_train_steps": 0.0031685829162597656, "step": 2891} {"info/global_step": 2892, "train_info/time_within_train_step": 2.7535512447357178, "step": 2892} {"train_info/time_between_train_steps": 0.0031592845916748047, "step": 2892} {"info/global_step": 2893, "train_info/time_within_train_step": 2.7568655014038086, "step": 2893} {"train_info/time_between_train_steps": 0.0033965110778808594, "step": 2893} {"info/global_step": 2894, "train_info/time_within_train_step": 2.757140636444092, "step": 2894} {"train_info/time_between_train_steps": 0.003312826156616211, "step": 2894} {"info/global_step": 2895, "train_info/time_within_train_step": 2.7553865909576416, "step": 2895} {"train_info/time_between_train_steps": 0.003317117691040039, "step": 2895} {"info/global_step": 2896, "train_info/time_within_train_step": 2.757176637649536, "step": 2896} {"train_info/time_between_train_steps": 0.0033931732177734375, "step": 2896} {"info/global_step": 2897, "train_info/time_within_train_step": 2.7560689449310303, "step": 2897} {"train_info/time_between_train_steps": 0.0033943653106689453, "step": 2897} {"info/global_step": 2898, "train_info/time_within_train_step": 2.7568464279174805, "step": 2898} {"train_info/time_between_train_steps": 0.0034012794494628906, "step": 2898} {"info/global_step": 2899, "train_info/time_within_train_step": 2.75689435005188, "step": 2899} {"train_info/time_between_train_steps": 0.003407716751098633, "step": 2899} {"info/global_step": 2900, "train_info/time_within_train_step": 2.75736141204834, "step": 2900} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746574453, "_runtime": 8462}, "step": 2900} {"logs": {"train/loss": 4.075, "train/learning_rate": 0.00047333333333333326, "train/epoch": 3.03, "_timestamp": 1746574453, "_runtime": 8462}, "step": 2900} {"train_info/time_between_train_steps": 0.013862848281860352, "step": 2900} {"info/global_step": 2901, "train_info/time_within_train_step": 2.7568390369415283, "step": 2901} {"train_info/time_between_train_steps": 0.003395557403564453, "step": 2901} {"info/global_step": 2902, "train_info/time_within_train_step": 2.7570855617523193, "step": 2902} {"train_info/time_between_train_steps": 0.003420591354370117, "step": 2902} {"info/global_step": 2903, "train_info/time_within_train_step": 2.755603313446045, "step": 2903} {"train_info/time_between_train_steps": 0.003391742706298828, "step": 2903} {"info/global_step": 2904, "train_info/time_within_train_step": 2.756390333175659, "step": 2904} {"train_info/time_between_train_steps": 0.0033566951751708984, "step": 2904} {"info/global_step": 2905, "train_info/time_within_train_step": 2.756103277206421, "step": 2905} {"train_info/time_between_train_steps": 0.003399372100830078, "step": 2905} {"info/global_step": 2906, "train_info/time_within_train_step": 2.7547707557678223, "step": 2906} {"train_info/time_between_train_steps": 0.0031557083129882812, "step": 2906} {"info/global_step": 2907, "train_info/time_within_train_step": 2.7548699378967285, "step": 2907} {"train_info/time_between_train_steps": 0.0032410621643066406, "step": 2907} {"info/global_step": 2908, "train_info/time_within_train_step": 2.7552144527435303, "step": 2908} {"train_info/time_between_train_steps": 0.0032148361206054688, "step": 2908} {"info/global_step": 2909, "train_info/time_within_train_step": 2.7556004524230957, "step": 2909} {"train_info/time_between_train_steps": 0.0032100677490234375, "step": 2909} {"info/global_step": 2910, "train_info/time_within_train_step": 2.7560441493988037, "step": 2910} {"train_info/time_between_train_steps": 0.0031948089599609375, "step": 2910} {"info/global_step": 2911, "train_info/time_within_train_step": 2.7562053203582764, "step": 2911} {"train_info/time_between_train_steps": 0.003194093704223633, "step": 2911} {"info/global_step": 2912, "train_info/time_within_train_step": 2.755923271179199, "step": 2912} {"train_info/time_between_train_steps": 0.0031609535217285156, "step": 2912} {"info/global_step": 2913, "train_info/time_within_train_step": 2.755892276763916, "step": 2913} {"train_info/time_between_train_steps": 0.0032300949096679688, "step": 2913} {"info/global_step": 2914, "train_info/time_within_train_step": 2.755690813064575, "step": 2914} {"train_info/time_between_train_steps": 0.003173828125, "step": 2914} {"info/global_step": 2915, "train_info/time_within_train_step": 2.755371570587158, "step": 2915} {"train_info/time_between_train_steps": 0.0031745433807373047, "step": 2915} {"info/global_step": 2916, "train_info/time_within_train_step": 2.7564949989318848, "step": 2916} {"train_info/time_between_train_steps": 0.0033478736877441406, "step": 2916} {"info/global_step": 2917, "train_info/time_within_train_step": 2.754391670227051, "step": 2917} {"train_info/time_between_train_steps": 0.003417491912841797, "step": 2917} {"info/global_step": 2918, "train_info/time_within_train_step": 2.7559566497802734, "step": 2918} {"train_info/time_between_train_steps": 0.0034475326538085938, "step": 2918} {"info/global_step": 2919, "train_info/time_within_train_step": 2.756427764892578, "step": 2919} {"train_info/time_between_train_steps": 0.003392934799194336, "step": 2919} {"info/global_step": 2920, "train_info/time_within_train_step": 2.7557952404022217, "step": 2920} {"train_info/time_between_train_steps": 0.0033919811248779297, "step": 2920} {"info/global_step": 2921, "train_info/time_within_train_step": 2.7562570571899414, "step": 2921} {"train_info/time_between_train_steps": 0.003368854522705078, "step": 2921} {"info/global_step": 2922, "train_info/time_within_train_step": 2.75590181350708, "step": 2922} {"train_info/time_between_train_steps": 0.0033957958221435547, "step": 2922} {"info/global_step": 2923, "train_info/time_within_train_step": 2.75504207611084, "step": 2923} {"train_info/time_between_train_steps": 0.0033202171325683594, "step": 2923} {"info/global_step": 2924, "train_info/time_within_train_step": 2.755457878112793, "step": 2924} {"train_info/time_between_train_steps": 0.0033173561096191406, "step": 2924} {"info/global_step": 2925, "train_info/time_within_train_step": 2.756004571914673, "step": 2925} {"train_info/time_between_train_steps": 0.0033566951751708984, "step": 2925} {"info/global_step": 2926, "train_info/time_within_train_step": 2.756016254425049, "step": 2926} {"train_info/time_between_train_steps": 0.0033059120178222656, "step": 2926} {"info/global_step": 2927, "train_info/time_within_train_step": 2.7561514377593994, "step": 2927} {"train_info/time_between_train_steps": 0.0033054351806640625, "step": 2927} {"info/global_step": 2928, "train_info/time_within_train_step": 2.754869222640991, "step": 2928} {"train_info/time_between_train_steps": 0.003196239471435547, "step": 2928} {"info/global_step": 2929, "train_info/time_within_train_step": 2.755295991897583, "step": 2929} {"train_info/time_between_train_steps": 0.003237485885620117, "step": 2929} {"info/global_step": 2930, "train_info/time_within_train_step": 2.755859136581421, "step": 2930} {"train_info/time_between_train_steps": 0.0033082962036132812, "step": 2930} {"info/global_step": 2931, "train_info/time_within_train_step": 2.75757098197937, "step": 2931} {"train_info/time_between_train_steps": 0.0033524036407470703, "step": 2931} {"info/global_step": 2932, "train_info/time_within_train_step": 2.7555770874023438, "step": 2932} {"train_info/time_between_train_steps": 0.003325223922729492, "step": 2932} {"info/global_step": 2933, "train_info/time_within_train_step": 2.758049964904785, "step": 2933} {"train_info/time_between_train_steps": 0.0033369064331054688, "step": 2933} {"info/global_step": 2934, "train_info/time_within_train_step": 2.7561333179473877, "step": 2934} {"train_info/time_between_train_steps": 0.12645316123962402, "step": 2934} {"info/global_step": 2935, "train_info/time_within_train_step": 2.756408214569092, "step": 2935} {"train_info/time_between_train_steps": 0.0033364295959472656, "step": 2935} {"info/global_step": 2936, "train_info/time_within_train_step": 2.7563905715942383, "step": 2936} {"train_info/time_between_train_steps": 0.0033643245697021484, "step": 2936} {"info/global_step": 2937, "train_info/time_within_train_step": 2.757105588912964, "step": 2937} {"train_info/time_between_train_steps": 0.0033288002014160156, "step": 2937} {"info/global_step": 2938, "train_info/time_within_train_step": 2.7559242248535156, "step": 2938} {"train_info/time_between_train_steps": 0.0033092498779296875, "step": 2938} {"info/global_step": 2939, "train_info/time_within_train_step": 2.7563345432281494, "step": 2939} {"train_info/time_between_train_steps": 0.0033316612243652344, "step": 2939} {"info/global_step": 2940, "train_info/time_within_train_step": 2.7550852298736572, "step": 2940} {"train_info/time_between_train_steps": 0.0033407211303710938, "step": 2940} {"info/global_step": 2941, "train_info/time_within_train_step": 2.756551742553711, "step": 2941} {"train_info/time_between_train_steps": 0.0033249855041503906, "step": 2941} {"info/global_step": 2942, "train_info/time_within_train_step": 2.7558460235595703, "step": 2942} {"train_info/time_between_train_steps": 0.0033528804779052734, "step": 2942} {"info/global_step": 2943, "train_info/time_within_train_step": 2.7549710273742676, "step": 2943} {"train_info/time_between_train_steps": 0.0034737586975097656, "step": 2943} {"info/global_step": 2944, "train_info/time_within_train_step": 2.7566661834716797, "step": 2944} {"train_info/time_between_train_steps": 0.0033304691314697266, "step": 2944} {"info/global_step": 2945, "train_info/time_within_train_step": 2.7559783458709717, "step": 2945} {"train_info/time_between_train_steps": 0.0033745765686035156, "step": 2945} {"info/global_step": 2946, "train_info/time_within_train_step": 2.7569425106048584, "step": 2946} {"train_info/time_between_train_steps": 0.0033218860626220703, "step": 2946} {"info/global_step": 2947, "train_info/time_within_train_step": 2.756903648376465, "step": 2947} {"train_info/time_between_train_steps": 0.003458261489868164, "step": 2947} {"info/global_step": 2948, "train_info/time_within_train_step": 2.757066249847412, "step": 2948} {"train_info/time_between_train_steps": 0.0035109519958496094, "step": 2948} {"info/global_step": 2949, "train_info/time_within_train_step": 2.755401611328125, "step": 2949} {"train_info/time_between_train_steps": 0.0034711360931396484, "step": 2949} {"info/global_step": 2950, "train_info/time_within_train_step": 2.7576968669891357, "step": 2950} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746574591, "_runtime": 8600}, "step": 2950} {"logs": {"train/loss": 4.0639, "train/learning_rate": 0.00046999999999999993, "train/epoch": 3.04, "_timestamp": 1746574591, "_runtime": 8600}, "step": 2950} {"train_info/time_between_train_steps": 0.01328897476196289, "step": 2950} {"info/global_step": 2951, "train_info/time_within_train_step": 2.7572176456451416, "step": 2951} {"train_info/time_between_train_steps": 0.003694772720336914, "step": 2951} {"info/global_step": 2952, "train_info/time_within_train_step": 2.757805824279785, "step": 2952} {"train_info/time_between_train_steps": 0.003654003143310547, "step": 2952} {"info/global_step": 2953, "train_info/time_within_train_step": 2.7554030418395996, "step": 2953} {"train_info/time_between_train_steps": 0.0036499500274658203, "step": 2953} {"info/global_step": 2954, "train_info/time_within_train_step": 2.7558178901672363, "step": 2954} {"train_info/time_between_train_steps": 0.003645658493041992, "step": 2954} {"info/global_step": 2955, "train_info/time_within_train_step": 2.756503105163574, "step": 2955} {"train_info/time_between_train_steps": 0.0036449432373046875, "step": 2955} {"info/global_step": 2956, "train_info/time_within_train_step": 2.7568273544311523, "step": 2956} {"train_info/time_between_train_steps": 0.0038285255432128906, "step": 2956} {"info/global_step": 2957, "train_info/time_within_train_step": 2.756234884262085, "step": 2957} {"train_info/time_between_train_steps": 0.003567934036254883, "step": 2957} {"info/global_step": 2958, "train_info/time_within_train_step": 2.758624792098999, "step": 2958} {"train_info/time_between_train_steps": 0.003554821014404297, "step": 2958} {"info/global_step": 2959, "train_info/time_within_train_step": 2.756378650665283, "step": 2959} {"train_info/time_between_train_steps": 0.003615856170654297, "step": 2959} {"info/global_step": 2960, "train_info/time_within_train_step": 2.7556095123291016, "step": 2960} {"train_info/time_between_train_steps": 0.0033652782440185547, "step": 2960} {"info/global_step": 2961, "train_info/time_within_train_step": 2.7554590702056885, "step": 2961} {"train_info/time_between_train_steps": 0.0034379959106445312, "step": 2961} {"info/global_step": 2962, "train_info/time_within_train_step": 2.754920721054077, "step": 2962} {"train_info/time_between_train_steps": 0.0034227371215820312, "step": 2962} {"info/global_step": 2963, "train_info/time_within_train_step": 2.754595994949341, "step": 2963} {"train_info/time_between_train_steps": 0.003414154052734375, "step": 2963} {"info/global_step": 2964, "train_info/time_within_train_step": 3.0724401473999023, "step": 2964} {"train_info/time_between_train_steps": 0.0032219886779785156, "step": 2964} {"info/global_step": 2965, "train_info/time_within_train_step": 2.755488634109497, "step": 2965} {"train_info/time_between_train_steps": 0.00321197509765625, "step": 2965} {"info/global_step": 2966, "train_info/time_within_train_step": 2.7549614906311035, "step": 2966} {"train_info/time_between_train_steps": 0.0032188892364501953, "step": 2966} {"info/global_step": 2967, "train_info/time_within_train_step": 2.7559003829956055, "step": 2967} {"train_info/time_between_train_steps": 0.003231525421142578, "step": 2967} {"info/global_step": 2968, "train_info/time_within_train_step": 2.7549755573272705, "step": 2968} {"train_info/time_between_train_steps": 0.0032694339752197266, "step": 2968} {"info/global_step": 2969, "train_info/time_within_train_step": 2.754920482635498, "step": 2969} {"train_info/time_between_train_steps": 0.0031795501708984375, "step": 2969} {"info/global_step": 2970, "train_info/time_within_train_step": 2.7555220127105713, "step": 2970} {"train_info/time_between_train_steps": 0.0032193660736083984, "step": 2970} {"info/global_step": 2971, "train_info/time_within_train_step": 2.7541728019714355, "step": 2971} {"train_info/time_between_train_steps": 0.0032432079315185547, "step": 2971} {"info/global_step": 2972, "train_info/time_within_train_step": 2.754652500152588, "step": 2972} {"train_info/time_between_train_steps": 0.0032210350036621094, "step": 2972} {"info/global_step": 2973, "train_info/time_within_train_step": 2.755955457687378, "step": 2973} {"train_info/time_between_train_steps": 0.0034530162811279297, "step": 2973} {"info/global_step": 2974, "train_info/time_within_train_step": 2.778989553451538, "step": 2974} {"train_info/time_between_train_steps": 0.003447294235229492, "step": 2974} {"info/global_step": 2975, "train_info/time_within_train_step": 2.7557640075683594, "step": 2975} {"train_info/time_between_train_steps": 0.003621339797973633, "step": 2975} {"info/global_step": 2976, "train_info/time_within_train_step": 2.7539098262786865, "step": 2976} {"train_info/time_between_train_steps": 0.003450155258178711, "step": 2976} {"info/global_step": 2977, "train_info/time_within_train_step": 2.755599021911621, "step": 2977} {"train_info/time_between_train_steps": 0.003465414047241211, "step": 2977} {"info/global_step": 2978, "train_info/time_within_train_step": 2.755908727645874, "step": 2978} {"train_info/time_between_train_steps": 0.003478527069091797, "step": 2978} {"info/global_step": 2979, "train_info/time_within_train_step": 2.7541208267211914, "step": 2979} {"train_info/time_between_train_steps": 0.0034787654876708984, "step": 2979} {"info/global_step": 2980, "train_info/time_within_train_step": 2.756039619445801, "step": 2980} {"train_info/time_between_train_steps": 0.0034177303314208984, "step": 2980} {"info/global_step": 2981, "train_info/time_within_train_step": 2.754157304763794, "step": 2981} {"train_info/time_between_train_steps": 0.0034215450286865234, "step": 2981} {"info/global_step": 2982, "train_info/time_within_train_step": 2.7556819915771484, "step": 2982} {"train_info/time_between_train_steps": 0.0034589767456054688, "step": 2982} {"info/global_step": 2983, "train_info/time_within_train_step": 2.7566797733306885, "step": 2983} {"train_info/time_between_train_steps": 0.003422260284423828, "step": 2983} {"info/global_step": 2984, "train_info/time_within_train_step": 2.75795316696167, "step": 2984} {"train_info/time_between_train_steps": 0.0034084320068359375, "step": 2984} {"info/global_step": 2985, "train_info/time_within_train_step": 2.7552552223205566, "step": 2985} {"train_info/time_between_train_steps": 0.003445148468017578, "step": 2985} {"info/global_step": 2986, "train_info/time_within_train_step": 2.756988286972046, "step": 2986} {"train_info/time_between_train_steps": 0.0034427642822265625, "step": 2986} {"info/global_step": 2987, "train_info/time_within_train_step": 2.7555088996887207, "step": 2987} {"train_info/time_between_train_steps": 0.003431081771850586, "step": 2987} {"info/global_step": 2988, "train_info/time_within_train_step": 2.7566943168640137, "step": 2988} {"train_info/time_between_train_steps": 0.0034699440002441406, "step": 2988} {"info/global_step": 2989, "train_info/time_within_train_step": 2.7559430599212646, "step": 2989} {"train_info/time_between_train_steps": 0.0034139156341552734, "step": 2989} {"info/global_step": 2990, "train_info/time_within_train_step": 2.7563185691833496, "step": 2990} {"train_info/time_between_train_steps": 0.0035037994384765625, "step": 2990} {"info/global_step": 2991, "train_info/time_within_train_step": 2.755814552307129, "step": 2991} {"train_info/time_between_train_steps": 0.0034050941467285156, "step": 2991} {"info/global_step": 2992, "train_info/time_within_train_step": 2.758589267730713, "step": 2992} {"train_info/time_between_train_steps": 0.003444671630859375, "step": 2992} {"info/global_step": 2993, "train_info/time_within_train_step": 2.7562735080718994, "step": 2993} {"train_info/time_between_train_steps": 0.003506898880004883, "step": 2993} {"info/global_step": 2994, "train_info/time_within_train_step": 2.754878282546997, "step": 2994} {"train_info/time_between_train_steps": 0.0034067630767822266, "step": 2994} {"info/global_step": 2995, "train_info/time_within_train_step": 2.755730390548706, "step": 2995} {"train_info/time_between_train_steps": 0.003503561019897461, "step": 2995} {"info/global_step": 2996, "train_info/time_within_train_step": 2.75677752494812, "step": 2996} {"train_info/time_between_train_steps": 0.003429412841796875, "step": 2996} {"info/global_step": 2997, "train_info/time_within_train_step": 2.887866497039795, "step": 2997} {"train_info/time_between_train_steps": 0.0034117698669433594, "step": 2997} {"info/global_step": 2998, "train_info/time_within_train_step": 2.7560689449310303, "step": 2998} {"train_info/time_between_train_steps": 0.003395557403564453, "step": 2998} {"info/global_step": 2999, "train_info/time_within_train_step": 3.3573737144470215, "step": 2999} {"train_info/time_between_train_steps": 0.003352642059326172, "step": 2999} {"info/global_step": 3000, "train_info/time_within_train_step": 2.75594162940979, "step": 3000} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746574731, "_runtime": 8740}, "step": 3000} {"logs": {"train/loss": 4.0424, "train/learning_rate": 0.0004666666666666666, "train/epoch": 3.04, "_timestamp": 1746574731, "_runtime": 8740}, "step": 3000} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746574736, "_runtime": 8745}, "step": 3000} {"logs": {"eval/loss": 4.674428462982178, "eval/runtime": 5.1598, "eval/samples_per_second": 36.823, "eval/steps_per_second": 1.163, "train/epoch": 3.04, "_timestamp": 1746574736, "_runtime": 8745}, "step": 3000} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746574736, "_runtime": 8745}, "step": 3000} {"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.674428462982178, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 107.17129722110278, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 5.1598, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 36.823, "train/epoch": 3.04, "_timestamp": 1746574736, "_runtime": 8745}, "step": 3000} {"train_info/time_between_train_steps": 21.609498262405396, "step": 3000} {"info/global_step": 3001, "train_info/time_within_train_step": 2.542548656463623, "step": 3001} {"train_info/time_between_train_steps": 0.003203153610229492, "step": 3001} {"info/global_step": 3002, "train_info/time_within_train_step": 2.5936520099639893, "step": 3002} {"train_info/time_between_train_steps": 0.0031805038452148438, "step": 3002} {"info/global_step": 3003, "train_info/time_within_train_step": 2.6963250637054443, "step": 3003} {"train_info/time_between_train_steps": 0.0032262802124023438, "step": 3003} {"info/global_step": 3004, "train_info/time_within_train_step": 2.7504689693450928, "step": 3004} {"train_info/time_between_train_steps": 0.0031745433807373047, "step": 3004} {"info/global_step": 3005, "train_info/time_within_train_step": 2.751535177230835, "step": 3005} {"train_info/time_between_train_steps": 0.0031850337982177734, "step": 3005} {"info/global_step": 3006, "train_info/time_within_train_step": 2.7552878856658936, "step": 3006} {"train_info/time_between_train_steps": 0.003216981887817383, "step": 3006} {"info/global_step": 3007, "train_info/time_within_train_step": 2.7563064098358154, "step": 3007} {"train_info/time_between_train_steps": 0.0032105445861816406, "step": 3007} {"info/global_step": 3008, "train_info/time_within_train_step": 2.757833957672119, "step": 3008} {"train_info/time_between_train_steps": 0.003404855728149414, "step": 3008} {"info/global_step": 3009, "train_info/time_within_train_step": 2.756804943084717, "step": 3009} {"train_info/time_between_train_steps": 0.003465890884399414, "step": 3009} {"info/global_step": 3010, "train_info/time_within_train_step": 2.7577579021453857, "step": 3010} {"train_info/time_between_train_steps": 0.0034041404724121094, "step": 3010} {"info/global_step": 3011, "train_info/time_within_train_step": 2.759213447570801, "step": 3011} {"train_info/time_between_train_steps": 0.003472566604614258, "step": 3011} {"info/global_step": 3012, "train_info/time_within_train_step": 2.758430004119873, "step": 3012} {"train_info/time_between_train_steps": 0.003430604934692383, "step": 3012} {"info/global_step": 3013, "train_info/time_within_train_step": 2.757389545440674, "step": 3013} {"train_info/time_between_train_steps": 0.003345012664794922, "step": 3013} {"info/global_step": 3014, "train_info/time_within_train_step": 2.757915735244751, "step": 3014} {"train_info/time_between_train_steps": 0.003488779067993164, "step": 3014} {"info/global_step": 3015, "train_info/time_within_train_step": 2.758025646209717, "step": 3015} {"train_info/time_between_train_steps": 0.003439188003540039, "step": 3015} {"info/global_step": 3016, "train_info/time_within_train_step": 2.7580626010894775, "step": 3016} {"train_info/time_between_train_steps": 0.00353240966796875, "step": 3016} {"info/global_step": 3017, "train_info/time_within_train_step": 2.758725643157959, "step": 3017} {"train_info/time_between_train_steps": 0.0035905838012695312, "step": 3017} {"info/global_step": 3018, "train_info/time_within_train_step": 2.7598109245300293, "step": 3018} {"train_info/time_between_train_steps": 0.003478527069091797, "step": 3018} {"info/global_step": 3019, "train_info/time_within_train_step": 2.757830858230591, "step": 3019} {"train_info/time_between_train_steps": 0.003663778305053711, "step": 3019} {"info/global_step": 3020, "train_info/time_within_train_step": 2.759732484817505, "step": 3020} {"train_info/time_between_train_steps": 0.003742218017578125, "step": 3020} {"info/global_step": 3021, "train_info/time_within_train_step": 2.759263753890991, "step": 3021} {"train_info/time_between_train_steps": 0.0036134719848632812, "step": 3021} {"info/global_step": 3022, "train_info/time_within_train_step": 2.7601571083068848, "step": 3022} {"train_info/time_between_train_steps": 0.003801584243774414, "step": 3022} {"info/global_step": 3023, "train_info/time_within_train_step": 2.759415626525879, "step": 3023} {"train_info/time_between_train_steps": 0.003610372543334961, "step": 3023} {"info/global_step": 3024, "train_info/time_within_train_step": 2.759582757949829, "step": 3024} {"train_info/time_between_train_steps": 0.0036437511444091797, "step": 3024} {"info/global_step": 3025, "train_info/time_within_train_step": 2.7593326568603516, "step": 3025} {"train_info/time_between_train_steps": 0.003711700439453125, "step": 3025} {"info/global_step": 3026, "train_info/time_within_train_step": 3.0995004177093506, "step": 3026} {"train_info/time_between_train_steps": 0.003422260284423828, "step": 3026} {"info/global_step": 3027, "train_info/time_within_train_step": 2.7590088844299316, "step": 3027} {"train_info/time_between_train_steps": 0.0034742355346679688, "step": 3027} {"info/global_step": 3028, "train_info/time_within_train_step": 2.757702350616455, "step": 3028} {"train_info/time_between_train_steps": 0.003471851348876953, "step": 3028} {"info/global_step": 3029, "train_info/time_within_train_step": 2.756819725036621, "step": 3029} {"train_info/time_between_train_steps": 0.0035941600799560547, "step": 3029} {"info/global_step": 3030, "train_info/time_within_train_step": 2.756901741027832, "step": 3030} {"train_info/time_between_train_steps": 0.0033867359161376953, "step": 3030} {"info/global_step": 3031, "train_info/time_within_train_step": 2.7583765983581543, "step": 3031} {"train_info/time_between_train_steps": 0.0034461021423339844, "step": 3031} {"info/global_step": 3032, "train_info/time_within_train_step": 2.7564330101013184, "step": 3032} {"train_info/time_between_train_steps": 0.003397703170776367, "step": 3032} {"info/global_step": 3033, "train_info/time_within_train_step": 2.7577619552612305, "step": 3033} {"train_info/time_between_train_steps": 0.003390073776245117, "step": 3033} {"info/global_step": 3034, "train_info/time_within_train_step": 2.756833553314209, "step": 3034} {"train_info/time_between_train_steps": 0.003374338150024414, "step": 3034} {"info/global_step": 3035, "train_info/time_within_train_step": 2.758192539215088, "step": 3035} {"train_info/time_between_train_steps": 0.0033664703369140625, "step": 3035} {"info/global_step": 3036, "train_info/time_within_train_step": 2.7567710876464844, "step": 3036} {"train_info/time_between_train_steps": 0.0033719539642333984, "step": 3036} {"info/global_step": 3037, "train_info/time_within_train_step": 2.758249521255493, "step": 3037} {"train_info/time_between_train_steps": 0.0035240650177001953, "step": 3037} {"info/global_step": 3038, "train_info/time_within_train_step": 2.7585840225219727, "step": 3038} {"train_info/time_between_train_steps": 0.0034363269805908203, "step": 3038} {"info/global_step": 3039, "train_info/time_within_train_step": 2.758005380630493, "step": 3039} {"train_info/time_between_train_steps": 0.003607034683227539, "step": 3039} {"info/global_step": 3040, "train_info/time_within_train_step": 2.7575652599334717, "step": 3040} {"train_info/time_between_train_steps": 0.003442525863647461, "step": 3040} {"info/global_step": 3041, "train_info/time_within_train_step": 2.7572388648986816, "step": 3041} {"train_info/time_between_train_steps": 0.0033423900604248047, "step": 3041} {"info/global_step": 3042, "train_info/time_within_train_step": 2.756354808807373, "step": 3042} {"train_info/time_between_train_steps": 0.0032286643981933594, "step": 3042} {"info/global_step": 3043, "train_info/time_within_train_step": 2.756373167037964, "step": 3043} {"train_info/time_between_train_steps": 0.0032601356506347656, "step": 3043} {"info/global_step": 3044, "train_info/time_within_train_step": 2.7567803859710693, "step": 3044} {"train_info/time_between_train_steps": 0.003322601318359375, "step": 3044} {"info/global_step": 3045, "train_info/time_within_train_step": 2.755894899368286, "step": 3045} {"train_info/time_between_train_steps": 0.0033075809478759766, "step": 3045} {"info/global_step": 3046, "train_info/time_within_train_step": 2.7563130855560303, "step": 3046} {"train_info/time_between_train_steps": 0.0033004283905029297, "step": 3046} {"info/global_step": 3047, "train_info/time_within_train_step": 2.755936861038208, "step": 3047} {"train_info/time_between_train_steps": 0.0035517215728759766, "step": 3047} {"info/global_step": 3048, "train_info/time_within_train_step": 2.7562191486358643, "step": 3048} {"train_info/time_between_train_steps": 0.0034933090209960938, "step": 3048} {"info/global_step": 3049, "train_info/time_within_train_step": 2.7562313079833984, "step": 3049} {"train_info/time_between_train_steps": 0.003665447235107422, "step": 3049} {"info/global_step": 3050, "train_info/time_within_train_step": 2.7554144859313965, "step": 3050} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746574891, "_runtime": 8900}, "step": 3050} {"logs": {"train/loss": 4.038, "train/learning_rate": 0.00046333333333333334, "train/epoch": 3.05, "_timestamp": 1746574891, "_runtime": 8900}, "step": 3050} {"train_info/time_between_train_steps": 0.013653039932250977, "step": 3050} {"info/global_step": 3051, "train_info/time_within_train_step": 2.756345272064209, "step": 3051} {"train_info/time_between_train_steps": 0.0034677982330322266, "step": 3051} {"info/global_step": 3052, "train_info/time_within_train_step": 2.7578110694885254, "step": 3052} {"train_info/time_between_train_steps": 0.0033881664276123047, "step": 3052} {"info/global_step": 3053, "train_info/time_within_train_step": 2.756763219833374, "step": 3053} {"train_info/time_between_train_steps": 0.0034193992614746094, "step": 3053} {"info/global_step": 3054, "train_info/time_within_train_step": 2.757011651992798, "step": 3054} {"train_info/time_between_train_steps": 0.003458261489868164, "step": 3054} {"info/global_step": 3055, "train_info/time_within_train_step": 2.7571399211883545, "step": 3055} {"train_info/time_between_train_steps": 0.0033800601959228516, "step": 3055} {"info/global_step": 3056, "train_info/time_within_train_step": 2.7550160884857178, "step": 3056} {"train_info/time_between_train_steps": 0.0033228397369384766, "step": 3056} {"info/global_step": 3057, "train_info/time_within_train_step": 2.755826234817505, "step": 3057} {"train_info/time_between_train_steps": 0.0034508705139160156, "step": 3057} {"info/global_step": 3058, "train_info/time_within_train_step": 2.7558343410491943, "step": 3058} {"train_info/time_between_train_steps": 0.003386259078979492, "step": 3058} {"info/global_step": 3059, "train_info/time_within_train_step": 2.7557573318481445, "step": 3059} {"train_info/time_between_train_steps": 0.12480282783508301, "step": 3059} {"info/global_step": 3060, "train_info/time_within_train_step": 2.7548818588256836, "step": 3060} {"train_info/time_between_train_steps": 0.003336191177368164, "step": 3060} {"info/global_step": 3061, "train_info/time_within_train_step": 2.754901170730591, "step": 3061} {"train_info/time_between_train_steps": 0.0032265186309814453, "step": 3061} {"info/global_step": 3062, "train_info/time_within_train_step": 2.755565643310547, "step": 3062} {"train_info/time_between_train_steps": 0.003305673599243164, "step": 3062} {"info/global_step": 3063, "train_info/time_within_train_step": 2.7559421062469482, "step": 3063} {"train_info/time_between_train_steps": 0.003256082534790039, "step": 3063} {"info/global_step": 3064, "train_info/time_within_train_step": 2.7555105686187744, "step": 3064} {"train_info/time_between_train_steps": 0.00325775146484375, "step": 3064} {"info/global_step": 3065, "train_info/time_within_train_step": 2.7560102939605713, "step": 3065} {"train_info/time_between_train_steps": 0.003286600112915039, "step": 3065} {"info/global_step": 3066, "train_info/time_within_train_step": 2.755316972732544, "step": 3066} {"train_info/time_between_train_steps": 0.0032787322998046875, "step": 3066} {"info/global_step": 3067, "train_info/time_within_train_step": 2.7562544345855713, "step": 3067} {"train_info/time_between_train_steps": 0.003253936767578125, "step": 3067} {"info/global_step": 3068, "train_info/time_within_train_step": 2.7552809715270996, "step": 3068} {"train_info/time_between_train_steps": 0.003307819366455078, "step": 3068} {"info/global_step": 3069, "train_info/time_within_train_step": 2.755532741546631, "step": 3069} {"train_info/time_between_train_steps": 0.0033016204833984375, "step": 3069} {"info/global_step": 3070, "train_info/time_within_train_step": 2.7559635639190674, "step": 3070} {"train_info/time_between_train_steps": 0.0032472610473632812, "step": 3070} {"info/global_step": 3071, "train_info/time_within_train_step": 2.756218671798706, "step": 3071} {"train_info/time_between_train_steps": 0.0033364295959472656, "step": 3071} {"info/global_step": 3072, "train_info/time_within_train_step": 2.755889654159546, "step": 3072} {"train_info/time_between_train_steps": 0.0032677650451660156, "step": 3072} {"info/global_step": 3073, "train_info/time_within_train_step": 2.756146192550659, "step": 3073} {"train_info/time_between_train_steps": 0.0032303333282470703, "step": 3073} {"info/global_step": 3074, "train_info/time_within_train_step": 2.754848003387451, "step": 3074} {"train_info/time_between_train_steps": 0.003280162811279297, "step": 3074} {"info/global_step": 3075, "train_info/time_within_train_step": 2.7805047035217285, "step": 3075} {"train_info/time_between_train_steps": 0.0032684803009033203, "step": 3075} {"info/global_step": 3076, "train_info/time_within_train_step": 2.755171775817871, "step": 3076} {"train_info/time_between_train_steps": 0.003253459930419922, "step": 3076} {"info/global_step": 3077, "train_info/time_within_train_step": 2.756899118423462, "step": 3077} {"train_info/time_between_train_steps": 0.003274202346801758, "step": 3077} {"info/global_step": 3078, "train_info/time_within_train_step": 2.7559781074523926, "step": 3078} {"train_info/time_between_train_steps": 0.003265380859375, "step": 3078} {"info/global_step": 3079, "train_info/time_within_train_step": 2.7543985843658447, "step": 3079} {"train_info/time_between_train_steps": 0.003276824951171875, "step": 3079} {"info/global_step": 3080, "train_info/time_within_train_step": 2.7565574645996094, "step": 3080} {"train_info/time_between_train_steps": 0.003281831741333008, "step": 3080} {"info/global_step": 3081, "train_info/time_within_train_step": 3.046905279159546, "step": 3081} {"train_info/time_between_train_steps": 0.003166675567626953, "step": 3081} {"info/global_step": 3082, "train_info/time_within_train_step": 2.756805181503296, "step": 3082} {"train_info/time_between_train_steps": 0.003217458724975586, "step": 3082} {"info/global_step": 3083, "train_info/time_within_train_step": 2.7569332122802734, "step": 3083} {"train_info/time_between_train_steps": 0.003209352493286133, "step": 3083} {"info/global_step": 3084, "train_info/time_within_train_step": 2.75585675239563, "step": 3084} {"train_info/time_between_train_steps": 0.003172159194946289, "step": 3084} {"info/global_step": 3085, "train_info/time_within_train_step": 2.7560067176818848, "step": 3085} {"train_info/time_between_train_steps": 0.0031995773315429688, "step": 3085} {"info/global_step": 3086, "train_info/time_within_train_step": 2.755553960800171, "step": 3086} {"train_info/time_between_train_steps": 0.0031588077545166016, "step": 3086} {"info/global_step": 3087, "train_info/time_within_train_step": 2.7556862831115723, "step": 3087} {"train_info/time_between_train_steps": 0.0031881332397460938, "step": 3087} {"info/global_step": 3088, "train_info/time_within_train_step": 2.755808115005493, "step": 3088} {"train_info/time_between_train_steps": 0.003220081329345703, "step": 3088} {"info/global_step": 3089, "train_info/time_within_train_step": 2.756411075592041, "step": 3089} {"train_info/time_between_train_steps": 0.0031876564025878906, "step": 3089} {"info/global_step": 3090, "train_info/time_within_train_step": 2.7548916339874268, "step": 3090} {"train_info/time_between_train_steps": 0.0031671524047851562, "step": 3090} {"info/global_step": 3091, "train_info/time_within_train_step": 2.7558913230895996, "step": 3091} {"train_info/time_between_train_steps": 0.003214597702026367, "step": 3091} {"info/global_step": 3092, "train_info/time_within_train_step": 2.7553465366363525, "step": 3092} {"train_info/time_between_train_steps": 0.003225088119506836, "step": 3092} {"info/global_step": 3093, "train_info/time_within_train_step": 2.756256341934204, "step": 3093} {"train_info/time_between_train_steps": 0.003214597702026367, "step": 3093} {"info/global_step": 3094, "train_info/time_within_train_step": 2.756950855255127, "step": 3094} {"train_info/time_between_train_steps": 0.00318145751953125, "step": 3094} {"info/global_step": 3095, "train_info/time_within_train_step": 2.7554216384887695, "step": 3095} {"train_info/time_between_train_steps": 0.003173828125, "step": 3095} {"info/global_step": 3096, "train_info/time_within_train_step": 2.7556979656219482, "step": 3096} {"train_info/time_between_train_steps": 0.0031850337982177734, "step": 3096} {"info/global_step": 3097, "train_info/time_within_train_step": 2.75653076171875, "step": 3097} {"train_info/time_between_train_steps": 0.0031855106353759766, "step": 3097} {"info/global_step": 3098, "train_info/time_within_train_step": 2.7551770210266113, "step": 3098} {"train_info/time_between_train_steps": 0.0033369064331054688, "step": 3098} {"info/global_step": 3099, "train_info/time_within_train_step": 2.756110906600952, "step": 3099} {"train_info/time_between_train_steps": 0.003353595733642578, "step": 3099} {"info/global_step": 3100, "train_info/time_within_train_step": 2.7566092014312744, "step": 3100} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746575030, "_runtime": 9039}, "step": 3100} {"logs": {"train/loss": 4.0295, "train/learning_rate": 0.00046, "train/epoch": 3.05, "_timestamp": 1746575030, "_runtime": 9039}, "step": 3100} {"train_info/time_between_train_steps": 0.029670000076293945, "step": 3100} {"info/global_step": 3101, "train_info/time_within_train_step": 2.7560572624206543, "step": 3101} {"train_info/time_between_train_steps": 0.0029718875885009766, "step": 3101} {"info/global_step": 3102, "train_info/time_within_train_step": 2.755410671234131, "step": 3102} {"train_info/time_between_train_steps": 0.002955198287963867, "step": 3102} {"info/global_step": 3103, "train_info/time_within_train_step": 2.755463123321533, "step": 3103} {"train_info/time_between_train_steps": 0.0030145645141601562, "step": 3103} {"info/global_step": 3104, "train_info/time_within_train_step": 2.7554612159729004, "step": 3104} {"train_info/time_between_train_steps": 0.002962827682495117, "step": 3104} {"info/global_step": 3105, "train_info/time_within_train_step": 2.7538344860076904, "step": 3105} {"train_info/time_between_train_steps": 0.002978086471557617, "step": 3105} {"info/global_step": 3106, "train_info/time_within_train_step": 2.753817558288574, "step": 3106} {"train_info/time_between_train_steps": 0.0029709339141845703, "step": 3106} {"info/global_step": 3107, "train_info/time_within_train_step": 2.755251884460449, "step": 3107} {"train_info/time_between_train_steps": 0.0029754638671875, "step": 3107} {"info/global_step": 3108, "train_info/time_within_train_step": 2.7562317848205566, "step": 3108} {"train_info/time_between_train_steps": 0.0029926300048828125, "step": 3108} {"info/global_step": 3109, "train_info/time_within_train_step": 2.75561785697937, "step": 3109} {"train_info/time_between_train_steps": 0.002959012985229492, "step": 3109} {"info/global_step": 3110, "train_info/time_within_train_step": 2.7556426525115967, "step": 3110} {"train_info/time_between_train_steps": 0.002985715866088867, "step": 3110} {"info/global_step": 3111, "train_info/time_within_train_step": 2.7553765773773193, "step": 3111} {"train_info/time_between_train_steps": 0.002988576889038086, "step": 3111} {"info/global_step": 3112, "train_info/time_within_train_step": 2.755530834197998, "step": 3112} {"train_info/time_between_train_steps": 0.002960205078125, "step": 3112} {"info/global_step": 3113, "train_info/time_within_train_step": 2.756619930267334, "step": 3113} {"train_info/time_between_train_steps": 0.0030515193939208984, "step": 3113} {"info/global_step": 3114, "train_info/time_within_train_step": 2.7552573680877686, "step": 3114} {"train_info/time_between_train_steps": 0.0030252933502197266, "step": 3114} {"info/global_step": 3115, "train_info/time_within_train_step": 2.7553374767303467, "step": 3115} {"train_info/time_between_train_steps": 0.003088235855102539, "step": 3115} {"info/global_step": 3116, "train_info/time_within_train_step": 2.7554280757904053, "step": 3116} {"train_info/time_between_train_steps": 0.0031108856201171875, "step": 3116} {"info/global_step": 3117, "train_info/time_within_train_step": 2.755868911743164, "step": 3117} {"train_info/time_between_train_steps": 0.0032303333282470703, "step": 3117} {"info/global_step": 3118, "train_info/time_within_train_step": 2.7554354667663574, "step": 3118} {"train_info/time_between_train_steps": 0.0032265186309814453, "step": 3118} {"info/global_step": 3119, "train_info/time_within_train_step": 2.7560086250305176, "step": 3119} {"train_info/time_between_train_steps": 0.003208637237548828, "step": 3119} {"info/global_step": 3120, "train_info/time_within_train_step": 2.7552804946899414, "step": 3120} {"train_info/time_between_train_steps": 0.0032138824462890625, "step": 3120} {"info/global_step": 3121, "train_info/time_within_train_step": 2.7552359104156494, "step": 3121} {"train_info/time_between_train_steps": 0.0031948089599609375, "step": 3121} {"info/global_step": 3122, "train_info/time_within_train_step": 3.0415639877319336, "step": 3122} {"train_info/time_between_train_steps": 0.0031626224517822266, "step": 3122} {"info/global_step": 3123, "train_info/time_within_train_step": 2.755418062210083, "step": 3123} {"train_info/time_between_train_steps": 0.003052234649658203, "step": 3123} {"info/global_step": 3124, "train_info/time_within_train_step": 2.7558436393737793, "step": 3124} {"train_info/time_between_train_steps": 0.0030455589294433594, "step": 3124} {"info/global_step": 3125, "train_info/time_within_train_step": 2.7552716732025146, "step": 3125} {"train_info/time_between_train_steps": 0.0030264854431152344, "step": 3125} {"info/global_step": 3126, "train_info/time_within_train_step": 2.7556469440460205, "step": 3126} {"train_info/time_between_train_steps": 0.0030155181884765625, "step": 3126} {"info/global_step": 3127, "train_info/time_within_train_step": 2.756319046020508, "step": 3127} {"train_info/time_between_train_steps": 0.003180980682373047, "step": 3127} {"info/global_step": 3128, "train_info/time_within_train_step": 2.755821466445923, "step": 3128} {"train_info/time_between_train_steps": 0.0030913352966308594, "step": 3128} {"info/global_step": 3129, "train_info/time_within_train_step": 2.7557764053344727, "step": 3129} {"train_info/time_between_train_steps": 0.0032830238342285156, "step": 3129} {"info/global_step": 3130, "train_info/time_within_train_step": 2.7566349506378174, "step": 3130} {"train_info/time_between_train_steps": 0.003137826919555664, "step": 3130} {"info/global_step": 3131, "train_info/time_within_train_step": 2.755570888519287, "step": 3131} {"train_info/time_between_train_steps": 0.0032863616943359375, "step": 3131} {"info/global_step": 3132, "train_info/time_within_train_step": 2.7553517818450928, "step": 3132} {"train_info/time_between_train_steps": 0.0032224655151367188, "step": 3132} {"info/global_step": 3133, "train_info/time_within_train_step": 2.755643367767334, "step": 3133} {"train_info/time_between_train_steps": 0.0032105445861816406, "step": 3133} {"info/global_step": 3134, "train_info/time_within_train_step": 2.7545676231384277, "step": 3134} {"train_info/time_between_train_steps": 0.0032088756561279297, "step": 3134} {"info/global_step": 3135, "train_info/time_within_train_step": 2.75535249710083, "step": 3135} {"train_info/time_between_train_steps": 0.003160238265991211, "step": 3135} {"info/global_step": 3136, "train_info/time_within_train_step": 2.755300760269165, "step": 3136} {"train_info/time_between_train_steps": 0.0032281875610351562, "step": 3136} {"info/global_step": 3137, "train_info/time_within_train_step": 2.755364418029785, "step": 3137} {"train_info/time_between_train_steps": 0.0031232833862304688, "step": 3137} {"info/global_step": 3138, "train_info/time_within_train_step": 2.755737781524658, "step": 3138} {"train_info/time_between_train_steps": 0.0031816959381103516, "step": 3138} {"info/global_step": 3139, "train_info/time_within_train_step": 2.7556302547454834, "step": 3139} {"train_info/time_between_train_steps": 0.0032057762145996094, "step": 3139} {"info/global_step": 3140, "train_info/time_within_train_step": 2.779919385910034, "step": 3140} {"train_info/time_between_train_steps": 0.0032241344451904297, "step": 3140} {"info/global_step": 3141, "train_info/time_within_train_step": 2.7559521198272705, "step": 3141} {"train_info/time_between_train_steps": 0.003214597702026367, "step": 3141} {"info/global_step": 3142, "train_info/time_within_train_step": 2.7550532817840576, "step": 3142} {"train_info/time_between_train_steps": 0.003068685531616211, "step": 3142} {"info/global_step": 3143, "train_info/time_within_train_step": 2.7549641132354736, "step": 3143} {"train_info/time_between_train_steps": 0.0030074119567871094, "step": 3143} {"info/global_step": 3144, "train_info/time_within_train_step": 2.7543704509735107, "step": 3144} {"train_info/time_between_train_steps": 0.0030558109283447266, "step": 3144} {"info/global_step": 3145, "train_info/time_within_train_step": 2.7542362213134766, "step": 3145} {"train_info/time_between_train_steps": 0.0030012130737304688, "step": 3145} {"info/global_step": 3146, "train_info/time_within_train_step": 2.7551591396331787, "step": 3146} {"train_info/time_between_train_steps": 0.002988576889038086, "step": 3146} {"info/global_step": 3147, "train_info/time_within_train_step": 2.754704475402832, "step": 3147} {"train_info/time_between_train_steps": 0.0030527114868164062, "step": 3147} {"info/global_step": 3148, "train_info/time_within_train_step": 2.7538187503814697, "step": 3148} {"train_info/time_between_train_steps": 0.003106355667114258, "step": 3148} {"info/global_step": 3149, "train_info/time_within_train_step": 2.7550835609436035, "step": 3149} {"train_info/time_between_train_steps": 0.0030231475830078125, "step": 3149} {"info/global_step": 3150, "train_info/time_within_train_step": 2.7552309036254883, "step": 3150} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746575169, "_runtime": 9178}, "step": 3150} {"logs": {"train/loss": 4.0219, "train/learning_rate": 0.0004566666666666666, "train/epoch": 3.06, "_timestamp": 1746575169, "_runtime": 9178}, "step": 3150} {"train_info/time_between_train_steps": 0.01323390007019043, "step": 3150} {"info/global_step": 3151, "train_info/time_within_train_step": 2.7552008628845215, "step": 3151} {"train_info/time_between_train_steps": 0.003094196319580078, "step": 3151} {"info/global_step": 3152, "train_info/time_within_train_step": 2.754828453063965, "step": 3152} {"train_info/time_between_train_steps": 0.0034165382385253906, "step": 3152} {"info/global_step": 3153, "train_info/time_within_train_step": 2.755059003829956, "step": 3153} {"train_info/time_between_train_steps": 0.0031020641326904297, "step": 3153} {"info/global_step": 3154, "train_info/time_within_train_step": 2.7561869621276855, "step": 3154} {"train_info/time_between_train_steps": 0.003065824508666992, "step": 3154} {"info/global_step": 3155, "train_info/time_within_train_step": 2.7534899711608887, "step": 3155} {"train_info/time_between_train_steps": 0.0030570030212402344, "step": 3155} {"info/global_step": 3156, "train_info/time_within_train_step": 2.7553341388702393, "step": 3156} {"train_info/time_between_train_steps": 0.003034353256225586, "step": 3156} {"info/global_step": 3157, "train_info/time_within_train_step": 2.7563228607177734, "step": 3157} {"train_info/time_between_train_steps": 0.0030291080474853516, "step": 3157} {"info/global_step": 3158, "train_info/time_within_train_step": 2.7555367946624756, "step": 3158} {"train_info/time_between_train_steps": 0.003031015396118164, "step": 3158} {"info/global_step": 3159, "train_info/time_within_train_step": 2.7544353008270264, "step": 3159} {"train_info/time_between_train_steps": 0.003078937530517578, "step": 3159} {"info/global_step": 3160, "train_info/time_within_train_step": 2.7553160190582275, "step": 3160} {"train_info/time_between_train_steps": 0.003061532974243164, "step": 3160} {"info/global_step": 3161, "train_info/time_within_train_step": 2.7542989253997803, "step": 3161} {"train_info/time_between_train_steps": 0.0030562877655029297, "step": 3161} {"info/global_step": 3162, "train_info/time_within_train_step": 2.7551536560058594, "step": 3162} {"train_info/time_between_train_steps": 0.003081083297729492, "step": 3162} {"info/global_step": 3163, "train_info/time_within_train_step": 2.755713701248169, "step": 3163} {"train_info/time_between_train_steps": 0.0030088424682617188, "step": 3163} {"info/global_step": 3164, "train_info/time_within_train_step": 2.7542872428894043, "step": 3164} {"train_info/time_between_train_steps": 0.0031938552856445312, "step": 3164} {"info/global_step": 3165, "train_info/time_within_train_step": 2.753737688064575, "step": 3165} {"train_info/time_between_train_steps": 0.0030329227447509766, "step": 3165} {"info/global_step": 3166, "train_info/time_within_train_step": 2.752919912338257, "step": 3166} {"train_info/time_between_train_steps": 0.0030989646911621094, "step": 3166} {"info/global_step": 3167, "train_info/time_within_train_step": 2.7575111389160156, "step": 3167} {"train_info/time_between_train_steps": 0.0030210018157958984, "step": 3167} {"info/global_step": 3168, "train_info/time_within_train_step": 2.75430965423584, "step": 3168} {"train_info/time_between_train_steps": 0.0030431747436523438, "step": 3168} {"info/global_step": 3169, "train_info/time_within_train_step": 2.7547755241394043, "step": 3169} {"train_info/time_between_train_steps": 0.003038644790649414, "step": 3169} {"info/global_step": 3170, "train_info/time_within_train_step": 2.7561898231506348, "step": 3170} {"train_info/time_between_train_steps": 0.003039836883544922, "step": 3170} {"info/global_step": 3171, "train_info/time_within_train_step": 2.7555158138275146, "step": 3171} {"train_info/time_between_train_steps": 0.003076791763305664, "step": 3171} {"info/global_step": 3172, "train_info/time_within_train_step": 2.7552683353424072, "step": 3172} {"train_info/time_between_train_steps": 0.0030813217163085938, "step": 3172} {"info/global_step": 3173, "train_info/time_within_train_step": 2.753974199295044, "step": 3173} {"train_info/time_between_train_steps": 0.0030634403228759766, "step": 3173} {"info/global_step": 3174, "train_info/time_within_train_step": 2.755427360534668, "step": 3174} {"train_info/time_between_train_steps": 0.0030364990234375, "step": 3174} {"info/global_step": 3175, "train_info/time_within_train_step": 2.7562148571014404, "step": 3175} {"train_info/time_between_train_steps": 0.003042936325073242, "step": 3175} {"info/global_step": 3176, "train_info/time_within_train_step": 2.754970073699951, "step": 3176} {"train_info/time_between_train_steps": 0.003016233444213867, "step": 3176} {"info/global_step": 3177, "train_info/time_within_train_step": 2.755406141281128, "step": 3177} {"train_info/time_between_train_steps": 0.0033180713653564453, "step": 3177} {"info/global_step": 3178, "train_info/time_within_train_step": 2.7549517154693604, "step": 3178} {"train_info/time_between_train_steps": 0.003021717071533203, "step": 3178} {"info/global_step": 3179, "train_info/time_within_train_step": 2.754758358001709, "step": 3179} {"train_info/time_between_train_steps": 0.003032207489013672, "step": 3179} {"info/global_step": 3180, "train_info/time_within_train_step": 2.75386118888855, "step": 3180} {"train_info/time_between_train_steps": 0.002993345260620117, "step": 3180} {"info/global_step": 3181, "train_info/time_within_train_step": 2.7543816566467285, "step": 3181} {"train_info/time_between_train_steps": 0.0029997825622558594, "step": 3181} {"info/global_step": 3182, "train_info/time_within_train_step": 2.75398588180542, "step": 3182} {"train_info/time_between_train_steps": 0.003019094467163086, "step": 3182} {"info/global_step": 3183, "train_info/time_within_train_step": 2.75443172454834, "step": 3183} {"train_info/time_between_train_steps": 0.0030202865600585938, "step": 3183} {"info/global_step": 3184, "train_info/time_within_train_step": 2.7538881301879883, "step": 3184} {"train_info/time_between_train_steps": 0.0029976367950439453, "step": 3184} {"info/global_step": 3185, "train_info/time_within_train_step": 2.7548341751098633, "step": 3185} {"train_info/time_between_train_steps": 0.0030367374420166016, "step": 3185} {"info/global_step": 3186, "train_info/time_within_train_step": 2.754289388656616, "step": 3186} {"train_info/time_between_train_steps": 0.0030488967895507812, "step": 3186} {"info/global_step": 3187, "train_info/time_within_train_step": 2.754272699356079, "step": 3187} {"train_info/time_between_train_steps": 0.0030372142791748047, "step": 3187} {"info/global_step": 3188, "train_info/time_within_train_step": 2.753923177719116, "step": 3188} {"train_info/time_between_train_steps": 0.0031156539916992188, "step": 3188} {"info/global_step": 3189, "train_info/time_within_train_step": 2.754192590713501, "step": 3189} {"train_info/time_between_train_steps": 0.0029249191284179688, "step": 3189} {"info/global_step": 3190, "train_info/time_within_train_step": 2.753887891769409, "step": 3190} {"train_info/time_between_train_steps": 0.002976655960083008, "step": 3190} {"info/global_step": 3191, "train_info/time_within_train_step": 2.754554510116577, "step": 3191} {"train_info/time_between_train_steps": 0.0029959678649902344, "step": 3191} {"info/global_step": 3192, "train_info/time_within_train_step": 2.7552828788757324, "step": 3192} {"train_info/time_between_train_steps": 0.002989530563354492, "step": 3192} {"info/global_step": 3193, "train_info/time_within_train_step": 2.7549211978912354, "step": 3193} {"train_info/time_between_train_steps": 0.0029625892639160156, "step": 3193} {"info/global_step": 3194, "train_info/time_within_train_step": 2.754725217819214, "step": 3194} {"train_info/time_between_train_steps": 0.002989053726196289, "step": 3194} {"info/global_step": 3195, "train_info/time_within_train_step": 2.7539255619049072, "step": 3195} {"train_info/time_between_train_steps": 0.0030090808868408203, "step": 3195} {"info/global_step": 3196, "train_info/time_within_train_step": 2.7540953159332275, "step": 3196} {"train_info/time_between_train_steps": 0.0030007362365722656, "step": 3196} {"info/global_step": 3197, "train_info/time_within_train_step": 2.7544567584991455, "step": 3197} {"train_info/time_between_train_steps": 0.003036975860595703, "step": 3197} {"info/global_step": 3198, "train_info/time_within_train_step": 2.7543442249298096, "step": 3198} {"train_info/time_between_train_steps": 0.0029463768005371094, "step": 3198} {"info/global_step": 3199, "train_info/time_within_train_step": 2.75319766998291, "step": 3199} {"train_info/time_between_train_steps": 0.002980947494506836, "step": 3199} {"info/global_step": 3200, "train_info/time_within_train_step": 2.754321336746216, "step": 3200} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746575307, "_runtime": 9316}, "step": 3200} {"logs": {"train/loss": 4.003, "train/learning_rate": 0.00045333333333333326, "train/epoch": 3.06, "_timestamp": 1746575307, "_runtime": 9316}, "step": 3200} {"train_info/time_between_train_steps": 19.595653295516968, "step": 3200} {"info/global_step": 3201, "train_info/time_within_train_step": 2.5386734008789062, "step": 3201} {"train_info/time_between_train_steps": 0.0029649734497070312, "step": 3201} {"info/global_step": 3202, "train_info/time_within_train_step": 2.5894205570220947, "step": 3202} {"train_info/time_between_train_steps": 0.002953767776489258, "step": 3202} {"info/global_step": 3203, "train_info/time_within_train_step": 2.7217354774475098, "step": 3203} {"train_info/time_between_train_steps": 0.002940654754638672, "step": 3203} {"info/global_step": 3204, "train_info/time_within_train_step": 2.733454704284668, "step": 3204} {"train_info/time_between_train_steps": 0.0029473304748535156, "step": 3204} {"info/global_step": 3205, "train_info/time_within_train_step": 2.7515792846679688, "step": 3205} {"train_info/time_between_train_steps": 0.0030128955841064453, "step": 3205} {"info/global_step": 3206, "train_info/time_within_train_step": 2.7564799785614014, "step": 3206} {"train_info/time_between_train_steps": 0.0030472278594970703, "step": 3206} {"info/global_step": 3207, "train_info/time_within_train_step": 2.757025718688965, "step": 3207} {"train_info/time_between_train_steps": 0.0030775070190429688, "step": 3207} {"info/global_step": 3208, "train_info/time_within_train_step": 2.756155252456665, "step": 3208} {"train_info/time_between_train_steps": 0.0030384063720703125, "step": 3208} {"info/global_step": 3209, "train_info/time_within_train_step": 2.7559871673583984, "step": 3209} {"train_info/time_between_train_steps": 0.0029985904693603516, "step": 3209} {"info/global_step": 3210, "train_info/time_within_train_step": 2.7557296752929688, "step": 3210} {"train_info/time_between_train_steps": 0.0030527114868164062, "step": 3210} {"info/global_step": 3211, "train_info/time_within_train_step": 2.756294012069702, "step": 3211} {"train_info/time_between_train_steps": 0.002989053726196289, "step": 3211} {"info/global_step": 3212, "train_info/time_within_train_step": 2.9301373958587646, "step": 3212} {"train_info/time_between_train_steps": 0.002980947494506836, "step": 3212} {"info/global_step": 3213, "train_info/time_within_train_step": 2.756676197052002, "step": 3213} {"train_info/time_between_train_steps": 0.0029726028442382812, "step": 3213} {"info/global_step": 3214, "train_info/time_within_train_step": 2.756887197494507, "step": 3214} {"train_info/time_between_train_steps": 0.0031118392944335938, "step": 3214} {"info/global_step": 3215, "train_info/time_within_train_step": 2.756591796875, "step": 3215} {"train_info/time_between_train_steps": 0.002971172332763672, "step": 3215} {"info/global_step": 3216, "train_info/time_within_train_step": 2.7579195499420166, "step": 3216} {"train_info/time_between_train_steps": 0.002859354019165039, "step": 3216} {"info/global_step": 3217, "train_info/time_within_train_step": 2.754671573638916, "step": 3217} {"train_info/time_between_train_steps": 0.002891063690185547, "step": 3217} {"info/global_step": 3218, "train_info/time_within_train_step": 2.7558746337890625, "step": 3218} {"train_info/time_between_train_steps": 0.002916574478149414, "step": 3218} {"info/global_step": 3219, "train_info/time_within_train_step": 2.756277322769165, "step": 3219} {"train_info/time_between_train_steps": 0.0029404163360595703, "step": 3219} {"info/global_step": 3220, "train_info/time_within_train_step": 2.7560958862304688, "step": 3220} {"train_info/time_between_train_steps": 0.0029289722442626953, "step": 3220} {"info/global_step": 3221, "train_info/time_within_train_step": 2.7558579444885254, "step": 3221} {"train_info/time_between_train_steps": 0.002998828887939453, "step": 3221} {"info/global_step": 3222, "train_info/time_within_train_step": 2.7572062015533447, "step": 3222} {"train_info/time_between_train_steps": 0.0029511451721191406, "step": 3222} {"info/global_step": 3223, "train_info/time_within_train_step": 2.7571020126342773, "step": 3223} {"train_info/time_between_train_steps": 0.003205537796020508, "step": 3223} {"info/global_step": 3224, "train_info/time_within_train_step": 2.7569310665130615, "step": 3224} {"train_info/time_between_train_steps": 0.0030138492584228516, "step": 3224} {"info/global_step": 3225, "train_info/time_within_train_step": 2.7572286128997803, "step": 3225} {"train_info/time_between_train_steps": 0.002968311309814453, "step": 3225} {"info/global_step": 3226, "train_info/time_within_train_step": 2.757124423980713, "step": 3226} {"train_info/time_between_train_steps": 0.0029511451721191406, "step": 3226} {"info/global_step": 3227, "train_info/time_within_train_step": 2.756209135055542, "step": 3227} {"train_info/time_between_train_steps": 0.002990245819091797, "step": 3227} {"info/global_step": 3228, "train_info/time_within_train_step": 2.755612850189209, "step": 3228} {"train_info/time_between_train_steps": 0.0028672218322753906, "step": 3228} {"info/global_step": 3229, "train_info/time_within_train_step": 2.754347324371338, "step": 3229} {"train_info/time_between_train_steps": 0.0029065608978271484, "step": 3229} {"info/global_step": 3230, "train_info/time_within_train_step": 2.755093574523926, "step": 3230} {"train_info/time_between_train_steps": 0.002882242202758789, "step": 3230} {"info/global_step": 3231, "train_info/time_within_train_step": 2.7545735836029053, "step": 3231} {"train_info/time_between_train_steps": 0.002922534942626953, "step": 3231} {"info/global_step": 3232, "train_info/time_within_train_step": 2.7542076110839844, "step": 3232} {"train_info/time_between_train_steps": 0.002914905548095703, "step": 3232} {"info/global_step": 3233, "train_info/time_within_train_step": 2.7558298110961914, "step": 3233} {"train_info/time_between_train_steps": 0.0029468536376953125, "step": 3233} {"info/global_step": 3234, "train_info/time_within_train_step": 2.7547109127044678, "step": 3234} {"train_info/time_between_train_steps": 0.0028989315032958984, "step": 3234} {"info/global_step": 3235, "train_info/time_within_train_step": 2.7549872398376465, "step": 3235} {"train_info/time_between_train_steps": 0.003060579299926758, "step": 3235} {"info/global_step": 3236, "train_info/time_within_train_step": 2.755640745162964, "step": 3236} {"train_info/time_between_train_steps": 0.0029642581939697266, "step": 3236} {"info/global_step": 3237, "train_info/time_within_train_step": 2.75614070892334, "step": 3237} {"train_info/time_between_train_steps": 0.002910137176513672, "step": 3237} {"info/global_step": 3238, "train_info/time_within_train_step": 2.755854845046997, "step": 3238} {"train_info/time_between_train_steps": 0.0029871463775634766, "step": 3238} {"info/global_step": 3239, "train_info/time_within_train_step": 2.756385087966919, "step": 3239} {"train_info/time_between_train_steps": 0.0029230117797851562, "step": 3239} {"info/global_step": 3240, "train_info/time_within_train_step": 2.755934476852417, "step": 3240} {"train_info/time_between_train_steps": 0.002932310104370117, "step": 3240} {"info/global_step": 3241, "train_info/time_within_train_step": 2.754915714263916, "step": 3241} {"train_info/time_between_train_steps": 0.0029342174530029297, "step": 3241} {"info/global_step": 3242, "train_info/time_within_train_step": 2.7538352012634277, "step": 3242} {"train_info/time_between_train_steps": 0.0029332637786865234, "step": 3242} {"info/global_step": 3243, "train_info/time_within_train_step": 2.7547316551208496, "step": 3243} {"train_info/time_between_train_steps": 0.0029764175415039062, "step": 3243} {"info/global_step": 3244, "train_info/time_within_train_step": 2.754697799682617, "step": 3244} {"train_info/time_between_train_steps": 0.0028853416442871094, "step": 3244} {"info/global_step": 3245, "train_info/time_within_train_step": 2.7543201446533203, "step": 3245} {"train_info/time_between_train_steps": 0.0029621124267578125, "step": 3245} {"info/global_step": 3246, "train_info/time_within_train_step": 2.753756046295166, "step": 3246} {"train_info/time_between_train_steps": 0.0028753280639648438, "step": 3246} {"info/global_step": 3247, "train_info/time_within_train_step": 2.7553012371063232, "step": 3247} {"train_info/time_between_train_steps": 0.0029091835021972656, "step": 3247} {"info/global_step": 3248, "train_info/time_within_train_step": 2.7544219493865967, "step": 3248} {"train_info/time_between_train_steps": 0.0029113292694091797, "step": 3248} {"info/global_step": 3249, "train_info/time_within_train_step": 3.341045618057251, "step": 3249} {"train_info/time_between_train_steps": 0.0029075145721435547, "step": 3249} {"info/global_step": 3250, "train_info/time_within_train_step": 2.754894971847534, "step": 3250} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746575465, "_runtime": 9474}, "step": 3250} {"logs": {"train/loss": 3.995, "train/learning_rate": 0.00045, "train/epoch": 3.07, "_timestamp": 1746575465, "_runtime": 9474}, "step": 3250} {"train_info/time_between_train_steps": 0.01405954360961914, "step": 3250} {"info/global_step": 3251, "train_info/time_within_train_step": 2.7533035278320312, "step": 3251} {"train_info/time_between_train_steps": 0.0029129981994628906, "step": 3251} {"info/global_step": 3252, "train_info/time_within_train_step": 2.7536985874176025, "step": 3252} {"train_info/time_between_train_steps": 0.002919912338256836, "step": 3252} {"info/global_step": 3253, "train_info/time_within_train_step": 2.753774881362915, "step": 3253} {"train_info/time_between_train_steps": 0.002868175506591797, "step": 3253} {"info/global_step": 3254, "train_info/time_within_train_step": 2.754592180252075, "step": 3254} {"train_info/time_between_train_steps": 0.0029380321502685547, "step": 3254} {"info/global_step": 3255, "train_info/time_within_train_step": 2.754607915878296, "step": 3255} {"train_info/time_between_train_steps": 0.002955198287963867, "step": 3255} {"info/global_step": 3256, "train_info/time_within_train_step": 2.754608631134033, "step": 3256} {"train_info/time_between_train_steps": 0.0028901100158691406, "step": 3256} {"info/global_step": 3257, "train_info/time_within_train_step": 2.7546868324279785, "step": 3257} {"train_info/time_between_train_steps": 0.002896547317504883, "step": 3257} {"info/global_step": 3258, "train_info/time_within_train_step": 2.75410532951355, "step": 3258} {"train_info/time_between_train_steps": 0.0029065608978271484, "step": 3258} {"info/global_step": 3259, "train_info/time_within_train_step": 2.7544569969177246, "step": 3259} {"train_info/time_between_train_steps": 0.0028777122497558594, "step": 3259} {"info/global_step": 3260, "train_info/time_within_train_step": 2.7548341751098633, "step": 3260} {"train_info/time_between_train_steps": 0.0028972625732421875, "step": 3260} {"info/global_step": 3261, "train_info/time_within_train_step": 2.7536675930023193, "step": 3261} {"train_info/time_between_train_steps": 0.0029006004333496094, "step": 3261} {"info/global_step": 3262, "train_info/time_within_train_step": 2.7544431686401367, "step": 3262} {"train_info/time_between_train_steps": 0.0029397010803222656, "step": 3262} {"info/global_step": 3263, "train_info/time_within_train_step": 2.7540669441223145, "step": 3263} {"train_info/time_between_train_steps": 0.002910614013671875, "step": 3263} {"info/global_step": 3264, "train_info/time_within_train_step": 2.753204107284546, "step": 3264} {"train_info/time_between_train_steps": 0.0028641223907470703, "step": 3264} {"info/global_step": 3265, "train_info/time_within_train_step": 2.754054307937622, "step": 3265} {"train_info/time_between_train_steps": 0.002856016159057617, "step": 3265} {"info/global_step": 3266, "train_info/time_within_train_step": 2.7550883293151855, "step": 3266} {"train_info/time_between_train_steps": 0.0029265880584716797, "step": 3266} {"info/global_step": 3267, "train_info/time_within_train_step": 2.7512269020080566, "step": 3267} {"train_info/time_between_train_steps": 0.0029125213623046875, "step": 3267} {"info/global_step": 3268, "train_info/time_within_train_step": 2.753786087036133, "step": 3268} {"train_info/time_between_train_steps": 0.0028913021087646484, "step": 3268} {"info/global_step": 3269, "train_info/time_within_train_step": 2.7541823387145996, "step": 3269} {"train_info/time_between_train_steps": 0.0029289722442626953, "step": 3269} {"info/global_step": 3270, "train_info/time_within_train_step": 2.754626512527466, "step": 3270} {"train_info/time_between_train_steps": 0.002911090850830078, "step": 3270} {"info/global_step": 3271, "train_info/time_within_train_step": 2.754080295562744, "step": 3271} {"train_info/time_between_train_steps": 0.002911806106567383, "step": 3271} {"info/global_step": 3272, "train_info/time_within_train_step": 2.754408359527588, "step": 3272} {"train_info/time_between_train_steps": 0.0028905868530273438, "step": 3272} {"info/global_step": 3273, "train_info/time_within_train_step": 2.754855155944824, "step": 3273} {"train_info/time_between_train_steps": 0.0029168128967285156, "step": 3273} {"info/global_step": 3274, "train_info/time_within_train_step": 2.754585027694702, "step": 3274} {"train_info/time_between_train_steps": 0.0028977394104003906, "step": 3274} {"info/global_step": 3275, "train_info/time_within_train_step": 2.7536675930023193, "step": 3275} {"train_info/time_between_train_steps": 0.0029296875, "step": 3275} {"info/global_step": 3276, "train_info/time_within_train_step": 2.7550106048583984, "step": 3276} {"train_info/time_between_train_steps": 0.0029473304748535156, "step": 3276} {"info/global_step": 3277, "train_info/time_within_train_step": 2.7524802684783936, "step": 3277} {"train_info/time_between_train_steps": 0.002865314483642578, "step": 3277} {"info/global_step": 3278, "train_info/time_within_train_step": 2.7534492015838623, "step": 3278} {"train_info/time_between_train_steps": 0.002922534942626953, "step": 3278} {"info/global_step": 3279, "train_info/time_within_train_step": 2.753493547439575, "step": 3279} {"train_info/time_between_train_steps": 0.002908468246459961, "step": 3279} {"info/global_step": 3280, "train_info/time_within_train_step": 2.7536404132843018, "step": 3280} {"train_info/time_between_train_steps": 0.002866506576538086, "step": 3280} {"info/global_step": 3281, "train_info/time_within_train_step": 2.7535462379455566, "step": 3281} {"train_info/time_between_train_steps": 0.003317117691040039, "step": 3281} {"info/global_step": 3282, "train_info/time_within_train_step": 2.7546749114990234, "step": 3282} {"train_info/time_between_train_steps": 0.0028848648071289062, "step": 3282} {"info/global_step": 3283, "train_info/time_within_train_step": 2.7547755241394043, "step": 3283} {"train_info/time_between_train_steps": 0.002912759780883789, "step": 3283} {"info/global_step": 3284, "train_info/time_within_train_step": 2.754680633544922, "step": 3284} {"train_info/time_between_train_steps": 0.0028824806213378906, "step": 3284} {"info/global_step": 3285, "train_info/time_within_train_step": 2.7538955211639404, "step": 3285} {"train_info/time_between_train_steps": 0.0028874874114990234, "step": 3285} {"info/global_step": 3286, "train_info/time_within_train_step": 2.7551093101501465, "step": 3286} {"train_info/time_between_train_steps": 0.0029096603393554688, "step": 3286} {"info/global_step": 3287, "train_info/time_within_train_step": 2.7548458576202393, "step": 3287} {"train_info/time_between_train_steps": 0.0029273033142089844, "step": 3287} {"info/global_step": 3288, "train_info/time_within_train_step": 2.755220413208008, "step": 3288} {"train_info/time_between_train_steps": 0.0029754638671875, "step": 3288} {"info/global_step": 3289, "train_info/time_within_train_step": 2.7557427883148193, "step": 3289} {"train_info/time_between_train_steps": 0.0029997825622558594, "step": 3289} {"info/global_step": 3290, "train_info/time_within_train_step": 2.7555830478668213, "step": 3290} {"train_info/time_between_train_steps": 0.0030062198638916016, "step": 3290} {"info/global_step": 3291, "train_info/time_within_train_step": 2.7526488304138184, "step": 3291} {"train_info/time_between_train_steps": 0.0030100345611572266, "step": 3291} {"info/global_step": 3292, "train_info/time_within_train_step": 2.756070613861084, "step": 3292} {"train_info/time_between_train_steps": 0.002989053726196289, "step": 3292} {"info/global_step": 3293, "train_info/time_within_train_step": 2.753600835800171, "step": 3293} {"train_info/time_between_train_steps": 0.002985239028930664, "step": 3293} {"info/global_step": 3294, "train_info/time_within_train_step": 2.755490779876709, "step": 3294} {"train_info/time_between_train_steps": 0.0030257701873779297, "step": 3294} {"info/global_step": 3295, "train_info/time_within_train_step": 2.754852294921875, "step": 3295} {"train_info/time_between_train_steps": 0.00298309326171875, "step": 3295} {"info/global_step": 3296, "train_info/time_within_train_step": 2.7555124759674072, "step": 3296} {"train_info/time_between_train_steps": 0.0031135082244873047, "step": 3296} {"info/global_step": 3297, "train_info/time_within_train_step": 2.7559423446655273, "step": 3297} {"train_info/time_between_train_steps": 0.003009319305419922, "step": 3297} {"info/global_step": 3298, "train_info/time_within_train_step": 2.754171371459961, "step": 3298} {"train_info/time_between_train_steps": 0.003039836883544922, "step": 3298} {"info/global_step": 3299, "train_info/time_within_train_step": 2.755711793899536, "step": 3299} {"train_info/time_between_train_steps": 0.002965211868286133, "step": 3299} {"info/global_step": 3300, "train_info/time_within_train_step": 2.755180835723877, "step": 3300} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746575604, "_runtime": 9613}, "step": 3300} {"logs": {"train/loss": 3.9829, "train/learning_rate": 0.00044666666666666666, "train/epoch": 3.07, "_timestamp": 1746575604, "_runtime": 9613}, "step": 3300} {"train_info/time_between_train_steps": 0.015035629272460938, "step": 3300} {"info/global_step": 3301, "train_info/time_within_train_step": 2.755824089050293, "step": 3301} {"train_info/time_between_train_steps": 0.0029926300048828125, "step": 3301} {"info/global_step": 3302, "train_info/time_within_train_step": 2.755525827407837, "step": 3302} {"train_info/time_between_train_steps": 0.0029878616333007812, "step": 3302} {"info/global_step": 3303, "train_info/time_within_train_step": 2.755969524383545, "step": 3303} {"train_info/time_between_train_steps": 0.003003358840942383, "step": 3303} {"info/global_step": 3304, "train_info/time_within_train_step": 2.75532865524292, "step": 3304} {"train_info/time_between_train_steps": 0.0030536651611328125, "step": 3304} {"info/global_step": 3305, "train_info/time_within_train_step": 2.7547600269317627, "step": 3305} {"train_info/time_between_train_steps": 0.0030400753021240234, "step": 3305} {"info/global_step": 3306, "train_info/time_within_train_step": 2.7556204795837402, "step": 3306} {"train_info/time_between_train_steps": 0.0029740333557128906, "step": 3306} {"info/global_step": 3307, "train_info/time_within_train_step": 2.7559568881988525, "step": 3307} {"train_info/time_between_train_steps": 0.0030014514923095703, "step": 3307} {"info/global_step": 3308, "train_info/time_within_train_step": 2.7563865184783936, "step": 3308} {"train_info/time_between_train_steps": 0.0030002593994140625, "step": 3308} {"info/global_step": 3309, "train_info/time_within_train_step": 2.756409168243408, "step": 3309} {"train_info/time_between_train_steps": 0.003027200698852539, "step": 3309} {"info/global_step": 3310, "train_info/time_within_train_step": 2.7551474571228027, "step": 3310} {"train_info/time_between_train_steps": 0.002993345260620117, "step": 3310} {"info/global_step": 3311, "train_info/time_within_train_step": 2.755859851837158, "step": 3311} {"train_info/time_between_train_steps": 0.0030210018157958984, "step": 3311} {"info/global_step": 3312, "train_info/time_within_train_step": 2.756382465362549, "step": 3312} {"train_info/time_between_train_steps": 0.0029821395874023438, "step": 3312} {"info/global_step": 3313, "train_info/time_within_train_step": 2.754507064819336, "step": 3313} {"train_info/time_between_train_steps": 0.003415822982788086, "step": 3313} {"info/global_step": 3314, "train_info/time_within_train_step": 2.8418757915496826, "step": 3314} {"train_info/time_between_train_steps": 0.003010272979736328, "step": 3314} {"info/global_step": 3315, "train_info/time_within_train_step": 2.753554344177246, "step": 3315} {"train_info/time_between_train_steps": 0.0029578208923339844, "step": 3315} {"info/global_step": 3316, "train_info/time_within_train_step": 2.7533957958221436, "step": 3316} {"train_info/time_between_train_steps": 0.0029876232147216797, "step": 3316} {"info/global_step": 3317, "train_info/time_within_train_step": 2.753258228302002, "step": 3317} {"train_info/time_between_train_steps": 0.0029442310333251953, "step": 3317} {"info/global_step": 3318, "train_info/time_within_train_step": 2.75492262840271, "step": 3318} {"train_info/time_between_train_steps": 0.003020048141479492, "step": 3318} {"info/global_step": 3319, "train_info/time_within_train_step": 2.7541892528533936, "step": 3319} {"train_info/time_between_train_steps": 0.0030798912048339844, "step": 3319} {"info/global_step": 3320, "train_info/time_within_train_step": 2.7531585693359375, "step": 3320} {"train_info/time_between_train_steps": 0.0029904842376708984, "step": 3320} {"info/global_step": 3321, "train_info/time_within_train_step": 2.7536847591400146, "step": 3321} {"train_info/time_between_train_steps": 0.0029861927032470703, "step": 3321} {"info/global_step": 3322, "train_info/time_within_train_step": 2.7556405067443848, "step": 3322} {"train_info/time_between_train_steps": 0.0029954910278320312, "step": 3322} {"info/global_step": 3323, "train_info/time_within_train_step": 2.755098581314087, "step": 3323} {"train_info/time_between_train_steps": 0.0029664039611816406, "step": 3323} {"info/global_step": 3324, "train_info/time_within_train_step": 2.756798028945923, "step": 3324} {"train_info/time_between_train_steps": 0.0029611587524414062, "step": 3324} {"info/global_step": 3325, "train_info/time_within_train_step": 2.755995750427246, "step": 3325} {"train_info/time_between_train_steps": 0.0029685497283935547, "step": 3325} {"info/global_step": 3326, "train_info/time_within_train_step": 2.756840229034424, "step": 3326} {"train_info/time_between_train_steps": 0.0029833316802978516, "step": 3326} {"info/global_step": 3327, "train_info/time_within_train_step": 2.755702257156372, "step": 3327} {"train_info/time_between_train_steps": 0.002939462661743164, "step": 3327} {"info/global_step": 3328, "train_info/time_within_train_step": 2.753999710083008, "step": 3328} {"train_info/time_between_train_steps": 0.0028421878814697266, "step": 3328} {"info/global_step": 3329, "train_info/time_within_train_step": 2.754302740097046, "step": 3329} {"train_info/time_between_train_steps": 0.002907991409301758, "step": 3329} {"info/global_step": 3330, "train_info/time_within_train_step": 2.752708673477173, "step": 3330} {"train_info/time_between_train_steps": 0.0028700828552246094, "step": 3330} {"info/global_step": 3331, "train_info/time_within_train_step": 2.7537026405334473, "step": 3331} {"train_info/time_between_train_steps": 0.0029082298278808594, "step": 3331} {"info/global_step": 3332, "train_info/time_within_train_step": 2.7527852058410645, "step": 3332} {"train_info/time_between_train_steps": 0.002888202667236328, "step": 3332} {"info/global_step": 3333, "train_info/time_within_train_step": 2.752699375152588, "step": 3333} {"train_info/time_between_train_steps": 0.002848386764526367, "step": 3333} {"info/global_step": 3334, "train_info/time_within_train_step": 2.753683567047119, "step": 3334} {"train_info/time_between_train_steps": 0.002834796905517578, "step": 3334} {"info/global_step": 3335, "train_info/time_within_train_step": 2.7540786266326904, "step": 3335} {"train_info/time_between_train_steps": 0.0028433799743652344, "step": 3335} {"info/global_step": 3336, "train_info/time_within_train_step": 2.7539939880371094, "step": 3336} {"train_info/time_between_train_steps": 0.002963542938232422, "step": 3336} {"info/global_step": 3337, "train_info/time_within_train_step": 2.7550809383392334, "step": 3337} {"train_info/time_between_train_steps": 0.002953052520751953, "step": 3337} {"info/global_step": 3338, "train_info/time_within_train_step": 2.7553412914276123, "step": 3338} {"train_info/time_between_train_steps": 0.002964496612548828, "step": 3338} {"info/global_step": 3339, "train_info/time_within_train_step": 2.7547593116760254, "step": 3339} {"train_info/time_between_train_steps": 0.002959012985229492, "step": 3339} {"info/global_step": 3340, "train_info/time_within_train_step": 2.752871513366699, "step": 3340} {"train_info/time_between_train_steps": 0.002907276153564453, "step": 3340} {"info/global_step": 3341, "train_info/time_within_train_step": 2.7533669471740723, "step": 3341} {"train_info/time_between_train_steps": 0.0028901100158691406, "step": 3341} {"info/global_step": 3342, "train_info/time_within_train_step": 2.7545933723449707, "step": 3342} {"train_info/time_between_train_steps": 0.003015279769897461, "step": 3342} {"info/global_step": 3343, "train_info/time_within_train_step": 2.755612850189209, "step": 3343} {"train_info/time_between_train_steps": 0.0029449462890625, "step": 3343} {"info/global_step": 3344, "train_info/time_within_train_step": 2.7553811073303223, "step": 3344} {"train_info/time_between_train_steps": 0.0029723644256591797, "step": 3344} {"info/global_step": 3345, "train_info/time_within_train_step": 2.754584789276123, "step": 3345} {"train_info/time_between_train_steps": 0.0029757022857666016, "step": 3345} {"info/global_step": 3346, "train_info/time_within_train_step": 2.7552103996276855, "step": 3346} {"train_info/time_between_train_steps": 0.0029888153076171875, "step": 3346} {"info/global_step": 3347, "train_info/time_within_train_step": 2.754565954208374, "step": 3347} {"train_info/time_between_train_steps": 0.002971649169921875, "step": 3347} {"info/global_step": 3348, "train_info/time_within_train_step": 2.7558774948120117, "step": 3348} {"train_info/time_between_train_steps": 0.003000020980834961, "step": 3348} {"info/global_step": 3349, "train_info/time_within_train_step": 2.754136800765991, "step": 3349} {"train_info/time_between_train_steps": 0.0030226707458496094, "step": 3349} {"info/global_step": 3350, "train_info/time_within_train_step": 2.7560510635375977, "step": 3350} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746575742, "_runtime": 9751}, "step": 3350} {"logs": {"train/loss": 3.9694, "train/learning_rate": 0.00044333333333333334, "train/epoch": 3.08, "_timestamp": 1746575742, "_runtime": 9751}, "step": 3350} {"train_info/time_between_train_steps": 0.013107061386108398, "step": 3350} {"info/global_step": 3351, "train_info/time_within_train_step": 2.752657890319824, "step": 3351} {"train_info/time_between_train_steps": 0.0030291080474853516, "step": 3351} {"info/global_step": 3352, "train_info/time_within_train_step": 2.7561440467834473, "step": 3352} {"train_info/time_between_train_steps": 0.002981901168823242, "step": 3352} {"info/global_step": 3353, "train_info/time_within_train_step": 2.7555856704711914, "step": 3353} {"train_info/time_between_train_steps": 0.0030088424682617188, "step": 3353} {"info/global_step": 3354, "train_info/time_within_train_step": 2.754725933074951, "step": 3354} {"train_info/time_between_train_steps": 0.002867460250854492, "step": 3354} {"info/global_step": 3355, "train_info/time_within_train_step": 2.754026174545288, "step": 3355} {"train_info/time_between_train_steps": 0.0028793811798095703, "step": 3355} {"info/global_step": 3356, "train_info/time_within_train_step": 2.755124092102051, "step": 3356} {"train_info/time_between_train_steps": 0.002870321273803711, "step": 3356} {"info/global_step": 3357, "train_info/time_within_train_step": 2.7542965412139893, "step": 3357} {"train_info/time_between_train_steps": 0.002927541732788086, "step": 3357} {"info/global_step": 3358, "train_info/time_within_train_step": 2.754575729370117, "step": 3358} {"train_info/time_between_train_steps": 0.002870798110961914, "step": 3358} {"info/global_step": 3359, "train_info/time_within_train_step": 2.7534046173095703, "step": 3359} {"train_info/time_between_train_steps": 0.002866983413696289, "step": 3359} {"info/global_step": 3360, "train_info/time_within_train_step": 2.753591775894165, "step": 3360} {"train_info/time_between_train_steps": 0.0028734207153320312, "step": 3360} {"info/global_step": 3361, "train_info/time_within_train_step": 2.75469970703125, "step": 3361} {"train_info/time_between_train_steps": 0.002937793731689453, "step": 3361} {"info/global_step": 3362, "train_info/time_within_train_step": 2.7521908283233643, "step": 3362} {"train_info/time_between_train_steps": 0.0029294490814208984, "step": 3362} {"info/global_step": 3363, "train_info/time_within_train_step": 2.753207206726074, "step": 3363} {"train_info/time_between_train_steps": 0.002857208251953125, "step": 3363} {"info/global_step": 3364, "train_info/time_within_train_step": 2.7555742263793945, "step": 3364} {"train_info/time_between_train_steps": 0.002881765365600586, "step": 3364} {"info/global_step": 3365, "train_info/time_within_train_step": 2.7540643215179443, "step": 3365} {"train_info/time_between_train_steps": 0.0030031204223632812, "step": 3365} {"info/global_step": 3366, "train_info/time_within_train_step": 2.754640579223633, "step": 3366} {"train_info/time_between_train_steps": 0.002857208251953125, "step": 3366} {"info/global_step": 3367, "train_info/time_within_train_step": 2.7543678283691406, "step": 3367} {"train_info/time_between_train_steps": 0.002905607223510742, "step": 3367} {"info/global_step": 3368, "train_info/time_within_train_step": 2.755699872970581, "step": 3368} {"train_info/time_between_train_steps": 0.0029289722442626953, "step": 3368} {"info/global_step": 3369, "train_info/time_within_train_step": 2.810589551925659, "step": 3369} {"train_info/time_between_train_steps": 0.002899646759033203, "step": 3369} {"info/global_step": 3370, "train_info/time_within_train_step": 2.755143165588379, "step": 3370} {"train_info/time_between_train_steps": 0.0029997825622558594, "step": 3370} {"info/global_step": 3371, "train_info/time_within_train_step": 2.7566394805908203, "step": 3371} {"train_info/time_between_train_steps": 0.002968311309814453, "step": 3371} {"info/global_step": 3372, "train_info/time_within_train_step": 2.7558393478393555, "step": 3372} {"train_info/time_between_train_steps": 0.0029654502868652344, "step": 3372} {"info/global_step": 3373, "train_info/time_within_train_step": 2.755124092102051, "step": 3373} {"train_info/time_between_train_steps": 0.0030431747436523438, "step": 3373} {"info/global_step": 3374, "train_info/time_within_train_step": 2.756209135055542, "step": 3374} {"train_info/time_between_train_steps": 0.002913236618041992, "step": 3374} {"info/global_step": 3375, "train_info/time_within_train_step": 2.7549924850463867, "step": 3375} {"train_info/time_between_train_steps": 0.002972841262817383, "step": 3375} {"info/global_step": 3376, "train_info/time_within_train_step": 2.7557520866394043, "step": 3376} {"train_info/time_between_train_steps": 0.0029745101928710938, "step": 3376} {"info/global_step": 3377, "train_info/time_within_train_step": 2.753221273422241, "step": 3377} {"train_info/time_between_train_steps": 0.002928018569946289, "step": 3377} {"info/global_step": 3378, "train_info/time_within_train_step": 2.7547929286956787, "step": 3378} {"train_info/time_between_train_steps": 0.003080606460571289, "step": 3378} {"info/global_step": 3379, "train_info/time_within_train_step": 2.7548561096191406, "step": 3379} {"train_info/time_between_train_steps": 0.003037691116333008, "step": 3379} {"info/global_step": 3380, "train_info/time_within_train_step": 2.7553107738494873, "step": 3380} {"train_info/time_between_train_steps": 0.002946615219116211, "step": 3380} {"info/global_step": 3381, "train_info/time_within_train_step": 2.755598545074463, "step": 3381} {"train_info/time_between_train_steps": 0.0030956268310546875, "step": 3381} {"info/global_step": 3382, "train_info/time_within_train_step": 2.7544190883636475, "step": 3382} {"train_info/time_between_train_steps": 0.0029680728912353516, "step": 3382} {"info/global_step": 3383, "train_info/time_within_train_step": 2.755263090133667, "step": 3383} {"train_info/time_between_train_steps": 0.003020048141479492, "step": 3383} {"info/global_step": 3384, "train_info/time_within_train_step": 2.7548131942749023, "step": 3384} {"train_info/time_between_train_steps": 0.003016948699951172, "step": 3384} {"info/global_step": 3385, "train_info/time_within_train_step": 2.7535061836242676, "step": 3385} {"train_info/time_between_train_steps": 0.003109455108642578, "step": 3385} {"info/global_step": 3386, "train_info/time_within_train_step": 2.7568256855010986, "step": 3386} {"train_info/time_between_train_steps": 0.003081798553466797, "step": 3386} {"info/global_step": 3387, "train_info/time_within_train_step": 2.7551538944244385, "step": 3387} {"train_info/time_between_train_steps": 0.003017425537109375, "step": 3387} {"info/global_step": 3388, "train_info/time_within_train_step": 2.7559940814971924, "step": 3388} {"train_info/time_between_train_steps": 0.0031156539916992188, "step": 3388} {"info/global_step": 3389, "train_info/time_within_train_step": 2.7544960975646973, "step": 3389} {"train_info/time_between_train_steps": 0.0032196044921875, "step": 3389} {"info/global_step": 3390, "train_info/time_within_train_step": 2.754051685333252, "step": 3390} {"train_info/time_between_train_steps": 0.002990245819091797, "step": 3390} {"info/global_step": 3391, "train_info/time_within_train_step": 2.754258871078491, "step": 3391} {"train_info/time_between_train_steps": 0.0031299591064453125, "step": 3391} {"info/global_step": 3392, "train_info/time_within_train_step": 2.7562339305877686, "step": 3392} {"train_info/time_between_train_steps": 0.0031807422637939453, "step": 3392} {"info/global_step": 3393, "train_info/time_within_train_step": 2.7551984786987305, "step": 3393} {"train_info/time_between_train_steps": 0.0031578540802001953, "step": 3393} {"info/global_step": 3394, "train_info/time_within_train_step": 2.754014492034912, "step": 3394} {"train_info/time_between_train_steps": 0.0030562877655029297, "step": 3394} {"info/global_step": 3395, "train_info/time_within_train_step": 2.7563703060150146, "step": 3395} {"train_info/time_between_train_steps": 0.0030434131622314453, "step": 3395} {"info/global_step": 3396, "train_info/time_within_train_step": 2.7554891109466553, "step": 3396} {"train_info/time_between_train_steps": 0.0031464099884033203, "step": 3396} {"info/global_step": 3397, "train_info/time_within_train_step": 2.7561240196228027, "step": 3397} {"train_info/time_between_train_steps": 0.0032231807708740234, "step": 3397} {"info/global_step": 3398, "train_info/time_within_train_step": 2.755425453186035, "step": 3398} {"train_info/time_between_train_steps": 0.0030908584594726562, "step": 3398} {"info/global_step": 3399, "train_info/time_within_train_step": 2.7549989223480225, "step": 3399} {"train_info/time_between_train_steps": 0.0031747817993164062, "step": 3399} {"info/global_step": 3400, "train_info/time_within_train_step": 2.7568140029907227, "step": 3400} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746575881, "_runtime": 9890}, "step": 3400} {"logs": {"train/loss": 3.9581, "train/learning_rate": 0.0004399999999999999, "train/epoch": 3.08, "_timestamp": 1746575881, "_runtime": 9890}, "step": 3400} {"train_info/time_between_train_steps": 17.77196192741394, "step": 3400} {"info/global_step": 3401, "train_info/time_within_train_step": 2.5413713455200195, "step": 3401} {"train_info/time_between_train_steps": 0.003238201141357422, "step": 3401} {"info/global_step": 3402, "train_info/time_within_train_step": 2.5802268981933594, "step": 3402} {"train_info/time_between_train_steps": 0.0033731460571289062, "step": 3402} {"info/global_step": 3403, "train_info/time_within_train_step": 2.6985511779785156, "step": 3403} {"train_info/time_between_train_steps": 0.0033769607543945312, "step": 3403} {"info/global_step": 3404, "train_info/time_within_train_step": 2.747187376022339, "step": 3404} {"train_info/time_between_train_steps": 0.003209352493286133, "step": 3404} {"info/global_step": 3405, "train_info/time_within_train_step": 2.751241445541382, "step": 3405} {"train_info/time_between_train_steps": 0.003358125686645508, "step": 3405} {"info/global_step": 3406, "train_info/time_within_train_step": 2.7553954124450684, "step": 3406} {"train_info/time_between_train_steps": 0.003319263458251953, "step": 3406} {"info/global_step": 3407, "train_info/time_within_train_step": 2.756420850753784, "step": 3407} {"train_info/time_between_train_steps": 0.0033135414123535156, "step": 3407} {"info/global_step": 3408, "train_info/time_within_train_step": 2.7569382190704346, "step": 3408} {"train_info/time_between_train_steps": 0.0033004283905029297, "step": 3408} {"info/global_step": 3409, "train_info/time_within_train_step": 2.788527250289917, "step": 3409} {"train_info/time_between_train_steps": 0.0033512115478515625, "step": 3409} {"info/global_step": 3410, "train_info/time_within_train_step": 2.755331516265869, "step": 3410} {"train_info/time_between_train_steps": 0.003340005874633789, "step": 3410} {"info/global_step": 3411, "train_info/time_within_train_step": 2.755728244781494, "step": 3411} {"train_info/time_between_train_steps": 0.003406047821044922, "step": 3411} {"info/global_step": 3412, "train_info/time_within_train_step": 2.757222890853882, "step": 3412} {"train_info/time_between_train_steps": 0.0033578872680664062, "step": 3412} {"train_info/time_between_train_steps": 3.106525182723999, "step": 3412} {"info/global_step": 3413, "train_info/time_within_train_step": 2.7409884929656982, "step": 3413} {"train_info/time_between_train_steps": 0.0032417774200439453, "step": 3413} {"info/global_step": 3414, "train_info/time_within_train_step": 2.7555110454559326, "step": 3414} {"train_info/time_between_train_steps": 0.0031723976135253906, "step": 3414} {"info/global_step": 3415, "train_info/time_within_train_step": 2.755678653717041, "step": 3415} {"train_info/time_between_train_steps": 0.0031731128692626953, "step": 3415} {"info/global_step": 3416, "train_info/time_within_train_step": 2.7574145793914795, "step": 3416} {"train_info/time_between_train_steps": 0.0031642913818359375, "step": 3416} {"info/global_step": 3417, "train_info/time_within_train_step": 2.7549376487731934, "step": 3417} {"train_info/time_between_train_steps": 0.0031599998474121094, "step": 3417} {"info/global_step": 3418, "train_info/time_within_train_step": 2.75612473487854, "step": 3418} {"train_info/time_between_train_steps": 0.0031783580780029297, "step": 3418} {"info/global_step": 3419, "train_info/time_within_train_step": 2.753476858139038, "step": 3419} {"train_info/time_between_train_steps": 0.003197908401489258, "step": 3419} {"info/global_step": 3420, "train_info/time_within_train_step": 2.754861354827881, "step": 3420} {"train_info/time_between_train_steps": 0.0031986236572265625, "step": 3420} {"info/global_step": 3421, "train_info/time_within_train_step": 2.7563962936401367, "step": 3421} {"train_info/time_between_train_steps": 0.0031540393829345703, "step": 3421} {"info/global_step": 3422, "train_info/time_within_train_step": 2.7548835277557373, "step": 3422} {"train_info/time_between_train_steps": 0.0031681060791015625, "step": 3422} {"info/global_step": 3423, "train_info/time_within_train_step": 2.7541520595550537, "step": 3423} {"train_info/time_between_train_steps": 0.003198862075805664, "step": 3423} {"info/global_step": 3424, "train_info/time_within_train_step": 2.9725489616394043, "step": 3424} {"train_info/time_between_train_steps": 0.0032491683959960938, "step": 3424} {"info/global_step": 3425, "train_info/time_within_train_step": 2.7557194232940674, "step": 3425} {"train_info/time_between_train_steps": 0.0031850337982177734, "step": 3425} {"info/global_step": 3426, "train_info/time_within_train_step": 2.755073070526123, "step": 3426} {"train_info/time_between_train_steps": 0.0031414031982421875, "step": 3426} {"info/global_step": 3427, "train_info/time_within_train_step": 2.756152391433716, "step": 3427} {"train_info/time_between_train_steps": 0.0034461021423339844, "step": 3427} {"info/global_step": 3428, "train_info/time_within_train_step": 2.7577550411224365, "step": 3428} {"train_info/time_between_train_steps": 0.003358125686645508, "step": 3428} {"info/global_step": 3429, "train_info/time_within_train_step": 2.7566006183624268, "step": 3429} {"train_info/time_between_train_steps": 0.003299713134765625, "step": 3429} {"info/global_step": 3430, "train_info/time_within_train_step": 2.7567436695098877, "step": 3430} {"train_info/time_between_train_steps": 0.0033211708068847656, "step": 3430} {"info/global_step": 3431, "train_info/time_within_train_step": 2.756519079208374, "step": 3431} {"train_info/time_between_train_steps": 0.003324747085571289, "step": 3431} {"info/global_step": 3432, "train_info/time_within_train_step": 2.75614595413208, "step": 3432} {"train_info/time_between_train_steps": 0.0034999847412109375, "step": 3432} {"info/global_step": 3433, "train_info/time_within_train_step": 2.756976366043091, "step": 3433} {"train_info/time_between_train_steps": 0.003309965133666992, "step": 3433} {"info/global_step": 3434, "train_info/time_within_train_step": 2.757380247116089, "step": 3434} {"train_info/time_between_train_steps": 0.0033271312713623047, "step": 3434} {"info/global_step": 3435, "train_info/time_within_train_step": 2.756736993789673, "step": 3435} {"train_info/time_between_train_steps": 0.00331878662109375, "step": 3435} {"info/global_step": 3436, "train_info/time_within_train_step": 2.757089138031006, "step": 3436} {"train_info/time_between_train_steps": 0.00336456298828125, "step": 3436} {"info/global_step": 3437, "train_info/time_within_train_step": 2.756352663040161, "step": 3437} {"train_info/time_between_train_steps": 0.0033097267150878906, "step": 3437} {"info/global_step": 3438, "train_info/time_within_train_step": 2.7559447288513184, "step": 3438} {"train_info/time_between_train_steps": 0.0032172203063964844, "step": 3438} {"info/global_step": 3439, "train_info/time_within_train_step": 2.7553417682647705, "step": 3439} {"train_info/time_between_train_steps": 0.0032067298889160156, "step": 3439} {"info/global_step": 3440, "train_info/time_within_train_step": 2.7561261653900146, "step": 3440} {"train_info/time_between_train_steps": 0.003165721893310547, "step": 3440} {"info/global_step": 3441, "train_info/time_within_train_step": 2.754641532897949, "step": 3441} {"train_info/time_between_train_steps": 0.0031909942626953125, "step": 3441} {"info/global_step": 3442, "train_info/time_within_train_step": 2.7556262016296387, "step": 3442} {"train_info/time_between_train_steps": 0.0031783580780029297, "step": 3442} {"info/global_step": 3443, "train_info/time_within_train_step": 2.754929304122925, "step": 3443} {"train_info/time_between_train_steps": 0.0031404495239257812, "step": 3443} {"info/global_step": 3444, "train_info/time_within_train_step": 2.7550597190856934, "step": 3444} {"train_info/time_between_train_steps": 0.003137826919555664, "step": 3444} {"info/global_step": 3445, "train_info/time_within_train_step": 2.7539331912994385, "step": 3445} {"train_info/time_between_train_steps": 0.0031197071075439453, "step": 3445} {"info/global_step": 3446, "train_info/time_within_train_step": 2.753934860229492, "step": 3446} {"train_info/time_between_train_steps": 0.0031654834747314453, "step": 3446} {"info/global_step": 3447, "train_info/time_within_train_step": 2.7554092407226562, "step": 3447} {"train_info/time_between_train_steps": 0.0033638477325439453, "step": 3447} {"info/global_step": 3448, "train_info/time_within_train_step": 2.7561748027801514, "step": 3448} {"train_info/time_between_train_steps": 0.0033044815063476562, "step": 3448} {"info/global_step": 3449, "train_info/time_within_train_step": 2.7554566860198975, "step": 3449} {"train_info/time_between_train_steps": 0.0032966136932373047, "step": 3449} {"info/global_step": 3450, "train_info/time_within_train_step": 2.7560245990753174, "step": 3450} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746576040, "_runtime": 10049}, "step": 3450} {"logs": {"train/loss": 3.9998, "train/learning_rate": 0.0004366666666666666, "train/epoch": 4.0, "_timestamp": 1746576040, "_runtime": 10049}, "step": 3450} {"train_info/time_between_train_steps": 0.013991117477416992, "step": 3450} {"info/global_step": 3451, "train_info/time_within_train_step": 2.755694627761841, "step": 3451} {"train_info/time_between_train_steps": 0.003280162811279297, "step": 3451} {"info/global_step": 3452, "train_info/time_within_train_step": 2.755178213119507, "step": 3452} {"train_info/time_between_train_steps": 0.0033211708068847656, "step": 3452} {"info/global_step": 3453, "train_info/time_within_train_step": 2.7563719749450684, "step": 3453} {"train_info/time_between_train_steps": 0.0032901763916015625, "step": 3453} {"info/global_step": 3454, "train_info/time_within_train_step": 2.7563185691833496, "step": 3454} {"train_info/time_between_train_steps": 0.003403186798095703, "step": 3454} {"info/global_step": 3455, "train_info/time_within_train_step": 2.756821393966675, "step": 3455} {"train_info/time_between_train_steps": 0.003317117691040039, "step": 3455} {"info/global_step": 3456, "train_info/time_within_train_step": 2.7567522525787354, "step": 3456} {"train_info/time_between_train_steps": 0.003280162811279297, "step": 3456} {"info/global_step": 3457, "train_info/time_within_train_step": 2.7565062046051025, "step": 3457} {"train_info/time_between_train_steps": 0.0033006668090820312, "step": 3457} {"info/global_step": 3458, "train_info/time_within_train_step": 2.754279613494873, "step": 3458} {"train_info/time_between_train_steps": 0.0031585693359375, "step": 3458} {"info/global_step": 3459, "train_info/time_within_train_step": 2.754291296005249, "step": 3459} {"train_info/time_between_train_steps": 0.0031397342681884766, "step": 3459} {"info/global_step": 3460, "train_info/time_within_train_step": 2.7544140815734863, "step": 3460} {"train_info/time_between_train_steps": 0.003175497055053711, "step": 3460} {"info/global_step": 3461, "train_info/time_within_train_step": 2.7540228366851807, "step": 3461} {"train_info/time_between_train_steps": 0.003652334213256836, "step": 3461} {"info/global_step": 3462, "train_info/time_within_train_step": 2.7550063133239746, "step": 3462} {"train_info/time_between_train_steps": 0.0031332969665527344, "step": 3462} {"info/global_step": 3463, "train_info/time_within_train_step": 2.753450632095337, "step": 3463} {"train_info/time_between_train_steps": 0.0031349658966064453, "step": 3463} {"info/global_step": 3464, "train_info/time_within_train_step": 2.7540416717529297, "step": 3464} {"train_info/time_between_train_steps": 0.0031790733337402344, "step": 3464} {"info/global_step": 3465, "train_info/time_within_train_step": 2.755150318145752, "step": 3465} {"train_info/time_between_train_steps": 0.003173828125, "step": 3465} {"info/global_step": 3466, "train_info/time_within_train_step": 2.7548892498016357, "step": 3466} {"train_info/time_between_train_steps": 0.003125905990600586, "step": 3466} {"info/global_step": 3467, "train_info/time_within_train_step": 2.75639271736145, "step": 3467} {"train_info/time_between_train_steps": 0.0034024715423583984, "step": 3467} {"info/global_step": 3468, "train_info/time_within_train_step": 2.7567687034606934, "step": 3468} {"train_info/time_between_train_steps": 0.0033757686614990234, "step": 3468} {"info/global_step": 3469, "train_info/time_within_train_step": 2.75614333152771, "step": 3469} {"train_info/time_between_train_steps": 0.003269672393798828, "step": 3469} {"info/global_step": 3470, "train_info/time_within_train_step": 2.7553012371063232, "step": 3470} {"train_info/time_between_train_steps": 0.0033655166625976562, "step": 3470} {"info/global_step": 3471, "train_info/time_within_train_step": 2.7557411193847656, "step": 3471} {"train_info/time_between_train_steps": 0.0033235549926757812, "step": 3471} {"info/global_step": 3472, "train_info/time_within_train_step": 2.7552785873413086, "step": 3472} {"train_info/time_between_train_steps": 0.003297090530395508, "step": 3472} {"info/global_step": 3473, "train_info/time_within_train_step": 2.7561895847320557, "step": 3473} {"train_info/time_between_train_steps": 0.003435850143432617, "step": 3473} {"info/global_step": 3474, "train_info/time_within_train_step": 2.756046772003174, "step": 3474} {"train_info/time_between_train_steps": 0.003392934799194336, "step": 3474} {"info/global_step": 3475, "train_info/time_within_train_step": 2.89971661567688, "step": 3475} {"train_info/time_between_train_steps": 0.0034422874450683594, "step": 3475} {"info/global_step": 3476, "train_info/time_within_train_step": 2.7542221546173096, "step": 3476} {"train_info/time_between_train_steps": 0.0031943321228027344, "step": 3476} {"info/global_step": 3477, "train_info/time_within_train_step": 2.7535512447357178, "step": 3477} {"train_info/time_between_train_steps": 0.0031938552856445312, "step": 3477} {"info/global_step": 3478, "train_info/time_within_train_step": 2.7537972927093506, "step": 3478} {"train_info/time_between_train_steps": 0.0032052993774414062, "step": 3478} {"info/global_step": 3479, "train_info/time_within_train_step": 2.987049102783203, "step": 3479} {"train_info/time_between_train_steps": 0.0032532215118408203, "step": 3479} {"info/global_step": 3480, "train_info/time_within_train_step": 2.7548444271087646, "step": 3480} {"train_info/time_between_train_steps": 0.003186464309692383, "step": 3480} {"info/global_step": 3481, "train_info/time_within_train_step": 2.7537758350372314, "step": 3481} {"train_info/time_between_train_steps": 0.0032007694244384766, "step": 3481} {"info/global_step": 3482, "train_info/time_within_train_step": 2.7552645206451416, "step": 3482} {"train_info/time_between_train_steps": 0.0031461715698242188, "step": 3482} {"info/global_step": 3483, "train_info/time_within_train_step": 2.7548608779907227, "step": 3483} {"train_info/time_between_train_steps": 0.003202676773071289, "step": 3483} {"info/global_step": 3484, "train_info/time_within_train_step": 2.7544667720794678, "step": 3484} {"train_info/time_between_train_steps": 0.003214597702026367, "step": 3484} {"info/global_step": 3485, "train_info/time_within_train_step": 2.7530243396759033, "step": 3485} {"train_info/time_between_train_steps": 0.0031626224517822266, "step": 3485} {"info/global_step": 3486, "train_info/time_within_train_step": 2.755368709564209, "step": 3486} {"train_info/time_between_train_steps": 0.003175497055053711, "step": 3486} {"info/global_step": 3487, "train_info/time_within_train_step": 2.7545621395111084, "step": 3487} {"train_info/time_between_train_steps": 0.003179311752319336, "step": 3487} {"info/global_step": 3488, "train_info/time_within_train_step": 2.7533652782440186, "step": 3488} {"train_info/time_between_train_steps": 0.0031709671020507812, "step": 3488} {"info/global_step": 3489, "train_info/time_within_train_step": 2.754578113555908, "step": 3489} {"train_info/time_between_train_steps": 0.003198862075805664, "step": 3489} {"info/global_step": 3490, "train_info/time_within_train_step": 2.7545082569122314, "step": 3490} {"train_info/time_between_train_steps": 0.0031881332397460938, "step": 3490} {"info/global_step": 3491, "train_info/time_within_train_step": 2.75518798828125, "step": 3491} {"train_info/time_between_train_steps": 0.0031511783599853516, "step": 3491} {"info/global_step": 3492, "train_info/time_within_train_step": 2.7536606788635254, "step": 3492} {"train_info/time_between_train_steps": 0.003142833709716797, "step": 3492} {"info/global_step": 3493, "train_info/time_within_train_step": 2.7539844512939453, "step": 3493} {"train_info/time_between_train_steps": 0.0031964778900146484, "step": 3493} {"info/global_step": 3494, "train_info/time_within_train_step": 2.754181146621704, "step": 3494} {"train_info/time_between_train_steps": 0.003209829330444336, "step": 3494} {"info/global_step": 3495, "train_info/time_within_train_step": 2.753990650177002, "step": 3495} {"train_info/time_between_train_steps": 0.003165721893310547, "step": 3495} {"info/global_step": 3496, "train_info/time_within_train_step": 2.753816843032837, "step": 3496} {"train_info/time_between_train_steps": 0.0032265186309814453, "step": 3496} {"info/global_step": 3497, "train_info/time_within_train_step": 2.7541539669036865, "step": 3497} {"train_info/time_between_train_steps": 0.0031592845916748047, "step": 3497} {"info/global_step": 3498, "train_info/time_within_train_step": 3.3624589443206787, "step": 3498} {"train_info/time_between_train_steps": 0.003206014633178711, "step": 3498} {"info/global_step": 3499, "train_info/time_within_train_step": 2.7503511905670166, "step": 3499} {"train_info/time_between_train_steps": 0.0032253265380859375, "step": 3499} {"info/global_step": 3500, "train_info/time_within_train_step": 2.7560510635375977, "step": 3500} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746576179, "_runtime": 10188}, "step": 3500} {"logs": {"train/loss": 3.9367, "train/learning_rate": 0.0004333333333333333, "train/epoch": 4.01, "_timestamp": 1746576179, "_runtime": 10188}, "step": 3500} {"train_info/time_between_train_steps": 0.01262211799621582, "step": 3500} {"info/global_step": 3501, "train_info/time_within_train_step": 2.7532103061676025, "step": 3501} {"train_info/time_between_train_steps": 0.003195047378540039, "step": 3501} {"info/global_step": 3502, "train_info/time_within_train_step": 2.752070665359497, "step": 3502} {"train_info/time_between_train_steps": 0.0031304359436035156, "step": 3502} {"info/global_step": 3503, "train_info/time_within_train_step": 2.7531020641326904, "step": 3503} {"train_info/time_between_train_steps": 0.003174304962158203, "step": 3503} {"info/global_step": 3504, "train_info/time_within_train_step": 2.7530994415283203, "step": 3504} {"train_info/time_between_train_steps": 0.003142833709716797, "step": 3504} {"info/global_step": 3505, "train_info/time_within_train_step": 2.754086494445801, "step": 3505} {"train_info/time_between_train_steps": 0.003125905990600586, "step": 3505} {"info/global_step": 3506, "train_info/time_within_train_step": 2.754135847091675, "step": 3506} {"train_info/time_between_train_steps": 0.0031969547271728516, "step": 3506} {"info/global_step": 3507, "train_info/time_within_train_step": 2.7529799938201904, "step": 3507} {"train_info/time_between_train_steps": 0.003133058547973633, "step": 3507} {"info/global_step": 3508, "train_info/time_within_train_step": 2.753422260284424, "step": 3508} {"train_info/time_between_train_steps": 0.0031404495239257812, "step": 3508} {"info/global_step": 3509, "train_info/time_within_train_step": 2.753878593444824, "step": 3509} {"train_info/time_between_train_steps": 0.0031654834747314453, "step": 3509} {"info/global_step": 3510, "train_info/time_within_train_step": 2.7545523643493652, "step": 3510} {"train_info/time_between_train_steps": 0.003232717514038086, "step": 3510} {"info/global_step": 3511, "train_info/time_within_train_step": 2.753743886947632, "step": 3511} {"train_info/time_between_train_steps": 0.0031709671020507812, "step": 3511} {"info/global_step": 3512, "train_info/time_within_train_step": 2.7538278102874756, "step": 3512} {"train_info/time_between_train_steps": 0.0032193660736083984, "step": 3512} {"info/global_step": 3513, "train_info/time_within_train_step": 2.7533657550811768, "step": 3513} {"train_info/time_between_train_steps": 0.003151416778564453, "step": 3513} {"info/global_step": 3514, "train_info/time_within_train_step": 2.7560503482818604, "step": 3514} {"train_info/time_between_train_steps": 0.0031919479370117188, "step": 3514} {"info/global_step": 3515, "train_info/time_within_train_step": 2.753242015838623, "step": 3515} {"train_info/time_between_train_steps": 0.003139019012451172, "step": 3515} {"info/global_step": 3516, "train_info/time_within_train_step": 2.754155158996582, "step": 3516} {"train_info/time_between_train_steps": 0.003179311752319336, "step": 3516} {"info/global_step": 3517, "train_info/time_within_train_step": 2.753899335861206, "step": 3517} {"train_info/time_between_train_steps": 0.003154277801513672, "step": 3517} {"info/global_step": 3518, "train_info/time_within_train_step": 2.7545812129974365, "step": 3518} {"train_info/time_between_train_steps": 0.0031604766845703125, "step": 3518} {"info/global_step": 3519, "train_info/time_within_train_step": 2.753744602203369, "step": 3519} {"train_info/time_between_train_steps": 0.003139495849609375, "step": 3519} {"info/global_step": 3520, "train_info/time_within_train_step": 2.9790475368499756, "step": 3520} {"train_info/time_between_train_steps": 0.003155946731567383, "step": 3520} {"info/global_step": 3521, "train_info/time_within_train_step": 2.7532131671905518, "step": 3521} {"train_info/time_between_train_steps": 0.003145933151245117, "step": 3521} {"info/global_step": 3522, "train_info/time_within_train_step": 2.753828525543213, "step": 3522} {"train_info/time_between_train_steps": 0.0031557083129882812, "step": 3522} {"info/global_step": 3523, "train_info/time_within_train_step": 2.7541332244873047, "step": 3523} {"train_info/time_between_train_steps": 0.0036351680755615234, "step": 3523} {"info/global_step": 3524, "train_info/time_within_train_step": 2.7537195682525635, "step": 3524} {"train_info/time_between_train_steps": 0.003143787384033203, "step": 3524} {"info/global_step": 3525, "train_info/time_within_train_step": 2.7545952796936035, "step": 3525} {"train_info/time_between_train_steps": 0.0031566619873046875, "step": 3525} {"info/global_step": 3526, "train_info/time_within_train_step": 2.7537572383880615, "step": 3526} {"train_info/time_between_train_steps": 0.0031647682189941406, "step": 3526} {"info/global_step": 3527, "train_info/time_within_train_step": 2.754882574081421, "step": 3527} {"train_info/time_between_train_steps": 0.003150463104248047, "step": 3527} {"info/global_step": 3528, "train_info/time_within_train_step": 2.755034923553467, "step": 3528} {"train_info/time_between_train_steps": 0.003160238265991211, "step": 3528} {"info/global_step": 3529, "train_info/time_within_train_step": 2.7557616233825684, "step": 3529} {"train_info/time_between_train_steps": 0.0031728744506835938, "step": 3529} {"info/global_step": 3530, "train_info/time_within_train_step": 2.7539498805999756, "step": 3530} {"train_info/time_between_train_steps": 0.003143310546875, "step": 3530} {"info/global_step": 3531, "train_info/time_within_train_step": 2.754462480545044, "step": 3531} {"train_info/time_between_train_steps": 0.0031516551971435547, "step": 3531} {"info/global_step": 3532, "train_info/time_within_train_step": 2.7550528049468994, "step": 3532} {"train_info/time_between_train_steps": 0.0032210350036621094, "step": 3532} {"info/global_step": 3533, "train_info/time_within_train_step": 2.754376173019409, "step": 3533} {"train_info/time_between_train_steps": 0.0031251907348632812, "step": 3533} {"info/global_step": 3534, "train_info/time_within_train_step": 2.7568259239196777, "step": 3534} {"train_info/time_between_train_steps": 0.0031921863555908203, "step": 3534} {"info/global_step": 3535, "train_info/time_within_train_step": 2.7539353370666504, "step": 3535} {"train_info/time_between_train_steps": 0.0031397342681884766, "step": 3535} {"info/global_step": 3536, "train_info/time_within_train_step": 2.7547590732574463, "step": 3536} {"train_info/time_between_train_steps": 0.0031452178955078125, "step": 3536} {"info/global_step": 3537, "train_info/time_within_train_step": 2.753325939178467, "step": 3537} {"train_info/time_between_train_steps": 0.12650442123413086, "step": 3537} {"info/global_step": 3538, "train_info/time_within_train_step": 2.7550435066223145, "step": 3538} {"train_info/time_between_train_steps": 0.0031464099884033203, "step": 3538} {"info/global_step": 3539, "train_info/time_within_train_step": 2.7542788982391357, "step": 3539} {"train_info/time_between_train_steps": 0.0031511783599853516, "step": 3539} {"info/global_step": 3540, "train_info/time_within_train_step": 2.755413770675659, "step": 3540} {"train_info/time_between_train_steps": 0.0031719207763671875, "step": 3540} {"info/global_step": 3541, "train_info/time_within_train_step": 2.7550463676452637, "step": 3541} {"train_info/time_between_train_steps": 0.003161191940307617, "step": 3541} {"info/global_step": 3542, "train_info/time_within_train_step": 2.754842758178711, "step": 3542} {"train_info/time_between_train_steps": 0.0031986236572265625, "step": 3542} {"info/global_step": 3543, "train_info/time_within_train_step": 2.7545087337493896, "step": 3543} {"train_info/time_between_train_steps": 0.003233194351196289, "step": 3543} {"info/global_step": 3544, "train_info/time_within_train_step": 2.7534983158111572, "step": 3544} {"train_info/time_between_train_steps": 0.003159046173095703, "step": 3544} {"info/global_step": 3545, "train_info/time_within_train_step": 2.753582239151001, "step": 3545} {"train_info/time_between_train_steps": 0.003183603286743164, "step": 3545} {"info/global_step": 3546, "train_info/time_within_train_step": 2.7546517848968506, "step": 3546} {"train_info/time_between_train_steps": 0.003157377243041992, "step": 3546} {"info/global_step": 3547, "train_info/time_within_train_step": 2.7542264461517334, "step": 3547} {"train_info/time_between_train_steps": 0.0031616687774658203, "step": 3547} {"info/global_step": 3548, "train_info/time_within_train_step": 2.7550439834594727, "step": 3548} {"train_info/time_between_train_steps": 0.003163576126098633, "step": 3548} {"info/global_step": 3549, "train_info/time_within_train_step": 2.7562124729156494, "step": 3549} {"train_info/time_between_train_steps": 0.0032033920288085938, "step": 3549} {"info/global_step": 3550, "train_info/time_within_train_step": 2.7541840076446533, "step": 3550} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746576318, "_runtime": 10327}, "step": 3550} {"logs": {"train/loss": 3.9272, "train/learning_rate": 0.00043, "train/epoch": 4.01, "_timestamp": 1746576318, "_runtime": 10327}, "step": 3550} {"train_info/time_between_train_steps": 0.013531208038330078, "step": 3550} {"info/global_step": 3551, "train_info/time_within_train_step": 2.756758689880371, "step": 3551} {"train_info/time_between_train_steps": 0.0031664371490478516, "step": 3551} {"info/global_step": 3552, "train_info/time_within_train_step": 2.75516939163208, "step": 3552} {"train_info/time_between_train_steps": 0.0031652450561523438, "step": 3552} {"info/global_step": 3553, "train_info/time_within_train_step": 2.753922700881958, "step": 3553} {"train_info/time_between_train_steps": 0.003147602081298828, "step": 3553} {"info/global_step": 3554, "train_info/time_within_train_step": 2.754786491394043, "step": 3554} {"train_info/time_between_train_steps": 0.0032110214233398438, "step": 3554} {"info/global_step": 3555, "train_info/time_within_train_step": 2.7545089721679688, "step": 3555} {"train_info/time_between_train_steps": 0.0031762123107910156, "step": 3555} {"info/global_step": 3556, "train_info/time_within_train_step": 2.754526138305664, "step": 3556} {"train_info/time_between_train_steps": 0.0031914710998535156, "step": 3556} {"info/global_step": 3557, "train_info/time_within_train_step": 2.755594491958618, "step": 3557} {"train_info/time_between_train_steps": 0.003172159194946289, "step": 3557} {"info/global_step": 3558, "train_info/time_within_train_step": 2.7550716400146484, "step": 3558} {"train_info/time_between_train_steps": 0.003213644027709961, "step": 3558} {"info/global_step": 3559, "train_info/time_within_train_step": 2.7548446655273438, "step": 3559} {"train_info/time_between_train_steps": 0.0031557083129882812, "step": 3559} {"info/global_step": 3560, "train_info/time_within_train_step": 2.7552833557128906, "step": 3560} {"train_info/time_between_train_steps": 0.0031745433807373047, "step": 3560} {"info/global_step": 3561, "train_info/time_within_train_step": 2.755364418029785, "step": 3561} {"train_info/time_between_train_steps": 0.0032072067260742188, "step": 3561} {"info/global_step": 3562, "train_info/time_within_train_step": 2.753952741622925, "step": 3562} {"train_info/time_between_train_steps": 0.003168344497680664, "step": 3562} {"info/global_step": 3563, "train_info/time_within_train_step": 2.752903461456299, "step": 3563} {"train_info/time_between_train_steps": 0.0031828880310058594, "step": 3563} {"info/global_step": 3564, "train_info/time_within_train_step": 2.754958152770996, "step": 3564} {"train_info/time_between_train_steps": 0.0031800270080566406, "step": 3564} {"info/global_step": 3565, "train_info/time_within_train_step": 2.7547073364257812, "step": 3565} {"train_info/time_between_train_steps": 0.0031545162200927734, "step": 3565} {"info/global_step": 3566, "train_info/time_within_train_step": 2.7541263103485107, "step": 3566} {"train_info/time_between_train_steps": 0.0031557083129882812, "step": 3566} {"info/global_step": 3567, "train_info/time_within_train_step": 2.7528722286224365, "step": 3567} {"train_info/time_between_train_steps": 0.003131866455078125, "step": 3567} {"info/global_step": 3568, "train_info/time_within_train_step": 2.7544987201690674, "step": 3568} {"train_info/time_between_train_steps": 0.0031409263610839844, "step": 3568} {"info/global_step": 3569, "train_info/time_within_train_step": 2.7537808418273926, "step": 3569} {"train_info/time_between_train_steps": 0.003201723098754883, "step": 3569} {"info/global_step": 3570, "train_info/time_within_train_step": 2.7545361518859863, "step": 3570} {"train_info/time_between_train_steps": 0.003160238265991211, "step": 3570} {"info/global_step": 3571, "train_info/time_within_train_step": 2.755434274673462, "step": 3571} {"train_info/time_between_train_steps": 0.003169536590576172, "step": 3571} {"info/global_step": 3572, "train_info/time_within_train_step": 2.754607915878296, "step": 3572} {"train_info/time_between_train_steps": 0.0031998157501220703, "step": 3572} {"info/global_step": 3573, "train_info/time_within_train_step": 2.7548656463623047, "step": 3573} {"train_info/time_between_train_steps": 0.0031282901763916016, "step": 3573} {"info/global_step": 3574, "train_info/time_within_train_step": 2.7538933753967285, "step": 3574} {"train_info/time_between_train_steps": 0.003199338912963867, "step": 3574} {"info/global_step": 3575, "train_info/time_within_train_step": 2.7541344165802, "step": 3575} {"train_info/time_between_train_steps": 0.003137350082397461, "step": 3575} {"info/global_step": 3576, "train_info/time_within_train_step": 2.7541139125823975, "step": 3576} {"train_info/time_between_train_steps": 0.0031363964080810547, "step": 3576} {"info/global_step": 3577, "train_info/time_within_train_step": 2.7525551319122314, "step": 3577} {"train_info/time_between_train_steps": 0.003159761428833008, "step": 3577} {"info/global_step": 3578, "train_info/time_within_train_step": 2.754694700241089, "step": 3578} {"train_info/time_between_train_steps": 0.003144502639770508, "step": 3578} {"info/global_step": 3579, "train_info/time_within_train_step": 2.754884958267212, "step": 3579} {"train_info/time_between_train_steps": 0.003153085708618164, "step": 3579} {"info/global_step": 3580, "train_info/time_within_train_step": 2.7550947666168213, "step": 3580} {"train_info/time_between_train_steps": 0.003183603286743164, "step": 3580} {"info/global_step": 3581, "train_info/time_within_train_step": 2.7542107105255127, "step": 3581} {"train_info/time_between_train_steps": 0.003159046173095703, "step": 3581} {"info/global_step": 3582, "train_info/time_within_train_step": 2.753847122192383, "step": 3582} {"train_info/time_between_train_steps": 0.003287076950073242, "step": 3582} {"info/global_step": 3583, "train_info/time_within_train_step": 2.7553648948669434, "step": 3583} {"train_info/time_between_train_steps": 0.0033528804779052734, "step": 3583} {"info/global_step": 3584, "train_info/time_within_train_step": 2.755420207977295, "step": 3584} {"train_info/time_between_train_steps": 0.003294229507446289, "step": 3584} {"info/global_step": 3585, "train_info/time_within_train_step": 2.7545528411865234, "step": 3585} {"train_info/time_between_train_steps": 0.0032935142517089844, "step": 3585} {"info/global_step": 3586, "train_info/time_within_train_step": 2.755722761154175, "step": 3586} {"train_info/time_between_train_steps": 0.003332853317260742, "step": 3586} {"info/global_step": 3587, "train_info/time_within_train_step": 2.7557051181793213, "step": 3587} {"train_info/time_between_train_steps": 0.003322601318359375, "step": 3587} {"info/global_step": 3588, "train_info/time_within_train_step": 2.7550625801086426, "step": 3588} {"train_info/time_between_train_steps": 0.0032927989959716797, "step": 3588} {"info/global_step": 3589, "train_info/time_within_train_step": 2.754878044128418, "step": 3589} {"train_info/time_between_train_steps": 0.0033049583435058594, "step": 3589} {"info/global_step": 3590, "train_info/time_within_train_step": 2.7557036876678467, "step": 3590} {"train_info/time_between_train_steps": 0.0032846927642822266, "step": 3590} {"info/global_step": 3591, "train_info/time_within_train_step": 2.7546207904815674, "step": 3591} {"train_info/time_between_train_steps": 0.003269672393798828, "step": 3591} {"info/global_step": 3592, "train_info/time_within_train_step": 2.754844903945923, "step": 3592} {"train_info/time_between_train_steps": 0.003281116485595703, "step": 3592} {"info/global_step": 3593, "train_info/time_within_train_step": 2.7563929557800293, "step": 3593} {"train_info/time_between_train_steps": 0.0032711029052734375, "step": 3593} {"info/global_step": 3594, "train_info/time_within_train_step": 2.7543675899505615, "step": 3594} {"train_info/time_between_train_steps": 0.0031893253326416016, "step": 3594} {"info/global_step": 3595, "train_info/time_within_train_step": 2.7543208599090576, "step": 3595} {"train_info/time_between_train_steps": 0.003171205520629883, "step": 3595} {"info/global_step": 3596, "train_info/time_within_train_step": 2.7553482055664062, "step": 3596} {"train_info/time_between_train_steps": 0.003157377243041992, "step": 3596} {"info/global_step": 3597, "train_info/time_within_train_step": 2.7554523944854736, "step": 3597} {"train_info/time_between_train_steps": 0.003172636032104492, "step": 3597} {"info/global_step": 3598, "train_info/time_within_train_step": 2.7546536922454834, "step": 3598} {"train_info/time_between_train_steps": 0.0032181739807128906, "step": 3598} {"info/global_step": 3599, "train_info/time_within_train_step": 2.754652261734009, "step": 3599} {"train_info/time_between_train_steps": 0.0031425952911376953, "step": 3599} {"info/global_step": 3600, "train_info/time_within_train_step": 2.877769708633423, "step": 3600} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746576456, "_runtime": 10465}, "step": 3600} {"logs": {"train/loss": 3.909, "train/learning_rate": 0.00042666666666666667, "train/epoch": 4.02, "_timestamp": 1746576456, "_runtime": 10465}, "step": 3600} {"train_info/time_between_train_steps": 27.714879751205444, "step": 3600} {"info/global_step": 3601, "train_info/time_within_train_step": 2.530014753341675, "step": 3601} {"train_info/time_between_train_steps": 0.003325939178466797, "step": 3601} {"info/global_step": 3602, "train_info/time_within_train_step": 2.5886423587799072, "step": 3602} {"train_info/time_between_train_steps": 0.003328084945678711, "step": 3602} {"info/global_step": 3603, "train_info/time_within_train_step": 2.713024854660034, "step": 3603} {"train_info/time_between_train_steps": 0.0033104419708251953, "step": 3603} {"info/global_step": 3604, "train_info/time_within_train_step": 2.9250805377960205, "step": 3604} {"train_info/time_between_train_steps": 0.0033974647521972656, "step": 3604} {"info/global_step": 3605, "train_info/time_within_train_step": 2.6959898471832275, "step": 3605} {"train_info/time_between_train_steps": 0.003331899642944336, "step": 3605} {"info/global_step": 3606, "train_info/time_within_train_step": 2.753917932510376, "step": 3606} {"train_info/time_between_train_steps": 0.0033168792724609375, "step": 3606} {"info/global_step": 3607, "train_info/time_within_train_step": 2.7568044662475586, "step": 3607} {"train_info/time_between_train_steps": 0.003298044204711914, "step": 3607} {"info/global_step": 3608, "train_info/time_within_train_step": 2.756667137145996, "step": 3608} {"train_info/time_between_train_steps": 0.0033562183380126953, "step": 3608} {"info/global_step": 3609, "train_info/time_within_train_step": 2.756610631942749, "step": 3609} {"train_info/time_between_train_steps": 0.0033075809478759766, "step": 3609} {"info/global_step": 3610, "train_info/time_within_train_step": 2.756089448928833, "step": 3610} {"train_info/time_between_train_steps": 0.0033478736877441406, "step": 3610} {"info/global_step": 3611, "train_info/time_within_train_step": 2.7564809322357178, "step": 3611} {"train_info/time_between_train_steps": 0.0032036304473876953, "step": 3611} {"info/global_step": 3612, "train_info/time_within_train_step": 2.7554097175598145, "step": 3612} {"train_info/time_between_train_steps": 0.003141641616821289, "step": 3612} {"info/global_step": 3613, "train_info/time_within_train_step": 2.755579710006714, "step": 3613} {"train_info/time_between_train_steps": 0.003147125244140625, "step": 3613} {"info/global_step": 3614, "train_info/time_within_train_step": 2.7552151679992676, "step": 3614} {"train_info/time_between_train_steps": 0.0031914710998535156, "step": 3614} {"info/global_step": 3615, "train_info/time_within_train_step": 2.7548553943634033, "step": 3615} {"train_info/time_between_train_steps": 0.003177642822265625, "step": 3615} {"info/global_step": 3616, "train_info/time_within_train_step": 2.754737377166748, "step": 3616} {"train_info/time_between_train_steps": 0.0031838417053222656, "step": 3616} {"info/global_step": 3617, "train_info/time_within_train_step": 2.756044864654541, "step": 3617} {"train_info/time_between_train_steps": 0.0031709671020507812, "step": 3617} {"info/global_step": 3618, "train_info/time_within_train_step": 2.756741762161255, "step": 3618} {"train_info/time_between_train_steps": 0.0031681060791015625, "step": 3618} {"info/global_step": 3619, "train_info/time_within_train_step": 2.756495237350464, "step": 3619} {"train_info/time_between_train_steps": 0.003192424774169922, "step": 3619} {"info/global_step": 3620, "train_info/time_within_train_step": 2.7583096027374268, "step": 3620} {"train_info/time_between_train_steps": 0.0031681060791015625, "step": 3620} {"info/global_step": 3621, "train_info/time_within_train_step": 2.7575438022613525, "step": 3621} {"train_info/time_between_train_steps": 0.003337860107421875, "step": 3621} {"info/global_step": 3622, "train_info/time_within_train_step": 2.758270263671875, "step": 3622} {"train_info/time_between_train_steps": 0.003337383270263672, "step": 3622} {"info/global_step": 3623, "train_info/time_within_train_step": 2.758925676345825, "step": 3623} {"train_info/time_between_train_steps": 0.003306150436401367, "step": 3623} {"info/global_step": 3624, "train_info/time_within_train_step": 2.7565786838531494, "step": 3624} {"train_info/time_between_train_steps": 0.0033147335052490234, "step": 3624} {"info/global_step": 3625, "train_info/time_within_train_step": 2.7575833797454834, "step": 3625} {"train_info/time_between_train_steps": 0.003315448760986328, "step": 3625} {"info/global_step": 3626, "train_info/time_within_train_step": 2.756923198699951, "step": 3626} {"train_info/time_between_train_steps": 0.003358602523803711, "step": 3626} {"info/global_step": 3627, "train_info/time_within_train_step": 2.7570912837982178, "step": 3627} {"train_info/time_between_train_steps": 0.0032973289489746094, "step": 3627} {"info/global_step": 3628, "train_info/time_within_train_step": 2.7578132152557373, "step": 3628} {"train_info/time_between_train_steps": 0.0033664703369140625, "step": 3628} {"info/global_step": 3629, "train_info/time_within_train_step": 2.7566893100738525, "step": 3629} {"train_info/time_between_train_steps": 0.003289461135864258, "step": 3629} {"info/global_step": 3630, "train_info/time_within_train_step": 2.7552084922790527, "step": 3630} {"train_info/time_between_train_steps": 0.003300905227661133, "step": 3630} {"info/global_step": 3631, "train_info/time_within_train_step": 2.7575531005859375, "step": 3631} {"train_info/time_between_train_steps": 0.003340005874633789, "step": 3631} {"info/global_step": 3632, "train_info/time_within_train_step": 2.756840705871582, "step": 3632} {"train_info/time_between_train_steps": 0.003305196762084961, "step": 3632} {"info/global_step": 3633, "train_info/time_within_train_step": 2.757115125656128, "step": 3633} {"train_info/time_between_train_steps": 0.0032906532287597656, "step": 3633} {"info/global_step": 3634, "train_info/time_within_train_step": 2.758230447769165, "step": 3634} {"train_info/time_between_train_steps": 0.0033593177795410156, "step": 3634} {"info/global_step": 3635, "train_info/time_within_train_step": 2.7562263011932373, "step": 3635} {"train_info/time_between_train_steps": 0.0033233165740966797, "step": 3635} {"info/global_step": 3636, "train_info/time_within_train_step": 2.7560672760009766, "step": 3636} {"train_info/time_between_train_steps": 0.0033195018768310547, "step": 3636} {"info/global_step": 3637, "train_info/time_within_train_step": 2.757614850997925, "step": 3637} {"train_info/time_between_train_steps": 0.0033464431762695312, "step": 3637} {"info/global_step": 3638, "train_info/time_within_train_step": 2.756373882293701, "step": 3638} {"train_info/time_between_train_steps": 0.0033330917358398438, "step": 3638} {"info/global_step": 3639, "train_info/time_within_train_step": 2.755218267440796, "step": 3639} {"train_info/time_between_train_steps": 0.0031518936157226562, "step": 3639} {"info/global_step": 3640, "train_info/time_within_train_step": 2.7563350200653076, "step": 3640} {"train_info/time_between_train_steps": 0.003252744674682617, "step": 3640} {"info/global_step": 3641, "train_info/time_within_train_step": 2.7536051273345947, "step": 3641} {"train_info/time_between_train_steps": 0.003164529800415039, "step": 3641} {"info/global_step": 3642, "train_info/time_within_train_step": 2.7540793418884277, "step": 3642} {"train_info/time_between_train_steps": 0.0033385753631591797, "step": 3642} {"info/global_step": 3643, "train_info/time_within_train_step": 2.7561354637145996, "step": 3643} {"train_info/time_between_train_steps": 0.0033397674560546875, "step": 3643} {"info/global_step": 3644, "train_info/time_within_train_step": 2.755725622177124, "step": 3644} {"train_info/time_between_train_steps": 0.0033257007598876953, "step": 3644} {"info/global_step": 3645, "train_info/time_within_train_step": 2.7574684619903564, "step": 3645} {"train_info/time_between_train_steps": 0.003311634063720703, "step": 3645} {"info/global_step": 3646, "train_info/time_within_train_step": 2.7563254833221436, "step": 3646} {"train_info/time_between_train_steps": 0.0033206939697265625, "step": 3646} {"info/global_step": 3647, "train_info/time_within_train_step": 2.756589412689209, "step": 3647} {"train_info/time_between_train_steps": 0.0032958984375, "step": 3647} {"info/global_step": 3648, "train_info/time_within_train_step": 2.7552924156188965, "step": 3648} {"train_info/time_between_train_steps": 0.003312826156616211, "step": 3648} {"info/global_step": 3649, "train_info/time_within_train_step": 2.7554008960723877, "step": 3649} {"train_info/time_between_train_steps": 0.0031440258026123047, "step": 3649} {"info/global_step": 3650, "train_info/time_within_train_step": 2.754905939102173, "step": 3650} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746576622, "_runtime": 10631}, "step": 3650} {"logs": {"train/loss": 3.9032, "train/learning_rate": 0.00042333333333333334, "train/epoch": 4.02, "_timestamp": 1746576622, "_runtime": 10631}, "step": 3650} {"train_info/time_between_train_steps": 0.01317143440246582, "step": 3650} {"info/global_step": 3651, "train_info/time_within_train_step": 2.7547154426574707, "step": 3651} {"train_info/time_between_train_steps": 0.003148794174194336, "step": 3651} {"info/global_step": 3652, "train_info/time_within_train_step": 2.755533218383789, "step": 3652} {"train_info/time_between_train_steps": 0.0031464099884033203, "step": 3652} {"info/global_step": 3653, "train_info/time_within_train_step": 2.754701852798462, "step": 3653} {"train_info/time_between_train_steps": 0.0031785964965820312, "step": 3653} {"info/global_step": 3654, "train_info/time_within_train_step": 2.7541470527648926, "step": 3654} {"train_info/time_between_train_steps": 0.0031876564025878906, "step": 3654} {"info/global_step": 3655, "train_info/time_within_train_step": 2.7547998428344727, "step": 3655} {"train_info/time_between_train_steps": 0.0031511783599853516, "step": 3655} {"info/global_step": 3656, "train_info/time_within_train_step": 2.755160331726074, "step": 3656} {"train_info/time_between_train_steps": 0.003194093704223633, "step": 3656} {"info/global_step": 3657, "train_info/time_within_train_step": 2.75398850440979, "step": 3657} {"train_info/time_between_train_steps": 0.0031833648681640625, "step": 3657} {"info/global_step": 3658, "train_info/time_within_train_step": 2.7548558712005615, "step": 3658} {"train_info/time_between_train_steps": 0.003141164779663086, "step": 3658} {"info/global_step": 3659, "train_info/time_within_train_step": 2.754127264022827, "step": 3659} {"train_info/time_between_train_steps": 0.0031189918518066406, "step": 3659} {"info/global_step": 3660, "train_info/time_within_train_step": 2.755007743835449, "step": 3660} {"train_info/time_between_train_steps": 0.003161191940307617, "step": 3660} {"info/global_step": 3661, "train_info/time_within_train_step": 2.7546679973602295, "step": 3661} {"train_info/time_between_train_steps": 0.003206014633178711, "step": 3661} {"info/global_step": 3662, "train_info/time_within_train_step": 2.7562355995178223, "step": 3662} {"train_info/time_between_train_steps": 0.12900257110595703, "step": 3662} {"info/global_step": 3663, "train_info/time_within_train_step": 2.755811929702759, "step": 3663} {"train_info/time_between_train_steps": 0.0032296180725097656, "step": 3663} {"info/global_step": 3664, "train_info/time_within_train_step": 2.755898952484131, "step": 3664} {"train_info/time_between_train_steps": 0.0032083988189697266, "step": 3664} {"info/global_step": 3665, "train_info/time_within_train_step": 2.7552740573883057, "step": 3665} {"train_info/time_between_train_steps": 0.0032682418823242188, "step": 3665} {"info/global_step": 3666, "train_info/time_within_train_step": 2.7561776638031006, "step": 3666} {"train_info/time_between_train_steps": 0.0033309459686279297, "step": 3666} {"info/global_step": 3667, "train_info/time_within_train_step": 2.757389545440674, "step": 3667} {"train_info/time_between_train_steps": 0.0033273696899414062, "step": 3667} {"info/global_step": 3668, "train_info/time_within_train_step": 2.7566776275634766, "step": 3668} {"train_info/time_between_train_steps": 0.0033407211303710938, "step": 3668} {"info/global_step": 3669, "train_info/time_within_train_step": 2.7554290294647217, "step": 3669} {"train_info/time_between_train_steps": 0.003328084945678711, "step": 3669} {"info/global_step": 3670, "train_info/time_within_train_step": 2.7553136348724365, "step": 3670} {"train_info/time_between_train_steps": 0.003309488296508789, "step": 3670} {"info/global_step": 3671, "train_info/time_within_train_step": 2.755457878112793, "step": 3671} {"train_info/time_between_train_steps": 0.003358125686645508, "step": 3671} {"info/global_step": 3672, "train_info/time_within_train_step": 2.7560877799987793, "step": 3672} {"train_info/time_between_train_steps": 0.003317594528198242, "step": 3672} {"info/global_step": 3673, "train_info/time_within_train_step": 2.754568576812744, "step": 3673} {"train_info/time_between_train_steps": 0.003298521041870117, "step": 3673} {"info/global_step": 3674, "train_info/time_within_train_step": 2.755444049835205, "step": 3674} {"train_info/time_between_train_steps": 0.0033435821533203125, "step": 3674} {"info/global_step": 3675, "train_info/time_within_train_step": 2.754801034927368, "step": 3675} {"train_info/time_between_train_steps": 0.0033228397369384766, "step": 3675} {"info/global_step": 3676, "train_info/time_within_train_step": 2.755615234375, "step": 3676} {"train_info/time_between_train_steps": 0.003336191177368164, "step": 3676} {"info/global_step": 3677, "train_info/time_within_train_step": 2.7559595108032227, "step": 3677} {"train_info/time_between_train_steps": 0.0033385753631591797, "step": 3677} {"info/global_step": 3678, "train_info/time_within_train_step": 2.756316661834717, "step": 3678} {"train_info/time_between_train_steps": 0.003370523452758789, "step": 3678} {"info/global_step": 3679, "train_info/time_within_train_step": 2.7557637691497803, "step": 3679} {"train_info/time_between_train_steps": 0.003331422805786133, "step": 3679} {"info/global_step": 3680, "train_info/time_within_train_step": 2.756924629211426, "step": 3680} {"train_info/time_between_train_steps": 0.0033359527587890625, "step": 3680} {"info/global_step": 3681, "train_info/time_within_train_step": 2.756544589996338, "step": 3681} {"train_info/time_between_train_steps": 0.0033392906188964844, "step": 3681} {"info/global_step": 3682, "train_info/time_within_train_step": 2.757473945617676, "step": 3682} {"train_info/time_between_train_steps": 0.003319978713989258, "step": 3682} {"info/global_step": 3683, "train_info/time_within_train_step": 2.7552483081817627, "step": 3683} {"train_info/time_between_train_steps": 0.0034651756286621094, "step": 3683} {"info/global_step": 3684, "train_info/time_within_train_step": 2.7575278282165527, "step": 3684} {"train_info/time_between_train_steps": 0.003316164016723633, "step": 3684} {"info/global_step": 3685, "train_info/time_within_train_step": 2.7558038234710693, "step": 3685} {"train_info/time_between_train_steps": 0.003374338150024414, "step": 3685} {"info/global_step": 3686, "train_info/time_within_train_step": 2.756265640258789, "step": 3686} {"train_info/time_between_train_steps": 0.0033423900604248047, "step": 3686} {"info/global_step": 3687, "train_info/time_within_train_step": 2.754798173904419, "step": 3687} {"train_info/time_between_train_steps": 0.0033075809478759766, "step": 3687} {"info/global_step": 3688, "train_info/time_within_train_step": 2.7568063735961914, "step": 3688} {"train_info/time_between_train_steps": 0.0033769607543945312, "step": 3688} {"info/global_step": 3689, "train_info/time_within_train_step": 2.756648302078247, "step": 3689} {"train_info/time_between_train_steps": 0.003326892852783203, "step": 3689} {"info/global_step": 3690, "train_info/time_within_train_step": 2.7541630268096924, "step": 3690} {"train_info/time_between_train_steps": 0.003313779830932617, "step": 3690} {"info/global_step": 3691, "train_info/time_within_train_step": 2.7548470497131348, "step": 3691} {"train_info/time_between_train_steps": 0.003326892852783203, "step": 3691} {"info/global_step": 3692, "train_info/time_within_train_step": 2.756222724914551, "step": 3692} {"train_info/time_between_train_steps": 0.003364086151123047, "step": 3692} {"info/global_step": 3693, "train_info/time_within_train_step": 2.7571332454681396, "step": 3693} {"train_info/time_between_train_steps": 0.0033016204833984375, "step": 3693} {"info/global_step": 3694, "train_info/time_within_train_step": 3.001363515853882, "step": 3694} {"train_info/time_between_train_steps": 0.003404378890991211, "step": 3694} {"info/global_step": 3695, "train_info/time_within_train_step": 2.7565109729766846, "step": 3695} {"train_info/time_between_train_steps": 0.0033152103424072266, "step": 3695} {"info/global_step": 3696, "train_info/time_within_train_step": 2.7551817893981934, "step": 3696} {"train_info/time_between_train_steps": 0.0033042430877685547, "step": 3696} {"info/global_step": 3697, "train_info/time_within_train_step": 2.7553980350494385, "step": 3697} {"train_info/time_between_train_steps": 0.0033185482025146484, "step": 3697} {"info/global_step": 3698, "train_info/time_within_train_step": 2.7590982913970947, "step": 3698} {"train_info/time_between_train_steps": 0.0033524036407470703, "step": 3698} {"info/global_step": 3699, "train_info/time_within_train_step": 2.756381034851074, "step": 3699} {"train_info/time_between_train_steps": 0.003332853317260742, "step": 3699} {"info/global_step": 3700, "train_info/time_within_train_step": 2.7542717456817627, "step": 3700} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746576761, "_runtime": 10770}, "step": 3700} {"logs": {"train/loss": 3.8791, "train/learning_rate": 0.00041999999999999996, "train/epoch": 4.03, "_timestamp": 1746576761, "_runtime": 10770}, "step": 3700} {"train_info/time_between_train_steps": 0.013991832733154297, "step": 3700} {"info/global_step": 3701, "train_info/time_within_train_step": 2.7545554637908936, "step": 3701} {"train_info/time_between_train_steps": 0.0031647682189941406, "step": 3701} {"info/global_step": 3702, "train_info/time_within_train_step": 2.754633665084839, "step": 3702} {"train_info/time_between_train_steps": 0.003169536590576172, "step": 3702} {"info/global_step": 3703, "train_info/time_within_train_step": 2.7553303241729736, "step": 3703} {"train_info/time_between_train_steps": 0.003234386444091797, "step": 3703} {"info/global_step": 3704, "train_info/time_within_train_step": 2.7556915283203125, "step": 3704} {"train_info/time_between_train_steps": 0.003180265426635742, "step": 3704} {"info/global_step": 3705, "train_info/time_within_train_step": 2.754574775695801, "step": 3705} {"train_info/time_between_train_steps": 0.003161191940307617, "step": 3705} {"info/global_step": 3706, "train_info/time_within_train_step": 2.7553822994232178, "step": 3706} {"train_info/time_between_train_steps": 0.003156900405883789, "step": 3706} {"info/global_step": 3707, "train_info/time_within_train_step": 2.7576887607574463, "step": 3707} {"train_info/time_between_train_steps": 0.0033664703369140625, "step": 3707} {"info/global_step": 3708, "train_info/time_within_train_step": 2.7556638717651367, "step": 3708} {"train_info/time_between_train_steps": 0.0033011436462402344, "step": 3708} {"info/global_step": 3709, "train_info/time_within_train_step": 2.755934953689575, "step": 3709} {"train_info/time_between_train_steps": 0.0033257007598876953, "step": 3709} {"info/global_step": 3710, "train_info/time_within_train_step": 2.7563602924346924, "step": 3710} {"train_info/time_between_train_steps": 0.0033371448516845703, "step": 3710} {"info/global_step": 3711, "train_info/time_within_train_step": 2.7560174465179443, "step": 3711} {"train_info/time_between_train_steps": 0.003337383270263672, "step": 3711} {"info/global_step": 3712, "train_info/time_within_train_step": 2.7562942504882812, "step": 3712} {"train_info/time_between_train_steps": 0.003292560577392578, "step": 3712} {"info/global_step": 3713, "train_info/time_within_train_step": 2.7555630207061768, "step": 3713} {"train_info/time_between_train_steps": 0.0033206939697265625, "step": 3713} {"info/global_step": 3714, "train_info/time_within_train_step": 2.756389856338501, "step": 3714} {"train_info/time_between_train_steps": 0.003380298614501953, "step": 3714} {"info/global_step": 3715, "train_info/time_within_train_step": 2.757575750350952, "step": 3715} {"train_info/time_between_train_steps": 0.0032911300659179688, "step": 3715} {"info/global_step": 3716, "train_info/time_within_train_step": 2.7558817863464355, "step": 3716} {"train_info/time_between_train_steps": 0.0032966136932373047, "step": 3716} {"info/global_step": 3717, "train_info/time_within_train_step": 2.755838632583618, "step": 3717} {"train_info/time_between_train_steps": 0.0033152103424072266, "step": 3717} {"info/global_step": 3718, "train_info/time_within_train_step": 2.755930185317993, "step": 3718} {"train_info/time_between_train_steps": 0.0031833648681640625, "step": 3718} {"info/global_step": 3719, "train_info/time_within_train_step": 2.7554447650909424, "step": 3719} {"train_info/time_between_train_steps": 0.0031511783599853516, "step": 3719} {"info/global_step": 3720, "train_info/time_within_train_step": 2.7547767162323, "step": 3720} {"train_info/time_between_train_steps": 0.0031473636627197266, "step": 3720} {"info/global_step": 3721, "train_info/time_within_train_step": 2.7546753883361816, "step": 3721} {"train_info/time_between_train_steps": 0.0031752586364746094, "step": 3721} {"info/global_step": 3722, "train_info/time_within_train_step": 2.7552921772003174, "step": 3722} {"train_info/time_between_train_steps": 0.003146648406982422, "step": 3722} {"info/global_step": 3723, "train_info/time_within_train_step": 2.7548797130584717, "step": 3723} {"train_info/time_between_train_steps": 0.0031697750091552734, "step": 3723} {"info/global_step": 3724, "train_info/time_within_train_step": 2.7553694248199463, "step": 3724} {"train_info/time_between_train_steps": 0.003158092498779297, "step": 3724} {"info/global_step": 3725, "train_info/time_within_train_step": 2.8795058727264404, "step": 3725} {"train_info/time_between_train_steps": 0.0032567977905273438, "step": 3725} {"info/global_step": 3726, "train_info/time_within_train_step": 2.7549259662628174, "step": 3726} {"train_info/time_between_train_steps": 0.003172636032104492, "step": 3726} {"info/global_step": 3727, "train_info/time_within_train_step": 2.755368709564209, "step": 3727} {"train_info/time_between_train_steps": 0.0031960010528564453, "step": 3727} {"info/global_step": 3728, "train_info/time_within_train_step": 2.754403591156006, "step": 3728} {"train_info/time_between_train_steps": 0.0031876564025878906, "step": 3728} {"info/global_step": 3729, "train_info/time_within_train_step": 2.754084348678589, "step": 3729} {"train_info/time_between_train_steps": 0.0032262802124023438, "step": 3729} {"info/global_step": 3730, "train_info/time_within_train_step": 2.754455089569092, "step": 3730} {"train_info/time_between_train_steps": 0.003160715103149414, "step": 3730} {"info/global_step": 3731, "train_info/time_within_train_step": 2.755200147628784, "step": 3731} {"train_info/time_between_train_steps": 0.0032181739807128906, "step": 3731} {"info/global_step": 3732, "train_info/time_within_train_step": 2.7554473876953125, "step": 3732} {"train_info/time_between_train_steps": 0.003182649612426758, "step": 3732} {"info/global_step": 3733, "train_info/time_within_train_step": 2.755293130874634, "step": 3733} {"train_info/time_between_train_steps": 0.003223896026611328, "step": 3733} {"info/global_step": 3734, "train_info/time_within_train_step": 2.755457878112793, "step": 3734} {"train_info/time_between_train_steps": 0.003179311752319336, "step": 3734} {"info/global_step": 3735, "train_info/time_within_train_step": 2.753826856613159, "step": 3735} {"train_info/time_between_train_steps": 0.003153562545776367, "step": 3735} {"info/global_step": 3736, "train_info/time_within_train_step": 2.7554166316986084, "step": 3736} {"train_info/time_between_train_steps": 0.0031938552856445312, "step": 3736} {"info/global_step": 3737, "train_info/time_within_train_step": 2.7558834552764893, "step": 3737} {"train_info/time_between_train_steps": 0.003206491470336914, "step": 3737} {"info/global_step": 3738, "train_info/time_within_train_step": 2.755114793777466, "step": 3738} {"train_info/time_between_train_steps": 0.003231048583984375, "step": 3738} {"info/global_step": 3739, "train_info/time_within_train_step": 2.754254102706909, "step": 3739} {"train_info/time_between_train_steps": 0.003141164779663086, "step": 3739} {"info/global_step": 3740, "train_info/time_within_train_step": 2.755415439605713, "step": 3740} {"train_info/time_between_train_steps": 0.003255128860473633, "step": 3740} {"info/global_step": 3741, "train_info/time_within_train_step": 2.7560782432556152, "step": 3741} {"train_info/time_between_train_steps": 0.003170013427734375, "step": 3741} {"info/global_step": 3742, "train_info/time_within_train_step": 2.7551205158233643, "step": 3742} {"train_info/time_between_train_steps": 0.0031507015228271484, "step": 3742} {"info/global_step": 3743, "train_info/time_within_train_step": 2.755380630493164, "step": 3743} {"train_info/time_between_train_steps": 0.0031909942626953125, "step": 3743} {"info/global_step": 3744, "train_info/time_within_train_step": 2.7553930282592773, "step": 3744} {"train_info/time_between_train_steps": 0.0031778812408447266, "step": 3744} {"info/global_step": 3745, "train_info/time_within_train_step": 2.7558016777038574, "step": 3745} {"train_info/time_between_train_steps": 0.0033681392669677734, "step": 3745} {"info/global_step": 3746, "train_info/time_within_train_step": 2.756636619567871, "step": 3746} {"train_info/time_between_train_steps": 0.0033540725708007812, "step": 3746} {"info/global_step": 3747, "train_info/time_within_train_step": 2.757040023803711, "step": 3747} {"train_info/time_between_train_steps": 0.0033507347106933594, "step": 3747} {"info/global_step": 3748, "train_info/time_within_train_step": 3.352221965789795, "step": 3748} {"train_info/time_between_train_steps": 0.003356456756591797, "step": 3748} {"info/global_step": 3749, "train_info/time_within_train_step": 3.008141040802002, "step": 3749} {"train_info/time_between_train_steps": 0.0034308433532714844, "step": 3749} {"info/global_step": 3750, "train_info/time_within_train_step": 2.7567005157470703, "step": 3750} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746576900, "_runtime": 10909}, "step": 3750} {"logs": {"train/loss": 3.8824, "train/learning_rate": 0.00041666666666666664, "train/epoch": 4.03, "_timestamp": 1746576900, "_runtime": 10909}, "step": 3750} {"train_info/time_between_train_steps": 0.015002250671386719, "step": 3750} {"info/global_step": 3751, "train_info/time_within_train_step": 2.7569923400878906, "step": 3751} {"train_info/time_between_train_steps": 0.003345012664794922, "step": 3751} {"info/global_step": 3752, "train_info/time_within_train_step": 2.7824020385742188, "step": 3752} {"train_info/time_between_train_steps": 0.0033257007598876953, "step": 3752} {"info/global_step": 3753, "train_info/time_within_train_step": 2.7573912143707275, "step": 3753} {"train_info/time_between_train_steps": 0.0033674240112304688, "step": 3753} {"info/global_step": 3754, "train_info/time_within_train_step": 2.7558178901672363, "step": 3754} {"train_info/time_between_train_steps": 0.003185749053955078, "step": 3754} {"info/global_step": 3755, "train_info/time_within_train_step": 2.753551721572876, "step": 3755} {"train_info/time_between_train_steps": 0.003218412399291992, "step": 3755} {"info/global_step": 3756, "train_info/time_within_train_step": 2.7549562454223633, "step": 3756} {"train_info/time_between_train_steps": 0.003243684768676758, "step": 3756} {"info/global_step": 3757, "train_info/time_within_train_step": 2.7543516159057617, "step": 3757} {"train_info/time_between_train_steps": 0.003167390823364258, "step": 3757} {"info/global_step": 3758, "train_info/time_within_train_step": 2.7544729709625244, "step": 3758} {"train_info/time_between_train_steps": 0.0031883716583251953, "step": 3758} {"info/global_step": 3759, "train_info/time_within_train_step": 2.755061388015747, "step": 3759} {"train_info/time_between_train_steps": 0.0031957626342773438, "step": 3759} {"info/global_step": 3760, "train_info/time_within_train_step": 2.755554676055908, "step": 3760} {"train_info/time_between_train_steps": 0.0031614303588867188, "step": 3760} {"info/global_step": 3761, "train_info/time_within_train_step": 2.7556328773498535, "step": 3761} {"train_info/time_between_train_steps": 0.003176450729370117, "step": 3761} {"info/global_step": 3762, "train_info/time_within_train_step": 2.7558438777923584, "step": 3762} {"train_info/time_between_train_steps": 0.003197193145751953, "step": 3762} {"info/global_step": 3763, "train_info/time_within_train_step": 2.756890296936035, "step": 3763} {"train_info/time_between_train_steps": 0.0033321380615234375, "step": 3763} {"info/global_step": 3764, "train_info/time_within_train_step": 2.7565762996673584, "step": 3764} {"train_info/time_between_train_steps": 0.003334522247314453, "step": 3764} {"info/global_step": 3765, "train_info/time_within_train_step": 2.7548906803131104, "step": 3765} {"train_info/time_between_train_steps": 0.003316164016723633, "step": 3765} {"info/global_step": 3766, "train_info/time_within_train_step": 2.756561040878296, "step": 3766} {"train_info/time_between_train_steps": 0.003455638885498047, "step": 3766} {"info/global_step": 3767, "train_info/time_within_train_step": 2.756666421890259, "step": 3767} {"train_info/time_between_train_steps": 0.0033545494079589844, "step": 3767} {"info/global_step": 3768, "train_info/time_within_train_step": 2.756923198699951, "step": 3768} {"train_info/time_between_train_steps": 0.003305673599243164, "step": 3768} {"info/global_step": 3769, "train_info/time_within_train_step": 2.7554914951324463, "step": 3769} {"train_info/time_between_train_steps": 0.0032873153686523438, "step": 3769} {"info/global_step": 3770, "train_info/time_within_train_step": 2.756706953048706, "step": 3770} {"train_info/time_between_train_steps": 0.0033495426177978516, "step": 3770} {"info/global_step": 3771, "train_info/time_within_train_step": 2.7551491260528564, "step": 3771} {"train_info/time_between_train_steps": 0.0033130645751953125, "step": 3771} {"info/global_step": 3772, "train_info/time_within_train_step": 2.7565696239471436, "step": 3772} {"train_info/time_between_train_steps": 0.0033359527587890625, "step": 3772} {"info/global_step": 3773, "train_info/time_within_train_step": 2.7559919357299805, "step": 3773} {"train_info/time_between_train_steps": 0.0033617019653320312, "step": 3773} {"info/global_step": 3774, "train_info/time_within_train_step": 2.756922960281372, "step": 3774} {"train_info/time_between_train_steps": 0.003346681594848633, "step": 3774} {"info/global_step": 3775, "train_info/time_within_train_step": 2.756749391555786, "step": 3775} {"train_info/time_between_train_steps": 0.0033762454986572266, "step": 3775} {"info/global_step": 3776, "train_info/time_within_train_step": 2.756808042526245, "step": 3776} {"train_info/time_between_train_steps": 0.003375530242919922, "step": 3776} {"info/global_step": 3777, "train_info/time_within_train_step": 2.7561697959899902, "step": 3777} {"train_info/time_between_train_steps": 0.0033159255981445312, "step": 3777} {"info/global_step": 3778, "train_info/time_within_train_step": 2.757070302963257, "step": 3778} {"train_info/time_between_train_steps": 0.0033380985260009766, "step": 3778} {"info/global_step": 3779, "train_info/time_within_train_step": 2.7560436725616455, "step": 3779} {"train_info/time_between_train_steps": 0.003353118896484375, "step": 3779} {"info/global_step": 3780, "train_info/time_within_train_step": 2.756223440170288, "step": 3780} {"train_info/time_between_train_steps": 0.003373861312866211, "step": 3780} {"info/global_step": 3781, "train_info/time_within_train_step": 2.756314754486084, "step": 3781} {"train_info/time_between_train_steps": 0.0033097267150878906, "step": 3781} {"info/global_step": 3782, "train_info/time_within_train_step": 2.7558836936950684, "step": 3782} {"train_info/time_between_train_steps": 0.003331422805786133, "step": 3782} {"info/global_step": 3783, "train_info/time_within_train_step": 2.7548580169677734, "step": 3783} {"train_info/time_between_train_steps": 0.0033044815063476562, "step": 3783} {"info/global_step": 3784, "train_info/time_within_train_step": 2.7534525394439697, "step": 3784} {"train_info/time_between_train_steps": 0.0031414031982421875, "step": 3784} {"info/global_step": 3785, "train_info/time_within_train_step": 2.7539992332458496, "step": 3785} {"train_info/time_between_train_steps": 0.0032041072845458984, "step": 3785} {"info/global_step": 3786, "train_info/time_within_train_step": 2.7531392574310303, "step": 3786} {"train_info/time_between_train_steps": 0.0031659603118896484, "step": 3786} {"info/global_step": 3787, "train_info/time_within_train_step": 2.754629135131836, "step": 3787} {"train_info/time_between_train_steps": 0.1478900909423828, "step": 3787} {"info/global_step": 3788, "train_info/time_within_train_step": 2.7728936672210693, "step": 3788} {"train_info/time_between_train_steps": 0.003213167190551758, "step": 3788} {"info/global_step": 3789, "train_info/time_within_train_step": 2.762603282928467, "step": 3789} {"train_info/time_between_train_steps": 0.003208160400390625, "step": 3789} {"info/global_step": 3790, "train_info/time_within_train_step": 2.755366563796997, "step": 3790} {"train_info/time_between_train_steps": 0.003197908401489258, "step": 3790} {"info/global_step": 3791, "train_info/time_within_train_step": 2.7583820819854736, "step": 3791} {"train_info/time_between_train_steps": 0.0033559799194335938, "step": 3791} {"info/global_step": 3792, "train_info/time_within_train_step": 2.7564306259155273, "step": 3792} {"train_info/time_between_train_steps": 0.003319978713989258, "step": 3792} {"info/global_step": 3793, "train_info/time_within_train_step": 2.7561020851135254, "step": 3793} {"train_info/time_between_train_steps": 0.003343820571899414, "step": 3793} {"info/global_step": 3794, "train_info/time_within_train_step": 2.75665545463562, "step": 3794} {"train_info/time_between_train_steps": 0.0033445358276367188, "step": 3794} {"info/global_step": 3795, "train_info/time_within_train_step": 2.7555341720581055, "step": 3795} {"train_info/time_between_train_steps": 0.003336668014526367, "step": 3795} {"info/global_step": 3796, "train_info/time_within_train_step": 2.7559192180633545, "step": 3796} {"train_info/time_between_train_steps": 0.0033469200134277344, "step": 3796} {"info/global_step": 3797, "train_info/time_within_train_step": 2.7561192512512207, "step": 3797} {"train_info/time_between_train_steps": 0.0033211708068847656, "step": 3797} {"info/global_step": 3798, "train_info/time_within_train_step": 2.7563397884368896, "step": 3798} {"train_info/time_between_train_steps": 0.0033338069915771484, "step": 3798} {"info/global_step": 3799, "train_info/time_within_train_step": 2.755587100982666, "step": 3799} {"train_info/time_between_train_steps": 0.003343343734741211, "step": 3799} {"info/global_step": 3800, "train_info/time_within_train_step": 2.755960702896118, "step": 3800} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746577039, "_runtime": 11048}, "step": 3800} {"logs": {"train/loss": 3.8765, "train/learning_rate": 0.0004133333333333333, "train/epoch": 4.04, "_timestamp": 1746577039, "_runtime": 11048}, "step": 3800} {"train_info/time_between_train_steps": 19.70453977584839, "step": 3800} {"info/global_step": 3801, "train_info/time_within_train_step": 2.527770757675171, "step": 3801} {"train_info/time_between_train_steps": 0.003374814987182617, "step": 3801} {"info/global_step": 3802, "train_info/time_within_train_step": 2.6054563522338867, "step": 3802} {"train_info/time_between_train_steps": 0.0033376216888427734, "step": 3802} {"info/global_step": 3803, "train_info/time_within_train_step": 2.712095022201538, "step": 3803} {"train_info/time_between_train_steps": 0.0033423900604248047, "step": 3803} {"info/global_step": 3804, "train_info/time_within_train_step": 2.749807596206665, "step": 3804} {"train_info/time_between_train_steps": 0.0033893585205078125, "step": 3804} {"info/global_step": 3805, "train_info/time_within_train_step": 3.00484037399292, "step": 3805} {"train_info/time_between_train_steps": 0.0031478404998779297, "step": 3805} {"info/global_step": 3806, "train_info/time_within_train_step": 2.7549586296081543, "step": 3806} {"train_info/time_between_train_steps": 0.0031769275665283203, "step": 3806} {"info/global_step": 3807, "train_info/time_within_train_step": 2.7557713985443115, "step": 3807} {"train_info/time_between_train_steps": 0.0035805702209472656, "step": 3807} {"info/global_step": 3808, "train_info/time_within_train_step": 2.7550854682922363, "step": 3808} {"train_info/time_between_train_steps": 0.0032198429107666016, "step": 3808} {"info/global_step": 3809, "train_info/time_within_train_step": 2.7559735774993896, "step": 3809} {"train_info/time_between_train_steps": 0.003305673599243164, "step": 3809} {"info/global_step": 3810, "train_info/time_within_train_step": 2.7565431594848633, "step": 3810} {"train_info/time_between_train_steps": 0.0032596588134765625, "step": 3810} {"info/global_step": 3811, "train_info/time_within_train_step": 2.7554337978363037, "step": 3811} {"train_info/time_between_train_steps": 0.0032694339752197266, "step": 3811} {"info/global_step": 3812, "train_info/time_within_train_step": 2.756051540374756, "step": 3812} {"train_info/time_between_train_steps": 0.0032758712768554688, "step": 3812} {"info/global_step": 3813, "train_info/time_within_train_step": 2.757297992706299, "step": 3813} {"train_info/time_between_train_steps": 0.0032694339752197266, "step": 3813} {"info/global_step": 3814, "train_info/time_within_train_step": 2.7563390731811523, "step": 3814} {"train_info/time_between_train_steps": 0.0032498836517333984, "step": 3814} {"info/global_step": 3815, "train_info/time_within_train_step": 2.755493640899658, "step": 3815} {"train_info/time_between_train_steps": 0.0032224655151367188, "step": 3815} {"info/global_step": 3816, "train_info/time_within_train_step": 2.7554116249084473, "step": 3816} {"train_info/time_between_train_steps": 0.0032083988189697266, "step": 3816} {"info/global_step": 3817, "train_info/time_within_train_step": 2.756967067718506, "step": 3817} {"train_info/time_between_train_steps": 0.0032002925872802734, "step": 3817} {"info/global_step": 3818, "train_info/time_within_train_step": 2.7568020820617676, "step": 3818} {"train_info/time_between_train_steps": 0.0032253265380859375, "step": 3818} {"info/global_step": 3819, "train_info/time_within_train_step": 2.756768226623535, "step": 3819} {"train_info/time_between_train_steps": 0.0032236576080322266, "step": 3819} {"info/global_step": 3820, "train_info/time_within_train_step": 2.756807327270508, "step": 3820} {"train_info/time_between_train_steps": 0.00323486328125, "step": 3820} {"info/global_step": 3821, "train_info/time_within_train_step": 2.755805492401123, "step": 3821} {"train_info/time_between_train_steps": 0.003229379653930664, "step": 3821} {"info/global_step": 3822, "train_info/time_within_train_step": 2.7562015056610107, "step": 3822} {"train_info/time_between_train_steps": 0.003303050994873047, "step": 3822} {"info/global_step": 3823, "train_info/time_within_train_step": 2.7563228607177734, "step": 3823} {"train_info/time_between_train_steps": 0.0032231807708740234, "step": 3823} {"info/global_step": 3824, "train_info/time_within_train_step": 2.756042003631592, "step": 3824} {"train_info/time_between_train_steps": 0.003290891647338867, "step": 3824} {"info/global_step": 3825, "train_info/time_within_train_step": 2.7562618255615234, "step": 3825} {"train_info/time_between_train_steps": 0.003298044204711914, "step": 3825} {"info/global_step": 3826, "train_info/time_within_train_step": 2.757188558578491, "step": 3826} {"train_info/time_between_train_steps": 0.0033121109008789062, "step": 3826} {"info/global_step": 3827, "train_info/time_within_train_step": 2.7545506954193115, "step": 3827} {"train_info/time_between_train_steps": 0.003202676773071289, "step": 3827} {"info/global_step": 3828, "train_info/time_within_train_step": 2.755417823791504, "step": 3828} {"train_info/time_between_train_steps": 0.0032453536987304688, "step": 3828} {"info/global_step": 3829, "train_info/time_within_train_step": 2.755343198776245, "step": 3829} {"train_info/time_between_train_steps": 0.00322723388671875, "step": 3829} {"info/global_step": 3830, "train_info/time_within_train_step": 2.7549493312835693, "step": 3830} {"train_info/time_between_train_steps": 0.003261566162109375, "step": 3830} {"info/global_step": 3831, "train_info/time_within_train_step": 2.755904197692871, "step": 3831} {"train_info/time_between_train_steps": 0.0032150745391845703, "step": 3831} {"info/global_step": 3832, "train_info/time_within_train_step": 2.7562005519866943, "step": 3832} {"train_info/time_between_train_steps": 0.0032913684844970703, "step": 3832} {"info/global_step": 3833, "train_info/time_within_train_step": 2.7553598880767822, "step": 3833} {"train_info/time_between_train_steps": 0.003325223922729492, "step": 3833} {"info/global_step": 3834, "train_info/time_within_train_step": 2.7546815872192383, "step": 3834} {"train_info/time_between_train_steps": 0.0032694339752197266, "step": 3834} {"info/global_step": 3835, "train_info/time_within_train_step": 2.755504608154297, "step": 3835} {"train_info/time_between_train_steps": 0.003328561782836914, "step": 3835} {"info/global_step": 3836, "train_info/time_within_train_step": 2.756312370300293, "step": 3836} {"train_info/time_between_train_steps": 0.0032329559326171875, "step": 3836} {"info/global_step": 3837, "train_info/time_within_train_step": 2.7546157836914062, "step": 3837} {"train_info/time_between_train_steps": 0.003240346908569336, "step": 3837} {"info/global_step": 3838, "train_info/time_within_train_step": 2.75414776802063, "step": 3838} {"train_info/time_between_train_steps": 0.003258943557739258, "step": 3838} {"info/global_step": 3839, "train_info/time_within_train_step": 2.7548367977142334, "step": 3839} {"train_info/time_between_train_steps": 0.0031473636627197266, "step": 3839} {"info/global_step": 3840, "train_info/time_within_train_step": 2.753911018371582, "step": 3840} {"train_info/time_between_train_steps": 0.0032079219818115234, "step": 3840} {"info/global_step": 3841, "train_info/time_within_train_step": 2.7559292316436768, "step": 3841} {"train_info/time_between_train_steps": 0.003220796585083008, "step": 3841} {"info/global_step": 3842, "train_info/time_within_train_step": 2.7554047107696533, "step": 3842} {"train_info/time_between_train_steps": 0.0032434463500976562, "step": 3842} {"info/global_step": 3843, "train_info/time_within_train_step": 2.7548165321350098, "step": 3843} {"train_info/time_between_train_steps": 0.003243684768676758, "step": 3843} {"info/global_step": 3844, "train_info/time_within_train_step": 2.7538938522338867, "step": 3844} {"train_info/time_between_train_steps": 0.0033349990844726562, "step": 3844} {"info/global_step": 3845, "train_info/time_within_train_step": 2.7542028427124023, "step": 3845} {"train_info/time_between_train_steps": 0.0032002925872802734, "step": 3845} {"info/global_step": 3846, "train_info/time_within_train_step": 2.755596876144409, "step": 3846} {"train_info/time_between_train_steps": 0.003297090530395508, "step": 3846} {"info/global_step": 3847, "train_info/time_within_train_step": 2.7557485103607178, "step": 3847} {"train_info/time_between_train_steps": 0.003204345703125, "step": 3847} {"info/global_step": 3848, "train_info/time_within_train_step": 2.7561235427856445, "step": 3848} {"train_info/time_between_train_steps": 0.003443479537963867, "step": 3848} {"info/global_step": 3849, "train_info/time_within_train_step": 2.7573904991149902, "step": 3849} {"train_info/time_between_train_steps": 0.0033690929412841797, "step": 3849} {"info/global_step": 3850, "train_info/time_within_train_step": 2.918703556060791, "step": 3850} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746577197, "_runtime": 11206}, "step": 3850} {"logs": {"train/loss": 3.8536, "train/learning_rate": 0.00041, "train/epoch": 4.04, "_timestamp": 1746577197, "_runtime": 11206}, "step": 3850} {"train_info/time_between_train_steps": 0.01334524154663086, "step": 3850} {"info/global_step": 3851, "train_info/time_within_train_step": 2.7585134506225586, "step": 3851} {"train_info/time_between_train_steps": 0.0034432411193847656, "step": 3851} {"info/global_step": 3852, "train_info/time_within_train_step": 2.7569520473480225, "step": 3852} {"train_info/time_between_train_steps": 0.003343343734741211, "step": 3852} {"info/global_step": 3853, "train_info/time_within_train_step": 2.757059335708618, "step": 3853} {"train_info/time_between_train_steps": 0.0033757686614990234, "step": 3853} {"info/global_step": 3854, "train_info/time_within_train_step": 2.7555603981018066, "step": 3854} {"train_info/time_between_train_steps": 0.0033566951751708984, "step": 3854} {"info/global_step": 3855, "train_info/time_within_train_step": 2.7568678855895996, "step": 3855} {"train_info/time_between_train_steps": 0.003403186798095703, "step": 3855} {"info/global_step": 3856, "train_info/time_within_train_step": 2.756075143814087, "step": 3856} {"train_info/time_between_train_steps": 0.0041654109954833984, "step": 3856} {"info/global_step": 3857, "train_info/time_within_train_step": 2.755988836288452, "step": 3857} {"train_info/time_between_train_steps": 0.003370523452758789, "step": 3857} {"info/global_step": 3858, "train_info/time_within_train_step": 2.755927324295044, "step": 3858} {"train_info/time_between_train_steps": 0.0033674240112304688, "step": 3858} {"info/global_step": 3859, "train_info/time_within_train_step": 2.755366325378418, "step": 3859} {"train_info/time_between_train_steps": 0.003340482711791992, "step": 3859} {"info/global_step": 3860, "train_info/time_within_train_step": 3.0380287170410156, "step": 3860} {"train_info/time_between_train_steps": 0.003355264663696289, "step": 3860} {"info/global_step": 3861, "train_info/time_within_train_step": 2.7558305263519287, "step": 3861} {"train_info/time_between_train_steps": 0.003351449966430664, "step": 3861} {"info/global_step": 3862, "train_info/time_within_train_step": 2.7552292346954346, "step": 3862} {"train_info/time_between_train_steps": 0.0033326148986816406, "step": 3862} {"info/global_step": 3863, "train_info/time_within_train_step": 2.7544665336608887, "step": 3863} {"train_info/time_between_train_steps": 0.003175973892211914, "step": 3863} {"info/global_step": 3864, "train_info/time_within_train_step": 2.7542738914489746, "step": 3864} {"train_info/time_between_train_steps": 0.003168344497680664, "step": 3864} {"info/global_step": 3865, "train_info/time_within_train_step": 2.754861831665039, "step": 3865} {"train_info/time_between_train_steps": 0.0031948089599609375, "step": 3865} {"info/global_step": 3866, "train_info/time_within_train_step": 2.754925489425659, "step": 3866} {"train_info/time_between_train_steps": 0.003224611282348633, "step": 3866} {"info/global_step": 3867, "train_info/time_within_train_step": 2.7560503482818604, "step": 3867} {"train_info/time_between_train_steps": 0.00316619873046875, "step": 3867} {"info/global_step": 3868, "train_info/time_within_train_step": 2.755005359649658, "step": 3868} {"train_info/time_between_train_steps": 0.003204345703125, "step": 3868} {"info/global_step": 3869, "train_info/time_within_train_step": 2.7554564476013184, "step": 3869} {"train_info/time_between_train_steps": 0.003191232681274414, "step": 3869} {"info/global_step": 3870, "train_info/time_within_train_step": 2.754894733428955, "step": 3870} {"train_info/time_between_train_steps": 0.0031876564025878906, "step": 3870} {"info/global_step": 3871, "train_info/time_within_train_step": 2.75439190864563, "step": 3871} {"train_info/time_between_train_steps": 0.0031638145446777344, "step": 3871} {"info/global_step": 3872, "train_info/time_within_train_step": 2.755420446395874, "step": 3872} {"train_info/time_between_train_steps": 0.00318145751953125, "step": 3872} {"info/global_step": 3873, "train_info/time_within_train_step": 2.7547760009765625, "step": 3873} {"train_info/time_between_train_steps": 0.0031778812408447266, "step": 3873} {"info/global_step": 3874, "train_info/time_within_train_step": 2.7542879581451416, "step": 3874} {"train_info/time_between_train_steps": 0.003164052963256836, "step": 3874} {"info/global_step": 3875, "train_info/time_within_train_step": 2.7547447681427, "step": 3875} {"train_info/time_between_train_steps": 0.003184080123901367, "step": 3875} {"info/global_step": 3876, "train_info/time_within_train_step": 2.754837989807129, "step": 3876} {"train_info/time_between_train_steps": 0.0031561851501464844, "step": 3876} {"info/global_step": 3877, "train_info/time_within_train_step": 2.7533576488494873, "step": 3877} {"train_info/time_between_train_steps": 0.003175497055053711, "step": 3877} {"info/global_step": 3878, "train_info/time_within_train_step": 2.7549521923065186, "step": 3878} {"train_info/time_between_train_steps": 0.0032236576080322266, "step": 3878} {"info/global_step": 3879, "train_info/time_within_train_step": 2.7549116611480713, "step": 3879} {"train_info/time_between_train_steps": 0.003235340118408203, "step": 3879} {"info/global_step": 3880, "train_info/time_within_train_step": 2.754655122756958, "step": 3880} {"train_info/time_between_train_steps": 0.0032181739807128906, "step": 3880} {"info/global_step": 3881, "train_info/time_within_train_step": 2.7555484771728516, "step": 3881} {"train_info/time_between_train_steps": 0.0032112598419189453, "step": 3881} {"info/global_step": 3882, "train_info/time_within_train_step": 2.755077600479126, "step": 3882} {"train_info/time_between_train_steps": 0.0031626224517822266, "step": 3882} {"info/global_step": 3883, "train_info/time_within_train_step": 2.7557373046875, "step": 3883} {"train_info/time_between_train_steps": 0.003237009048461914, "step": 3883} {"info/global_step": 3884, "train_info/time_within_train_step": 2.7546753883361816, "step": 3884} {"train_info/time_between_train_steps": 0.003168821334838867, "step": 3884} {"info/global_step": 3885, "train_info/time_within_train_step": 2.754662036895752, "step": 3885} {"train_info/time_between_train_steps": 0.0031735897064208984, "step": 3885} {"info/global_step": 3886, "train_info/time_within_train_step": 2.7560031414031982, "step": 3886} {"train_info/time_between_train_steps": 0.003370523452758789, "step": 3886} {"info/global_step": 3887, "train_info/time_within_train_step": 2.755647659301758, "step": 3887} {"train_info/time_between_train_steps": 0.0032515525817871094, "step": 3887} {"info/global_step": 3888, "train_info/time_within_train_step": 2.7559473514556885, "step": 3888} {"train_info/time_between_train_steps": 0.0032117366790771484, "step": 3888} {"info/global_step": 3889, "train_info/time_within_train_step": 2.7541534900665283, "step": 3889} {"train_info/time_between_train_steps": 0.0032110214233398438, "step": 3889} {"info/global_step": 3890, "train_info/time_within_train_step": 2.754906177520752, "step": 3890} {"train_info/time_between_train_steps": 0.0032355785369873047, "step": 3890} {"info/global_step": 3891, "train_info/time_within_train_step": 2.754986047744751, "step": 3891} {"train_info/time_between_train_steps": 0.003177165985107422, "step": 3891} {"info/global_step": 3892, "train_info/time_within_train_step": 2.7546002864837646, "step": 3892} {"train_info/time_between_train_steps": 0.0032753944396972656, "step": 3892} {"info/global_step": 3893, "train_info/time_within_train_step": 2.7555079460144043, "step": 3893} {"train_info/time_between_train_steps": 0.0031647682189941406, "step": 3893} {"info/global_step": 3894, "train_info/time_within_train_step": 2.754579544067383, "step": 3894} {"train_info/time_between_train_steps": 0.003183603286743164, "step": 3894} {"info/global_step": 3895, "train_info/time_within_train_step": 2.754143476486206, "step": 3895} {"train_info/time_between_train_steps": 0.003228902816772461, "step": 3895} {"info/global_step": 3896, "train_info/time_within_train_step": 2.752006769180298, "step": 3896} {"train_info/time_between_train_steps": 0.0032227039337158203, "step": 3896} {"info/global_step": 3897, "train_info/time_within_train_step": 2.7548179626464844, "step": 3897} {"train_info/time_between_train_steps": 0.0032415390014648438, "step": 3897} {"info/global_step": 3898, "train_info/time_within_train_step": 2.755363702774048, "step": 3898} {"train_info/time_between_train_steps": 0.0031905174255371094, "step": 3898} {"info/global_step": 3899, "train_info/time_within_train_step": 2.754072666168213, "step": 3899} {"train_info/time_between_train_steps": 0.0032143592834472656, "step": 3899} {"info/global_step": 3900, "train_info/time_within_train_step": 3.044452428817749, "step": 3900} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746577336, "_runtime": 11345}, "step": 3900} {"logs": {"train/loss": 3.8509, "train/learning_rate": 0.00040666666666666667, "train/epoch": 4.05, "_timestamp": 1746577336, "_runtime": 11345}, "step": 3900} {"train_info/time_between_train_steps": 0.013185501098632812, "step": 3900} {"info/global_step": 3901, "train_info/time_within_train_step": 2.7554636001586914, "step": 3901} {"train_info/time_between_train_steps": 0.003351449966430664, "step": 3901} {"info/global_step": 3902, "train_info/time_within_train_step": 2.7550559043884277, "step": 3902} {"train_info/time_between_train_steps": 0.0033311843872070312, "step": 3902} {"info/global_step": 3903, "train_info/time_within_train_step": 2.7554593086242676, "step": 3903} {"train_info/time_between_train_steps": 0.0033257007598876953, "step": 3903} {"info/global_step": 3904, "train_info/time_within_train_step": 2.7561750411987305, "step": 3904} {"train_info/time_between_train_steps": 0.003359079360961914, "step": 3904} {"info/global_step": 3905, "train_info/time_within_train_step": 2.7563023567199707, "step": 3905} {"train_info/time_between_train_steps": 0.0034720897674560547, "step": 3905} {"info/global_step": 3906, "train_info/time_within_train_step": 2.7556538581848145, "step": 3906} {"train_info/time_between_train_steps": 0.0034821033477783203, "step": 3906} {"info/global_step": 3907, "train_info/time_within_train_step": 2.7560923099517822, "step": 3907} {"train_info/time_between_train_steps": 0.003459453582763672, "step": 3907} {"info/global_step": 3908, "train_info/time_within_train_step": 2.7551987171173096, "step": 3908} {"train_info/time_between_train_steps": 0.0034291744232177734, "step": 3908} {"info/global_step": 3909, "train_info/time_within_train_step": 2.7547976970672607, "step": 3909} {"train_info/time_between_train_steps": 0.003377199172973633, "step": 3909} {"info/global_step": 3910, "train_info/time_within_train_step": 2.7555065155029297, "step": 3910} {"train_info/time_between_train_steps": 0.003412961959838867, "step": 3910} {"info/global_step": 3911, "train_info/time_within_train_step": 2.755760431289673, "step": 3911} {"train_info/time_between_train_steps": 0.003365755081176758, "step": 3911} {"info/global_step": 3912, "train_info/time_within_train_step": 2.7548208236694336, "step": 3912} {"train_info/time_between_train_steps": 0.10083723068237305, "step": 3912} {"info/global_step": 3913, "train_info/time_within_train_step": 2.755689859390259, "step": 3913} {"train_info/time_between_train_steps": 0.003371000289916992, "step": 3913} {"info/global_step": 3914, "train_info/time_within_train_step": 2.757256031036377, "step": 3914} {"train_info/time_between_train_steps": 0.0034284591674804688, "step": 3914} {"info/global_step": 3915, "train_info/time_within_train_step": 2.755803346633911, "step": 3915} {"train_info/time_between_train_steps": 0.003373861312866211, "step": 3915} {"info/global_step": 3916, "train_info/time_within_train_step": 2.7579963207244873, "step": 3916} {"train_info/time_between_train_steps": 0.0033690929412841797, "step": 3916} {"info/global_step": 3917, "train_info/time_within_train_step": 2.7586429119110107, "step": 3917} {"train_info/time_between_train_steps": 0.0034470558166503906, "step": 3917} {"info/global_step": 3918, "train_info/time_within_train_step": 2.7569596767425537, "step": 3918} {"train_info/time_between_train_steps": 0.0033507347106933594, "step": 3918} {"info/global_step": 3919, "train_info/time_within_train_step": 2.7812726497650146, "step": 3919} {"train_info/time_between_train_steps": 0.0033338069915771484, "step": 3919} {"info/global_step": 3920, "train_info/time_within_train_step": 2.7568955421447754, "step": 3920} {"train_info/time_between_train_steps": 0.0034089088439941406, "step": 3920} {"info/global_step": 3921, "train_info/time_within_train_step": 2.754772424697876, "step": 3921} {"train_info/time_between_train_steps": 0.0034241676330566406, "step": 3921} {"info/global_step": 3922, "train_info/time_within_train_step": 2.7562639713287354, "step": 3922} {"train_info/time_between_train_steps": 0.0033288002014160156, "step": 3922} {"info/global_step": 3923, "train_info/time_within_train_step": 2.755678653717041, "step": 3923} {"train_info/time_between_train_steps": 0.0033826828002929688, "step": 3923} {"info/global_step": 3924, "train_info/time_within_train_step": 2.755026340484619, "step": 3924} {"train_info/time_between_train_steps": 0.0033948421478271484, "step": 3924} {"info/global_step": 3925, "train_info/time_within_train_step": 2.7558400630950928, "step": 3925} {"train_info/time_between_train_steps": 0.0033838748931884766, "step": 3925} {"info/global_step": 3926, "train_info/time_within_train_step": 2.756441116333008, "step": 3926} {"train_info/time_between_train_steps": 0.0033617019653320312, "step": 3926} {"info/global_step": 3927, "train_info/time_within_train_step": 2.755863666534424, "step": 3927} {"train_info/time_between_train_steps": 0.0033407211303710938, "step": 3927} {"info/global_step": 3928, "train_info/time_within_train_step": 2.7540721893310547, "step": 3928} {"train_info/time_between_train_steps": 0.003370523452758789, "step": 3928} {"info/global_step": 3929, "train_info/time_within_train_step": 2.7523059844970703, "step": 3929} {"train_info/time_between_train_steps": 0.003404855728149414, "step": 3929} {"info/global_step": 3930, "train_info/time_within_train_step": 2.7547590732574463, "step": 3930} {"train_info/time_between_train_steps": 0.0033452510833740234, "step": 3930} {"info/global_step": 3931, "train_info/time_within_train_step": 2.7554373741149902, "step": 3931} {"train_info/time_between_train_steps": 0.003376483917236328, "step": 3931} {"info/global_step": 3932, "train_info/time_within_train_step": 2.7551589012145996, "step": 3932} {"train_info/time_between_train_steps": 0.0034151077270507812, "step": 3932} {"info/global_step": 3933, "train_info/time_within_train_step": 2.7566256523132324, "step": 3933} {"train_info/time_between_train_steps": 0.0033643245697021484, "step": 3933} {"info/global_step": 3934, "train_info/time_within_train_step": 2.755095958709717, "step": 3934} {"train_info/time_between_train_steps": 0.0033478736877441406, "step": 3934} {"info/global_step": 3935, "train_info/time_within_train_step": 2.756253480911255, "step": 3935} {"train_info/time_between_train_steps": 0.003343820571899414, "step": 3935} {"info/global_step": 3936, "train_info/time_within_train_step": 2.75738525390625, "step": 3936} {"train_info/time_between_train_steps": 0.0033562183380126953, "step": 3936} {"info/global_step": 3937, "train_info/time_within_train_step": 2.7554099559783936, "step": 3937} {"train_info/time_between_train_steps": 0.003387451171875, "step": 3937} {"info/global_step": 3938, "train_info/time_within_train_step": 2.756101369857788, "step": 3938} {"train_info/time_between_train_steps": 0.003355264663696289, "step": 3938} {"info/global_step": 3939, "train_info/time_within_train_step": 2.7551562786102295, "step": 3939} {"train_info/time_between_train_steps": 0.003355741500854492, "step": 3939} {"info/global_step": 3940, "train_info/time_within_train_step": 3.038551092147827, "step": 3940} {"train_info/time_between_train_steps": 0.0034520626068115234, "step": 3940} {"info/global_step": 3941, "train_info/time_within_train_step": 2.7548182010650635, "step": 3941} {"train_info/time_between_train_steps": 0.003340005874633789, "step": 3941} {"info/global_step": 3942, "train_info/time_within_train_step": 2.7553422451019287, "step": 3942} {"train_info/time_between_train_steps": 0.003330230712890625, "step": 3942} {"info/global_step": 3943, "train_info/time_within_train_step": 2.756636142730713, "step": 3943} {"train_info/time_between_train_steps": 0.0034613609313964844, "step": 3943} {"info/global_step": 3944, "train_info/time_within_train_step": 2.754699230194092, "step": 3944} {"train_info/time_between_train_steps": 0.003206014633178711, "step": 3944} {"info/global_step": 3945, "train_info/time_within_train_step": 2.7540810108184814, "step": 3945} {"train_info/time_between_train_steps": 0.004026174545288086, "step": 3945} {"info/global_step": 3946, "train_info/time_within_train_step": 2.753753662109375, "step": 3946} {"train_info/time_between_train_steps": 0.0032265186309814453, "step": 3946} {"info/global_step": 3947, "train_info/time_within_train_step": 2.7544612884521484, "step": 3947} {"train_info/time_between_train_steps": 0.003180980682373047, "step": 3947} {"info/global_step": 3948, "train_info/time_within_train_step": 2.75476336479187, "step": 3948} {"train_info/time_between_train_steps": 0.003233671188354492, "step": 3948} {"info/global_step": 3949, "train_info/time_within_train_step": 2.754244327545166, "step": 3949} {"train_info/time_between_train_steps": 0.0031735897064208984, "step": 3949} {"info/global_step": 3950, "train_info/time_within_train_step": 2.7544667720794678, "step": 3950} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746577475, "_runtime": 11484}, "step": 3950} {"logs": {"train/loss": 3.8418, "train/learning_rate": 0.00040333333333333334, "train/epoch": 4.05, "_timestamp": 1746577475, "_runtime": 11484}, "step": 3950} {"train_info/time_between_train_steps": 0.013407468795776367, "step": 3950} {"info/global_step": 3951, "train_info/time_within_train_step": 2.7566964626312256, "step": 3951} {"train_info/time_between_train_steps": 0.003206491470336914, "step": 3951} {"info/global_step": 3952, "train_info/time_within_train_step": 2.7555906772613525, "step": 3952} {"train_info/time_between_train_steps": 0.003206968307495117, "step": 3952} {"info/global_step": 3953, "train_info/time_within_train_step": 2.7544150352478027, "step": 3953} {"train_info/time_between_train_steps": 0.01994490623474121, "step": 3953} {"info/global_step": 3954, "train_info/time_within_train_step": 2.7535829544067383, "step": 3954} {"train_info/time_between_train_steps": 0.002897500991821289, "step": 3954} {"info/global_step": 3955, "train_info/time_within_train_step": 2.7536280155181885, "step": 3955} {"train_info/time_between_train_steps": 0.0028793811798095703, "step": 3955} {"info/global_step": 3956, "train_info/time_within_train_step": 2.7537147998809814, "step": 3956} {"train_info/time_between_train_steps": 0.0028810501098632812, "step": 3956} {"info/global_step": 3957, "train_info/time_within_train_step": 2.7547245025634766, "step": 3957} {"train_info/time_between_train_steps": 0.0030241012573242188, "step": 3957} {"info/global_step": 3958, "train_info/time_within_train_step": 2.755620241165161, "step": 3958} {"train_info/time_between_train_steps": 0.0029535293579101562, "step": 3958} {"info/global_step": 3959, "train_info/time_within_train_step": 2.753929853439331, "step": 3959} {"train_info/time_between_train_steps": 0.002998828887939453, "step": 3959} {"info/global_step": 3960, "train_info/time_within_train_step": 2.7550032138824463, "step": 3960} {"train_info/time_between_train_steps": 0.0029587745666503906, "step": 3960} {"info/global_step": 3961, "train_info/time_within_train_step": 2.7540805339813232, "step": 3961} {"train_info/time_between_train_steps": 0.003011941909790039, "step": 3961} {"info/global_step": 3962, "train_info/time_within_train_step": 2.7555932998657227, "step": 3962} {"train_info/time_between_train_steps": 0.0029435157775878906, "step": 3962} {"info/global_step": 3963, "train_info/time_within_train_step": 2.754807949066162, "step": 3963} {"train_info/time_between_train_steps": 0.003030538558959961, "step": 3963} {"info/global_step": 3964, "train_info/time_within_train_step": 2.7553658485412598, "step": 3964} {"train_info/time_between_train_steps": 0.003009796142578125, "step": 3964} {"info/global_step": 3965, "train_info/time_within_train_step": 2.754852771759033, "step": 3965} {"train_info/time_between_train_steps": 0.0029616355895996094, "step": 3965} {"info/global_step": 3966, "train_info/time_within_train_step": 2.755183219909668, "step": 3966} {"train_info/time_between_train_steps": 0.0030145645141601562, "step": 3966} {"info/global_step": 3967, "train_info/time_within_train_step": 2.7539188861846924, "step": 3967} {"train_info/time_between_train_steps": 0.0029408931732177734, "step": 3967} {"info/global_step": 3968, "train_info/time_within_train_step": 2.7539432048797607, "step": 3968} {"train_info/time_between_train_steps": 0.0029418468475341797, "step": 3968} {"info/global_step": 3969, "train_info/time_within_train_step": 2.756399154663086, "step": 3969} {"train_info/time_between_train_steps": 0.002956390380859375, "step": 3969} {"info/global_step": 3970, "train_info/time_within_train_step": 2.7562415599823, "step": 3970} {"train_info/time_between_train_steps": 0.0029745101928710938, "step": 3970} {"info/global_step": 3971, "train_info/time_within_train_step": 2.7553014755249023, "step": 3971} {"train_info/time_between_train_steps": 0.003011941909790039, "step": 3971} {"info/global_step": 3972, "train_info/time_within_train_step": 2.7556560039520264, "step": 3972} {"train_info/time_between_train_steps": 0.003039121627807617, "step": 3972} {"info/global_step": 3973, "train_info/time_within_train_step": 2.7561194896698, "step": 3973} {"train_info/time_between_train_steps": 0.003130197525024414, "step": 3973} {"info/global_step": 3974, "train_info/time_within_train_step": 2.7559077739715576, "step": 3974} {"train_info/time_between_train_steps": 0.002978086471557617, "step": 3974} {"info/global_step": 3975, "train_info/time_within_train_step": 2.7549030780792236, "step": 3975} {"train_info/time_between_train_steps": 0.0029592514038085938, "step": 3975} {"info/global_step": 3976, "train_info/time_within_train_step": 2.7552430629730225, "step": 3976} {"train_info/time_between_train_steps": 0.0029556751251220703, "step": 3976} {"info/global_step": 3977, "train_info/time_within_train_step": 2.75480318069458, "step": 3977} {"train_info/time_between_train_steps": 0.0029973983764648438, "step": 3977} {"info/global_step": 3978, "train_info/time_within_train_step": 2.7551698684692383, "step": 3978} {"train_info/time_between_train_steps": 0.0029473304748535156, "step": 3978} {"info/global_step": 3979, "train_info/time_within_train_step": 2.7528443336486816, "step": 3979} {"train_info/time_between_train_steps": 0.0029473304748535156, "step": 3979} {"info/global_step": 3980, "train_info/time_within_train_step": 2.754490613937378, "step": 3980} {"train_info/time_between_train_steps": 0.002997875213623047, "step": 3980} {"info/global_step": 3981, "train_info/time_within_train_step": 2.753836154937744, "step": 3981} {"train_info/time_between_train_steps": 0.002841472625732422, "step": 3981} {"info/global_step": 3982, "train_info/time_within_train_step": 2.7546133995056152, "step": 3982} {"train_info/time_between_train_steps": 0.002881288528442383, "step": 3982} {"info/global_step": 3983, "train_info/time_within_train_step": 2.753617525100708, "step": 3983} {"train_info/time_between_train_steps": 0.0029053688049316406, "step": 3983} {"info/global_step": 3984, "train_info/time_within_train_step": 2.754577875137329, "step": 3984} {"train_info/time_between_train_steps": 0.0028879642486572266, "step": 3984} {"info/global_step": 3985, "train_info/time_within_train_step": 2.754150152206421, "step": 3985} {"train_info/time_between_train_steps": 0.0028710365295410156, "step": 3985} {"info/global_step": 3986, "train_info/time_within_train_step": 2.7544820308685303, "step": 3986} {"train_info/time_between_train_steps": 0.002885103225708008, "step": 3986} {"info/global_step": 3987, "train_info/time_within_train_step": 2.7552437782287598, "step": 3987} {"train_info/time_between_train_steps": 0.0028612613677978516, "step": 3987} {"info/global_step": 3988, "train_info/time_within_train_step": 2.7547121047973633, "step": 3988} {"train_info/time_between_train_steps": 0.0028862953186035156, "step": 3988} {"info/global_step": 3989, "train_info/time_within_train_step": 2.754009485244751, "step": 3989} {"train_info/time_between_train_steps": 0.002909421920776367, "step": 3989} {"info/global_step": 3990, "train_info/time_within_train_step": 2.755321741104126, "step": 3990} {"train_info/time_between_train_steps": 0.002859354019165039, "step": 3990} {"info/global_step": 3991, "train_info/time_within_train_step": 2.7536706924438477, "step": 3991} {"train_info/time_between_train_steps": 0.0029163360595703125, "step": 3991} {"info/global_step": 3992, "train_info/time_within_train_step": 2.7534985542297363, "step": 3992} {"train_info/time_between_train_steps": 0.0029413700103759766, "step": 3992} {"info/global_step": 3993, "train_info/time_within_train_step": 2.754457473754883, "step": 3993} {"train_info/time_between_train_steps": 0.0028667449951171875, "step": 3993} {"info/global_step": 3994, "train_info/time_within_train_step": 2.753922939300537, "step": 3994} {"train_info/time_between_train_steps": 0.0030295848846435547, "step": 3994} {"info/global_step": 3995, "train_info/time_within_train_step": 2.7533130645751953, "step": 3995} {"train_info/time_between_train_steps": 0.0029053688049316406, "step": 3995} {"info/global_step": 3996, "train_info/time_within_train_step": 2.754300594329834, "step": 3996} {"train_info/time_between_train_steps": 0.002900838851928711, "step": 3996} {"info/global_step": 3997, "train_info/time_within_train_step": 2.7552173137664795, "step": 3997} {"train_info/time_between_train_steps": 0.0028922557830810547, "step": 3997} {"info/global_step": 3998, "train_info/time_within_train_step": 3.3408823013305664, "step": 3998} {"train_info/time_between_train_steps": 0.002909421920776367, "step": 3998} {"info/global_step": 3999, "train_info/time_within_train_step": 2.754779100418091, "step": 3999} {"train_info/time_between_train_steps": 0.002888917922973633, "step": 3999} {"info/global_step": 4000, "train_info/time_within_train_step": 2.755019187927246, "step": 4000} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746577614, "_runtime": 11623}, "step": 4000} {"logs": {"train/loss": 3.8372, "train/learning_rate": 0.00039999999999999996, "train/epoch": 4.06, "_timestamp": 1746577614, "_runtime": 11623}, "step": 4000} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746577619, "_runtime": 11628}, "step": 4000} {"logs": {"eval/loss": 4.649745464324951, "eval/runtime": 5.1626, "eval/samples_per_second": 36.803, "eval/steps_per_second": 1.162, "train/epoch": 4.06, "_timestamp": 1746577619, "_runtime": 11628}, "step": 4000} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746577619, "_runtime": 11628}, "step": 4000} {"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.649745464324951, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 104.55836835487037, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 5.1626, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 36.803, "train/epoch": 4.06, "_timestamp": 1746577619, "_runtime": 11628}, "step": 4000} {"train_info/time_between_train_steps": 24.357934713363647, "step": 4000} {"info/global_step": 4001, "train_info/time_within_train_step": 2.5431156158447266, "step": 4001} {"train_info/time_between_train_steps": 0.0029022693634033203, "step": 4001} {"info/global_step": 4002, "train_info/time_within_train_step": 2.5605692863464355, "step": 4002} {"train_info/time_between_train_steps": 0.0028846263885498047, "step": 4002} {"info/global_step": 4003, "train_info/time_within_train_step": 2.691675901412964, "step": 4003} {"train_info/time_between_train_steps": 0.0029196739196777344, "step": 4003} {"info/global_step": 4004, "train_info/time_within_train_step": 2.749863386154175, "step": 4004} {"train_info/time_between_train_steps": 0.0028879642486572266, "step": 4004} {"info/global_step": 4005, "train_info/time_within_train_step": 2.753871440887451, "step": 4005} {"train_info/time_between_train_steps": 0.0028536319732666016, "step": 4005} {"info/global_step": 4006, "train_info/time_within_train_step": 2.7540621757507324, "step": 4006} {"train_info/time_between_train_steps": 0.002894878387451172, "step": 4006} {"info/global_step": 4007, "train_info/time_within_train_step": 2.7537553310394287, "step": 4007} {"train_info/time_between_train_steps": 0.0028994083404541016, "step": 4007} {"info/global_step": 4008, "train_info/time_within_train_step": 2.753727912902832, "step": 4008} {"train_info/time_between_train_steps": 0.002907991409301758, "step": 4008} {"info/global_step": 4009, "train_info/time_within_train_step": 2.7517294883728027, "step": 4009} {"train_info/time_between_train_steps": 0.002879619598388672, "step": 4009} {"info/global_step": 4010, "train_info/time_within_train_step": 2.754173755645752, "step": 4010} {"train_info/time_between_train_steps": 0.0028848648071289062, "step": 4010} {"info/global_step": 4011, "train_info/time_within_train_step": 2.7535746097564697, "step": 4011} {"train_info/time_between_train_steps": 0.0028913021087646484, "step": 4011} {"info/global_step": 4012, "train_info/time_within_train_step": 2.753725051879883, "step": 4012} {"train_info/time_between_train_steps": 0.002897977828979492, "step": 4012} {"info/global_step": 4013, "train_info/time_within_train_step": 2.7553024291992188, "step": 4013} {"train_info/time_between_train_steps": 0.0028862953186035156, "step": 4013} {"info/global_step": 4014, "train_info/time_within_train_step": 2.754432201385498, "step": 4014} {"train_info/time_between_train_steps": 0.002874612808227539, "step": 4014} {"info/global_step": 4015, "train_info/time_within_train_step": 2.7543857097625732, "step": 4015} {"train_info/time_between_train_steps": 0.0029048919677734375, "step": 4015} {"info/global_step": 4016, "train_info/time_within_train_step": 2.755563974380493, "step": 4016} {"train_info/time_between_train_steps": 0.0028793811798095703, "step": 4016} {"info/global_step": 4017, "train_info/time_within_train_step": 2.75370192527771, "step": 4017} {"train_info/time_between_train_steps": 0.002876758575439453, "step": 4017} {"info/global_step": 4018, "train_info/time_within_train_step": 2.972623109817505, "step": 4018} {"train_info/time_between_train_steps": 0.002911806106567383, "step": 4018} {"info/global_step": 4019, "train_info/time_within_train_step": 2.7550547122955322, "step": 4019} {"train_info/time_between_train_steps": 0.00290679931640625, "step": 4019} {"info/global_step": 4020, "train_info/time_within_train_step": 2.754331588745117, "step": 4020} {"train_info/time_between_train_steps": 0.0029430389404296875, "step": 4020} {"info/global_step": 4021, "train_info/time_within_train_step": 2.7537946701049805, "step": 4021} {"train_info/time_between_train_steps": 0.0028917789459228516, "step": 4021} {"info/global_step": 4022, "train_info/time_within_train_step": 2.7541677951812744, "step": 4022} {"train_info/time_between_train_steps": 0.0029315948486328125, "step": 4022} {"info/global_step": 4023, "train_info/time_within_train_step": 2.754535675048828, "step": 4023} {"train_info/time_between_train_steps": 0.0028791427612304688, "step": 4023} {"info/global_step": 4024, "train_info/time_within_train_step": 2.7533962726593018, "step": 4024} {"train_info/time_between_train_steps": 0.002919912338256836, "step": 4024} {"info/global_step": 4025, "train_info/time_within_train_step": 2.7536933422088623, "step": 4025} {"train_info/time_between_train_steps": 0.0028867721557617188, "step": 4025} {"info/global_step": 4026, "train_info/time_within_train_step": 2.7543959617614746, "step": 4026} {"train_info/time_between_train_steps": 0.002869129180908203, "step": 4026} {"info/global_step": 4027, "train_info/time_within_train_step": 2.7548038959503174, "step": 4027} {"train_info/time_between_train_steps": 0.002898693084716797, "step": 4027} {"info/global_step": 4028, "train_info/time_within_train_step": 2.7552387714385986, "step": 4028} {"train_info/time_between_train_steps": 0.0028967857360839844, "step": 4028} {"info/global_step": 4029, "train_info/time_within_train_step": 2.7527709007263184, "step": 4029} {"train_info/time_between_train_steps": 0.0029020309448242188, "step": 4029} {"info/global_step": 4030, "train_info/time_within_train_step": 2.753619909286499, "step": 4030} {"train_info/time_between_train_steps": 0.002878427505493164, "step": 4030} {"info/global_step": 4031, "train_info/time_within_train_step": 2.7536985874176025, "step": 4031} {"train_info/time_between_train_steps": 0.002918243408203125, "step": 4031} {"info/global_step": 4032, "train_info/time_within_train_step": 2.7546792030334473, "step": 4032} {"train_info/time_between_train_steps": 0.0028870105743408203, "step": 4032} {"info/global_step": 4033, "train_info/time_within_train_step": 2.7545289993286133, "step": 4033} {"train_info/time_between_train_steps": 0.0029146671295166016, "step": 4033} {"info/global_step": 4034, "train_info/time_within_train_step": 2.7551066875457764, "step": 4034} {"train_info/time_between_train_steps": 0.0028815269470214844, "step": 4034} {"info/global_step": 4035, "train_info/time_within_train_step": 2.7560744285583496, "step": 4035} {"train_info/time_between_train_steps": 0.003042936325073242, "step": 4035} {"info/global_step": 4036, "train_info/time_within_train_step": 2.7555108070373535, "step": 4036} {"train_info/time_between_train_steps": 0.002990245819091797, "step": 4036} {"info/global_step": 4037, "train_info/time_within_train_step": 2.7543089389801025, "step": 4037} {"train_info/time_between_train_steps": 0.0028934478759765625, "step": 4037} {"info/global_step": 4038, "train_info/time_within_train_step": 2.7520320415496826, "step": 4038} {"train_info/time_between_train_steps": 0.002884387969970703, "step": 4038} {"info/global_step": 4039, "train_info/time_within_train_step": 2.7537543773651123, "step": 4039} {"train_info/time_between_train_steps": 0.002859830856323242, "step": 4039} {"info/global_step": 4040, "train_info/time_within_train_step": 2.7537729740142822, "step": 4040} {"train_info/time_between_train_steps": 0.0029501914978027344, "step": 4040} {"info/global_step": 4041, "train_info/time_within_train_step": 2.7536051273345947, "step": 4041} {"train_info/time_between_train_steps": 0.003026723861694336, "step": 4041} {"info/global_step": 4042, "train_info/time_within_train_step": 2.754467725753784, "step": 4042} {"train_info/time_between_train_steps": 0.0029718875885009766, "step": 4042} {"info/global_step": 4043, "train_info/time_within_train_step": 2.754715919494629, "step": 4043} {"train_info/time_between_train_steps": 0.0029702186584472656, "step": 4043} {"info/global_step": 4044, "train_info/time_within_train_step": 2.7563133239746094, "step": 4044} {"train_info/time_between_train_steps": 0.003018617630004883, "step": 4044} {"info/global_step": 4045, "train_info/time_within_train_step": 2.7540388107299805, "step": 4045} {"train_info/time_between_train_steps": 0.0028679370880126953, "step": 4045} {"info/global_step": 4046, "train_info/time_within_train_step": 2.753754138946533, "step": 4046} {"train_info/time_between_train_steps": 0.0028793811798095703, "step": 4046} {"info/global_step": 4047, "train_info/time_within_train_step": 2.7536394596099854, "step": 4047} {"train_info/time_between_train_steps": 0.0029015541076660156, "step": 4047} {"info/global_step": 4048, "train_info/time_within_train_step": 2.752450704574585, "step": 4048} {"train_info/time_between_train_steps": 0.002936840057373047, "step": 4048} {"info/global_step": 4049, "train_info/time_within_train_step": 2.753019332885742, "step": 4049} {"train_info/time_between_train_steps": 0.002924203872680664, "step": 4049} {"info/global_step": 4050, "train_info/time_within_train_step": 2.753645658493042, "step": 4050} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746577776, "_runtime": 11785}, "step": 4050} {"logs": {"train/loss": 3.8216, "train/learning_rate": 0.00039666666666666664, "train/epoch": 4.06, "_timestamp": 1746577776, "_runtime": 11785}, "step": 4050} {"train_info/time_between_train_steps": 0.012540102005004883, "step": 4050} {"info/global_step": 4051, "train_info/time_within_train_step": 2.753145217895508, "step": 4051} {"train_info/time_between_train_steps": 0.002846956253051758, "step": 4051} {"info/global_step": 4052, "train_info/time_within_train_step": 2.75304913520813, "step": 4052} {"train_info/time_between_train_steps": 0.0028717517852783203, "step": 4052} {"info/global_step": 4053, "train_info/time_within_train_step": 2.7532875537872314, "step": 4053} {"train_info/time_between_train_steps": 0.0028760433197021484, "step": 4053} {"info/global_step": 4054, "train_info/time_within_train_step": 2.7540831565856934, "step": 4054} {"train_info/time_between_train_steps": 0.002855062484741211, "step": 4054} {"info/global_step": 4055, "train_info/time_within_train_step": 2.7532289028167725, "step": 4055} {"train_info/time_between_train_steps": 0.002930164337158203, "step": 4055} {"info/global_step": 4056, "train_info/time_within_train_step": 2.7516520023345947, "step": 4056} {"train_info/time_between_train_steps": 0.0028963088989257812, "step": 4056} {"info/global_step": 4057, "train_info/time_within_train_step": 2.7545766830444336, "step": 4057} {"train_info/time_between_train_steps": 0.002911090850830078, "step": 4057} {"info/global_step": 4058, "train_info/time_within_train_step": 2.7525064945220947, "step": 4058} {"train_info/time_between_train_steps": 0.0028951168060302734, "step": 4058} {"info/global_step": 4059, "train_info/time_within_train_step": 2.754049301147461, "step": 4059} {"train_info/time_between_train_steps": 0.0028886795043945312, "step": 4059} {"info/global_step": 4060, "train_info/time_within_train_step": 2.753459930419922, "step": 4060} {"train_info/time_between_train_steps": 0.0028836727142333984, "step": 4060} {"info/global_step": 4061, "train_info/time_within_train_step": 2.7520806789398193, "step": 4061} {"train_info/time_between_train_steps": 0.0029213428497314453, "step": 4061} {"info/global_step": 4062, "train_info/time_within_train_step": 2.7514050006866455, "step": 4062} {"train_info/time_between_train_steps": 0.0028650760650634766, "step": 4062} {"info/global_step": 4063, "train_info/time_within_train_step": 2.7530951499938965, "step": 4063} {"train_info/time_between_train_steps": 0.0028793811798095703, "step": 4063} {"info/global_step": 4064, "train_info/time_within_train_step": 2.7518675327301025, "step": 4064} {"train_info/time_between_train_steps": 0.002924203872680664, "step": 4064} {"info/global_step": 4065, "train_info/time_within_train_step": 2.7540369033813477, "step": 4065} {"train_info/time_between_train_steps": 0.0028891563415527344, "step": 4065} {"info/global_step": 4066, "train_info/time_within_train_step": 2.7549350261688232, "step": 4066} {"train_info/time_between_train_steps": 0.0029180049896240234, "step": 4066} {"info/global_step": 4067, "train_info/time_within_train_step": 2.753185272216797, "step": 4067} {"train_info/time_between_train_steps": 0.002925395965576172, "step": 4067} {"info/global_step": 4068, "train_info/time_within_train_step": 2.7513444423675537, "step": 4068} {"train_info/time_between_train_steps": 0.002914905548095703, "step": 4068} {"info/global_step": 4069, "train_info/time_within_train_step": 2.7548413276672363, "step": 4069} {"train_info/time_between_train_steps": 0.002993345260620117, "step": 4069} {"info/global_step": 4070, "train_info/time_within_train_step": 2.7551357746124268, "step": 4070} {"train_info/time_between_train_steps": 0.0029959678649902344, "step": 4070} {"info/global_step": 4071, "train_info/time_within_train_step": 2.755450487136841, "step": 4071} {"train_info/time_between_train_steps": 0.003049135208129883, "step": 4071} {"info/global_step": 4072, "train_info/time_within_train_step": 2.754441499710083, "step": 4072} {"train_info/time_between_train_steps": 0.0029668807983398438, "step": 4072} {"info/global_step": 4073, "train_info/time_within_train_step": 2.755120277404785, "step": 4073} {"train_info/time_between_train_steps": 0.0029973983764648438, "step": 4073} {"info/global_step": 4074, "train_info/time_within_train_step": 2.7538774013519287, "step": 4074} {"train_info/time_between_train_steps": 0.0029904842376708984, "step": 4074} {"info/global_step": 4075, "train_info/time_within_train_step": 2.753662347793579, "step": 4075} {"train_info/time_between_train_steps": 0.0031769275665283203, "step": 4075} {"info/global_step": 4076, "train_info/time_within_train_step": 2.7547407150268555, "step": 4076} {"train_info/time_between_train_steps": 0.0030057430267333984, "step": 4076} {"info/global_step": 4077, "train_info/time_within_train_step": 2.7538626194000244, "step": 4077} {"train_info/time_between_train_steps": 0.002979755401611328, "step": 4077} {"info/global_step": 4078, "train_info/time_within_train_step": 2.7536747455596924, "step": 4078} {"train_info/time_between_train_steps": 0.003007173538208008, "step": 4078} {"info/global_step": 4079, "train_info/time_within_train_step": 2.754945993423462, "step": 4079} {"train_info/time_between_train_steps": 0.002954721450805664, "step": 4079} {"info/global_step": 4080, "train_info/time_within_train_step": 2.7552578449249268, "step": 4080} {"train_info/time_between_train_steps": 0.002959728240966797, "step": 4080} {"info/global_step": 4081, "train_info/time_within_train_step": 2.755255937576294, "step": 4081} {"train_info/time_between_train_steps": 0.002969503402709961, "step": 4081} {"info/global_step": 4082, "train_info/time_within_train_step": 2.754854202270508, "step": 4082} {"train_info/time_between_train_steps": 0.002997159957885742, "step": 4082} {"info/global_step": 4083, "train_info/time_within_train_step": 2.756023406982422, "step": 4083} {"train_info/time_between_train_steps": 0.003000974655151367, "step": 4083} {"info/global_step": 4084, "train_info/time_within_train_step": 2.7539520263671875, "step": 4084} {"train_info/time_between_train_steps": 0.003000497817993164, "step": 4084} {"info/global_step": 4085, "train_info/time_within_train_step": 2.754779815673828, "step": 4085} {"train_info/time_between_train_steps": 0.003021240234375, "step": 4085} {"info/global_step": 4086, "train_info/time_within_train_step": 2.7547481060028076, "step": 4086} {"train_info/time_between_train_steps": 0.0030410289764404297, "step": 4086} {"info/global_step": 4087, "train_info/time_within_train_step": 2.7546520233154297, "step": 4087} {"train_info/time_between_train_steps": 0.002992868423461914, "step": 4087} {"info/global_step": 4088, "train_info/time_within_train_step": 2.754638910293579, "step": 4088} {"train_info/time_between_train_steps": 0.0029952526092529297, "step": 4088} {"info/global_step": 4089, "train_info/time_within_train_step": 2.75454044342041, "step": 4089} {"train_info/time_between_train_steps": 0.0029599666595458984, "step": 4089} {"info/global_step": 4090, "train_info/time_within_train_step": 2.7549080848693848, "step": 4090} {"train_info/time_between_train_steps": 0.003015756607055664, "step": 4090} {"info/global_step": 4091, "train_info/time_within_train_step": 2.754303216934204, "step": 4091} {"train_info/time_between_train_steps": 0.0029900074005126953, "step": 4091} {"info/global_step": 4092, "train_info/time_within_train_step": 2.754215955734253, "step": 4092} {"train_info/time_between_train_steps": 0.003003358840942383, "step": 4092} {"info/global_step": 4093, "train_info/time_within_train_step": 2.753574848175049, "step": 4093} {"train_info/time_between_train_steps": 0.003025531768798828, "step": 4093} {"info/global_step": 4094, "train_info/time_within_train_step": 2.7555763721466064, "step": 4094} {"train_info/time_between_train_steps": 0.0029969215393066406, "step": 4094} {"info/global_step": 4095, "train_info/time_within_train_step": 2.7553911209106445, "step": 4095} {"train_info/time_between_train_steps": 0.003025054931640625, "step": 4095} {"info/global_step": 4096, "train_info/time_within_train_step": 2.756279468536377, "step": 4096} {"train_info/time_between_train_steps": 0.0029582977294921875, "step": 4096} {"info/global_step": 4097, "train_info/time_within_train_step": 2.75398850440979, "step": 4097} {"train_info/time_between_train_steps": 0.0030150413513183594, "step": 4097} {"info/global_step": 4098, "train_info/time_within_train_step": 2.754270076751709, "step": 4098} {"train_info/time_between_train_steps": 0.0029861927032470703, "step": 4098} {"info/global_step": 4099, "train_info/time_within_train_step": 2.754772424697876, "step": 4099} {"train_info/time_between_train_steps": 0.002974987030029297, "step": 4099} {"info/global_step": 4100, "train_info/time_within_train_step": 2.7538840770721436, "step": 4100} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746577914, "_runtime": 11923}, "step": 4100} {"logs": {"train/loss": 3.8116, "train/learning_rate": 0.0003933333333333333, "train/epoch": 4.07, "_timestamp": 1746577914, "_runtime": 11923}, "step": 4100} {"train_info/time_between_train_steps": 0.007383823394775391, "step": 4100} {"info/global_step": 4101, "train_info/time_within_train_step": 2.7552788257598877, "step": 4101} {"train_info/time_between_train_steps": 0.002974987030029297, "step": 4101} {"info/global_step": 4102, "train_info/time_within_train_step": 2.7536017894744873, "step": 4102} {"train_info/time_between_train_steps": 0.0029506683349609375, "step": 4102} {"info/global_step": 4103, "train_info/time_within_train_step": 2.7541866302490234, "step": 4103} {"train_info/time_between_train_steps": 0.0029773712158203125, "step": 4103} {"info/global_step": 4104, "train_info/time_within_train_step": 2.7536137104034424, "step": 4104} {"train_info/time_between_train_steps": 0.0029065608978271484, "step": 4104} {"info/global_step": 4105, "train_info/time_within_train_step": 2.7527036666870117, "step": 4105} {"train_info/time_between_train_steps": 0.002893686294555664, "step": 4105} {"info/global_step": 4106, "train_info/time_within_train_step": 2.7531042098999023, "step": 4106} {"train_info/time_between_train_steps": 0.0028913021087646484, "step": 4106} {"info/global_step": 4107, "train_info/time_within_train_step": 2.7518904209136963, "step": 4107} {"train_info/time_between_train_steps": 0.002978086471557617, "step": 4107} {"info/global_step": 4108, "train_info/time_within_train_step": 2.7538399696350098, "step": 4108} {"train_info/time_between_train_steps": 0.002970457077026367, "step": 4108} {"info/global_step": 4109, "train_info/time_within_train_step": 2.7537992000579834, "step": 4109} {"train_info/time_between_train_steps": 0.0029528141021728516, "step": 4109} {"info/global_step": 4110, "train_info/time_within_train_step": 2.7538533210754395, "step": 4110} {"train_info/time_between_train_steps": 0.003055095672607422, "step": 4110} {"info/global_step": 4111, "train_info/time_within_train_step": 2.7555010318756104, "step": 4111} {"train_info/time_between_train_steps": 0.0030078887939453125, "step": 4111} {"info/global_step": 4112, "train_info/time_within_train_step": 2.7551000118255615, "step": 4112} {"train_info/time_between_train_steps": 0.0029811859130859375, "step": 4112} {"info/global_step": 4113, "train_info/time_within_train_step": 2.754368305206299, "step": 4113} {"train_info/time_between_train_steps": 0.003028392791748047, "step": 4113} {"info/global_step": 4114, "train_info/time_within_train_step": 2.7523603439331055, "step": 4114} {"train_info/time_between_train_steps": 0.002990245819091797, "step": 4114} {"info/global_step": 4115, "train_info/time_within_train_step": 2.753441095352173, "step": 4115} {"train_info/time_between_train_steps": 0.0029647350311279297, "step": 4115} {"info/global_step": 4116, "train_info/time_within_train_step": 2.754147529602051, "step": 4116} {"train_info/time_between_train_steps": 0.0029845237731933594, "step": 4116} {"info/global_step": 4117, "train_info/time_within_train_step": 2.7537286281585693, "step": 4117} {"train_info/time_between_train_steps": 0.003017425537109375, "step": 4117} {"info/global_step": 4118, "train_info/time_within_train_step": 2.7534236907958984, "step": 4118} {"train_info/time_between_train_steps": 0.002985239028930664, "step": 4118} {"info/global_step": 4119, "train_info/time_within_train_step": 2.7547101974487305, "step": 4119} {"train_info/time_between_train_steps": 0.0029892921447753906, "step": 4119} {"info/global_step": 4120, "train_info/time_within_train_step": 2.753981828689575, "step": 4120} {"train_info/time_between_train_steps": 0.0030319690704345703, "step": 4120} {"info/global_step": 4121, "train_info/time_within_train_step": 2.7543373107910156, "step": 4121} {"train_info/time_between_train_steps": 0.003004312515258789, "step": 4121} {"info/global_step": 4122, "train_info/time_within_train_step": 2.7539048194885254, "step": 4122} {"train_info/time_between_train_steps": 0.0029990673065185547, "step": 4122} {"info/global_step": 4123, "train_info/time_within_train_step": 2.7537310123443604, "step": 4123} {"train_info/time_between_train_steps": 0.0030057430267333984, "step": 4123} {"info/global_step": 4124, "train_info/time_within_train_step": 2.8897182941436768, "step": 4124} {"train_info/time_between_train_steps": 0.0031328201293945312, "step": 4124} {"info/global_step": 4125, "train_info/time_within_train_step": 2.753497362136841, "step": 4125} {"train_info/time_between_train_steps": 0.002998828887939453, "step": 4125} {"info/global_step": 4126, "train_info/time_within_train_step": 2.7540998458862305, "step": 4126} {"train_info/time_between_train_steps": 0.0029892921447753906, "step": 4126} {"info/global_step": 4127, "train_info/time_within_train_step": 2.7545337677001953, "step": 4127} {"train_info/time_between_train_steps": 0.002950906753540039, "step": 4127} {"info/global_step": 4128, "train_info/time_within_train_step": 2.7535297870635986, "step": 4128} {"train_info/time_between_train_steps": 0.002892017364501953, "step": 4128} {"info/global_step": 4129, "train_info/time_within_train_step": 2.753249168395996, "step": 4129} {"train_info/time_between_train_steps": 0.0029058456420898438, "step": 4129} {"info/global_step": 4130, "train_info/time_within_train_step": 2.7516732215881348, "step": 4130} {"train_info/time_between_train_steps": 0.0029349327087402344, "step": 4130} {"info/global_step": 4131, "train_info/time_within_train_step": 2.7534844875335693, "step": 4131} {"train_info/time_between_train_steps": 0.0028977394104003906, "step": 4131} {"info/global_step": 4132, "train_info/time_within_train_step": 2.7536404132843018, "step": 4132} {"train_info/time_between_train_steps": 0.0029408931732177734, "step": 4132} {"info/global_step": 4133, "train_info/time_within_train_step": 2.753633499145508, "step": 4133} {"train_info/time_between_train_steps": 0.002892732620239258, "step": 4133} {"info/global_step": 4134, "train_info/time_within_train_step": 2.75309419631958, "step": 4134} {"train_info/time_between_train_steps": 0.002889394760131836, "step": 4134} {"info/global_step": 4135, "train_info/time_within_train_step": 2.753023147583008, "step": 4135} {"train_info/time_between_train_steps": 0.0028896331787109375, "step": 4135} {"info/global_step": 4136, "train_info/time_within_train_step": 2.7514686584472656, "step": 4136} {"train_info/time_between_train_steps": 0.0028901100158691406, "step": 4136} {"info/global_step": 4137, "train_info/time_within_train_step": 2.7520298957824707, "step": 4137} {"train_info/time_between_train_steps": 0.0028769969940185547, "step": 4137} {"info/global_step": 4138, "train_info/time_within_train_step": 2.7520558834075928, "step": 4138} {"train_info/time_between_train_steps": 0.0028955936431884766, "step": 4138} {"info/global_step": 4139, "train_info/time_within_train_step": 2.752868413925171, "step": 4139} {"train_info/time_between_train_steps": 0.002919435501098633, "step": 4139} {"info/global_step": 4140, "train_info/time_within_train_step": 2.7519497871398926, "step": 4140} {"train_info/time_between_train_steps": 0.002906322479248047, "step": 4140} {"info/global_step": 4141, "train_info/time_within_train_step": 2.7532706260681152, "step": 4141} {"train_info/time_between_train_steps": 0.0029344558715820312, "step": 4141} {"info/global_step": 4142, "train_info/time_within_train_step": 2.7519726753234863, "step": 4142} {"train_info/time_between_train_steps": 0.0028939247131347656, "step": 4142} {"info/global_step": 4143, "train_info/time_within_train_step": 2.752426862716675, "step": 4143} {"train_info/time_between_train_steps": 0.0028798580169677734, "step": 4143} {"info/global_step": 4144, "train_info/time_within_train_step": 2.752575635910034, "step": 4144} {"train_info/time_between_train_steps": 0.0029091835021972656, "step": 4144} {"info/global_step": 4145, "train_info/time_within_train_step": 2.752635955810547, "step": 4145} {"train_info/time_between_train_steps": 0.002892017364501953, "step": 4145} {"info/global_step": 4146, "train_info/time_within_train_step": 2.753248453140259, "step": 4146} {"train_info/time_between_train_steps": 0.002871274948120117, "step": 4146} {"info/global_step": 4147, "train_info/time_within_train_step": 2.753227949142456, "step": 4147} {"train_info/time_between_train_steps": 0.002876758575439453, "step": 4147} {"info/global_step": 4148, "train_info/time_within_train_step": 2.7523090839385986, "step": 4148} {"train_info/time_between_train_steps": 0.0028896331787109375, "step": 4148} {"info/global_step": 4149, "train_info/time_within_train_step": 2.753455877304077, "step": 4149} {"train_info/time_between_train_steps": 0.002985239028930664, "step": 4149} {"info/global_step": 4150, "train_info/time_within_train_step": 2.7547717094421387, "step": 4150} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746578053, "_runtime": 12062}, "step": 4150} {"logs": {"train/loss": 3.8049, "train/learning_rate": 0.00039, "train/epoch": 4.07, "_timestamp": 1746578053, "_runtime": 12062}, "step": 4150} {"train_info/time_between_train_steps": 0.012035608291625977, "step": 4150} {"info/global_step": 4151, "train_info/time_within_train_step": 2.7548470497131348, "step": 4151} {"train_info/time_between_train_steps": 0.002980470657348633, "step": 4151} {"info/global_step": 4152, "train_info/time_within_train_step": 2.754629611968994, "step": 4152} {"train_info/time_between_train_steps": 0.0029439926147460938, "step": 4152} {"info/global_step": 4153, "train_info/time_within_train_step": 2.7527530193328857, "step": 4153} {"train_info/time_between_train_steps": 0.0030269622802734375, "step": 4153} {"info/global_step": 4154, "train_info/time_within_train_step": 2.7544150352478027, "step": 4154} {"train_info/time_between_train_steps": 0.003038167953491211, "step": 4154} {"info/global_step": 4155, "train_info/time_within_train_step": 2.7543482780456543, "step": 4155} {"train_info/time_between_train_steps": 0.0029785633087158203, "step": 4155} {"info/global_step": 4156, "train_info/time_within_train_step": 2.753750801086426, "step": 4156} {"train_info/time_between_train_steps": 0.0029821395874023438, "step": 4156} {"info/global_step": 4157, "train_info/time_within_train_step": 2.7542831897735596, "step": 4157} {"train_info/time_between_train_steps": 0.0030188560485839844, "step": 4157} {"info/global_step": 4158, "train_info/time_within_train_step": 2.753082752227783, "step": 4158} {"train_info/time_between_train_steps": 0.0029783248901367188, "step": 4158} {"info/global_step": 4159, "train_info/time_within_train_step": 2.7548093795776367, "step": 4159} {"train_info/time_between_train_steps": 0.0030226707458496094, "step": 4159} {"info/global_step": 4160, "train_info/time_within_train_step": 2.753995656967163, "step": 4160} {"train_info/time_between_train_steps": 0.003015279769897461, "step": 4160} {"info/global_step": 4161, "train_info/time_within_train_step": 2.7540106773376465, "step": 4161} {"train_info/time_between_train_steps": 0.0030100345611572266, "step": 4161} {"info/global_step": 4162, "train_info/time_within_train_step": 2.7546322345733643, "step": 4162} {"train_info/time_between_train_steps": 0.0029435157775878906, "step": 4162} {"info/global_step": 4163, "train_info/time_within_train_step": 2.7532923221588135, "step": 4163} {"train_info/time_between_train_steps": 0.002964496612548828, "step": 4163} {"info/global_step": 4164, "train_info/time_within_train_step": 2.7544469833374023, "step": 4164} {"train_info/time_between_train_steps": 0.0029630661010742188, "step": 4164} {"info/global_step": 4165, "train_info/time_within_train_step": 2.755239725112915, "step": 4165} {"train_info/time_between_train_steps": 0.0030362606048583984, "step": 4165} {"info/global_step": 4166, "train_info/time_within_train_step": 2.7542991638183594, "step": 4166} {"train_info/time_between_train_steps": 0.0029823780059814453, "step": 4166} {"info/global_step": 4167, "train_info/time_within_train_step": 2.753631591796875, "step": 4167} {"train_info/time_between_train_steps": 0.002978801727294922, "step": 4167} {"info/global_step": 4168, "train_info/time_within_train_step": 2.7548468112945557, "step": 4168} {"train_info/time_between_train_steps": 0.0029811859130859375, "step": 4168} {"info/global_step": 4169, "train_info/time_within_train_step": 2.754025459289551, "step": 4169} {"train_info/time_between_train_steps": 0.0029439926147460938, "step": 4169} {"info/global_step": 4170, "train_info/time_within_train_step": 2.7528669834136963, "step": 4170} {"train_info/time_between_train_steps": 0.0029473304748535156, "step": 4170} {"info/global_step": 4171, "train_info/time_within_train_step": 2.7540152072906494, "step": 4171} {"train_info/time_between_train_steps": 0.0028791427612304688, "step": 4171} {"info/global_step": 4172, "train_info/time_within_train_step": 2.7525017261505127, "step": 4172} {"train_info/time_between_train_steps": 0.0028715133666992188, "step": 4172} {"info/global_step": 4173, "train_info/time_within_train_step": 2.752871036529541, "step": 4173} {"train_info/time_between_train_steps": 0.0028786659240722656, "step": 4173} {"info/global_step": 4174, "train_info/time_within_train_step": 2.7531893253326416, "step": 4174} {"train_info/time_between_train_steps": 0.0029587745666503906, "step": 4174} {"info/global_step": 4175, "train_info/time_within_train_step": 2.752624988555908, "step": 4175} {"train_info/time_between_train_steps": 0.0029027462005615234, "step": 4175} {"info/global_step": 4176, "train_info/time_within_train_step": 2.7538692951202393, "step": 4176} {"train_info/time_between_train_steps": 0.0029888153076171875, "step": 4176} {"info/global_step": 4177, "train_info/time_within_train_step": 2.7545268535614014, "step": 4177} {"train_info/time_between_train_steps": 0.003024578094482422, "step": 4177} {"info/global_step": 4178, "train_info/time_within_train_step": 2.7540299892425537, "step": 4178} {"train_info/time_between_train_steps": 0.003085613250732422, "step": 4178} {"info/global_step": 4179, "train_info/time_within_train_step": 2.7525088787078857, "step": 4179} {"train_info/time_between_train_steps": 0.0030145645141601562, "step": 4179} {"info/global_step": 4180, "train_info/time_within_train_step": 2.7542457580566406, "step": 4180} {"train_info/time_between_train_steps": 0.0029916763305664062, "step": 4180} {"info/global_step": 4181, "train_info/time_within_train_step": 2.855355978012085, "step": 4181} {"train_info/time_between_train_steps": 0.003007173538208008, "step": 4181} {"info/global_step": 4182, "train_info/time_within_train_step": 2.7548837661743164, "step": 4182} {"train_info/time_between_train_steps": 0.0030066967010498047, "step": 4182} {"info/global_step": 4183, "train_info/time_within_train_step": 2.7539689540863037, "step": 4183} {"train_info/time_between_train_steps": 0.002946615219116211, "step": 4183} {"info/global_step": 4184, "train_info/time_within_train_step": 2.755023956298828, "step": 4184} {"train_info/time_between_train_steps": 0.003116130828857422, "step": 4184} {"info/global_step": 4185, "train_info/time_within_train_step": 2.7534406185150146, "step": 4185} {"train_info/time_between_train_steps": 0.0029697418212890625, "step": 4185} {"info/global_step": 4186, "train_info/time_within_train_step": 2.7538247108459473, "step": 4186} {"train_info/time_between_train_steps": 0.0030050277709960938, "step": 4186} {"info/global_step": 4187, "train_info/time_within_train_step": 2.7535104751586914, "step": 4187} {"train_info/time_between_train_steps": 0.003034830093383789, "step": 4187} {"info/global_step": 4188, "train_info/time_within_train_step": 2.7496063709259033, "step": 4188} {"train_info/time_between_train_steps": 0.002973318099975586, "step": 4188} {"info/global_step": 4189, "train_info/time_within_train_step": 2.7544806003570557, "step": 4189} {"train_info/time_between_train_steps": 0.0029938220977783203, "step": 4189} {"info/global_step": 4190, "train_info/time_within_train_step": 2.753739595413208, "step": 4190} {"train_info/time_between_train_steps": 0.0030257701873779297, "step": 4190} {"info/global_step": 4191, "train_info/time_within_train_step": 2.754228115081787, "step": 4191} {"train_info/time_between_train_steps": 0.0029795169830322266, "step": 4191} {"info/global_step": 4192, "train_info/time_within_train_step": 2.751633405685425, "step": 4192} {"train_info/time_between_train_steps": 0.0029594898223876953, "step": 4192} {"info/global_step": 4193, "train_info/time_within_train_step": 2.7543938159942627, "step": 4193} {"train_info/time_between_train_steps": 0.0029861927032470703, "step": 4193} {"info/global_step": 4194, "train_info/time_within_train_step": 2.7543511390686035, "step": 4194} {"train_info/time_between_train_steps": 0.0029680728912353516, "step": 4194} {"info/global_step": 4195, "train_info/time_within_train_step": 2.753920555114746, "step": 4195} {"train_info/time_between_train_steps": 0.002977132797241211, "step": 4195} {"info/global_step": 4196, "train_info/time_within_train_step": 2.7535011768341064, "step": 4196} {"train_info/time_between_train_steps": 0.0030133724212646484, "step": 4196} {"info/global_step": 4197, "train_info/time_within_train_step": 2.7537693977355957, "step": 4197} {"train_info/time_between_train_steps": 0.0029828548431396484, "step": 4197} {"info/global_step": 4198, "train_info/time_within_train_step": 2.751941204071045, "step": 4198} {"train_info/time_between_train_steps": 0.003004789352416992, "step": 4198} {"info/global_step": 4199, "train_info/time_within_train_step": 2.7536096572875977, "step": 4199} {"train_info/time_between_train_steps": 0.002989530563354492, "step": 4199} {"info/global_step": 4200, "train_info/time_within_train_step": 2.7525062561035156, "step": 4200} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746578191, "_runtime": 12200}, "step": 4200} {"logs": {"train/loss": 3.7886, "train/learning_rate": 0.00038666666666666667, "train/epoch": 4.08, "_timestamp": 1746578191, "_runtime": 12200}, "step": 4200} {"train_info/time_between_train_steps": 24.61650538444519, "step": 4200} {"info/global_step": 4201, "train_info/time_within_train_step": 2.54160213470459, "step": 4201} {"train_info/time_between_train_steps": 0.0029630661010742188, "step": 4201} {"info/global_step": 4202, "train_info/time_within_train_step": 2.5847346782684326, "step": 4202} {"train_info/time_between_train_steps": 0.003031492233276367, "step": 4202} {"info/global_step": 4203, "train_info/time_within_train_step": 2.7142484188079834, "step": 4203} {"train_info/time_between_train_steps": 0.00299835205078125, "step": 4203} {"info/global_step": 4204, "train_info/time_within_train_step": 2.7188687324523926, "step": 4204} {"train_info/time_between_train_steps": 0.0029561519622802734, "step": 4204} {"info/global_step": 4205, "train_info/time_within_train_step": 2.747382164001465, "step": 4205} {"train_info/time_between_train_steps": 0.0030126571655273438, "step": 4205} {"info/global_step": 4206, "train_info/time_within_train_step": 2.754343032836914, "step": 4206} {"train_info/time_between_train_steps": 0.003026723861694336, "step": 4206} {"info/global_step": 4207, "train_info/time_within_train_step": 2.7555959224700928, "step": 4207} {"train_info/time_between_train_steps": 0.0029757022857666016, "step": 4207} {"info/global_step": 4208, "train_info/time_within_train_step": 2.7563865184783936, "step": 4208} {"train_info/time_between_train_steps": 0.002979755401611328, "step": 4208} {"info/global_step": 4209, "train_info/time_within_train_step": 2.7549633979797363, "step": 4209} {"train_info/time_between_train_steps": 0.0029845237731933594, "step": 4209} {"info/global_step": 4210, "train_info/time_within_train_step": 2.755178451538086, "step": 4210} {"train_info/time_between_train_steps": 0.002969503402709961, "step": 4210} {"info/global_step": 4211, "train_info/time_within_train_step": 2.7546143531799316, "step": 4211} {"train_info/time_between_train_steps": 0.0030562877655029297, "step": 4211} {"info/global_step": 4212, "train_info/time_within_train_step": 2.7550244331359863, "step": 4212} {"train_info/time_between_train_steps": 0.0029740333557128906, "step": 4212} {"info/global_step": 4213, "train_info/time_within_train_step": 2.755162239074707, "step": 4213} {"train_info/time_between_train_steps": 0.0029926300048828125, "step": 4213} {"info/global_step": 4214, "train_info/time_within_train_step": 2.7557904720306396, "step": 4214} {"train_info/time_between_train_steps": 0.003005504608154297, "step": 4214} {"info/global_step": 4215, "train_info/time_within_train_step": 2.7556209564208984, "step": 4215} {"train_info/time_between_train_steps": 0.0029680728912353516, "step": 4215} {"info/global_step": 4216, "train_info/time_within_train_step": 2.7559635639190674, "step": 4216} {"train_info/time_between_train_steps": 0.0029401779174804688, "step": 4216} {"info/global_step": 4217, "train_info/time_within_train_step": 2.7559471130371094, "step": 4217} {"train_info/time_between_train_steps": 0.002987384796142578, "step": 4217} {"info/global_step": 4218, "train_info/time_within_train_step": 2.756295919418335, "step": 4218} {"train_info/time_between_train_steps": 0.002969503402709961, "step": 4218} {"info/global_step": 4219, "train_info/time_within_train_step": 2.755890130996704, "step": 4219} {"train_info/time_between_train_steps": 0.002998828887939453, "step": 4219} {"info/global_step": 4220, "train_info/time_within_train_step": 2.756100654602051, "step": 4220} {"train_info/time_between_train_steps": 0.0030062198638916016, "step": 4220} {"info/global_step": 4221, "train_info/time_within_train_step": 2.756967544555664, "step": 4221} {"train_info/time_between_train_steps": 0.0029578208923339844, "step": 4221} {"info/global_step": 4222, "train_info/time_within_train_step": 2.7563588619232178, "step": 4222} {"train_info/time_between_train_steps": 0.003044605255126953, "step": 4222} {"info/global_step": 4223, "train_info/time_within_train_step": 2.7553980350494385, "step": 4223} {"train_info/time_between_train_steps": 0.003018617630004883, "step": 4223} {"info/global_step": 4224, "train_info/time_within_train_step": 2.7559890747070312, "step": 4224} {"train_info/time_between_train_steps": 0.0029861927032470703, "step": 4224} {"info/global_step": 4225, "train_info/time_within_train_step": 2.757394790649414, "step": 4225} {"train_info/time_between_train_steps": 0.003000497817993164, "step": 4225} {"info/global_step": 4226, "train_info/time_within_train_step": 2.7563908100128174, "step": 4226} {"train_info/time_between_train_steps": 0.0030035972595214844, "step": 4226} {"info/global_step": 4227, "train_info/time_within_train_step": 2.813551902770996, "step": 4227} {"train_info/time_between_train_steps": 0.0030448436737060547, "step": 4227} {"info/global_step": 4228, "train_info/time_within_train_step": 2.7573471069335938, "step": 4228} {"train_info/time_between_train_steps": 0.002995729446411133, "step": 4228} {"info/global_step": 4229, "train_info/time_within_train_step": 2.7529854774475098, "step": 4229} {"train_info/time_between_train_steps": 0.002998828887939453, "step": 4229} {"info/global_step": 4230, "train_info/time_within_train_step": 2.755610942840576, "step": 4230} {"train_info/time_between_train_steps": 0.002977132797241211, "step": 4230} {"info/global_step": 4231, "train_info/time_within_train_step": 2.7559094429016113, "step": 4231} {"train_info/time_between_train_steps": 0.0030486583709716797, "step": 4231} {"info/global_step": 4232, "train_info/time_within_train_step": 2.756479024887085, "step": 4232} {"train_info/time_between_train_steps": 0.0029573440551757812, "step": 4232} {"info/global_step": 4233, "train_info/time_within_train_step": 2.755356550216675, "step": 4233} {"train_info/time_between_train_steps": 0.003082275390625, "step": 4233} {"info/global_step": 4234, "train_info/time_within_train_step": 2.755180597305298, "step": 4234} {"train_info/time_between_train_steps": 0.0030508041381835938, "step": 4234} {"info/global_step": 4235, "train_info/time_within_train_step": 2.7558820247650146, "step": 4235} {"train_info/time_between_train_steps": 0.003068208694458008, "step": 4235} {"info/global_step": 4236, "train_info/time_within_train_step": 2.755723714828491, "step": 4236} {"train_info/time_between_train_steps": 0.003025531768798828, "step": 4236} {"info/global_step": 4237, "train_info/time_within_train_step": 2.7563424110412598, "step": 4237} {"train_info/time_between_train_steps": 0.0031273365020751953, "step": 4237} {"info/global_step": 4238, "train_info/time_within_train_step": 2.7557365894317627, "step": 4238} {"train_info/time_between_train_steps": 0.002969503402709961, "step": 4238} {"info/global_step": 4239, "train_info/time_within_train_step": 2.756024122238159, "step": 4239} {"train_info/time_between_train_steps": 0.0031485557556152344, "step": 4239} {"info/global_step": 4240, "train_info/time_within_train_step": 2.7555229663848877, "step": 4240} {"train_info/time_between_train_steps": 0.0030591487884521484, "step": 4240} {"info/global_step": 4241, "train_info/time_within_train_step": 2.7549827098846436, "step": 4241} {"train_info/time_between_train_steps": 0.003008127212524414, "step": 4241} {"info/global_step": 4242, "train_info/time_within_train_step": 2.756213665008545, "step": 4242} {"train_info/time_between_train_steps": 0.0030198097229003906, "step": 4242} {"info/global_step": 4243, "train_info/time_within_train_step": 2.7556989192962646, "step": 4243} {"train_info/time_between_train_steps": 0.003060579299926758, "step": 4243} {"info/global_step": 4244, "train_info/time_within_train_step": 2.7567074298858643, "step": 4244} {"train_info/time_between_train_steps": 0.0031461715698242188, "step": 4244} {"info/global_step": 4245, "train_info/time_within_train_step": 2.757390260696411, "step": 4245} {"train_info/time_between_train_steps": 0.0031290054321289062, "step": 4245} {"info/global_step": 4246, "train_info/time_within_train_step": 2.756455659866333, "step": 4246} {"train_info/time_between_train_steps": 0.0031931400299072266, "step": 4246} {"info/global_step": 4247, "train_info/time_within_train_step": 2.7558720111846924, "step": 4247} {"train_info/time_between_train_steps": 0.003150463104248047, "step": 4247} {"info/global_step": 4248, "train_info/time_within_train_step": 3.3636465072631836, "step": 4248} {"train_info/time_between_train_steps": 0.0030477046966552734, "step": 4248} {"info/global_step": 4249, "train_info/time_within_train_step": 2.752628803253174, "step": 4249} {"train_info/time_between_train_steps": 0.0030164718627929688, "step": 4249} {"info/global_step": 4250, "train_info/time_within_train_step": 2.7556896209716797, "step": 4250} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746578354, "_runtime": 12363}, "step": 4250} {"logs": {"train/loss": 3.7791, "train/learning_rate": 0.0003833333333333333, "train/epoch": 4.08, "_timestamp": 1746578354, "_runtime": 12363}, "step": 4250} {"train_info/time_between_train_steps": 0.012359142303466797, "step": 4250} {"info/global_step": 4251, "train_info/time_within_train_step": 2.753870725631714, "step": 4251} {"train_info/time_between_train_steps": 0.0030546188354492188, "step": 4251} {"info/global_step": 4252, "train_info/time_within_train_step": 2.754302978515625, "step": 4252} {"train_info/time_between_train_steps": 0.003301382064819336, "step": 4252} {"info/global_step": 4253, "train_info/time_within_train_step": 2.7546546459198, "step": 4253} {"train_info/time_between_train_steps": 0.003214120864868164, "step": 4253} {"info/global_step": 4254, "train_info/time_within_train_step": 2.755342483520508, "step": 4254} {"train_info/time_between_train_steps": 0.0030562877655029297, "step": 4254} {"info/global_step": 4255, "train_info/time_within_train_step": 2.7551655769348145, "step": 4255} {"train_info/time_between_train_steps": 0.0032618045806884766, "step": 4255} {"info/global_step": 4256, "train_info/time_within_train_step": 2.7549102306365967, "step": 4256} {"train_info/time_between_train_steps": 0.003270387649536133, "step": 4256} {"info/global_step": 4257, "train_info/time_within_train_step": 2.755648374557495, "step": 4257} {"train_info/time_between_train_steps": 0.003443479537963867, "step": 4257} {"info/global_step": 4258, "train_info/time_within_train_step": 2.7553389072418213, "step": 4258} {"train_info/time_between_train_steps": 0.0033113956451416016, "step": 4258} {"info/global_step": 4259, "train_info/time_within_train_step": 2.7550132274627686, "step": 4259} {"train_info/time_between_train_steps": 0.003217458724975586, "step": 4259} {"info/global_step": 4260, "train_info/time_within_train_step": 2.7556803226470947, "step": 4260} {"train_info/time_between_train_steps": 0.003226757049560547, "step": 4260} {"info/global_step": 4261, "train_info/time_within_train_step": 2.755284070968628, "step": 4261} {"train_info/time_between_train_steps": 0.0034694671630859375, "step": 4261} {"info/global_step": 4262, "train_info/time_within_train_step": 2.7557895183563232, "step": 4262} {"train_info/time_between_train_steps": 0.0034503936767578125, "step": 4262} {"info/global_step": 4263, "train_info/time_within_train_step": 2.754564046859741, "step": 4263} {"train_info/time_between_train_steps": 0.0038776397705078125, "step": 4263} {"info/global_step": 4264, "train_info/time_within_train_step": 2.7553536891937256, "step": 4264} {"train_info/time_between_train_steps": 0.003425121307373047, "step": 4264} {"info/global_step": 4265, "train_info/time_within_train_step": 2.7858166694641113, "step": 4265} {"train_info/time_between_train_steps": 0.0038292407989501953, "step": 4265} {"train_info/time_between_train_steps": 3.0600333213806152, "step": 4265} {"info/global_step": 4266, "train_info/time_within_train_step": 2.695774555206299, "step": 4266} {"train_info/time_between_train_steps": 0.003155946731567383, "step": 4266} {"info/global_step": 4267, "train_info/time_within_train_step": 2.7544631958007812, "step": 4267} {"train_info/time_between_train_steps": 0.003135204315185547, "step": 4267} {"info/global_step": 4268, "train_info/time_within_train_step": 2.7542057037353516, "step": 4268} {"train_info/time_between_train_steps": 0.003134012222290039, "step": 4268} {"info/global_step": 4269, "train_info/time_within_train_step": 2.75441312789917, "step": 4269} {"train_info/time_between_train_steps": 0.0031900405883789062, "step": 4269} {"info/global_step": 4270, "train_info/time_within_train_step": 2.753478765487671, "step": 4270} {"train_info/time_between_train_steps": 0.003107309341430664, "step": 4270} {"info/global_step": 4271, "train_info/time_within_train_step": 2.7537167072296143, "step": 4271} {"train_info/time_between_train_steps": 0.0031554698944091797, "step": 4271} {"info/global_step": 4272, "train_info/time_within_train_step": 2.753993272781372, "step": 4272} {"train_info/time_between_train_steps": 0.0031845569610595703, "step": 4272} {"info/global_step": 4273, "train_info/time_within_train_step": 2.7539560794830322, "step": 4273} {"train_info/time_between_train_steps": 0.0031194686889648438, "step": 4273} {"info/global_step": 4274, "train_info/time_within_train_step": 2.7532241344451904, "step": 4274} {"train_info/time_between_train_steps": 0.0031387805938720703, "step": 4274} {"info/global_step": 4275, "train_info/time_within_train_step": 2.7541730403900146, "step": 4275} {"train_info/time_between_train_steps": 0.003154277801513672, "step": 4275} {"info/global_step": 4276, "train_info/time_within_train_step": 2.7538654804229736, "step": 4276} {"train_info/time_between_train_steps": 0.0031468868255615234, "step": 4276} {"info/global_step": 4277, "train_info/time_within_train_step": 2.7531421184539795, "step": 4277} {"train_info/time_between_train_steps": 0.003132343292236328, "step": 4277} {"info/global_step": 4278, "train_info/time_within_train_step": 2.964325428009033, "step": 4278} {"train_info/time_between_train_steps": 0.003209829330444336, "step": 4278} {"info/global_step": 4279, "train_info/time_within_train_step": 2.7519583702087402, "step": 4279} {"train_info/time_between_train_steps": 0.003131389617919922, "step": 4279} {"info/global_step": 4280, "train_info/time_within_train_step": 2.7551934719085693, "step": 4280} {"train_info/time_between_train_steps": 0.003161191940307617, "step": 4280} {"info/global_step": 4281, "train_info/time_within_train_step": 2.754103899002075, "step": 4281} {"train_info/time_between_train_steps": 0.003160715103149414, "step": 4281} {"info/global_step": 4282, "train_info/time_within_train_step": 2.7543017864227295, "step": 4282} {"train_info/time_between_train_steps": 0.003129720687866211, "step": 4282} {"info/global_step": 4283, "train_info/time_within_train_step": 2.753235340118408, "step": 4283} {"train_info/time_between_train_steps": 0.003200531005859375, "step": 4283} {"info/global_step": 4284, "train_info/time_within_train_step": 2.7544755935668945, "step": 4284} {"train_info/time_between_train_steps": 0.0031595230102539062, "step": 4284} {"info/global_step": 4285, "train_info/time_within_train_step": 2.754371404647827, "step": 4285} {"train_info/time_between_train_steps": 0.0031380653381347656, "step": 4285} {"info/global_step": 4286, "train_info/time_within_train_step": 2.7533140182495117, "step": 4286} {"train_info/time_between_train_steps": 0.0031533241271972656, "step": 4286} {"info/global_step": 4287, "train_info/time_within_train_step": 2.7540600299835205, "step": 4287} {"train_info/time_between_train_steps": 0.003144979476928711, "step": 4287} {"info/global_step": 4288, "train_info/time_within_train_step": 2.7534263134002686, "step": 4288} {"train_info/time_between_train_steps": 0.003129243850708008, "step": 4288} {"info/global_step": 4289, "train_info/time_within_train_step": 2.7539825439453125, "step": 4289} {"train_info/time_between_train_steps": 0.0031659603118896484, "step": 4289} {"info/global_step": 4290, "train_info/time_within_train_step": 2.752336263656616, "step": 4290} {"train_info/time_between_train_steps": 0.003175020217895508, "step": 4290} {"info/global_step": 4291, "train_info/time_within_train_step": 2.754256248474121, "step": 4291} {"train_info/time_between_train_steps": 0.0031757354736328125, "step": 4291} {"info/global_step": 4292, "train_info/time_within_train_step": 2.7548129558563232, "step": 4292} {"train_info/time_between_train_steps": 0.0032432079315185547, "step": 4292} {"info/global_step": 4293, "train_info/time_within_train_step": 2.7533764839172363, "step": 4293} {"train_info/time_between_train_steps": 0.0031998157501220703, "step": 4293} {"info/global_step": 4294, "train_info/time_within_train_step": 2.7542026042938232, "step": 4294} {"train_info/time_between_train_steps": 0.003167867660522461, "step": 4294} {"info/global_step": 4295, "train_info/time_within_train_step": 2.753197193145752, "step": 4295} {"train_info/time_between_train_steps": 0.0031490325927734375, "step": 4295} {"info/global_step": 4296, "train_info/time_within_train_step": 2.7547526359558105, "step": 4296} {"train_info/time_between_train_steps": 0.00315093994140625, "step": 4296} {"info/global_step": 4297, "train_info/time_within_train_step": 2.753493547439575, "step": 4297} {"train_info/time_between_train_steps": 0.0030760765075683594, "step": 4297} {"info/global_step": 4298, "train_info/time_within_train_step": 2.755030632019043, "step": 4298} {"train_info/time_between_train_steps": 0.003125429153442383, "step": 4298} {"info/global_step": 4299, "train_info/time_within_train_step": 2.754225015640259, "step": 4299} {"train_info/time_between_train_steps": 0.0031762123107910156, "step": 4299} {"info/global_step": 4300, "train_info/time_within_train_step": 2.7545018196105957, "step": 4300} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746578496, "_runtime": 12505}, "step": 4300} {"logs": {"train/loss": 3.8198, "train/learning_rate": 0.00037999999999999997, "train/epoch": 5.0, "_timestamp": 1746578496, "_runtime": 12505}, "step": 4300} {"train_info/time_between_train_steps": 0.009169578552246094, "step": 4300} {"info/global_step": 4301, "train_info/time_within_train_step": 2.754539728164673, "step": 4301} {"train_info/time_between_train_steps": 0.003121614456176758, "step": 4301} {"info/global_step": 4302, "train_info/time_within_train_step": 2.754539728164673, "step": 4302} {"train_info/time_between_train_steps": 0.0032265186309814453, "step": 4302} {"info/global_step": 4303, "train_info/time_within_train_step": 2.7547783851623535, "step": 4303} {"train_info/time_between_train_steps": 0.0031805038452148438, "step": 4303} {"info/global_step": 4304, "train_info/time_within_train_step": 2.7545228004455566, "step": 4304} {"train_info/time_between_train_steps": 0.003122091293334961, "step": 4304} {"info/global_step": 4305, "train_info/time_within_train_step": 2.754948854446411, "step": 4305} {"train_info/time_between_train_steps": 0.0031440258026123047, "step": 4305} {"info/global_step": 4306, "train_info/time_within_train_step": 2.754849910736084, "step": 4306} {"train_info/time_between_train_steps": 0.0031232833862304688, "step": 4306} {"info/global_step": 4307, "train_info/time_within_train_step": 2.753953218460083, "step": 4307} {"train_info/time_between_train_steps": 0.0031766891479492188, "step": 4307} {"info/global_step": 4308, "train_info/time_within_train_step": 2.7535715103149414, "step": 4308} {"train_info/time_between_train_steps": 0.003115415573120117, "step": 4308} {"info/global_step": 4309, "train_info/time_within_train_step": 2.7543256282806396, "step": 4309} {"train_info/time_between_train_steps": 0.00308990478515625, "step": 4309} {"info/global_step": 4310, "train_info/time_within_train_step": 2.7543935775756836, "step": 4310} {"train_info/time_between_train_steps": 0.0031347274780273438, "step": 4310} {"info/global_step": 4311, "train_info/time_within_train_step": 2.756498336791992, "step": 4311} {"train_info/time_between_train_steps": 0.003093719482421875, "step": 4311} {"info/global_step": 4312, "train_info/time_within_train_step": 2.7545342445373535, "step": 4312} {"train_info/time_between_train_steps": 0.0031363964080810547, "step": 4312} {"info/global_step": 4313, "train_info/time_within_train_step": 2.7550196647644043, "step": 4313} {"train_info/time_between_train_steps": 0.0031714439392089844, "step": 4313} {"info/global_step": 4314, "train_info/time_within_train_step": 2.7540786266326904, "step": 4314} {"train_info/time_between_train_steps": 0.0031507015228271484, "step": 4314} {"info/global_step": 4315, "train_info/time_within_train_step": 2.7546579837799072, "step": 4315} {"train_info/time_between_train_steps": 0.0031015872955322266, "step": 4315} {"info/global_step": 4316, "train_info/time_within_train_step": 2.7542874813079834, "step": 4316} {"train_info/time_between_train_steps": 0.00315093994140625, "step": 4316} {"info/global_step": 4317, "train_info/time_within_train_step": 2.7548975944519043, "step": 4317} {"train_info/time_between_train_steps": 0.0031709671020507812, "step": 4317} {"info/global_step": 4318, "train_info/time_within_train_step": 2.9851040840148926, "step": 4318} {"train_info/time_between_train_steps": 0.0031363964080810547, "step": 4318} {"info/global_step": 4319, "train_info/time_within_train_step": 2.755173921585083, "step": 4319} {"train_info/time_between_train_steps": 0.0031054019927978516, "step": 4319} {"info/global_step": 4320, "train_info/time_within_train_step": 2.7561142444610596, "step": 4320} {"train_info/time_between_train_steps": 0.0031464099884033203, "step": 4320} {"info/global_step": 4321, "train_info/time_within_train_step": 2.7515311241149902, "step": 4321} {"train_info/time_between_train_steps": 0.0031626224517822266, "step": 4321} {"info/global_step": 4322, "train_info/time_within_train_step": 2.7539103031158447, "step": 4322} {"train_info/time_between_train_steps": 0.003088235855102539, "step": 4322} {"info/global_step": 4323, "train_info/time_within_train_step": 2.753674030303955, "step": 4323} {"train_info/time_between_train_steps": 0.0031147003173828125, "step": 4323} {"info/global_step": 4324, "train_info/time_within_train_step": 2.755279779434204, "step": 4324} {"train_info/time_between_train_steps": 0.0031402111053466797, "step": 4324} {"info/global_step": 4325, "train_info/time_within_train_step": 2.7538094520568848, "step": 4325} {"train_info/time_between_train_steps": 0.003240823745727539, "step": 4325} {"info/global_step": 4326, "train_info/time_within_train_step": 2.7526233196258545, "step": 4326} {"train_info/time_between_train_steps": 0.0031931400299072266, "step": 4326} {"info/global_step": 4327, "train_info/time_within_train_step": 2.7536816596984863, "step": 4327} {"train_info/time_between_train_steps": 0.0034940242767333984, "step": 4327} {"info/global_step": 4328, "train_info/time_within_train_step": 2.8760597705841064, "step": 4328} {"train_info/time_between_train_steps": 0.0032415390014648438, "step": 4328} {"info/global_step": 4329, "train_info/time_within_train_step": 2.7540605068206787, "step": 4329} {"train_info/time_between_train_steps": 0.0032699108123779297, "step": 4329} {"info/global_step": 4330, "train_info/time_within_train_step": 2.75520396232605, "step": 4330} {"train_info/time_between_train_steps": 0.003184080123901367, "step": 4330} {"info/global_step": 4331, "train_info/time_within_train_step": 2.75424861907959, "step": 4331} {"train_info/time_between_train_steps": 0.0031900405883789062, "step": 4331} {"info/global_step": 4332, "train_info/time_within_train_step": 2.753969669342041, "step": 4332} {"train_info/time_between_train_steps": 0.0032138824462890625, "step": 4332} {"info/global_step": 4333, "train_info/time_within_train_step": 2.7529053688049316, "step": 4333} {"train_info/time_between_train_steps": 0.0032186508178710938, "step": 4333} {"info/global_step": 4334, "train_info/time_within_train_step": 2.754261016845703, "step": 4334} {"train_info/time_between_train_steps": 0.0032176971435546875, "step": 4334} {"info/global_step": 4335, "train_info/time_within_train_step": 2.7538766860961914, "step": 4335} {"train_info/time_between_train_steps": 0.003214120864868164, "step": 4335} {"info/global_step": 4336, "train_info/time_within_train_step": 2.754302978515625, "step": 4336} {"train_info/time_between_train_steps": 0.003150463104248047, "step": 4336} {"info/global_step": 4337, "train_info/time_within_train_step": 2.754246473312378, "step": 4337} {"train_info/time_between_train_steps": 0.0032160282135009766, "step": 4337} {"info/global_step": 4338, "train_info/time_within_train_step": 2.7788214683532715, "step": 4338} {"train_info/time_between_train_steps": 0.0032491683959960938, "step": 4338} {"info/global_step": 4339, "train_info/time_within_train_step": 2.754533529281616, "step": 4339} {"train_info/time_between_train_steps": 0.0032067298889160156, "step": 4339} {"info/global_step": 4340, "train_info/time_within_train_step": 2.754981279373169, "step": 4340} {"train_info/time_between_train_steps": 0.0032193660736083984, "step": 4340} {"info/global_step": 4341, "train_info/time_within_train_step": 2.755143642425537, "step": 4341} {"train_info/time_between_train_steps": 0.003212451934814453, "step": 4341} {"info/global_step": 4342, "train_info/time_within_train_step": 2.753878593444824, "step": 4342} {"train_info/time_between_train_steps": 0.003143787384033203, "step": 4342} {"info/global_step": 4343, "train_info/time_within_train_step": 2.7552003860473633, "step": 4343} {"train_info/time_between_train_steps": 0.003203153610229492, "step": 4343} {"info/global_step": 4344, "train_info/time_within_train_step": 2.754743814468384, "step": 4344} {"train_info/time_between_train_steps": 0.0031991004943847656, "step": 4344} {"info/global_step": 4345, "train_info/time_within_train_step": 2.754087209701538, "step": 4345} {"train_info/time_between_train_steps": 0.003198385238647461, "step": 4345} {"info/global_step": 4346, "train_info/time_within_train_step": 2.7557690143585205, "step": 4346} {"train_info/time_between_train_steps": 0.003156423568725586, "step": 4346} {"info/global_step": 4347, "train_info/time_within_train_step": 2.7546989917755127, "step": 4347} {"train_info/time_between_train_steps": 0.0031375885009765625, "step": 4347} {"info/global_step": 4348, "train_info/time_within_train_step": 2.7557284832000732, "step": 4348} {"train_info/time_between_train_steps": 0.003176450729370117, "step": 4348} {"info/global_step": 4349, "train_info/time_within_train_step": 2.754368782043457, "step": 4349} {"train_info/time_between_train_steps": 0.003259897232055664, "step": 4349} {"info/global_step": 4350, "train_info/time_within_train_step": 2.755039691925049, "step": 4350} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746578635, "_runtime": 12644}, "step": 4350} {"logs": {"train/loss": 3.761, "train/learning_rate": 0.00037666666666666664, "train/epoch": 5.01, "_timestamp": 1746578635, "_runtime": 12644}, "step": 4350} {"train_info/time_between_train_steps": 0.013026237487792969, "step": 4350} {"info/global_step": 4351, "train_info/time_within_train_step": 2.755638360977173, "step": 4351} {"train_info/time_between_train_steps": 0.0032258033752441406, "step": 4351} {"info/global_step": 4352, "train_info/time_within_train_step": 2.755913257598877, "step": 4352} {"train_info/time_between_train_steps": 0.0032253265380859375, "step": 4352} {"info/global_step": 4353, "train_info/time_within_train_step": 2.7550055980682373, "step": 4353} {"train_info/time_between_train_steps": 0.0031909942626953125, "step": 4353} {"info/global_step": 4354, "train_info/time_within_train_step": 2.7551989555358887, "step": 4354} {"train_info/time_between_train_steps": 0.0031125545501708984, "step": 4354} {"info/global_step": 4355, "train_info/time_within_train_step": 2.7553906440734863, "step": 4355} {"train_info/time_between_train_steps": 0.003219127655029297, "step": 4355} {"info/global_step": 4356, "train_info/time_within_train_step": 2.754944324493408, "step": 4356} {"train_info/time_between_train_steps": 0.0031898021697998047, "step": 4356} {"info/global_step": 4357, "train_info/time_within_train_step": 2.7544240951538086, "step": 4357} {"train_info/time_between_train_steps": 0.0032281875610351562, "step": 4357} {"info/global_step": 4358, "train_info/time_within_train_step": 2.7550904750823975, "step": 4358} {"train_info/time_between_train_steps": 0.0031614303588867188, "step": 4358} {"info/global_step": 4359, "train_info/time_within_train_step": 2.7529966831207275, "step": 4359} {"train_info/time_between_train_steps": 0.003152132034301758, "step": 4359} {"info/global_step": 4360, "train_info/time_within_train_step": 2.754483461380005, "step": 4360} {"train_info/time_between_train_steps": 0.0031664371490478516, "step": 4360} {"info/global_step": 4361, "train_info/time_within_train_step": 2.75388765335083, "step": 4361} {"train_info/time_between_train_steps": 0.0032074451446533203, "step": 4361} {"info/global_step": 4362, "train_info/time_within_train_step": 2.755330801010132, "step": 4362} {"train_info/time_between_train_steps": 0.0031850337982177734, "step": 4362} {"info/global_step": 4363, "train_info/time_within_train_step": 2.7553341388702393, "step": 4363} {"train_info/time_between_train_steps": 0.0032050609588623047, "step": 4363} {"info/global_step": 4364, "train_info/time_within_train_step": 2.753627061843872, "step": 4364} {"train_info/time_between_train_steps": 0.003272533416748047, "step": 4364} {"info/global_step": 4365, "train_info/time_within_train_step": 2.754807233810425, "step": 4365} {"train_info/time_between_train_steps": 0.003174304962158203, "step": 4365} {"info/global_step": 4366, "train_info/time_within_train_step": 2.75567889213562, "step": 4366} {"train_info/time_between_train_steps": 0.003213167190551758, "step": 4366} {"info/global_step": 4367, "train_info/time_within_train_step": 2.755561351776123, "step": 4367} {"train_info/time_between_train_steps": 0.0031960010528564453, "step": 4367} {"info/global_step": 4368, "train_info/time_within_train_step": 2.7559099197387695, "step": 4368} {"train_info/time_between_train_steps": 0.0031757354736328125, "step": 4368} {"info/global_step": 4369, "train_info/time_within_train_step": 2.755553960800171, "step": 4369} {"train_info/time_between_train_steps": 0.00318145751953125, "step": 4369} {"info/global_step": 4370, "train_info/time_within_train_step": 2.7548305988311768, "step": 4370} {"train_info/time_between_train_steps": 0.003200531005859375, "step": 4370} {"info/global_step": 4371, "train_info/time_within_train_step": 2.754377841949463, "step": 4371} {"train_info/time_between_train_steps": 0.0032677650451660156, "step": 4371} {"info/global_step": 4372, "train_info/time_within_train_step": 2.7549185752868652, "step": 4372} {"train_info/time_between_train_steps": 0.003221273422241211, "step": 4372} {"info/global_step": 4373, "train_info/time_within_train_step": 2.7546603679656982, "step": 4373} {"train_info/time_between_train_steps": 0.003206491470336914, "step": 4373} {"info/global_step": 4374, "train_info/time_within_train_step": 2.7544987201690674, "step": 4374} {"train_info/time_between_train_steps": 0.0031890869140625, "step": 4374} {"info/global_step": 4375, "train_info/time_within_train_step": 2.754662275314331, "step": 4375} {"train_info/time_between_train_steps": 0.0032024383544921875, "step": 4375} {"info/global_step": 4376, "train_info/time_within_train_step": 2.753812313079834, "step": 4376} {"train_info/time_between_train_steps": 0.0031948089599609375, "step": 4376} {"info/global_step": 4377, "train_info/time_within_train_step": 2.7529335021972656, "step": 4377} {"train_info/time_between_train_steps": 0.0032138824462890625, "step": 4377} {"info/global_step": 4378, "train_info/time_within_train_step": 2.754983901977539, "step": 4378} {"train_info/time_between_train_steps": 0.0032265186309814453, "step": 4378} {"info/global_step": 4379, "train_info/time_within_train_step": 2.754408836364746, "step": 4379} {"train_info/time_between_train_steps": 0.003167867660522461, "step": 4379} {"info/global_step": 4380, "train_info/time_within_train_step": 2.754704713821411, "step": 4380} {"train_info/time_between_train_steps": 0.003206968307495117, "step": 4380} {"info/global_step": 4381, "train_info/time_within_train_step": 2.7545783519744873, "step": 4381} {"train_info/time_between_train_steps": 0.0032625198364257812, "step": 4381} {"info/global_step": 4382, "train_info/time_within_train_step": 2.7546679973602295, "step": 4382} {"train_info/time_between_train_steps": 0.0031991004943847656, "step": 4382} {"info/global_step": 4383, "train_info/time_within_train_step": 2.7533466815948486, "step": 4383} {"train_info/time_between_train_steps": 0.003132343292236328, "step": 4383} {"info/global_step": 4384, "train_info/time_within_train_step": 2.7545156478881836, "step": 4384} {"train_info/time_between_train_steps": 0.003164529800415039, "step": 4384} {"info/global_step": 4385, "train_info/time_within_train_step": 2.7551212310791016, "step": 4385} {"train_info/time_between_train_steps": 0.003186941146850586, "step": 4385} {"info/global_step": 4386, "train_info/time_within_train_step": 2.7547736167907715, "step": 4386} {"train_info/time_between_train_steps": 0.0032236576080322266, "step": 4386} {"info/global_step": 4387, "train_info/time_within_train_step": 2.755180597305298, "step": 4387} {"train_info/time_between_train_steps": 0.0031769275665283203, "step": 4387} {"info/global_step": 4388, "train_info/time_within_train_step": 2.752251148223877, "step": 4388} {"train_info/time_between_train_steps": 0.003170013427734375, "step": 4388} {"info/global_step": 4389, "train_info/time_within_train_step": 2.7536351680755615, "step": 4389} {"train_info/time_between_train_steps": 0.0031652450561523438, "step": 4389} {"info/global_step": 4390, "train_info/time_within_train_step": 2.754380941390991, "step": 4390} {"train_info/time_between_train_steps": 0.1283130645751953, "step": 4390} {"info/global_step": 4391, "train_info/time_within_train_step": 2.755429983139038, "step": 4391} {"train_info/time_between_train_steps": 0.003158092498779297, "step": 4391} {"info/global_step": 4392, "train_info/time_within_train_step": 2.7549328804016113, "step": 4392} {"train_info/time_between_train_steps": 0.003181934356689453, "step": 4392} {"info/global_step": 4393, "train_info/time_within_train_step": 2.753844738006592, "step": 4393} {"train_info/time_between_train_steps": 0.0032303333282470703, "step": 4393} {"info/global_step": 4394, "train_info/time_within_train_step": 2.7541370391845703, "step": 4394} {"train_info/time_between_train_steps": 0.003154754638671875, "step": 4394} {"info/global_step": 4395, "train_info/time_within_train_step": 2.7539467811584473, "step": 4395} {"train_info/time_between_train_steps": 0.0031795501708984375, "step": 4395} {"info/global_step": 4396, "train_info/time_within_train_step": 2.755255937576294, "step": 4396} {"train_info/time_between_train_steps": 0.0031783580780029297, "step": 4396} {"info/global_step": 4397, "train_info/time_within_train_step": 2.7552242279052734, "step": 4397} {"train_info/time_between_train_steps": 0.00315093994140625, "step": 4397} {"info/global_step": 4398, "train_info/time_within_train_step": 2.75551438331604, "step": 4398} {"train_info/time_between_train_steps": 0.0032074451446533203, "step": 4398} {"info/global_step": 4399, "train_info/time_within_train_step": 2.7554707527160645, "step": 4399} {"train_info/time_between_train_steps": 0.0031936168670654297, "step": 4399} {"info/global_step": 4400, "train_info/time_within_train_step": 2.754561424255371, "step": 4400} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746578773, "_runtime": 12782}, "step": 4400} {"logs": {"train/loss": 3.7552, "train/learning_rate": 0.0003733333333333333, "train/epoch": 5.01, "_timestamp": 1746578773, "_runtime": 12782}, "step": 4400} {"train_info/time_between_train_steps": 17.722489595413208, "step": 4400} {"info/global_step": 4401, "train_info/time_within_train_step": 2.542628765106201, "step": 4401} {"train_info/time_between_train_steps": 0.003335237503051758, "step": 4401} {"info/global_step": 4402, "train_info/time_within_train_step": 2.570499897003174, "step": 4402} {"train_info/time_between_train_steps": 0.0033240318298339844, "step": 4402} {"info/global_step": 4403, "train_info/time_within_train_step": 2.694732904434204, "step": 4403} {"train_info/time_between_train_steps": 0.0033216476440429688, "step": 4403} {"info/global_step": 4404, "train_info/time_within_train_step": 2.749906063079834, "step": 4404} {"train_info/time_between_train_steps": 0.0031654834747314453, "step": 4404} {"info/global_step": 4405, "train_info/time_within_train_step": 2.9675040245056152, "step": 4405} {"train_info/time_between_train_steps": 0.0031480789184570312, "step": 4405} {"info/global_step": 4406, "train_info/time_within_train_step": 2.7543187141418457, "step": 4406} {"train_info/time_between_train_steps": 0.0032930374145507812, "step": 4406} {"info/global_step": 4407, "train_info/time_within_train_step": 2.756739616394043, "step": 4407} {"train_info/time_between_train_steps": 0.0034584999084472656, "step": 4407} {"info/global_step": 4408, "train_info/time_within_train_step": 2.7569494247436523, "step": 4408} {"train_info/time_between_train_steps": 0.0033152103424072266, "step": 4408} {"info/global_step": 4409, "train_info/time_within_train_step": 2.7560195922851562, "step": 4409} {"train_info/time_between_train_steps": 0.003325223922729492, "step": 4409} {"info/global_step": 4410, "train_info/time_within_train_step": 2.7577030658721924, "step": 4410} {"train_info/time_between_train_steps": 0.0032930374145507812, "step": 4410} {"info/global_step": 4411, "train_info/time_within_train_step": 2.7577614784240723, "step": 4411} {"train_info/time_between_train_steps": 0.0033485889434814453, "step": 4411} {"info/global_step": 4412, "train_info/time_within_train_step": 2.7586278915405273, "step": 4412} {"train_info/time_between_train_steps": 0.0033669471740722656, "step": 4412} {"info/global_step": 4413, "train_info/time_within_train_step": 2.7578020095825195, "step": 4413} {"train_info/time_between_train_steps": 0.003382444381713867, "step": 4413} {"info/global_step": 4414, "train_info/time_within_train_step": 2.7580387592315674, "step": 4414} {"train_info/time_between_train_steps": 0.0033464431762695312, "step": 4414} {"info/global_step": 4415, "train_info/time_within_train_step": 2.7586567401885986, "step": 4415} {"train_info/time_between_train_steps": 0.003169536590576172, "step": 4415} {"info/global_step": 4416, "train_info/time_within_train_step": 2.7589168548583984, "step": 4416} {"train_info/time_between_train_steps": 0.0033304691314697266, "step": 4416} {"info/global_step": 4417, "train_info/time_within_train_step": 2.7598824501037598, "step": 4417} {"train_info/time_between_train_steps": 0.0033066272735595703, "step": 4417} {"info/global_step": 4418, "train_info/time_within_train_step": 2.7592296600341797, "step": 4418} {"train_info/time_between_train_steps": 0.003323793411254883, "step": 4418} {"info/global_step": 4419, "train_info/time_within_train_step": 2.758899211883545, "step": 4419} {"train_info/time_between_train_steps": 0.0035903453826904297, "step": 4419} {"info/global_step": 4420, "train_info/time_within_train_step": 2.757185220718384, "step": 4420} {"train_info/time_between_train_steps": 0.003302335739135742, "step": 4420} {"info/global_step": 4421, "train_info/time_within_train_step": 2.7569000720977783, "step": 4421} {"train_info/time_between_train_steps": 0.003292560577392578, "step": 4421} {"info/global_step": 4422, "train_info/time_within_train_step": 2.7568771839141846, "step": 4422} {"train_info/time_between_train_steps": 0.0031540393829345703, "step": 4422} {"info/global_step": 4423, "train_info/time_within_train_step": 2.7571256160736084, "step": 4423} {"train_info/time_between_train_steps": 0.003166675567626953, "step": 4423} {"info/global_step": 4424, "train_info/time_within_train_step": 2.756126880645752, "step": 4424} {"train_info/time_between_train_steps": 0.0031490325927734375, "step": 4424} {"info/global_step": 4425, "train_info/time_within_train_step": 2.75697922706604, "step": 4425} {"train_info/time_between_train_steps": 0.003208160400390625, "step": 4425} {"info/global_step": 4426, "train_info/time_within_train_step": 2.7562766075134277, "step": 4426} {"train_info/time_between_train_steps": 0.0031442642211914062, "step": 4426} {"info/global_step": 4427, "train_info/time_within_train_step": 2.755833148956299, "step": 4427} {"train_info/time_between_train_steps": 0.0031676292419433594, "step": 4427} {"info/global_step": 4428, "train_info/time_within_train_step": 2.7566747665405273, "step": 4428} {"train_info/time_between_train_steps": 0.0031790733337402344, "step": 4428} {"info/global_step": 4429, "train_info/time_within_train_step": 2.756596326828003, "step": 4429} {"train_info/time_between_train_steps": 0.003305673599243164, "step": 4429} {"info/global_step": 4430, "train_info/time_within_train_step": 2.7579920291900635, "step": 4430} {"train_info/time_between_train_steps": 0.0033097267150878906, "step": 4430} {"info/global_step": 4431, "train_info/time_within_train_step": 2.7575738430023193, "step": 4431} {"train_info/time_between_train_steps": 0.003323078155517578, "step": 4431} {"info/global_step": 4432, "train_info/time_within_train_step": 2.7581050395965576, "step": 4432} {"train_info/time_between_train_steps": 0.003335714340209961, "step": 4432} {"info/global_step": 4433, "train_info/time_within_train_step": 2.758685827255249, "step": 4433} {"train_info/time_between_train_steps": 0.0033130645751953125, "step": 4433} {"info/global_step": 4434, "train_info/time_within_train_step": 2.7576687335968018, "step": 4434} {"train_info/time_between_train_steps": 0.0033462047576904297, "step": 4434} {"info/global_step": 4435, "train_info/time_within_train_step": 2.756654739379883, "step": 4435} {"train_info/time_between_train_steps": 0.003270387649536133, "step": 4435} {"info/global_step": 4436, "train_info/time_within_train_step": 2.75728702545166, "step": 4436} {"train_info/time_between_train_steps": 0.0034308433532714844, "step": 4436} {"info/global_step": 4437, "train_info/time_within_train_step": 2.756777286529541, "step": 4437} {"train_info/time_between_train_steps": 0.0034492015838623047, "step": 4437} {"info/global_step": 4438, "train_info/time_within_train_step": 2.7572407722473145, "step": 4438} {"train_info/time_between_train_steps": 0.003576040267944336, "step": 4438} {"info/global_step": 4439, "train_info/time_within_train_step": 2.757624626159668, "step": 4439} {"train_info/time_between_train_steps": 0.0034983158111572266, "step": 4439} {"info/global_step": 4440, "train_info/time_within_train_step": 2.7567837238311768, "step": 4440} {"train_info/time_between_train_steps": 0.0033528804779052734, "step": 4440} {"info/global_step": 4441, "train_info/time_within_train_step": 2.7567009925842285, "step": 4441} {"train_info/time_between_train_steps": 0.0033266544342041016, "step": 4441} {"info/global_step": 4442, "train_info/time_within_train_step": 2.755741834640503, "step": 4442} {"train_info/time_between_train_steps": 0.0033512115478515625, "step": 4442} {"info/global_step": 4443, "train_info/time_within_train_step": 2.7562642097473145, "step": 4443} {"train_info/time_between_train_steps": 0.003380298614501953, "step": 4443} {"info/global_step": 4444, "train_info/time_within_train_step": 2.7570688724517822, "step": 4444} {"train_info/time_between_train_steps": 0.0033485889434814453, "step": 4444} {"info/global_step": 4445, "train_info/time_within_train_step": 3.0789389610290527, "step": 4445} {"train_info/time_between_train_steps": 0.0031905174255371094, "step": 4445} {"info/global_step": 4446, "train_info/time_within_train_step": 2.757300615310669, "step": 4446} {"train_info/time_between_train_steps": 0.003412008285522461, "step": 4446} {"info/global_step": 4447, "train_info/time_within_train_step": 2.7603204250335693, "step": 4447} {"train_info/time_between_train_steps": 0.0033817291259765625, "step": 4447} {"info/global_step": 4448, "train_info/time_within_train_step": 2.758815288543701, "step": 4448} {"train_info/time_between_train_steps": 0.003448009490966797, "step": 4448} {"info/global_step": 4449, "train_info/time_within_train_step": 2.7594804763793945, "step": 4449} {"train_info/time_between_train_steps": 0.003429889678955078, "step": 4449} {"info/global_step": 4450, "train_info/time_within_train_step": 2.759849786758423, "step": 4450} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746578929, "_runtime": 12938}, "step": 4450} {"logs": {"train/loss": 3.7345, "train/learning_rate": 0.00037, "train/epoch": 5.02, "_timestamp": 1746578929, "_runtime": 12938}, "step": 4450} {"train_info/time_between_train_steps": 0.015131711959838867, "step": 4450} {"info/global_step": 4451, "train_info/time_within_train_step": 2.759335994720459, "step": 4451} {"train_info/time_between_train_steps": 0.0033740997314453125, "step": 4451} {"info/global_step": 4452, "train_info/time_within_train_step": 2.760274887084961, "step": 4452} {"train_info/time_between_train_steps": 0.003310680389404297, "step": 4452} {"info/global_step": 4453, "train_info/time_within_train_step": 2.8977627754211426, "step": 4453} {"train_info/time_between_train_steps": 0.0031995773315429688, "step": 4453} {"info/global_step": 4454, "train_info/time_within_train_step": 2.7557671070098877, "step": 4454} {"train_info/time_between_train_steps": 0.003183603286743164, "step": 4454} {"info/global_step": 4455, "train_info/time_within_train_step": 2.755647897720337, "step": 4455} {"train_info/time_between_train_steps": 0.0031883716583251953, "step": 4455} {"info/global_step": 4456, "train_info/time_within_train_step": 2.755127191543579, "step": 4456} {"train_info/time_between_train_steps": 0.003208637237548828, "step": 4456} {"info/global_step": 4457, "train_info/time_within_train_step": 2.7548251152038574, "step": 4457} {"train_info/time_between_train_steps": 0.003169536590576172, "step": 4457} {"info/global_step": 4458, "train_info/time_within_train_step": 2.7551801204681396, "step": 4458} {"train_info/time_between_train_steps": 0.003173828125, "step": 4458} {"info/global_step": 4459, "train_info/time_within_train_step": 2.755873680114746, "step": 4459} {"train_info/time_between_train_steps": 0.0031998157501220703, "step": 4459} {"info/global_step": 4460, "train_info/time_within_train_step": 2.754990816116333, "step": 4460} {"train_info/time_between_train_steps": 0.003171205520629883, "step": 4460} {"info/global_step": 4461, "train_info/time_within_train_step": 2.7553653717041016, "step": 4461} {"train_info/time_between_train_steps": 0.0031900405883789062, "step": 4461} {"info/global_step": 4462, "train_info/time_within_train_step": 2.755039691925049, "step": 4462} {"train_info/time_between_train_steps": 0.0032007694244384766, "step": 4462} {"info/global_step": 4463, "train_info/time_within_train_step": 2.755103826522827, "step": 4463} {"train_info/time_between_train_steps": 0.003415346145629883, "step": 4463} {"info/global_step": 4464, "train_info/time_within_train_step": 2.7577269077301025, "step": 4464} {"train_info/time_between_train_steps": 0.0035753250122070312, "step": 4464} {"info/global_step": 4465, "train_info/time_within_train_step": 2.756605625152588, "step": 4465} {"train_info/time_between_train_steps": 0.003741741180419922, "step": 4465} {"info/global_step": 4466, "train_info/time_within_train_step": 2.7585511207580566, "step": 4466} {"train_info/time_between_train_steps": 0.0039005279541015625, "step": 4466} {"info/global_step": 4467, "train_info/time_within_train_step": 2.760282278060913, "step": 4467} {"train_info/time_between_train_steps": 0.003767251968383789, "step": 4467} {"info/global_step": 4468, "train_info/time_within_train_step": 2.7603702545166016, "step": 4468} {"train_info/time_between_train_steps": 0.003652334213256836, "step": 4468} {"info/global_step": 4469, "train_info/time_within_train_step": 2.7611472606658936, "step": 4469} {"train_info/time_between_train_steps": 0.0035288333892822266, "step": 4469} {"info/global_step": 4470, "train_info/time_within_train_step": 2.758803606033325, "step": 4470} {"train_info/time_between_train_steps": 0.003716707229614258, "step": 4470} {"info/global_step": 4471, "train_info/time_within_train_step": 2.7571403980255127, "step": 4471} {"train_info/time_between_train_steps": 0.0035614967346191406, "step": 4471} {"info/global_step": 4472, "train_info/time_within_train_step": 2.7569522857666016, "step": 4472} {"train_info/time_between_train_steps": 0.003605365753173828, "step": 4472} {"info/global_step": 4473, "train_info/time_within_train_step": 2.757761001586914, "step": 4473} {"train_info/time_between_train_steps": 0.0035958290100097656, "step": 4473} {"info/global_step": 4474, "train_info/time_within_train_step": 2.7569527626037598, "step": 4474} {"train_info/time_between_train_steps": 0.003451108932495117, "step": 4474} {"info/global_step": 4475, "train_info/time_within_train_step": 2.7567403316497803, "step": 4475} {"train_info/time_between_train_steps": 0.0036687850952148438, "step": 4475} {"info/global_step": 4476, "train_info/time_within_train_step": 2.7565150260925293, "step": 4476} {"train_info/time_between_train_steps": 0.003540515899658203, "step": 4476} {"info/global_step": 4477, "train_info/time_within_train_step": 2.755995750427246, "step": 4477} {"train_info/time_between_train_steps": 0.0034494400024414062, "step": 4477} {"info/global_step": 4478, "train_info/time_within_train_step": 2.7571587562561035, "step": 4478} {"train_info/time_between_train_steps": 0.0035681724548339844, "step": 4478} {"info/global_step": 4479, "train_info/time_within_train_step": 2.757133722305298, "step": 4479} {"train_info/time_between_train_steps": 0.0034537315368652344, "step": 4479} {"info/global_step": 4480, "train_info/time_within_train_step": 2.7571184635162354, "step": 4480} {"train_info/time_between_train_steps": 0.003473520278930664, "step": 4480} {"info/global_step": 4481, "train_info/time_within_train_step": 2.756279706954956, "step": 4481} {"train_info/time_between_train_steps": 0.003427743911743164, "step": 4481} {"info/global_step": 4482, "train_info/time_within_train_step": 2.7564773559570312, "step": 4482} {"train_info/time_between_train_steps": 0.0034165382385253906, "step": 4482} {"info/global_step": 4483, "train_info/time_within_train_step": 2.7559423446655273, "step": 4483} {"train_info/time_between_train_steps": 0.003506898880004883, "step": 4483} {"info/global_step": 4484, "train_info/time_within_train_step": 2.7556557655334473, "step": 4484} {"train_info/time_between_train_steps": 0.0034770965576171875, "step": 4484} {"info/global_step": 4485, "train_info/time_within_train_step": 2.7564377784729004, "step": 4485} {"train_info/time_between_train_steps": 0.0034646987915039062, "step": 4485} {"info/global_step": 4486, "train_info/time_within_train_step": 2.756640911102295, "step": 4486} {"train_info/time_between_train_steps": 0.0034220218658447266, "step": 4486} {"info/global_step": 4487, "train_info/time_within_train_step": 2.7556817531585693, "step": 4487} {"train_info/time_between_train_steps": 0.003439188003540039, "step": 4487} {"info/global_step": 4488, "train_info/time_within_train_step": 2.75585675239563, "step": 4488} {"train_info/time_between_train_steps": 0.0034301280975341797, "step": 4488} {"info/global_step": 4489, "train_info/time_within_train_step": 2.7554831504821777, "step": 4489} {"train_info/time_between_train_steps": 0.0034987926483154297, "step": 4489} {"info/global_step": 4490, "train_info/time_within_train_step": 2.7574644088745117, "step": 4490} {"train_info/time_between_train_steps": 0.0036165714263916016, "step": 4490} {"info/global_step": 4491, "train_info/time_within_train_step": 2.757342576980591, "step": 4491} {"train_info/time_between_train_steps": 0.003548145294189453, "step": 4491} {"info/global_step": 4492, "train_info/time_within_train_step": 2.757051467895508, "step": 4492} {"train_info/time_between_train_steps": 0.0035805702209472656, "step": 4492} {"info/global_step": 4493, "train_info/time_within_train_step": 2.756931781768799, "step": 4493} {"train_info/time_between_train_steps": 0.0036296844482421875, "step": 4493} {"info/global_step": 4494, "train_info/time_within_train_step": 2.7555971145629883, "step": 4494} {"train_info/time_between_train_steps": 0.0036127567291259766, "step": 4494} {"info/global_step": 4495, "train_info/time_within_train_step": 2.7566442489624023, "step": 4495} {"train_info/time_between_train_steps": 0.003560304641723633, "step": 4495} {"info/global_step": 4496, "train_info/time_within_train_step": 2.7572898864746094, "step": 4496} {"train_info/time_between_train_steps": 0.0035550594329833984, "step": 4496} {"info/global_step": 4497, "train_info/time_within_train_step": 2.7564008235931396, "step": 4497} {"train_info/time_between_train_steps": 0.003461122512817383, "step": 4497} {"info/global_step": 4498, "train_info/time_within_train_step": 3.3467729091644287, "step": 4498} {"train_info/time_between_train_steps": 0.0038690567016601562, "step": 4498} {"info/global_step": 4499, "train_info/time_within_train_step": 2.7581217288970947, "step": 4499} {"train_info/time_between_train_steps": 0.0036001205444335938, "step": 4499} {"info/global_step": 4500, "train_info/time_within_train_step": 2.756941795349121, "step": 4500} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746579069, "_runtime": 13078}, "step": 4500} {"logs": {"train/loss": 3.7293, "train/learning_rate": 0.00036666666666666667, "train/epoch": 5.02, "_timestamp": 1746579069, "_runtime": 13078}, "step": 4500} {"train_info/time_between_train_steps": 0.01575469970703125, "step": 4500} {"info/global_step": 4501, "train_info/time_within_train_step": 2.757619857788086, "step": 4501} {"train_info/time_between_train_steps": 0.003694295883178711, "step": 4501} {"info/global_step": 4502, "train_info/time_within_train_step": 2.757465362548828, "step": 4502} {"train_info/time_between_train_steps": 0.003644704818725586, "step": 4502} {"info/global_step": 4503, "train_info/time_within_train_step": 2.7574284076690674, "step": 4503} {"train_info/time_between_train_steps": 0.0034456253051757812, "step": 4503} {"info/global_step": 4504, "train_info/time_within_train_step": 2.7563095092773438, "step": 4504} {"train_info/time_between_train_steps": 0.0036144256591796875, "step": 4504} {"info/global_step": 4505, "train_info/time_within_train_step": 2.7561025619506836, "step": 4505} {"train_info/time_between_train_steps": 0.0037300586700439453, "step": 4505} {"info/global_step": 4506, "train_info/time_within_train_step": 2.7561442852020264, "step": 4506} {"train_info/time_between_train_steps": 0.003650188446044922, "step": 4506} {"info/global_step": 4507, "train_info/time_within_train_step": 2.756864070892334, "step": 4507} {"train_info/time_between_train_steps": 0.003621816635131836, "step": 4507} {"info/global_step": 4508, "train_info/time_within_train_step": 2.7583281993865967, "step": 4508} {"train_info/time_between_train_steps": 0.003601551055908203, "step": 4508} {"info/global_step": 4509, "train_info/time_within_train_step": 2.7568843364715576, "step": 4509} {"train_info/time_between_train_steps": 0.0036191940307617188, "step": 4509} {"info/global_step": 4510, "train_info/time_within_train_step": 2.757892370223999, "step": 4510} {"train_info/time_between_train_steps": 0.00353240966796875, "step": 4510} {"info/global_step": 4511, "train_info/time_within_train_step": 2.7577121257781982, "step": 4511} {"train_info/time_between_train_steps": 0.003622293472290039, "step": 4511} {"info/global_step": 4512, "train_info/time_within_train_step": 2.758535623550415, "step": 4512} {"train_info/time_between_train_steps": 0.003597259521484375, "step": 4512} {"info/global_step": 4513, "train_info/time_within_train_step": 2.757305383682251, "step": 4513} {"train_info/time_between_train_steps": 0.0037071704864501953, "step": 4513} {"info/global_step": 4514, "train_info/time_within_train_step": 2.758258581161499, "step": 4514} {"train_info/time_between_train_steps": 0.003657102584838867, "step": 4514} {"info/global_step": 4515, "train_info/time_within_train_step": 2.7569446563720703, "step": 4515} {"train_info/time_between_train_steps": 0.14613080024719238, "step": 4515} {"info/global_step": 4516, "train_info/time_within_train_step": 2.757615089416504, "step": 4516} {"train_info/time_between_train_steps": 0.003484010696411133, "step": 4516} {"info/global_step": 4517, "train_info/time_within_train_step": 2.7560529708862305, "step": 4517} {"train_info/time_between_train_steps": 0.0033960342407226562, "step": 4517} {"info/global_step": 4518, "train_info/time_within_train_step": 2.7561028003692627, "step": 4518} {"train_info/time_between_train_steps": 0.003505229949951172, "step": 4518} {"info/global_step": 4519, "train_info/time_within_train_step": 2.755507230758667, "step": 4519} {"train_info/time_between_train_steps": 0.003398895263671875, "step": 4519} {"info/global_step": 4520, "train_info/time_within_train_step": 2.7561230659484863, "step": 4520} {"train_info/time_between_train_steps": 0.003461599349975586, "step": 4520} {"info/global_step": 4521, "train_info/time_within_train_step": 2.7569282054901123, "step": 4521} {"train_info/time_between_train_steps": 0.003451824188232422, "step": 4521} {"info/global_step": 4522, "train_info/time_within_train_step": 2.7561817169189453, "step": 4522} {"train_info/time_between_train_steps": 0.0033621788024902344, "step": 4522} {"info/global_step": 4523, "train_info/time_within_train_step": 2.7567079067230225, "step": 4523} {"train_info/time_between_train_steps": 0.0035338401794433594, "step": 4523} {"info/global_step": 4524, "train_info/time_within_train_step": 2.7565131187438965, "step": 4524} {"train_info/time_between_train_steps": 0.0033774375915527344, "step": 4524} {"info/global_step": 4525, "train_info/time_within_train_step": 2.755403518676758, "step": 4525} {"train_info/time_between_train_steps": 0.0034437179565429688, "step": 4525} {"info/global_step": 4526, "train_info/time_within_train_step": 2.755905866622925, "step": 4526} {"train_info/time_between_train_steps": 0.0033867359161376953, "step": 4526} {"info/global_step": 4527, "train_info/time_within_train_step": 2.7563507556915283, "step": 4527} {"train_info/time_between_train_steps": 0.003494739532470703, "step": 4527} {"info/global_step": 4528, "train_info/time_within_train_step": 2.75594425201416, "step": 4528} {"train_info/time_between_train_steps": 0.003422975540161133, "step": 4528} {"info/global_step": 4529, "train_info/time_within_train_step": 2.758254289627075, "step": 4529} {"train_info/time_between_train_steps": 0.0034303665161132812, "step": 4529} {"info/global_step": 4530, "train_info/time_within_train_step": 2.779850721359253, "step": 4530} {"train_info/time_between_train_steps": 0.0034971237182617188, "step": 4530} {"info/global_step": 4531, "train_info/time_within_train_step": 2.7582993507385254, "step": 4531} {"train_info/time_between_train_steps": 0.003438711166381836, "step": 4531} {"info/global_step": 4532, "train_info/time_within_train_step": 2.7554144859313965, "step": 4532} {"train_info/time_between_train_steps": 0.0035021305084228516, "step": 4532} {"info/global_step": 4533, "train_info/time_within_train_step": 2.7563467025756836, "step": 4533} {"train_info/time_between_train_steps": 0.003512859344482422, "step": 4533} {"info/global_step": 4534, "train_info/time_within_train_step": 2.7557692527770996, "step": 4534} {"train_info/time_between_train_steps": 0.003494739532470703, "step": 4534} {"info/global_step": 4535, "train_info/time_within_train_step": 2.756904125213623, "step": 4535} {"train_info/time_between_train_steps": 0.003465890884399414, "step": 4535} {"info/global_step": 4536, "train_info/time_within_train_step": 3.044475555419922, "step": 4536} {"train_info/time_between_train_steps": 0.0033867359161376953, "step": 4536} {"info/global_step": 4537, "train_info/time_within_train_step": 2.7556211948394775, "step": 4537} {"train_info/time_between_train_steps": 0.003331422805786133, "step": 4537} {"info/global_step": 4538, "train_info/time_within_train_step": 2.7560482025146484, "step": 4538} {"train_info/time_between_train_steps": 0.0033843517303466797, "step": 4538} {"info/global_step": 4539, "train_info/time_within_train_step": 2.7555878162384033, "step": 4539} {"train_info/time_between_train_steps": 0.0033369064331054688, "step": 4539} {"info/global_step": 4540, "train_info/time_within_train_step": 2.756540060043335, "step": 4540} {"train_info/time_between_train_steps": 0.003389120101928711, "step": 4540} {"info/global_step": 4541, "train_info/time_within_train_step": 2.7557358741760254, "step": 4541} {"train_info/time_between_train_steps": 0.003217935562133789, "step": 4541} {"info/global_step": 4542, "train_info/time_within_train_step": 2.756645441055298, "step": 4542} {"train_info/time_between_train_steps": 0.003205537796020508, "step": 4542} {"info/global_step": 4543, "train_info/time_within_train_step": 2.755476236343384, "step": 4543} {"train_info/time_between_train_steps": 0.003179788589477539, "step": 4543} {"info/global_step": 4544, "train_info/time_within_train_step": 2.7551348209381104, "step": 4544} {"train_info/time_between_train_steps": 0.003155946731567383, "step": 4544} {"info/global_step": 4545, "train_info/time_within_train_step": 2.754608392715454, "step": 4545} {"train_info/time_between_train_steps": 0.0033102035522460938, "step": 4545} {"info/global_step": 4546, "train_info/time_within_train_step": 2.755084991455078, "step": 4546} {"train_info/time_between_train_steps": 0.0031905174255371094, "step": 4546} {"info/global_step": 4547, "train_info/time_within_train_step": 2.754361391067505, "step": 4547} {"train_info/time_between_train_steps": 0.003160715103149414, "step": 4547} {"info/global_step": 4548, "train_info/time_within_train_step": 2.7542755603790283, "step": 4548} {"train_info/time_between_train_steps": 0.00315093994140625, "step": 4548} {"info/global_step": 4549, "train_info/time_within_train_step": 2.7553064823150635, "step": 4549} {"train_info/time_between_train_steps": 0.0032417774200439453, "step": 4549} {"info/global_step": 4550, "train_info/time_within_train_step": 2.7544045448303223, "step": 4550} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746579207, "_runtime": 13216}, "step": 4550} {"logs": {"train/loss": 3.7093, "train/learning_rate": 0.0003633333333333333, "train/epoch": 5.03, "_timestamp": 1746579207, "_runtime": 13216}, "step": 4550} {"train_info/time_between_train_steps": 0.013430595397949219, "step": 4550} {"info/global_step": 4551, "train_info/time_within_train_step": 2.754977226257324, "step": 4551} {"train_info/time_between_train_steps": 0.0033025741577148438, "step": 4551} {"info/global_step": 4552, "train_info/time_within_train_step": 2.755615472793579, "step": 4552} {"train_info/time_between_train_steps": 0.003326892852783203, "step": 4552} {"info/global_step": 4553, "train_info/time_within_train_step": 2.7564687728881836, "step": 4553} {"train_info/time_between_train_steps": 0.0033817291259765625, "step": 4553} {"info/global_step": 4554, "train_info/time_within_train_step": 2.7566258907318115, "step": 4554} {"train_info/time_between_train_steps": 0.0033164024353027344, "step": 4554} {"info/global_step": 4555, "train_info/time_within_train_step": 2.7567713260650635, "step": 4555} {"train_info/time_between_train_steps": 0.003339529037475586, "step": 4555} {"info/global_step": 4556, "train_info/time_within_train_step": 2.756749153137207, "step": 4556} {"train_info/time_between_train_steps": 0.0034127235412597656, "step": 4556} {"info/global_step": 4557, "train_info/time_within_train_step": 2.756472587585449, "step": 4557} {"train_info/time_between_train_steps": 0.0033135414123535156, "step": 4557} {"info/global_step": 4558, "train_info/time_within_train_step": 2.7565579414367676, "step": 4558} {"train_info/time_between_train_steps": 0.0033032894134521484, "step": 4558} {"info/global_step": 4559, "train_info/time_within_train_step": 2.7562460899353027, "step": 4559} {"train_info/time_between_train_steps": 0.003313302993774414, "step": 4559} {"info/global_step": 4560, "train_info/time_within_train_step": 2.7570130825042725, "step": 4560} {"train_info/time_between_train_steps": 0.0033020973205566406, "step": 4560} {"info/global_step": 4561, "train_info/time_within_train_step": 2.755556106567383, "step": 4561} {"train_info/time_between_train_steps": 0.003320932388305664, "step": 4561} {"info/global_step": 4562, "train_info/time_within_train_step": 2.7556512355804443, "step": 4562} {"train_info/time_between_train_steps": 0.0032842159271240234, "step": 4562} {"info/global_step": 4563, "train_info/time_within_train_step": 2.756523370742798, "step": 4563} {"train_info/time_between_train_steps": 0.0033082962036132812, "step": 4563} {"info/global_step": 4564, "train_info/time_within_train_step": 2.7563066482543945, "step": 4564} {"train_info/time_between_train_steps": 0.0033464431762695312, "step": 4564} {"info/global_step": 4565, "train_info/time_within_train_step": 2.758270740509033, "step": 4565} {"train_info/time_between_train_steps": 0.0033135414123535156, "step": 4565} {"info/global_step": 4566, "train_info/time_within_train_step": 2.756577491760254, "step": 4566} {"train_info/time_between_train_steps": 0.00334930419921875, "step": 4566} {"info/global_step": 4567, "train_info/time_within_train_step": 2.756260395050049, "step": 4567} {"train_info/time_between_train_steps": 0.0032639503479003906, "step": 4567} {"info/global_step": 4568, "train_info/time_within_train_step": 2.7566800117492676, "step": 4568} {"train_info/time_between_train_steps": 0.003281116485595703, "step": 4568} {"info/global_step": 4569, "train_info/time_within_train_step": 2.755289077758789, "step": 4569} {"train_info/time_between_train_steps": 0.0032660961151123047, "step": 4569} {"info/global_step": 4570, "train_info/time_within_train_step": 2.756068706512451, "step": 4570} {"train_info/time_between_train_steps": 0.0034637451171875, "step": 4570} {"info/global_step": 4571, "train_info/time_within_train_step": 2.7562997341156006, "step": 4571} {"train_info/time_between_train_steps": 0.0033893585205078125, "step": 4571} {"info/global_step": 4572, "train_info/time_within_train_step": 2.755986213684082, "step": 4572} {"train_info/time_between_train_steps": 0.0031926631927490234, "step": 4572} {"info/global_step": 4573, "train_info/time_within_train_step": 2.755230188369751, "step": 4573} {"train_info/time_between_train_steps": 0.003204345703125, "step": 4573} {"info/global_step": 4574, "train_info/time_within_train_step": 2.7548611164093018, "step": 4574} {"train_info/time_between_train_steps": 0.0032036304473876953, "step": 4574} {"info/global_step": 4575, "train_info/time_within_train_step": 2.7554807662963867, "step": 4575} {"train_info/time_between_train_steps": 0.003178834915161133, "step": 4575} {"info/global_step": 4576, "train_info/time_within_train_step": 2.7549333572387695, "step": 4576} {"train_info/time_between_train_steps": 0.003170013427734375, "step": 4576} {"info/global_step": 4577, "train_info/time_within_train_step": 2.755258321762085, "step": 4577} {"train_info/time_between_train_steps": 0.003139495849609375, "step": 4577} {"info/global_step": 4578, "train_info/time_within_train_step": 2.8793768882751465, "step": 4578} {"train_info/time_between_train_steps": 0.0031876564025878906, "step": 4578} {"info/global_step": 4579, "train_info/time_within_train_step": 2.754333019256592, "step": 4579} {"train_info/time_between_train_steps": 0.003194570541381836, "step": 4579} {"info/global_step": 4580, "train_info/time_within_train_step": 2.7546112537384033, "step": 4580} {"train_info/time_between_train_steps": 0.003173351287841797, "step": 4580} {"info/global_step": 4581, "train_info/time_within_train_step": 2.753363609313965, "step": 4581} {"train_info/time_between_train_steps": 0.0031850337982177734, "step": 4581} {"info/global_step": 4582, "train_info/time_within_train_step": 2.7545342445373535, "step": 4582} {"train_info/time_between_train_steps": 0.00328826904296875, "step": 4582} {"info/global_step": 4583, "train_info/time_within_train_step": 2.7550644874572754, "step": 4583} {"train_info/time_between_train_steps": 0.003168344497680664, "step": 4583} {"info/global_step": 4584, "train_info/time_within_train_step": 2.7560150623321533, "step": 4584} {"train_info/time_between_train_steps": 0.003142118453979492, "step": 4584} {"info/global_step": 4585, "train_info/time_within_train_step": 2.7559821605682373, "step": 4585} {"train_info/time_between_train_steps": 0.0031843185424804688, "step": 4585} {"info/global_step": 4586, "train_info/time_within_train_step": 2.755002021789551, "step": 4586} {"train_info/time_between_train_steps": 0.003210306167602539, "step": 4586} {"info/global_step": 4587, "train_info/time_within_train_step": 2.7546682357788086, "step": 4587} {"train_info/time_between_train_steps": 0.0031723976135253906, "step": 4587} {"info/global_step": 4588, "train_info/time_within_train_step": 2.754556655883789, "step": 4588} {"train_info/time_between_train_steps": 0.003168821334838867, "step": 4588} {"info/global_step": 4589, "train_info/time_within_train_step": 2.7546885013580322, "step": 4589} {"train_info/time_between_train_steps": 0.0032045841217041016, "step": 4589} {"info/global_step": 4590, "train_info/time_within_train_step": 2.7550606727600098, "step": 4590} {"train_info/time_between_train_steps": 0.0031671524047851562, "step": 4590} {"info/global_step": 4591, "train_info/time_within_train_step": 2.9882004261016846, "step": 4591} {"train_info/time_between_train_steps": 0.003145456314086914, "step": 4591} {"info/global_step": 4592, "train_info/time_within_train_step": 2.753103017807007, "step": 4592} {"train_info/time_between_train_steps": 0.003190279006958008, "step": 4592} {"info/global_step": 4593, "train_info/time_within_train_step": 2.754535436630249, "step": 4593} {"train_info/time_between_train_steps": 0.0032808780670166016, "step": 4593} {"info/global_step": 4594, "train_info/time_within_train_step": 2.754446268081665, "step": 4594} {"train_info/time_between_train_steps": 0.003233671188354492, "step": 4594} {"info/global_step": 4595, "train_info/time_within_train_step": 2.760162830352783, "step": 4595} {"train_info/time_between_train_steps": 0.0031843185424804688, "step": 4595} {"info/global_step": 4596, "train_info/time_within_train_step": 2.7548892498016357, "step": 4596} {"train_info/time_between_train_steps": 0.003170013427734375, "step": 4596} {"info/global_step": 4597, "train_info/time_within_train_step": 2.754855155944824, "step": 4597} {"train_info/time_between_train_steps": 0.0031511783599853516, "step": 4597} {"info/global_step": 4598, "train_info/time_within_train_step": 2.7535274028778076, "step": 4598} {"train_info/time_between_train_steps": 0.003151416778564453, "step": 4598} {"info/global_step": 4599, "train_info/time_within_train_step": 2.7554500102996826, "step": 4599} {"train_info/time_between_train_steps": 0.0032672882080078125, "step": 4599} {"info/global_step": 4600, "train_info/time_within_train_step": 2.756676197052002, "step": 4600} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746579346, "_runtime": 13355}, "step": 4600} {"logs": {"train/loss": 3.7088, "train/learning_rate": 0.00035999999999999997, "train/epoch": 5.03, "_timestamp": 1746579346, "_runtime": 13355}, "step": 4600} {"train_info/time_between_train_steps": 18.370896100997925, "step": 4600} {"info/global_step": 4601, "train_info/time_within_train_step": 2.5334033966064453, "step": 4601} {"train_info/time_between_train_steps": 0.0033609867095947266, "step": 4601} {"info/global_step": 4602, "train_info/time_within_train_step": 2.5812275409698486, "step": 4602} {"train_info/time_between_train_steps": 0.003415822982788086, "step": 4602} {"info/global_step": 4603, "train_info/time_within_train_step": 2.7041571140289307, "step": 4603} {"train_info/time_between_train_steps": 0.003321409225463867, "step": 4603} {"info/global_step": 4604, "train_info/time_within_train_step": 2.7463316917419434, "step": 4604} {"train_info/time_between_train_steps": 0.0033164024353027344, "step": 4604} {"info/global_step": 4605, "train_info/time_within_train_step": 2.7527689933776855, "step": 4605} {"train_info/time_between_train_steps": 0.0033121109008789062, "step": 4605} {"info/global_step": 4606, "train_info/time_within_train_step": 2.755810260772705, "step": 4606} {"train_info/time_between_train_steps": 0.0033028125762939453, "step": 4606} {"info/global_step": 4607, "train_info/time_within_train_step": 2.7562296390533447, "step": 4607} {"train_info/time_between_train_steps": 0.003307819366455078, "step": 4607} {"info/global_step": 4608, "train_info/time_within_train_step": 2.7566819190979004, "step": 4608} {"train_info/time_between_train_steps": 0.0032999515533447266, "step": 4608} {"info/global_step": 4609, "train_info/time_within_train_step": 2.756693124771118, "step": 4609} {"train_info/time_between_train_steps": 0.003309011459350586, "step": 4609} {"info/global_step": 4610, "train_info/time_within_train_step": 2.756639242172241, "step": 4610} {"train_info/time_between_train_steps": 0.003354310989379883, "step": 4610} {"info/global_step": 4611, "train_info/time_within_train_step": 2.755570650100708, "step": 4611} {"train_info/time_between_train_steps": 0.0033004283905029297, "step": 4611} {"info/global_step": 4612, "train_info/time_within_train_step": 2.7547717094421387, "step": 4612} {"train_info/time_between_train_steps": 0.0033195018768310547, "step": 4612} {"info/global_step": 4613, "train_info/time_within_train_step": 2.7569453716278076, "step": 4613} {"train_info/time_between_train_steps": 0.0033261775970458984, "step": 4613} {"info/global_step": 4614, "train_info/time_within_train_step": 2.756437301635742, "step": 4614} {"train_info/time_between_train_steps": 0.003337860107421875, "step": 4614} {"info/global_step": 4615, "train_info/time_within_train_step": 2.7569291591644287, "step": 4615} {"train_info/time_between_train_steps": 0.003289461135864258, "step": 4615} {"info/global_step": 4616, "train_info/time_within_train_step": 2.7568306922912598, "step": 4616} {"train_info/time_between_train_steps": 0.0033185482025146484, "step": 4616} {"info/global_step": 4617, "train_info/time_within_train_step": 2.7574939727783203, "step": 4617} {"train_info/time_between_train_steps": 0.003316164016723633, "step": 4617} {"info/global_step": 4618, "train_info/time_within_train_step": 2.7569119930267334, "step": 4618} {"train_info/time_between_train_steps": 0.0033020973205566406, "step": 4618} {"info/global_step": 4619, "train_info/time_within_train_step": 2.7575924396514893, "step": 4619} {"train_info/time_between_train_steps": 0.003344297409057617, "step": 4619} {"info/global_step": 4620, "train_info/time_within_train_step": 2.7565550804138184, "step": 4620} {"train_info/time_between_train_steps": 0.0031516551971435547, "step": 4620} {"info/global_step": 4621, "train_info/time_within_train_step": 2.756366491317749, "step": 4621} {"train_info/time_between_train_steps": 0.003177165985107422, "step": 4621} {"info/global_step": 4622, "train_info/time_within_train_step": 2.755504846572876, "step": 4622} {"train_info/time_between_train_steps": 0.003147125244140625, "step": 4622} {"info/global_step": 4623, "train_info/time_within_train_step": 2.7560441493988037, "step": 4623} {"train_info/time_between_train_steps": 0.003162384033203125, "step": 4623} {"info/global_step": 4624, "train_info/time_within_train_step": 2.7551307678222656, "step": 4624} {"train_info/time_between_train_steps": 0.003304004669189453, "step": 4624} {"info/global_step": 4625, "train_info/time_within_train_step": 2.7557384967803955, "step": 4625} {"train_info/time_between_train_steps": 0.0031621456146240234, "step": 4625} {"info/global_step": 4626, "train_info/time_within_train_step": 2.755133867263794, "step": 4626} {"train_info/time_between_train_steps": 0.0031745433807373047, "step": 4626} {"info/global_step": 4627, "train_info/time_within_train_step": 2.7549636363983154, "step": 4627} {"train_info/time_between_train_steps": 0.0031850337982177734, "step": 4627} {"info/global_step": 4628, "train_info/time_within_train_step": 2.7543599605560303, "step": 4628} {"train_info/time_between_train_steps": 0.0031998157501220703, "step": 4628} {"info/global_step": 4629, "train_info/time_within_train_step": 2.755596160888672, "step": 4629} {"train_info/time_between_train_steps": 0.0031461715698242188, "step": 4629} {"info/global_step": 4630, "train_info/time_within_train_step": 2.7551627159118652, "step": 4630} {"train_info/time_between_train_steps": 0.003156423568725586, "step": 4630} {"info/global_step": 4631, "train_info/time_within_train_step": 2.7555689811706543, "step": 4631} {"train_info/time_between_train_steps": 0.0031540393829345703, "step": 4631} {"info/global_step": 4632, "train_info/time_within_train_step": 2.754969596862793, "step": 4632} {"train_info/time_between_train_steps": 0.0031774044036865234, "step": 4632} {"info/global_step": 4633, "train_info/time_within_train_step": 2.7558014392852783, "step": 4633} {"train_info/time_between_train_steps": 0.0031774044036865234, "step": 4633} {"info/global_step": 4634, "train_info/time_within_train_step": 2.755242109298706, "step": 4634} {"train_info/time_between_train_steps": 0.003132343292236328, "step": 4634} {"info/global_step": 4635, "train_info/time_within_train_step": 2.756152391433716, "step": 4635} {"train_info/time_between_train_steps": 0.003187417984008789, "step": 4635} {"info/global_step": 4636, "train_info/time_within_train_step": 2.754415512084961, "step": 4636} {"train_info/time_between_train_steps": 0.0031881332397460938, "step": 4636} {"info/global_step": 4637, "train_info/time_within_train_step": 2.7544994354248047, "step": 4637} {"train_info/time_between_train_steps": 0.003139495849609375, "step": 4637} {"info/global_step": 4638, "train_info/time_within_train_step": 2.7554948329925537, "step": 4638} {"train_info/time_between_train_steps": 0.0031375885009765625, "step": 4638} {"info/global_step": 4639, "train_info/time_within_train_step": 2.754692316055298, "step": 4639} {"train_info/time_between_train_steps": 0.003210783004760742, "step": 4639} {"info/global_step": 4640, "train_info/time_within_train_step": 2.7552788257598877, "step": 4640} {"train_info/time_between_train_steps": 0.1234440803527832, "step": 4640} {"info/global_step": 4641, "train_info/time_within_train_step": 2.7557270526885986, "step": 4641} {"train_info/time_between_train_steps": 0.0031604766845703125, "step": 4641} {"info/global_step": 4642, "train_info/time_within_train_step": 2.755070209503174, "step": 4642} {"train_info/time_between_train_steps": 0.003126859664916992, "step": 4642} {"info/global_step": 4643, "train_info/time_within_train_step": 2.7543160915374756, "step": 4643} {"train_info/time_between_train_steps": 0.003163576126098633, "step": 4643} {"info/global_step": 4644, "train_info/time_within_train_step": 2.753122568130493, "step": 4644} {"train_info/time_between_train_steps": 0.003165006637573242, "step": 4644} {"info/global_step": 4645, "train_info/time_within_train_step": 2.7543070316314697, "step": 4645} {"train_info/time_between_train_steps": 0.0031833648681640625, "step": 4645} {"info/global_step": 4646, "train_info/time_within_train_step": 2.7540059089660645, "step": 4646} {"train_info/time_between_train_steps": 0.0032205581665039062, "step": 4646} {"info/global_step": 4647, "train_info/time_within_train_step": 2.7545340061187744, "step": 4647} {"train_info/time_between_train_steps": 0.003242015838623047, "step": 4647} {"info/global_step": 4648, "train_info/time_within_train_step": 2.752548933029175, "step": 4648} {"train_info/time_between_train_steps": 0.0031745433807373047, "step": 4648} {"info/global_step": 4649, "train_info/time_within_train_step": 2.754528284072876, "step": 4649} {"train_info/time_between_train_steps": 0.0031692981719970703, "step": 4649} {"info/global_step": 4650, "train_info/time_within_train_step": 2.754802703857422, "step": 4650} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746579502, "_runtime": 13511}, "step": 4650} {"logs": {"train/loss": 3.7089, "train/learning_rate": 0.00035666666666666664, "train/epoch": 5.04, "_timestamp": 1746579502, "_runtime": 13511}, "step": 4650} {"train_info/time_between_train_steps": 0.01410531997680664, "step": 4650} {"info/global_step": 4651, "train_info/time_within_train_step": 2.754887104034424, "step": 4651} {"train_info/time_between_train_steps": 0.0031719207763671875, "step": 4651} {"info/global_step": 4652, "train_info/time_within_train_step": 2.7547006607055664, "step": 4652} {"train_info/time_between_train_steps": 0.003172636032104492, "step": 4652} {"info/global_step": 4653, "train_info/time_within_train_step": 2.7546563148498535, "step": 4653} {"train_info/time_between_train_steps": 0.00322723388671875, "step": 4653} {"info/global_step": 4654, "train_info/time_within_train_step": 2.754542589187622, "step": 4654} {"train_info/time_between_train_steps": 0.0031592845916748047, "step": 4654} {"info/global_step": 4655, "train_info/time_within_train_step": 2.7542762756347656, "step": 4655} {"train_info/time_between_train_steps": 0.003161191940307617, "step": 4655} {"info/global_step": 4656, "train_info/time_within_train_step": 2.7541611194610596, "step": 4656} {"train_info/time_between_train_steps": 0.003172159194946289, "step": 4656} {"info/global_step": 4657, "train_info/time_within_train_step": 2.7543625831604004, "step": 4657} {"train_info/time_between_train_steps": 0.003157377243041992, "step": 4657} {"info/global_step": 4658, "train_info/time_within_train_step": 2.7538042068481445, "step": 4658} {"train_info/time_between_train_steps": 0.0031745433807373047, "step": 4658} {"info/global_step": 4659, "train_info/time_within_train_step": 2.7537357807159424, "step": 4659} {"train_info/time_between_train_steps": 0.0031843185424804688, "step": 4659} {"info/global_step": 4660, "train_info/time_within_train_step": 2.7538864612579346, "step": 4660} {"train_info/time_between_train_steps": 0.0031723976135253906, "step": 4660} {"info/global_step": 4661, "train_info/time_within_train_step": 2.7534897327423096, "step": 4661} {"train_info/time_between_train_steps": 0.0031502246856689453, "step": 4661} {"info/global_step": 4662, "train_info/time_within_train_step": 2.754019021987915, "step": 4662} {"train_info/time_between_train_steps": 0.003175497055053711, "step": 4662} {"info/global_step": 4663, "train_info/time_within_train_step": 2.753871440887451, "step": 4663} {"train_info/time_between_train_steps": 0.0031516551971435547, "step": 4663} {"info/global_step": 4664, "train_info/time_within_train_step": 2.7538130283355713, "step": 4664} {"train_info/time_between_train_steps": 0.003202676773071289, "step": 4664} {"info/global_step": 4665, "train_info/time_within_train_step": 2.753190755844116, "step": 4665} {"train_info/time_between_train_steps": 0.0031905174255371094, "step": 4665} {"info/global_step": 4666, "train_info/time_within_train_step": 2.7535383701324463, "step": 4666} {"train_info/time_between_train_steps": 0.003151416778564453, "step": 4666} {"info/global_step": 4667, "train_info/time_within_train_step": 2.7545087337493896, "step": 4667} {"train_info/time_between_train_steps": 0.003192901611328125, "step": 4667} {"info/global_step": 4668, "train_info/time_within_train_step": 2.7544808387756348, "step": 4668} {"train_info/time_between_train_steps": 0.0031516551971435547, "step": 4668} {"info/global_step": 4669, "train_info/time_within_train_step": 2.754148483276367, "step": 4669} {"train_info/time_between_train_steps": 0.0031898021697998047, "step": 4669} {"info/global_step": 4670, "train_info/time_within_train_step": 2.991224765777588, "step": 4670} {"train_info/time_between_train_steps": 0.0031538009643554688, "step": 4670} {"info/global_step": 4671, "train_info/time_within_train_step": 2.7534525394439697, "step": 4671} {"train_info/time_between_train_steps": 0.0031502246856689453, "step": 4671} {"info/global_step": 4672, "train_info/time_within_train_step": 2.753779411315918, "step": 4672} {"train_info/time_between_train_steps": 0.003132343292236328, "step": 4672} {"info/global_step": 4673, "train_info/time_within_train_step": 2.7541377544403076, "step": 4673} {"train_info/time_between_train_steps": 0.0031812191009521484, "step": 4673} {"info/global_step": 4674, "train_info/time_within_train_step": 2.754629373550415, "step": 4674} {"train_info/time_between_train_steps": 0.003169536590576172, "step": 4674} {"info/global_step": 4675, "train_info/time_within_train_step": 2.753812074661255, "step": 4675} {"train_info/time_between_train_steps": 0.003132343292236328, "step": 4675} {"info/global_step": 4676, "train_info/time_within_train_step": 2.7546849250793457, "step": 4676} {"train_info/time_between_train_steps": 0.0031981468200683594, "step": 4676} {"info/global_step": 4677, "train_info/time_within_train_step": 2.754100799560547, "step": 4677} {"train_info/time_between_train_steps": 0.0031282901763916016, "step": 4677} {"info/global_step": 4678, "train_info/time_within_train_step": 2.7541866302490234, "step": 4678} {"train_info/time_between_train_steps": 0.0031964778900146484, "step": 4678} {"info/global_step": 4679, "train_info/time_within_train_step": 2.7530758380889893, "step": 4679} {"train_info/time_between_train_steps": 0.003168821334838867, "step": 4679} {"info/global_step": 4680, "train_info/time_within_train_step": 2.753748655319214, "step": 4680} {"train_info/time_between_train_steps": 0.0031380653381347656, "step": 4680} {"info/global_step": 4681, "train_info/time_within_train_step": 2.7545363903045654, "step": 4681} {"train_info/time_between_train_steps": 0.003144979476928711, "step": 4681} {"info/global_step": 4682, "train_info/time_within_train_step": 2.7539408206939697, "step": 4682} {"train_info/time_between_train_steps": 0.003177165985107422, "step": 4682} {"info/global_step": 4683, "train_info/time_within_train_step": 2.754384994506836, "step": 4683} {"train_info/time_between_train_steps": 0.0031859874725341797, "step": 4683} {"info/global_step": 4684, "train_info/time_within_train_step": 2.7536659240722656, "step": 4684} {"train_info/time_between_train_steps": 0.0031783580780029297, "step": 4684} {"info/global_step": 4685, "train_info/time_within_train_step": 2.7549808025360107, "step": 4685} {"train_info/time_between_train_steps": 0.0032324790954589844, "step": 4685} {"info/global_step": 4686, "train_info/time_within_train_step": 2.7544753551483154, "step": 4686} {"train_info/time_between_train_steps": 0.003136157989501953, "step": 4686} {"info/global_step": 4687, "train_info/time_within_train_step": 2.754542350769043, "step": 4687} {"train_info/time_between_train_steps": 0.003155231475830078, "step": 4687} {"info/global_step": 4688, "train_info/time_within_train_step": 2.753648519515991, "step": 4688} {"train_info/time_between_train_steps": 0.003173351287841797, "step": 4688} {"info/global_step": 4689, "train_info/time_within_train_step": 2.7522075176239014, "step": 4689} {"train_info/time_between_train_steps": 0.0031669139862060547, "step": 4689} {"info/global_step": 4690, "train_info/time_within_train_step": 2.753026247024536, "step": 4690} {"train_info/time_between_train_steps": 0.003190755844116211, "step": 4690} {"info/global_step": 4691, "train_info/time_within_train_step": 2.7534637451171875, "step": 4691} {"train_info/time_between_train_steps": 0.003227710723876953, "step": 4691} {"info/global_step": 4692, "train_info/time_within_train_step": 2.7540383338928223, "step": 4692} {"train_info/time_between_train_steps": 0.0031805038452148438, "step": 4692} {"info/global_step": 4693, "train_info/time_within_train_step": 2.75388503074646, "step": 4693} {"train_info/time_between_train_steps": 0.0032167434692382812, "step": 4693} {"info/global_step": 4694, "train_info/time_within_train_step": 2.7539355754852295, "step": 4694} {"train_info/time_between_train_steps": 0.003219127655029297, "step": 4694} {"info/global_step": 4695, "train_info/time_within_train_step": 2.7544353008270264, "step": 4695} {"train_info/time_between_train_steps": 0.0032215118408203125, "step": 4695} {"info/global_step": 4696, "train_info/time_within_train_step": 2.754079580307007, "step": 4696} {"train_info/time_between_train_steps": 0.0032258033752441406, "step": 4696} {"info/global_step": 4697, "train_info/time_within_train_step": 2.753182888031006, "step": 4697} {"train_info/time_between_train_steps": 0.0031630992889404297, "step": 4697} {"info/global_step": 4698, "train_info/time_within_train_step": 2.753397226333618, "step": 4698} {"train_info/time_between_train_steps": 0.0031616687774658203, "step": 4698} {"info/global_step": 4699, "train_info/time_within_train_step": 2.7538819313049316, "step": 4699} {"train_info/time_between_train_steps": 0.0031621456146240234, "step": 4699} {"info/global_step": 4700, "train_info/time_within_train_step": 2.7540528774261475, "step": 4700} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746579641, "_runtime": 13650}, "step": 4700} {"logs": {"train/loss": 3.6861, "train/learning_rate": 0.0003533333333333333, "train/epoch": 5.04, "_timestamp": 1746579641, "_runtime": 13650}, "step": 4700} {"train_info/time_between_train_steps": 0.0092926025390625, "step": 4700} {"info/global_step": 4701, "train_info/time_within_train_step": 2.7529456615448, "step": 4701} {"train_info/time_between_train_steps": 0.003135204315185547, "step": 4701} {"info/global_step": 4702, "train_info/time_within_train_step": 2.7547810077667236, "step": 4702} {"train_info/time_between_train_steps": 0.003145933151245117, "step": 4702} {"info/global_step": 4703, "train_info/time_within_train_step": 2.877793788909912, "step": 4703} {"train_info/time_between_train_steps": 0.0031633377075195312, "step": 4703} {"info/global_step": 4704, "train_info/time_within_train_step": 2.7546682357788086, "step": 4704} {"train_info/time_between_train_steps": 0.0031595230102539062, "step": 4704} {"info/global_step": 4705, "train_info/time_within_train_step": 2.7537951469421387, "step": 4705} {"train_info/time_between_train_steps": 0.0032320022583007812, "step": 4705} {"info/global_step": 4706, "train_info/time_within_train_step": 2.754067897796631, "step": 4706} {"train_info/time_between_train_steps": 0.0032281875610351562, "step": 4706} {"info/global_step": 4707, "train_info/time_within_train_step": 2.755805253982544, "step": 4707} {"train_info/time_between_train_steps": 0.0031960010528564453, "step": 4707} {"info/global_step": 4708, "train_info/time_within_train_step": 2.7542343139648438, "step": 4708} {"train_info/time_between_train_steps": 0.0031621456146240234, "step": 4708} {"info/global_step": 4709, "train_info/time_within_train_step": 2.7524049282073975, "step": 4709} {"train_info/time_between_train_steps": 0.003159046173095703, "step": 4709} {"info/global_step": 4710, "train_info/time_within_train_step": 2.7538392543792725, "step": 4710} {"train_info/time_between_train_steps": 0.0031838417053222656, "step": 4710} {"info/global_step": 4711, "train_info/time_within_train_step": 2.7530245780944824, "step": 4711} {"train_info/time_between_train_steps": 0.0031642913818359375, "step": 4711} {"info/global_step": 4712, "train_info/time_within_train_step": 2.7532379627227783, "step": 4712} {"train_info/time_between_train_steps": 0.003157377243041992, "step": 4712} {"info/global_step": 4713, "train_info/time_within_train_step": 2.7534756660461426, "step": 4713} {"train_info/time_between_train_steps": 0.003174304962158203, "step": 4713} {"info/global_step": 4714, "train_info/time_within_train_step": 2.75260329246521, "step": 4714} {"train_info/time_between_train_steps": 0.0031707286834716797, "step": 4714} {"info/global_step": 4715, "train_info/time_within_train_step": 2.753643751144409, "step": 4715} {"train_info/time_between_train_steps": 0.003187417984008789, "step": 4715} {"info/global_step": 4716, "train_info/time_within_train_step": 2.7534995079040527, "step": 4716} {"train_info/time_between_train_steps": 0.0031745433807373047, "step": 4716} {"info/global_step": 4717, "train_info/time_within_train_step": 2.7541041374206543, "step": 4717} {"train_info/time_between_train_steps": 0.00316619873046875, "step": 4717} {"info/global_step": 4718, "train_info/time_within_train_step": 2.7536773681640625, "step": 4718} {"train_info/time_between_train_steps": 0.0031719207763671875, "step": 4718} {"info/global_step": 4719, "train_info/time_within_train_step": 2.755051851272583, "step": 4719} {"train_info/time_between_train_steps": 0.0031812191009521484, "step": 4719} {"info/global_step": 4720, "train_info/time_within_train_step": 2.7536628246307373, "step": 4720} {"train_info/time_between_train_steps": 0.003178834915161133, "step": 4720} {"info/global_step": 4721, "train_info/time_within_train_step": 2.7553293704986572, "step": 4721} {"train_info/time_between_train_steps": 0.0031614303588867188, "step": 4721} {"info/global_step": 4722, "train_info/time_within_train_step": 2.753380298614502, "step": 4722} {"train_info/time_between_train_steps": 0.003162860870361328, "step": 4722} {"info/global_step": 4723, "train_info/time_within_train_step": 2.754253387451172, "step": 4723} {"train_info/time_between_train_steps": 0.0031692981719970703, "step": 4723} {"info/global_step": 4724, "train_info/time_within_train_step": 2.7535533905029297, "step": 4724} {"train_info/time_between_train_steps": 0.0031464099884033203, "step": 4724} {"info/global_step": 4725, "train_info/time_within_train_step": 2.754257917404175, "step": 4725} {"train_info/time_between_train_steps": 0.0031621456146240234, "step": 4725} {"info/global_step": 4726, "train_info/time_within_train_step": 2.9920756816864014, "step": 4726} {"train_info/time_between_train_steps": 0.0031447410583496094, "step": 4726} {"info/global_step": 4727, "train_info/time_within_train_step": 2.754070520401001, "step": 4727} {"train_info/time_between_train_steps": 0.003180980682373047, "step": 4727} {"info/global_step": 4728, "train_info/time_within_train_step": 2.7532804012298584, "step": 4728} {"train_info/time_between_train_steps": 0.0031380653381347656, "step": 4728} {"info/global_step": 4729, "train_info/time_within_train_step": 2.7539703845977783, "step": 4729} {"train_info/time_between_train_steps": 0.003197193145751953, "step": 4729} {"info/global_step": 4730, "train_info/time_within_train_step": 2.753740072250366, "step": 4730} {"train_info/time_between_train_steps": 0.003200054168701172, "step": 4730} {"info/global_step": 4731, "train_info/time_within_train_step": 2.7529964447021484, "step": 4731} {"train_info/time_between_train_steps": 0.003206491470336914, "step": 4731} {"info/global_step": 4732, "train_info/time_within_train_step": 2.7541656494140625, "step": 4732} {"train_info/time_between_train_steps": 0.0031571388244628906, "step": 4732} {"info/global_step": 4733, "train_info/time_within_train_step": 2.7539074420928955, "step": 4733} {"train_info/time_between_train_steps": 0.0031681060791015625, "step": 4733} {"info/global_step": 4734, "train_info/time_within_train_step": 2.754509210586548, "step": 4734} {"train_info/time_between_train_steps": 0.0031843185424804688, "step": 4734} {"info/global_step": 4735, "train_info/time_within_train_step": 2.7537074089050293, "step": 4735} {"train_info/time_between_train_steps": 0.0031795501708984375, "step": 4735} {"info/global_step": 4736, "train_info/time_within_train_step": 2.7531561851501465, "step": 4736} {"train_info/time_between_train_steps": 0.0031960010528564453, "step": 4736} {"info/global_step": 4737, "train_info/time_within_train_step": 2.7537789344787598, "step": 4737} {"train_info/time_between_train_steps": 0.00315093994140625, "step": 4737} {"info/global_step": 4738, "train_info/time_within_train_step": 2.7536189556121826, "step": 4738} {"train_info/time_between_train_steps": 0.003151416778564453, "step": 4738} {"info/global_step": 4739, "train_info/time_within_train_step": 2.7530605792999268, "step": 4739} {"train_info/time_between_train_steps": 0.003175020217895508, "step": 4739} {"info/global_step": 4740, "train_info/time_within_train_step": 2.7541329860687256, "step": 4740} {"train_info/time_between_train_steps": 0.0032176971435546875, "step": 4740} {"info/global_step": 4741, "train_info/time_within_train_step": 2.7529821395874023, "step": 4741} {"train_info/time_between_train_steps": 0.003102540969848633, "step": 4741} {"info/global_step": 4742, "train_info/time_within_train_step": 2.753810405731201, "step": 4742} {"train_info/time_between_train_steps": 0.003175020217895508, "step": 4742} {"info/global_step": 4743, "train_info/time_within_train_step": 2.752825975418091, "step": 4743} {"train_info/time_between_train_steps": 0.0031540393829345703, "step": 4743} {"info/global_step": 4744, "train_info/time_within_train_step": 2.7525506019592285, "step": 4744} {"train_info/time_between_train_steps": 0.0031456947326660156, "step": 4744} {"info/global_step": 4745, "train_info/time_within_train_step": 2.753871202468872, "step": 4745} {"train_info/time_between_train_steps": 0.0031952857971191406, "step": 4745} {"info/global_step": 4746, "train_info/time_within_train_step": 2.754894733428955, "step": 4746} {"train_info/time_between_train_steps": 0.003190279006958008, "step": 4746} {"info/global_step": 4747, "train_info/time_within_train_step": 2.754420042037964, "step": 4747} {"train_info/time_between_train_steps": 0.0032050609588623047, "step": 4747} {"info/global_step": 4748, "train_info/time_within_train_step": 3.3470585346221924, "step": 4748} {"train_info/time_between_train_steps": 0.003199338912963867, "step": 4748} {"info/global_step": 4749, "train_info/time_within_train_step": 2.754096746444702, "step": 4749} {"train_info/time_between_train_steps": 0.003178119659423828, "step": 4749} {"info/global_step": 4750, "train_info/time_within_train_step": 2.7545361518859863, "step": 4750} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746579780, "_runtime": 13789}, "step": 4750} {"logs": {"train/loss": 3.684, "train/learning_rate": 0.00035, "train/epoch": 5.05, "_timestamp": 1746579780, "_runtime": 13789}, "step": 4750} {"train_info/time_between_train_steps": 0.006754875183105469, "step": 4750} {"info/global_step": 4751, "train_info/time_within_train_step": 2.7546403408050537, "step": 4751} {"train_info/time_between_train_steps": 0.0031311511993408203, "step": 4751} {"info/global_step": 4752, "train_info/time_within_train_step": 2.7548937797546387, "step": 4752} {"train_info/time_between_train_steps": 0.0031681060791015625, "step": 4752} {"info/global_step": 4753, "train_info/time_within_train_step": 2.755200147628784, "step": 4753} {"train_info/time_between_train_steps": 0.0031991004943847656, "step": 4753} {"info/global_step": 4754, "train_info/time_within_train_step": 2.7538864612579346, "step": 4754} {"train_info/time_between_train_steps": 0.003153085708618164, "step": 4754} {"info/global_step": 4755, "train_info/time_within_train_step": 2.7526097297668457, "step": 4755} {"train_info/time_between_train_steps": 0.0031785964965820312, "step": 4755} {"info/global_step": 4756, "train_info/time_within_train_step": 2.753258466720581, "step": 4756} {"train_info/time_between_train_steps": 0.0032095909118652344, "step": 4756} {"info/global_step": 4757, "train_info/time_within_train_step": 2.7535178661346436, "step": 4757} {"train_info/time_between_train_steps": 0.0031423568725585938, "step": 4757} {"info/global_step": 4758, "train_info/time_within_train_step": 2.7533352375030518, "step": 4758} {"train_info/time_between_train_steps": 0.003178119659423828, "step": 4758} {"info/global_step": 4759, "train_info/time_within_train_step": 2.7532906532287598, "step": 4759} {"train_info/time_between_train_steps": 0.0031747817993164062, "step": 4759} {"info/global_step": 4760, "train_info/time_within_train_step": 2.7537357807159424, "step": 4760} {"train_info/time_between_train_steps": 0.00315093994140625, "step": 4760} {"info/global_step": 4761, "train_info/time_within_train_step": 2.7547178268432617, "step": 4761} {"train_info/time_between_train_steps": 0.003180265426635742, "step": 4761} {"info/global_step": 4762, "train_info/time_within_train_step": 2.753875494003296, "step": 4762} {"train_info/time_between_train_steps": 0.003134489059448242, "step": 4762} {"info/global_step": 4763, "train_info/time_within_train_step": 2.7542219161987305, "step": 4763} {"train_info/time_between_train_steps": 0.003164052963256836, "step": 4763} {"info/global_step": 4764, "train_info/time_within_train_step": 2.7540690898895264, "step": 4764} {"train_info/time_between_train_steps": 0.003652811050415039, "step": 4764} {"info/global_step": 4765, "train_info/time_within_train_step": 2.7535784244537354, "step": 4765} {"train_info/time_between_train_steps": 0.09369087219238281, "step": 4765} {"info/global_step": 4766, "train_info/time_within_train_step": 2.9867427349090576, "step": 4766} {"train_info/time_between_train_steps": 0.003198385238647461, "step": 4766} {"info/global_step": 4767, "train_info/time_within_train_step": 2.7533936500549316, "step": 4767} {"train_info/time_between_train_steps": 0.0031931400299072266, "step": 4767} {"info/global_step": 4768, "train_info/time_within_train_step": 2.7538723945617676, "step": 4768} {"train_info/time_between_train_steps": 0.003125905990600586, "step": 4768} {"info/global_step": 4769, "train_info/time_within_train_step": 2.7541487216949463, "step": 4769} {"train_info/time_between_train_steps": 0.0034198760986328125, "step": 4769} {"info/global_step": 4770, "train_info/time_within_train_step": 2.753614664077759, "step": 4770} {"train_info/time_between_train_steps": 0.0031633377075195312, "step": 4770} {"info/global_step": 4771, "train_info/time_within_train_step": 2.7546660900115967, "step": 4771} {"train_info/time_between_train_steps": 0.0031681060791015625, "step": 4771} {"info/global_step": 4772, "train_info/time_within_train_step": 2.75370192527771, "step": 4772} {"train_info/time_between_train_steps": 0.003177642822265625, "step": 4772} {"info/global_step": 4773, "train_info/time_within_train_step": 2.7539100646972656, "step": 4773} {"train_info/time_between_train_steps": 0.003193378448486328, "step": 4773} {"info/global_step": 4774, "train_info/time_within_train_step": 2.7535266876220703, "step": 4774} {"train_info/time_between_train_steps": 0.0031948089599609375, "step": 4774} {"info/global_step": 4775, "train_info/time_within_train_step": 2.754239797592163, "step": 4775} {"train_info/time_between_train_steps": 0.0032165050506591797, "step": 4775} {"info/global_step": 4776, "train_info/time_within_train_step": 2.7545011043548584, "step": 4776} {"train_info/time_between_train_steps": 0.0031647682189941406, "step": 4776} {"info/global_step": 4777, "train_info/time_within_train_step": 2.7521824836730957, "step": 4777} {"train_info/time_between_train_steps": 0.003161907196044922, "step": 4777} {"info/global_step": 4778, "train_info/time_within_train_step": 2.7541680335998535, "step": 4778} {"train_info/time_between_train_steps": 0.0031719207763671875, "step": 4778} {"info/global_step": 4779, "train_info/time_within_train_step": 2.7529759407043457, "step": 4779} {"train_info/time_between_train_steps": 0.0031280517578125, "step": 4779} {"info/global_step": 4780, "train_info/time_within_train_step": 2.7538557052612305, "step": 4780} {"train_info/time_between_train_steps": 0.003215789794921875, "step": 4780} {"info/global_step": 4781, "train_info/time_within_train_step": 2.7531747817993164, "step": 4781} {"train_info/time_between_train_steps": 0.00316619873046875, "step": 4781} {"info/global_step": 4782, "train_info/time_within_train_step": 2.754068374633789, "step": 4782} {"train_info/time_between_train_steps": 0.003147125244140625, "step": 4782} {"info/global_step": 4783, "train_info/time_within_train_step": 2.7536098957061768, "step": 4783} {"train_info/time_between_train_steps": 0.003168821334838867, "step": 4783} {"info/global_step": 4784, "train_info/time_within_train_step": 2.7765021324157715, "step": 4784} {"train_info/time_between_train_steps": 0.003191709518432617, "step": 4784} {"info/global_step": 4785, "train_info/time_within_train_step": 2.755297899246216, "step": 4785} {"train_info/time_between_train_steps": 0.003155946731567383, "step": 4785} {"info/global_step": 4786, "train_info/time_within_train_step": 2.7534520626068115, "step": 4786} {"train_info/time_between_train_steps": 0.0031783580780029297, "step": 4786} {"info/global_step": 4787, "train_info/time_within_train_step": 2.7533507347106934, "step": 4787} {"train_info/time_between_train_steps": 0.0031571388244628906, "step": 4787} {"info/global_step": 4788, "train_info/time_within_train_step": 2.752880334854126, "step": 4788} {"train_info/time_between_train_steps": 0.003153562545776367, "step": 4788} {"info/global_step": 4789, "train_info/time_within_train_step": 2.7562668323516846, "step": 4789} {"train_info/time_between_train_steps": 0.0031545162200927734, "step": 4789} {"info/global_step": 4790, "train_info/time_within_train_step": 2.755007266998291, "step": 4790} {"train_info/time_between_train_steps": 0.0031728744506835938, "step": 4790} {"info/global_step": 4791, "train_info/time_within_train_step": 2.7546887397766113, "step": 4791} {"train_info/time_between_train_steps": 0.0032334327697753906, "step": 4791} {"info/global_step": 4792, "train_info/time_within_train_step": 2.7524218559265137, "step": 4792} {"train_info/time_between_train_steps": 0.0031566619873046875, "step": 4792} {"info/global_step": 4793, "train_info/time_within_train_step": 2.754112958908081, "step": 4793} {"train_info/time_between_train_steps": 0.0031778812408447266, "step": 4793} {"info/global_step": 4794, "train_info/time_within_train_step": 2.7542428970336914, "step": 4794} {"train_info/time_between_train_steps": 0.0031614303588867188, "step": 4794} {"info/global_step": 4795, "train_info/time_within_train_step": 2.754713296890259, "step": 4795} {"train_info/time_between_train_steps": 0.003202676773071289, "step": 4795} {"info/global_step": 4796, "train_info/time_within_train_step": 2.753838539123535, "step": 4796} {"train_info/time_between_train_steps": 0.0031859874725341797, "step": 4796} {"info/global_step": 4797, "train_info/time_within_train_step": 2.7547707557678223, "step": 4797} {"train_info/time_between_train_steps": 0.003208160400390625, "step": 4797} {"info/global_step": 4798, "train_info/time_within_train_step": 2.7522876262664795, "step": 4798} {"train_info/time_between_train_steps": 0.0031549930572509766, "step": 4798} {"info/global_step": 4799, "train_info/time_within_train_step": 2.753786087036133, "step": 4799} {"train_info/time_between_train_steps": 0.0031900405883789062, "step": 4799} {"info/global_step": 4800, "train_info/time_within_train_step": 2.7528412342071533, "step": 4800} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746579918, "_runtime": 13927}, "step": 4800} {"logs": {"train/loss": 3.6728, "train/learning_rate": 0.0003466666666666666, "train/epoch": 5.05, "_timestamp": 1746579918, "_runtime": 13927}, "step": 4800} {"train_info/time_between_train_steps": 19.643611669540405, "step": 4800} {"info/global_step": 4801, "train_info/time_within_train_step": 2.534001350402832, "step": 4801} {"train_info/time_between_train_steps": 0.003318309783935547, "step": 4801} {"info/global_step": 4802, "train_info/time_within_train_step": 2.5708062648773193, "step": 4802} {"train_info/time_between_train_steps": 0.0033020973205566406, "step": 4802} {"info/global_step": 4803, "train_info/time_within_train_step": 2.7216782569885254, "step": 4803} {"train_info/time_between_train_steps": 0.0033783912658691406, "step": 4803} {"info/global_step": 4804, "train_info/time_within_train_step": 2.7496399879455566, "step": 4804} {"train_info/time_between_train_steps": 0.003336191177368164, "step": 4804} {"info/global_step": 4805, "train_info/time_within_train_step": 2.7520453929901123, "step": 4805} {"train_info/time_between_train_steps": 0.0033674240112304688, "step": 4805} {"info/global_step": 4806, "train_info/time_within_train_step": 2.755526304244995, "step": 4806} {"train_info/time_between_train_steps": 0.018598556518554688, "step": 4806} {"info/global_step": 4807, "train_info/time_within_train_step": 2.7529256343841553, "step": 4807} {"train_info/time_between_train_steps": 0.00302886962890625, "step": 4807} {"info/global_step": 4808, "train_info/time_within_train_step": 2.7538657188415527, "step": 4808} {"train_info/time_between_train_steps": 0.003376007080078125, "step": 4808} {"info/global_step": 4809, "train_info/time_within_train_step": 2.7528555393218994, "step": 4809} {"train_info/time_between_train_steps": 0.002979278564453125, "step": 4809} {"info/global_step": 4810, "train_info/time_within_train_step": 2.750803232192993, "step": 4810} {"train_info/time_between_train_steps": 0.002991914749145508, "step": 4810} {"info/global_step": 4811, "train_info/time_within_train_step": 2.754288911819458, "step": 4811} {"train_info/time_between_train_steps": 0.0029380321502685547, "step": 4811} {"info/global_step": 4812, "train_info/time_within_train_step": 2.7540271282196045, "step": 4812} {"train_info/time_between_train_steps": 0.0029573440551757812, "step": 4812} {"info/global_step": 4813, "train_info/time_within_train_step": 2.7541098594665527, "step": 4813} {"train_info/time_between_train_steps": 0.002960681915283203, "step": 4813} {"info/global_step": 4814, "train_info/time_within_train_step": 2.753837823867798, "step": 4814} {"train_info/time_between_train_steps": 0.002942323684692383, "step": 4814} {"info/global_step": 4815, "train_info/time_within_train_step": 2.754246473312378, "step": 4815} {"train_info/time_between_train_steps": 0.0029516220092773438, "step": 4815} {"info/global_step": 4816, "train_info/time_within_train_step": 2.7550208568573, "step": 4816} {"train_info/time_between_train_steps": 0.0029633045196533203, "step": 4816} {"info/global_step": 4817, "train_info/time_within_train_step": 2.755533218383789, "step": 4817} {"train_info/time_between_train_steps": 0.003030538558959961, "step": 4817} {"info/global_step": 4818, "train_info/time_within_train_step": 2.7558929920196533, "step": 4818} {"train_info/time_between_train_steps": 0.0030024051666259766, "step": 4818} {"info/global_step": 4819, "train_info/time_within_train_step": 2.755901575088501, "step": 4819} {"train_info/time_between_train_steps": 0.0029633045196533203, "step": 4819} {"info/global_step": 4820, "train_info/time_within_train_step": 2.754624843597412, "step": 4820} {"train_info/time_between_train_steps": 0.0029561519622802734, "step": 4820} {"info/global_step": 4821, "train_info/time_within_train_step": 2.751917839050293, "step": 4821} {"train_info/time_between_train_steps": 0.0029942989349365234, "step": 4821} {"info/global_step": 4822, "train_info/time_within_train_step": 2.783193826675415, "step": 4822} {"train_info/time_between_train_steps": 0.0029382705688476562, "step": 4822} {"info/global_step": 4823, "train_info/time_within_train_step": 2.7560596466064453, "step": 4823} {"train_info/time_between_train_steps": 0.002969980239868164, "step": 4823} {"info/global_step": 4824, "train_info/time_within_train_step": 2.7545735836029053, "step": 4824} {"train_info/time_between_train_steps": 0.002964496612548828, "step": 4824} {"info/global_step": 4825, "train_info/time_within_train_step": 2.754488706588745, "step": 4825} {"train_info/time_between_train_steps": 0.003002643585205078, "step": 4825} {"info/global_step": 4826, "train_info/time_within_train_step": 2.7543880939483643, "step": 4826} {"train_info/time_between_train_steps": 0.002976655960083008, "step": 4826} {"info/global_step": 4827, "train_info/time_within_train_step": 2.7552170753479004, "step": 4827} {"train_info/time_between_train_steps": 0.003020048141479492, "step": 4827} {"info/global_step": 4828, "train_info/time_within_train_step": 2.7553553581237793, "step": 4828} {"train_info/time_between_train_steps": 0.002939939498901367, "step": 4828} {"info/global_step": 4829, "train_info/time_within_train_step": 2.753803014755249, "step": 4829} {"train_info/time_between_train_steps": 0.0029213428497314453, "step": 4829} {"info/global_step": 4830, "train_info/time_within_train_step": 2.7544238567352295, "step": 4830} {"train_info/time_between_train_steps": 0.0029675960540771484, "step": 4830} {"info/global_step": 4831, "train_info/time_within_train_step": 2.753460168838501, "step": 4831} {"train_info/time_between_train_steps": 0.0029213428497314453, "step": 4831} {"info/global_step": 4832, "train_info/time_within_train_step": 2.7535455226898193, "step": 4832} {"train_info/time_between_train_steps": 0.002925395965576172, "step": 4832} {"info/global_step": 4833, "train_info/time_within_train_step": 2.7543060779571533, "step": 4833} {"train_info/time_between_train_steps": 0.0031800270080566406, "step": 4833} {"info/global_step": 4834, "train_info/time_within_train_step": 2.7538094520568848, "step": 4834} {"train_info/time_between_train_steps": 0.0028922557830810547, "step": 4834} {"info/global_step": 4835, "train_info/time_within_train_step": 2.7530550956726074, "step": 4835} {"train_info/time_between_train_steps": 0.002907991409301758, "step": 4835} {"info/global_step": 4836, "train_info/time_within_train_step": 2.7541732788085938, "step": 4836} {"train_info/time_between_train_steps": 0.0028870105743408203, "step": 4836} {"info/global_step": 4837, "train_info/time_within_train_step": 2.9543678760528564, "step": 4837} {"train_info/time_between_train_steps": 0.0029807090759277344, "step": 4837} {"info/global_step": 4838, "train_info/time_within_train_step": 2.7546498775482178, "step": 4838} {"train_info/time_between_train_steps": 0.0028896331787109375, "step": 4838} {"info/global_step": 4839, "train_info/time_within_train_step": 2.753232717514038, "step": 4839} {"train_info/time_between_train_steps": 0.0028533935546875, "step": 4839} {"info/global_step": 4840, "train_info/time_within_train_step": 2.754099130630493, "step": 4840} {"train_info/time_between_train_steps": 0.002902984619140625, "step": 4840} {"info/global_step": 4841, "train_info/time_within_train_step": 2.752488613128662, "step": 4841} {"train_info/time_between_train_steps": 0.002908945083618164, "step": 4841} {"info/global_step": 4842, "train_info/time_within_train_step": 2.7551279067993164, "step": 4842} {"train_info/time_between_train_steps": 0.0029649734497070312, "step": 4842} {"info/global_step": 4843, "train_info/time_within_train_step": 2.7551021575927734, "step": 4843} {"train_info/time_between_train_steps": 0.0029981136322021484, "step": 4843} {"info/global_step": 4844, "train_info/time_within_train_step": 2.7552337646484375, "step": 4844} {"train_info/time_between_train_steps": 0.0029878616333007812, "step": 4844} {"info/global_step": 4845, "train_info/time_within_train_step": 2.7548675537109375, "step": 4845} {"train_info/time_between_train_steps": 0.0029685497283935547, "step": 4845} {"info/global_step": 4846, "train_info/time_within_train_step": 2.7520458698272705, "step": 4846} {"train_info/time_between_train_steps": 0.002961397171020508, "step": 4846} {"info/global_step": 4847, "train_info/time_within_train_step": 2.7543399333953857, "step": 4847} {"train_info/time_between_train_steps": 0.002960681915283203, "step": 4847} {"info/global_step": 4848, "train_info/time_within_train_step": 2.755354642868042, "step": 4848} {"train_info/time_between_train_steps": 0.002946615219116211, "step": 4848} {"info/global_step": 4849, "train_info/time_within_train_step": 2.7545738220214844, "step": 4849} {"train_info/time_between_train_steps": 0.002969980239868164, "step": 4849} {"info/global_step": 4850, "train_info/time_within_train_step": 2.7548649311065674, "step": 4850} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746580076, "_runtime": 14085}, "step": 4850} {"logs": {"train/loss": 3.6697, "train/learning_rate": 0.0003433333333333333, "train/epoch": 5.06, "_timestamp": 1746580076, "_runtime": 14085}, "step": 4850} {"train_info/time_between_train_steps": 0.013627290725708008, "step": 4850} {"info/global_step": 4851, "train_info/time_within_train_step": 2.754887342453003, "step": 4851} {"train_info/time_between_train_steps": 0.0028791427612304688, "step": 4851} {"info/global_step": 4852, "train_info/time_within_train_step": 2.7526731491088867, "step": 4852} {"train_info/time_between_train_steps": 0.002885580062866211, "step": 4852} {"info/global_step": 4853, "train_info/time_within_train_step": 2.7537920475006104, "step": 4853} {"train_info/time_between_train_steps": 0.0029244422912597656, "step": 4853} {"info/global_step": 4854, "train_info/time_within_train_step": 2.752279758453369, "step": 4854} {"train_info/time_between_train_steps": 0.0028994083404541016, "step": 4854} {"info/global_step": 4855, "train_info/time_within_train_step": 2.7605857849121094, "step": 4855} {"train_info/time_between_train_steps": 0.002910137176513672, "step": 4855} {"info/global_step": 4856, "train_info/time_within_train_step": 2.7554304599761963, "step": 4856} {"train_info/time_between_train_steps": 0.0029363632202148438, "step": 4856} {"info/global_step": 4857, "train_info/time_within_train_step": 2.7550785541534424, "step": 4857} {"train_info/time_between_train_steps": 0.0029778480529785156, "step": 4857} {"info/global_step": 4858, "train_info/time_within_train_step": 2.75071382522583, "step": 4858} {"train_info/time_between_train_steps": 0.0029289722442626953, "step": 4858} {"info/global_step": 4859, "train_info/time_within_train_step": 2.7528133392333984, "step": 4859} {"train_info/time_between_train_steps": 0.0029070377349853516, "step": 4859} {"info/global_step": 4860, "train_info/time_within_train_step": 2.7519822120666504, "step": 4860} {"train_info/time_between_train_steps": 0.0029134750366210938, "step": 4860} {"info/global_step": 4861, "train_info/time_within_train_step": 2.7531983852386475, "step": 4861} {"train_info/time_between_train_steps": 0.002909421920776367, "step": 4861} {"info/global_step": 4862, "train_info/time_within_train_step": 2.7524073123931885, "step": 4862} {"train_info/time_between_train_steps": 0.002844572067260742, "step": 4862} {"info/global_step": 4863, "train_info/time_within_train_step": 2.753098487854004, "step": 4863} {"train_info/time_between_train_steps": 0.0029401779174804688, "step": 4863} {"info/global_step": 4864, "train_info/time_within_train_step": 2.7532265186309814, "step": 4864} {"train_info/time_between_train_steps": 0.0028734207153320312, "step": 4864} {"info/global_step": 4865, "train_info/time_within_train_step": 2.753774642944336, "step": 4865} {"train_info/time_between_train_steps": 0.0028564929962158203, "step": 4865} {"info/global_step": 4866, "train_info/time_within_train_step": 2.75299334526062, "step": 4866} {"train_info/time_between_train_steps": 0.002910137176513672, "step": 4866} {"info/global_step": 4867, "train_info/time_within_train_step": 2.7530088424682617, "step": 4867} {"train_info/time_between_train_steps": 0.002908945083618164, "step": 4867} {"info/global_step": 4868, "train_info/time_within_train_step": 2.752797842025757, "step": 4868} {"train_info/time_between_train_steps": 0.0028753280639648438, "step": 4868} {"info/global_step": 4869, "train_info/time_within_train_step": 2.7534377574920654, "step": 4869} {"train_info/time_between_train_steps": 0.0028886795043945312, "step": 4869} {"info/global_step": 4870, "train_info/time_within_train_step": 2.753093719482422, "step": 4870} {"train_info/time_between_train_steps": 0.003094911575317383, "step": 4870} {"info/global_step": 4871, "train_info/time_within_train_step": 2.7516708374023438, "step": 4871} {"train_info/time_between_train_steps": 0.0029006004333496094, "step": 4871} {"info/global_step": 4872, "train_info/time_within_train_step": 2.7527353763580322, "step": 4872} {"train_info/time_between_train_steps": 0.00292205810546875, "step": 4872} {"info/global_step": 4873, "train_info/time_within_train_step": 2.7522270679473877, "step": 4873} {"train_info/time_between_train_steps": 0.0028963088989257812, "step": 4873} {"info/global_step": 4874, "train_info/time_within_train_step": 2.752671718597412, "step": 4874} {"train_info/time_between_train_steps": 0.0028989315032958984, "step": 4874} {"info/global_step": 4875, "train_info/time_within_train_step": 2.752206325531006, "step": 4875} {"train_info/time_between_train_steps": 0.0028960704803466797, "step": 4875} {"info/global_step": 4876, "train_info/time_within_train_step": 2.7519760131835938, "step": 4876} {"train_info/time_between_train_steps": 0.0028944015502929688, "step": 4876} {"info/global_step": 4877, "train_info/time_within_train_step": 2.7525017261505127, "step": 4877} {"train_info/time_between_train_steps": 0.0028717517852783203, "step": 4877} {"info/global_step": 4878, "train_info/time_within_train_step": 2.7511489391326904, "step": 4878} {"train_info/time_between_train_steps": 0.002899646759033203, "step": 4878} {"info/global_step": 4879, "train_info/time_within_train_step": 2.7527382373809814, "step": 4879} {"train_info/time_between_train_steps": 0.002917766571044922, "step": 4879} {"info/global_step": 4880, "train_info/time_within_train_step": 2.7534492015838623, "step": 4880} {"train_info/time_between_train_steps": 0.0029070377349853516, "step": 4880} {"info/global_step": 4881, "train_info/time_within_train_step": 2.9243357181549072, "step": 4881} {"train_info/time_between_train_steps": 0.0029366016387939453, "step": 4881} {"info/global_step": 4882, "train_info/time_within_train_step": 2.751505136489868, "step": 4882} {"train_info/time_between_train_steps": 0.0029630661010742188, "step": 4882} {"info/global_step": 4883, "train_info/time_within_train_step": 2.752923011779785, "step": 4883} {"train_info/time_between_train_steps": 0.002913236618041992, "step": 4883} {"info/global_step": 4884, "train_info/time_within_train_step": 2.754270315170288, "step": 4884} {"train_info/time_between_train_steps": 0.002949237823486328, "step": 4884} {"info/global_step": 4885, "train_info/time_within_train_step": 2.754244327545166, "step": 4885} {"train_info/time_between_train_steps": 0.002992868423461914, "step": 4885} {"info/global_step": 4886, "train_info/time_within_train_step": 2.7548255920410156, "step": 4886} {"train_info/time_between_train_steps": 0.0031507015228271484, "step": 4886} {"info/global_step": 4887, "train_info/time_within_train_step": 2.7791521549224854, "step": 4887} {"train_info/time_between_train_steps": 0.0029456615447998047, "step": 4887} {"info/global_step": 4888, "train_info/time_within_train_step": 2.753573417663574, "step": 4888} {"train_info/time_between_train_steps": 0.0029592514038085938, "step": 4888} {"info/global_step": 4889, "train_info/time_within_train_step": 2.752699136734009, "step": 4889} {"train_info/time_between_train_steps": 0.002921581268310547, "step": 4889} {"info/global_step": 4890, "train_info/time_within_train_step": 2.752429246902466, "step": 4890} {"train_info/time_between_train_steps": 0.0028791427612304688, "step": 4890} {"info/global_step": 4891, "train_info/time_within_train_step": 2.752269744873047, "step": 4891} {"train_info/time_between_train_steps": 0.002880573272705078, "step": 4891} {"info/global_step": 4892, "train_info/time_within_train_step": 2.753053903579712, "step": 4892} {"train_info/time_between_train_steps": 0.00319671630859375, "step": 4892} {"info/global_step": 4893, "train_info/time_within_train_step": 2.752350330352783, "step": 4893} {"train_info/time_between_train_steps": 0.0030362606048583984, "step": 4893} {"info/global_step": 4894, "train_info/time_within_train_step": 2.753218650817871, "step": 4894} {"train_info/time_between_train_steps": 0.00299072265625, "step": 4894} {"info/global_step": 4895, "train_info/time_within_train_step": 2.753143310546875, "step": 4895} {"train_info/time_between_train_steps": 0.0029528141021728516, "step": 4895} {"info/global_step": 4896, "train_info/time_within_train_step": 2.7535645961761475, "step": 4896} {"train_info/time_between_train_steps": 0.0029757022857666016, "step": 4896} {"info/global_step": 4897, "train_info/time_within_train_step": 2.7522356510162354, "step": 4897} {"train_info/time_between_train_steps": 0.003500223159790039, "step": 4897} {"info/global_step": 4898, "train_info/time_within_train_step": 2.7541229724884033, "step": 4898} {"train_info/time_between_train_steps": 0.0030035972595214844, "step": 4898} {"info/global_step": 4899, "train_info/time_within_train_step": 2.757046937942505, "step": 4899} {"train_info/time_between_train_steps": 0.0029976367950439453, "step": 4899} {"info/global_step": 4900, "train_info/time_within_train_step": 2.753415107727051, "step": 4900} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746580215, "_runtime": 14224}, "step": 4900} {"logs": {"train/loss": 3.6514, "train/learning_rate": 0.00033999999999999997, "train/epoch": 5.06, "_timestamp": 1746580215, "_runtime": 14224}, "step": 4900} {"train_info/time_between_train_steps": 0.01476907730102539, "step": 4900} {"info/global_step": 4901, "train_info/time_within_train_step": 2.754847526550293, "step": 4901} {"train_info/time_between_train_steps": 0.002985715866088867, "step": 4901} {"info/global_step": 4902, "train_info/time_within_train_step": 2.754674196243286, "step": 4902} {"train_info/time_between_train_steps": 0.0029821395874023438, "step": 4902} {"info/global_step": 4903, "train_info/time_within_train_step": 2.754487991333008, "step": 4903} {"train_info/time_between_train_steps": 0.002960205078125, "step": 4903} {"info/global_step": 4904, "train_info/time_within_train_step": 2.7532553672790527, "step": 4904} {"train_info/time_between_train_steps": 0.0029218196868896484, "step": 4904} {"info/global_step": 4905, "train_info/time_within_train_step": 2.7536447048187256, "step": 4905} {"train_info/time_between_train_steps": 0.0029354095458984375, "step": 4905} {"info/global_step": 4906, "train_info/time_within_train_step": 2.7534899711608887, "step": 4906} {"train_info/time_between_train_steps": 0.002988100051879883, "step": 4906} {"info/global_step": 4907, "train_info/time_within_train_step": 2.7526066303253174, "step": 4907} {"train_info/time_between_train_steps": 0.003012418746948242, "step": 4907} {"info/global_step": 4908, "train_info/time_within_train_step": 2.7531790733337402, "step": 4908} {"train_info/time_between_train_steps": 0.0029234886169433594, "step": 4908} {"info/global_step": 4909, "train_info/time_within_train_step": 2.7530879974365234, "step": 4909} {"train_info/time_between_train_steps": 0.0029544830322265625, "step": 4909} {"info/global_step": 4910, "train_info/time_within_train_step": 2.7520298957824707, "step": 4910} {"train_info/time_between_train_steps": 0.002938508987426758, "step": 4910} {"info/global_step": 4911, "train_info/time_within_train_step": 2.7540228366851807, "step": 4911} {"train_info/time_between_train_steps": 0.003010988235473633, "step": 4911} {"info/global_step": 4912, "train_info/time_within_train_step": 2.750558614730835, "step": 4912} {"train_info/time_between_train_steps": 0.002974271774291992, "step": 4912} {"info/global_step": 4913, "train_info/time_within_train_step": 2.754911422729492, "step": 4913} {"train_info/time_between_train_steps": 0.0029642581939697266, "step": 4913} {"info/global_step": 4914, "train_info/time_within_train_step": 2.7522552013397217, "step": 4914} {"train_info/time_between_train_steps": 0.002980947494506836, "step": 4914} {"info/global_step": 4915, "train_info/time_within_train_step": 2.7554783821105957, "step": 4915} {"train_info/time_between_train_steps": 0.0029697418212890625, "step": 4915} {"info/global_step": 4916, "train_info/time_within_train_step": 2.754798173904419, "step": 4916} {"train_info/time_between_train_steps": 0.0029959678649902344, "step": 4916} {"info/global_step": 4917, "train_info/time_within_train_step": 2.7543036937713623, "step": 4917} {"train_info/time_between_train_steps": 0.0029726028442382812, "step": 4917} {"info/global_step": 4918, "train_info/time_within_train_step": 2.753636598587036, "step": 4918} {"train_info/time_between_train_steps": 0.0030341148376464844, "step": 4918} {"info/global_step": 4919, "train_info/time_within_train_step": 2.7547507286071777, "step": 4919} {"train_info/time_between_train_steps": 0.002992391586303711, "step": 4919} {"info/global_step": 4920, "train_info/time_within_train_step": 2.7551395893096924, "step": 4920} {"train_info/time_between_train_steps": 0.002978801727294922, "step": 4920} {"info/global_step": 4921, "train_info/time_within_train_step": 2.754955291748047, "step": 4921} {"train_info/time_between_train_steps": 0.003006458282470703, "step": 4921} {"info/global_step": 4922, "train_info/time_within_train_step": 2.7545969486236572, "step": 4922} {"train_info/time_between_train_steps": 0.00299072265625, "step": 4922} {"info/global_step": 4923, "train_info/time_within_train_step": 2.754089832305908, "step": 4923} {"train_info/time_between_train_steps": 0.0029680728912353516, "step": 4923} {"info/global_step": 4924, "train_info/time_within_train_step": 2.7534427642822266, "step": 4924} {"train_info/time_between_train_steps": 0.0030062198638916016, "step": 4924} {"info/global_step": 4925, "train_info/time_within_train_step": 2.7544305324554443, "step": 4925} {"train_info/time_between_train_steps": 0.003032684326171875, "step": 4925} {"info/global_step": 4926, "train_info/time_within_train_step": 2.754439353942871, "step": 4926} {"train_info/time_between_train_steps": 0.003002166748046875, "step": 4926} {"info/global_step": 4927, "train_info/time_within_train_step": 2.7543458938598633, "step": 4927} {"train_info/time_between_train_steps": 0.003006458282470703, "step": 4927} {"info/global_step": 4928, "train_info/time_within_train_step": 2.7539918422698975, "step": 4928} {"train_info/time_between_train_steps": 0.003086090087890625, "step": 4928} {"info/global_step": 4929, "train_info/time_within_train_step": 2.7524449825286865, "step": 4929} {"train_info/time_between_train_steps": 0.0030014514923095703, "step": 4929} {"info/global_step": 4930, "train_info/time_within_train_step": 2.7546253204345703, "step": 4930} {"train_info/time_between_train_steps": 0.0030062198638916016, "step": 4930} {"info/global_step": 4931, "train_info/time_within_train_step": 2.7532196044921875, "step": 4931} {"train_info/time_between_train_steps": 0.003022909164428711, "step": 4931} {"info/global_step": 4932, "train_info/time_within_train_step": 2.7543160915374756, "step": 4932} {"train_info/time_between_train_steps": 0.0030219554901123047, "step": 4932} {"info/global_step": 4933, "train_info/time_within_train_step": 2.75352144241333, "step": 4933} {"train_info/time_between_train_steps": 0.003000020980834961, "step": 4933} {"info/global_step": 4934, "train_info/time_within_train_step": 2.7546839714050293, "step": 4934} {"train_info/time_between_train_steps": 0.0030524730682373047, "step": 4934} {"info/global_step": 4935, "train_info/time_within_train_step": 2.7536792755126953, "step": 4935} {"train_info/time_between_train_steps": 0.0029931068420410156, "step": 4935} {"info/global_step": 4936, "train_info/time_within_train_step": 2.7546298503875732, "step": 4936} {"train_info/time_between_train_steps": 0.0030295848846435547, "step": 4936} {"info/global_step": 4937, "train_info/time_within_train_step": 2.7553443908691406, "step": 4937} {"train_info/time_between_train_steps": 0.002978801727294922, "step": 4937} {"info/global_step": 4938, "train_info/time_within_train_step": 2.7534983158111572, "step": 4938} {"train_info/time_between_train_steps": 0.0029859542846679688, "step": 4938} {"info/global_step": 4939, "train_info/time_within_train_step": 2.753957509994507, "step": 4939} {"train_info/time_between_train_steps": 0.003026723861694336, "step": 4939} {"info/global_step": 4940, "train_info/time_within_train_step": 2.754066228866577, "step": 4940} {"train_info/time_between_train_steps": 0.002979755401611328, "step": 4940} {"info/global_step": 4941, "train_info/time_within_train_step": 2.7537262439727783, "step": 4941} {"train_info/time_between_train_steps": 0.0034418106079101562, "step": 4941} {"info/global_step": 4942, "train_info/time_within_train_step": 2.7545931339263916, "step": 4942} {"train_info/time_between_train_steps": 0.002969026565551758, "step": 4942} {"info/global_step": 4943, "train_info/time_within_train_step": 2.754148483276367, "step": 4943} {"train_info/time_between_train_steps": 0.002959728240966797, "step": 4943} {"info/global_step": 4944, "train_info/time_within_train_step": 2.7544708251953125, "step": 4944} {"train_info/time_between_train_steps": 0.002991914749145508, "step": 4944} {"info/global_step": 4945, "train_info/time_within_train_step": 2.7539243698120117, "step": 4945} {"train_info/time_between_train_steps": 0.002928018569946289, "step": 4945} {"info/global_step": 4946, "train_info/time_within_train_step": 2.754772186279297, "step": 4946} {"train_info/time_between_train_steps": 0.0029370784759521484, "step": 4946} {"info/global_step": 4947, "train_info/time_within_train_step": 2.754101276397705, "step": 4947} {"train_info/time_between_train_steps": 0.0029785633087158203, "step": 4947} {"info/global_step": 4948, "train_info/time_within_train_step": 2.7550899982452393, "step": 4948} {"train_info/time_between_train_steps": 0.0029931068420410156, "step": 4948} {"info/global_step": 4949, "train_info/time_within_train_step": 2.7527058124542236, "step": 4949} {"train_info/time_between_train_steps": 0.002981901168823242, "step": 4949} {"info/global_step": 4950, "train_info/time_within_train_step": 2.7538468837738037, "step": 4950} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746580353, "_runtime": 14362}, "step": 4950} {"logs": {"train/loss": 3.6461, "train/learning_rate": 0.00033666666666666665, "train/epoch": 5.07, "_timestamp": 1746580353, "_runtime": 14362}, "step": 4950} {"train_info/time_between_train_steps": 0.012517452239990234, "step": 4950} {"info/global_step": 4951, "train_info/time_within_train_step": 2.7538890838623047, "step": 4951} {"train_info/time_between_train_steps": 0.0029582977294921875, "step": 4951} {"info/global_step": 4952, "train_info/time_within_train_step": 2.752976655960083, "step": 4952} {"train_info/time_between_train_steps": 0.0029799938201904297, "step": 4952} {"info/global_step": 4953, "train_info/time_within_train_step": 2.7540459632873535, "step": 4953} {"train_info/time_between_train_steps": 0.0029442310333251953, "step": 4953} {"info/global_step": 4954, "train_info/time_within_train_step": 2.754593849182129, "step": 4954} {"train_info/time_between_train_steps": 0.002961874008178711, "step": 4954} {"info/global_step": 4955, "train_info/time_within_train_step": 2.7539377212524414, "step": 4955} {"train_info/time_between_train_steps": 0.003003358840942383, "step": 4955} {"info/global_step": 4956, "train_info/time_within_train_step": 2.7539122104644775, "step": 4956} {"train_info/time_between_train_steps": 0.0029630661010742188, "step": 4956} {"info/global_step": 4957, "train_info/time_within_train_step": 2.753830671310425, "step": 4957} {"train_info/time_between_train_steps": 0.002975940704345703, "step": 4957} {"info/global_step": 4958, "train_info/time_within_train_step": 2.753647565841675, "step": 4958} {"train_info/time_between_train_steps": 0.003098011016845703, "step": 4958} {"info/global_step": 4959, "train_info/time_within_train_step": 2.754002094268799, "step": 4959} {"train_info/time_between_train_steps": 0.0029582977294921875, "step": 4959} {"info/global_step": 4960, "train_info/time_within_train_step": 2.7544965744018555, "step": 4960} {"train_info/time_between_train_steps": 0.0030312538146972656, "step": 4960} {"info/global_step": 4961, "train_info/time_within_train_step": 2.7537481784820557, "step": 4961} {"train_info/time_between_train_steps": 0.003244161605834961, "step": 4961} {"info/global_step": 4962, "train_info/time_within_train_step": 2.7540483474731445, "step": 4962} {"train_info/time_between_train_steps": 0.0030171871185302734, "step": 4962} {"info/global_step": 4963, "train_info/time_within_train_step": 2.753142833709717, "step": 4963} {"train_info/time_between_train_steps": 0.0029420852661132812, "step": 4963} {"info/global_step": 4964, "train_info/time_within_train_step": 2.7525200843811035, "step": 4964} {"train_info/time_between_train_steps": 0.00299835205078125, "step": 4964} {"info/global_step": 4965, "train_info/time_within_train_step": 2.7531473636627197, "step": 4965} {"train_info/time_between_train_steps": 0.0029630661010742188, "step": 4965} {"info/global_step": 4966, "train_info/time_within_train_step": 2.7539398670196533, "step": 4966} {"train_info/time_between_train_steps": 0.0029778480529785156, "step": 4966} {"info/global_step": 4967, "train_info/time_within_train_step": 2.753969669342041, "step": 4967} {"train_info/time_between_train_steps": 0.0029821395874023438, "step": 4967} {"info/global_step": 4968, "train_info/time_within_train_step": 2.7541844844818115, "step": 4968} {"train_info/time_between_train_steps": 0.0029969215393066406, "step": 4968} {"info/global_step": 4969, "train_info/time_within_train_step": 2.7532296180725098, "step": 4969} {"train_info/time_between_train_steps": 0.0030069351196289062, "step": 4969} {"info/global_step": 4970, "train_info/time_within_train_step": 2.7534537315368652, "step": 4970} {"train_info/time_between_train_steps": 0.0029709339141845703, "step": 4970} {"info/global_step": 4971, "train_info/time_within_train_step": 2.7534523010253906, "step": 4971} {"train_info/time_between_train_steps": 0.0029845237731933594, "step": 4971} {"info/global_step": 4972, "train_info/time_within_train_step": 2.7544021606445312, "step": 4972} {"train_info/time_between_train_steps": 0.0029289722442626953, "step": 4972} {"info/global_step": 4973, "train_info/time_within_train_step": 2.7533605098724365, "step": 4973} {"train_info/time_between_train_steps": 0.0029251575469970703, "step": 4973} {"info/global_step": 4974, "train_info/time_within_train_step": 2.7529349327087402, "step": 4974} {"train_info/time_between_train_steps": 0.0028696060180664062, "step": 4974} {"info/global_step": 4975, "train_info/time_within_train_step": 2.75331449508667, "step": 4975} {"train_info/time_between_train_steps": 0.0028696060180664062, "step": 4975} {"info/global_step": 4976, "train_info/time_within_train_step": 2.753955841064453, "step": 4976} {"train_info/time_between_train_steps": 0.0029549598693847656, "step": 4976} {"info/global_step": 4977, "train_info/time_within_train_step": 2.7523348331451416, "step": 4977} {"train_info/time_between_train_steps": 0.002902984619140625, "step": 4977} {"info/global_step": 4978, "train_info/time_within_train_step": 2.7531981468200684, "step": 4978} {"train_info/time_between_train_steps": 0.002916574478149414, "step": 4978} {"info/global_step": 4979, "train_info/time_within_train_step": 2.7514305114746094, "step": 4979} {"train_info/time_between_train_steps": 0.002943754196166992, "step": 4979} {"info/global_step": 4980, "train_info/time_within_train_step": 2.7532198429107666, "step": 4980} {"train_info/time_between_train_steps": 0.002891063690185547, "step": 4980} {"info/global_step": 4981, "train_info/time_within_train_step": 2.7531046867370605, "step": 4981} {"train_info/time_between_train_steps": 0.002923250198364258, "step": 4981} {"info/global_step": 4982, "train_info/time_within_train_step": 2.7535643577575684, "step": 4982} {"train_info/time_between_train_steps": 0.002913236618041992, "step": 4982} {"info/global_step": 4983, "train_info/time_within_train_step": 2.753011703491211, "step": 4983} {"train_info/time_between_train_steps": 0.002960205078125, "step": 4983} {"info/global_step": 4984, "train_info/time_within_train_step": 2.750340461730957, "step": 4984} {"train_info/time_between_train_steps": 0.0029473304748535156, "step": 4984} {"info/global_step": 4985, "train_info/time_within_train_step": 2.75253963470459, "step": 4985} {"train_info/time_between_train_steps": 0.0028982162475585938, "step": 4985} {"info/global_step": 4986, "train_info/time_within_train_step": 2.752819061279297, "step": 4986} {"train_info/time_between_train_steps": 0.0028982162475585938, "step": 4986} {"info/global_step": 4987, "train_info/time_within_train_step": 2.754533290863037, "step": 4987} {"train_info/time_between_train_steps": 0.0029702186584472656, "step": 4987} {"info/global_step": 4988, "train_info/time_within_train_step": 2.866421937942505, "step": 4988} {"train_info/time_between_train_steps": 0.0029282569885253906, "step": 4988} {"info/global_step": 4989, "train_info/time_within_train_step": 2.7536349296569824, "step": 4989} {"train_info/time_between_train_steps": 0.0029845237731933594, "step": 4989} {"info/global_step": 4990, "train_info/time_within_train_step": 2.7548329830169678, "step": 4990} {"train_info/time_between_train_steps": 0.0029697418212890625, "step": 4990} {"info/global_step": 4991, "train_info/time_within_train_step": 2.7538676261901855, "step": 4991} {"train_info/time_between_train_steps": 0.002954721450805664, "step": 4991} {"info/global_step": 4992, "train_info/time_within_train_step": 2.754300355911255, "step": 4992} {"train_info/time_between_train_steps": 0.0029413700103759766, "step": 4992} {"info/global_step": 4993, "train_info/time_within_train_step": 2.7533786296844482, "step": 4993} {"train_info/time_between_train_steps": 0.0029630661010742188, "step": 4993} {"info/global_step": 4994, "train_info/time_within_train_step": 2.754448890686035, "step": 4994} {"train_info/time_between_train_steps": 0.0029435157775878906, "step": 4994} {"info/global_step": 4995, "train_info/time_within_train_step": 2.7530641555786133, "step": 4995} {"train_info/time_between_train_steps": 0.0029754638671875, "step": 4995} {"info/global_step": 4996, "train_info/time_within_train_step": 2.7535347938537598, "step": 4996} {"train_info/time_between_train_steps": 0.002877950668334961, "step": 4996} {"info/global_step": 4997, "train_info/time_within_train_step": 2.7525153160095215, "step": 4997} {"train_info/time_between_train_steps": 0.0029294490814208984, "step": 4997} {"info/global_step": 4998, "train_info/time_within_train_step": 3.3587114810943604, "step": 4998} {"train_info/time_between_train_steps": 0.0028662681579589844, "step": 4998} {"info/global_step": 4999, "train_info/time_within_train_step": 2.752354621887207, "step": 4999} {"train_info/time_between_train_steps": 0.002859830856323242, "step": 4999} {"info/global_step": 5000, "train_info/time_within_train_step": 2.7528741359710693, "step": 5000} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746580492, "_runtime": 14501}, "step": 5000} {"logs": {"train/loss": 3.6377, "train/learning_rate": 0.0003333333333333333, "train/epoch": 5.07, "_timestamp": 1746580492, "_runtime": 14501}, "step": 5000} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746580497, "_runtime": 14506}, "step": 5000} {"logs": {"eval/loss": 4.662978649139404, "eval/runtime": 5.1245, "eval/samples_per_second": 37.077, "eval/steps_per_second": 1.171, "train/epoch": 5.07, "_timestamp": 1746580497, "_runtime": 14506}, "step": 5000} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746580497, "_runtime": 14506}, "step": 5000} {"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.662978649139404, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 105.9512040676807, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 5.1245, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 37.077, "train/epoch": 5.07, "_timestamp": 1746580497, "_runtime": 14506}, "step": 5000} {"train_info/time_between_train_steps": 18.452239513397217, "step": 5000} {"info/global_step": 5001, "train_info/time_within_train_step": 2.5357420444488525, "step": 5001} {"train_info/time_between_train_steps": 0.0029649734497070312, "step": 5001} {"info/global_step": 5002, "train_info/time_within_train_step": 2.583010673522949, "step": 5002} {"train_info/time_between_train_steps": 0.002950906753540039, "step": 5002} {"info/global_step": 5003, "train_info/time_within_train_step": 2.731203556060791, "step": 5003} {"train_info/time_between_train_steps": 0.0030069351196289062, "step": 5003} {"info/global_step": 5004, "train_info/time_within_train_step": 2.7488644123077393, "step": 5004} {"train_info/time_between_train_steps": 0.0030007362365722656, "step": 5004} {"info/global_step": 5005, "train_info/time_within_train_step": 2.750875234603882, "step": 5005} {"train_info/time_between_train_steps": 0.0029611587524414062, "step": 5005} {"info/global_step": 5006, "train_info/time_within_train_step": 2.750793933868408, "step": 5006} {"train_info/time_between_train_steps": 0.0028426647186279297, "step": 5006} {"info/global_step": 5007, "train_info/time_within_train_step": 2.7526376247406006, "step": 5007} {"train_info/time_between_train_steps": 0.002888917922973633, "step": 5007} {"info/global_step": 5008, "train_info/time_within_train_step": 2.7508506774902344, "step": 5008} {"train_info/time_between_train_steps": 0.002879619598388672, "step": 5008} {"info/global_step": 5009, "train_info/time_within_train_step": 2.752880811691284, "step": 5009} {"train_info/time_between_train_steps": 0.0028553009033203125, "step": 5009} {"info/global_step": 5010, "train_info/time_within_train_step": 2.7524845600128174, "step": 5010} {"train_info/time_between_train_steps": 0.002844095230102539, "step": 5010} {"info/global_step": 5011, "train_info/time_within_train_step": 2.753016471862793, "step": 5011} {"train_info/time_between_train_steps": 0.0029315948486328125, "step": 5011} {"info/global_step": 5012, "train_info/time_within_train_step": 2.753129243850708, "step": 5012} {"train_info/time_between_train_steps": 0.0029256343841552734, "step": 5012} {"info/global_step": 5013, "train_info/time_within_train_step": 2.7540276050567627, "step": 5013} {"train_info/time_between_train_steps": 0.002910137176513672, "step": 5013} {"info/global_step": 5014, "train_info/time_within_train_step": 2.7543537616729736, "step": 5014} {"train_info/time_between_train_steps": 0.0029501914978027344, "step": 5014} {"info/global_step": 5015, "train_info/time_within_train_step": 2.7541663646698, "step": 5015} {"train_info/time_between_train_steps": 0.0028934478759765625, "step": 5015} {"info/global_step": 5016, "train_info/time_within_train_step": 2.7550048828125, "step": 5016} {"train_info/time_between_train_steps": 0.0030117034912109375, "step": 5016} {"info/global_step": 5017, "train_info/time_within_train_step": 2.754845142364502, "step": 5017} {"train_info/time_between_train_steps": 0.0029261112213134766, "step": 5017} {"info/global_step": 5018, "train_info/time_within_train_step": 2.75627064704895, "step": 5018} {"train_info/time_between_train_steps": 0.0028862953186035156, "step": 5018} {"info/global_step": 5019, "train_info/time_within_train_step": 2.7555859088897705, "step": 5019} {"train_info/time_between_train_steps": 0.002928018569946289, "step": 5019} {"info/global_step": 5020, "train_info/time_within_train_step": 2.7546045780181885, "step": 5020} {"train_info/time_between_train_steps": 0.0028929710388183594, "step": 5020} {"info/global_step": 5021, "train_info/time_within_train_step": 2.7542648315429688, "step": 5021} {"train_info/time_between_train_steps": 0.002933979034423828, "step": 5021} {"info/global_step": 5022, "train_info/time_within_train_step": 2.7538468837738037, "step": 5022} {"train_info/time_between_train_steps": 0.0029001235961914062, "step": 5022} {"info/global_step": 5023, "train_info/time_within_train_step": 2.7552032470703125, "step": 5023} {"train_info/time_between_train_steps": 0.002959012985229492, "step": 5023} {"info/global_step": 5024, "train_info/time_within_train_step": 2.752864360809326, "step": 5024} {"train_info/time_between_train_steps": 0.0028891563415527344, "step": 5024} {"info/global_step": 5025, "train_info/time_within_train_step": 2.7539596557617188, "step": 5025} {"train_info/time_between_train_steps": 0.0029435157775878906, "step": 5025} {"info/global_step": 5026, "train_info/time_within_train_step": 2.754478931427002, "step": 5026} {"train_info/time_between_train_steps": 0.0028738975524902344, "step": 5026} {"info/global_step": 5027, "train_info/time_within_train_step": 2.7548792362213135, "step": 5027} {"train_info/time_between_train_steps": 0.0029151439666748047, "step": 5027} {"info/global_step": 5028, "train_info/time_within_train_step": 2.7543742656707764, "step": 5028} {"train_info/time_between_train_steps": 0.002908945083618164, "step": 5028} {"info/global_step": 5029, "train_info/time_within_train_step": 2.755103826522827, "step": 5029} {"train_info/time_between_train_steps": 0.002923727035522461, "step": 5029} {"info/global_step": 5030, "train_info/time_within_train_step": 2.8419342041015625, "step": 5030} {"train_info/time_between_train_steps": 0.0028772354125976562, "step": 5030} {"info/global_step": 5031, "train_info/time_within_train_step": 2.754525899887085, "step": 5031} {"train_info/time_between_train_steps": 0.002870321273803711, "step": 5031} {"info/global_step": 5032, "train_info/time_within_train_step": 2.7532079219818115, "step": 5032} {"train_info/time_between_train_steps": 0.002873659133911133, "step": 5032} {"info/global_step": 5033, "train_info/time_within_train_step": 2.753424882888794, "step": 5033} {"train_info/time_between_train_steps": 0.0028738975524902344, "step": 5033} {"info/global_step": 5034, "train_info/time_within_train_step": 2.7543563842773438, "step": 5034} {"train_info/time_between_train_steps": 0.002874612808227539, "step": 5034} {"info/global_step": 5035, "train_info/time_within_train_step": 2.754007339477539, "step": 5035} {"train_info/time_between_train_steps": 0.002847433090209961, "step": 5035} {"info/global_step": 5036, "train_info/time_within_train_step": 2.7543787956237793, "step": 5036} {"train_info/time_between_train_steps": 0.0029137134552001953, "step": 5036} {"info/global_step": 5037, "train_info/time_within_train_step": 2.7536685466766357, "step": 5037} {"train_info/time_between_train_steps": 0.002867460250854492, "step": 5037} {"info/global_step": 5038, "train_info/time_within_train_step": 2.7549705505371094, "step": 5038} {"train_info/time_between_train_steps": 0.002913236618041992, "step": 5038} {"info/global_step": 5039, "train_info/time_within_train_step": 2.7550880908966064, "step": 5039} {"train_info/time_between_train_steps": 0.0030164718627929688, "step": 5039} {"info/global_step": 5040, "train_info/time_within_train_step": 2.7546260356903076, "step": 5040} {"train_info/time_between_train_steps": 0.003035306930541992, "step": 5040} {"info/global_step": 5041, "train_info/time_within_train_step": 2.7539491653442383, "step": 5041} {"train_info/time_between_train_steps": 0.0029582977294921875, "step": 5041} {"info/global_step": 5042, "train_info/time_within_train_step": 2.7547621726989746, "step": 5042} {"train_info/time_between_train_steps": 0.003004312515258789, "step": 5042} {"info/global_step": 5043, "train_info/time_within_train_step": 2.75447940826416, "step": 5043} {"train_info/time_between_train_steps": 0.0029878616333007812, "step": 5043} {"info/global_step": 5044, "train_info/time_within_train_step": 2.753845691680908, "step": 5044} {"train_info/time_between_train_steps": 0.002953052520751953, "step": 5044} {"info/global_step": 5045, "train_info/time_within_train_step": 2.752408027648926, "step": 5045} {"train_info/time_between_train_steps": 0.0029954910278320312, "step": 5045} {"info/global_step": 5046, "train_info/time_within_train_step": 2.754992961883545, "step": 5046} {"train_info/time_between_train_steps": 0.002963542938232422, "step": 5046} {"info/global_step": 5047, "train_info/time_within_train_step": 2.755998134613037, "step": 5047} {"train_info/time_between_train_steps": 0.0030095577239990234, "step": 5047} {"info/global_step": 5048, "train_info/time_within_train_step": 2.7546873092651367, "step": 5048} {"train_info/time_between_train_steps": 0.002961397171020508, "step": 5048} {"info/global_step": 5049, "train_info/time_within_train_step": 2.754706382751465, "step": 5049} {"train_info/time_between_train_steps": 0.0029659271240234375, "step": 5049} {"info/global_step": 5050, "train_info/time_within_train_step": 2.7541377544403076, "step": 5050} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746580648, "_runtime": 14657}, "step": 5050} {"logs": {"train/loss": 3.624, "train/learning_rate": 0.00033, "train/epoch": 5.08, "_timestamp": 1746580648, "_runtime": 14657}, "step": 5050} {"train_info/time_between_train_steps": 0.013750553131103516, "step": 5050} {"info/global_step": 5051, "train_info/time_within_train_step": 2.755307912826538, "step": 5051} {"train_info/time_between_train_steps": 0.002973318099975586, "step": 5051} {"info/global_step": 5052, "train_info/time_within_train_step": 2.754286289215088, "step": 5052} {"train_info/time_between_train_steps": 0.0029914379119873047, "step": 5052} {"info/global_step": 5053, "train_info/time_within_train_step": 2.753795623779297, "step": 5053} {"train_info/time_between_train_steps": 0.0030634403228759766, "step": 5053} {"info/global_step": 5054, "train_info/time_within_train_step": 2.7549211978912354, "step": 5054} {"train_info/time_between_train_steps": 0.0029811859130859375, "step": 5054} {"info/global_step": 5055, "train_info/time_within_train_step": 2.7541935443878174, "step": 5055} {"train_info/time_between_train_steps": 0.0029761791229248047, "step": 5055} {"info/global_step": 5056, "train_info/time_within_train_step": 2.753255844116211, "step": 5056} {"train_info/time_between_train_steps": 0.003019571304321289, "step": 5056} {"info/global_step": 5057, "train_info/time_within_train_step": 2.753458261489868, "step": 5057} {"train_info/time_between_train_steps": 0.0029761791229248047, "step": 5057} {"info/global_step": 5058, "train_info/time_within_train_step": 2.755349636077881, "step": 5058} {"train_info/time_between_train_steps": 0.003048419952392578, "step": 5058} {"info/global_step": 5059, "train_info/time_within_train_step": 2.752362012863159, "step": 5059} {"train_info/time_between_train_steps": 0.002969026565551758, "step": 5059} {"info/global_step": 5060, "train_info/time_within_train_step": 2.753988027572632, "step": 5060} {"train_info/time_between_train_steps": 0.0029807090759277344, "step": 5060} {"info/global_step": 5061, "train_info/time_within_train_step": 2.7531557083129883, "step": 5061} {"train_info/time_between_train_steps": 0.0029981136322021484, "step": 5061} {"info/global_step": 5062, "train_info/time_within_train_step": 2.7533023357391357, "step": 5062} {"train_info/time_between_train_steps": 0.0030281543731689453, "step": 5062} {"info/global_step": 5063, "train_info/time_within_train_step": 2.752983808517456, "step": 5063} {"train_info/time_between_train_steps": 0.002922534942626953, "step": 5063} {"info/global_step": 5064, "train_info/time_within_train_step": 2.753553867340088, "step": 5064} {"train_info/time_between_train_steps": 0.0029964447021484375, "step": 5064} {"info/global_step": 5065, "train_info/time_within_train_step": 2.7528305053710938, "step": 5065} {"train_info/time_between_train_steps": 0.002948284149169922, "step": 5065} {"info/global_step": 5066, "train_info/time_within_train_step": 2.753502607345581, "step": 5066} {"train_info/time_between_train_steps": 0.0029332637786865234, "step": 5066} {"info/global_step": 5067, "train_info/time_within_train_step": 2.7540512084960938, "step": 5067} {"train_info/time_between_train_steps": 0.0029604434967041016, "step": 5067} {"info/global_step": 5068, "train_info/time_within_train_step": 2.7536590099334717, "step": 5068} {"train_info/time_between_train_steps": 0.0029296875, "step": 5068} {"info/global_step": 5069, "train_info/time_within_train_step": 2.7534472942352295, "step": 5069} {"train_info/time_between_train_steps": 0.0029366016387939453, "step": 5069} {"info/global_step": 5070, "train_info/time_within_train_step": 2.753823757171631, "step": 5070} {"train_info/time_between_train_steps": 0.0029582977294921875, "step": 5070} {"info/global_step": 5071, "train_info/time_within_train_step": 2.752965211868286, "step": 5071} {"train_info/time_between_train_steps": 0.0028922557830810547, "step": 5071} {"info/global_step": 5072, "train_info/time_within_train_step": 2.7530298233032227, "step": 5072} {"train_info/time_between_train_steps": 0.0028951168060302734, "step": 5072} {"info/global_step": 5073, "train_info/time_within_train_step": 2.752742290496826, "step": 5073} {"train_info/time_between_train_steps": 0.002933502197265625, "step": 5073} {"info/global_step": 5074, "train_info/time_within_train_step": 2.752303123474121, "step": 5074} {"train_info/time_between_train_steps": 0.0028870105743408203, "step": 5074} {"info/global_step": 5075, "train_info/time_within_train_step": 2.7526652812957764, "step": 5075} {"train_info/time_between_train_steps": 0.0029306411743164062, "step": 5075} {"info/global_step": 5076, "train_info/time_within_train_step": 2.7543013095855713, "step": 5076} {"train_info/time_between_train_steps": 0.0034568309783935547, "step": 5076} {"info/global_step": 5077, "train_info/time_within_train_step": 2.7520415782928467, "step": 5077} {"train_info/time_between_train_steps": 0.002932310104370117, "step": 5077} {"info/global_step": 5078, "train_info/time_within_train_step": 2.751939296722412, "step": 5078} {"train_info/time_between_train_steps": 0.002897977828979492, "step": 5078} {"info/global_step": 5079, "train_info/time_within_train_step": 2.752617835998535, "step": 5079} {"train_info/time_between_train_steps": 0.0028862953186035156, "step": 5079} {"info/global_step": 5080, "train_info/time_within_train_step": 2.750854253768921, "step": 5080} {"train_info/time_between_train_steps": 0.0030426979064941406, "step": 5080} {"info/global_step": 5081, "train_info/time_within_train_step": 2.752638578414917, "step": 5081} {"train_info/time_between_train_steps": 0.0029587745666503906, "step": 5081} {"info/global_step": 5082, "train_info/time_within_train_step": 2.753368854522705, "step": 5082} {"train_info/time_between_train_steps": 0.0029027462005615234, "step": 5082} {"info/global_step": 5083, "train_info/time_within_train_step": 2.753455877304077, "step": 5083} {"train_info/time_between_train_steps": 0.002997159957885742, "step": 5083} {"info/global_step": 5084, "train_info/time_within_train_step": 2.7535200119018555, "step": 5084} {"train_info/time_between_train_steps": 0.002935171127319336, "step": 5084} {"info/global_step": 5085, "train_info/time_within_train_step": 2.7534234523773193, "step": 5085} {"train_info/time_between_train_steps": 0.0028963088989257812, "step": 5085} {"info/global_step": 5086, "train_info/time_within_train_step": 2.752617597579956, "step": 5086} {"train_info/time_between_train_steps": 0.0028853416442871094, "step": 5086} {"info/global_step": 5087, "train_info/time_within_train_step": 2.7530901432037354, "step": 5087} {"train_info/time_between_train_steps": 0.002924680709838867, "step": 5087} {"info/global_step": 5088, "train_info/time_within_train_step": 2.7539594173431396, "step": 5088} {"train_info/time_between_train_steps": 0.002890348434448242, "step": 5088} {"info/global_step": 5089, "train_info/time_within_train_step": 2.7529730796813965, "step": 5089} {"train_info/time_between_train_steps": 0.0029876232147216797, "step": 5089} {"info/global_step": 5090, "train_info/time_within_train_step": 2.752180337905884, "step": 5090} {"train_info/time_between_train_steps": 0.002895832061767578, "step": 5090} {"info/global_step": 5091, "train_info/time_within_train_step": 2.7521355152130127, "step": 5091} {"train_info/time_between_train_steps": 0.0030663013458251953, "step": 5091} {"info/global_step": 5092, "train_info/time_within_train_step": 2.7520713806152344, "step": 5092} {"train_info/time_between_train_steps": 0.0030269622802734375, "step": 5092} {"info/global_step": 5093, "train_info/time_within_train_step": 2.752363920211792, "step": 5093} {"train_info/time_between_train_steps": 0.0029306411743164062, "step": 5093} {"info/global_step": 5094, "train_info/time_within_train_step": 2.7528960704803467, "step": 5094} {"train_info/time_between_train_steps": 0.003036022186279297, "step": 5094} {"info/global_step": 5095, "train_info/time_within_train_step": 2.751491069793701, "step": 5095} {"train_info/time_between_train_steps": 0.0029039382934570312, "step": 5095} {"info/global_step": 5096, "train_info/time_within_train_step": 2.7504312992095947, "step": 5096} {"train_info/time_between_train_steps": 0.002948760986328125, "step": 5096} {"info/global_step": 5097, "train_info/time_within_train_step": 2.7533204555511475, "step": 5097} {"train_info/time_between_train_steps": 0.003065824508666992, "step": 5097} {"info/global_step": 5098, "train_info/time_within_train_step": 2.7696585655212402, "step": 5098} {"train_info/time_between_train_steps": 0.0030028820037841797, "step": 5098} {"info/global_step": 5099, "train_info/time_within_train_step": 2.755133628845215, "step": 5099} {"train_info/time_between_train_steps": 0.003141164779663086, "step": 5099} {"info/global_step": 5100, "train_info/time_within_train_step": 2.7551872730255127, "step": 5100} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746580786, "_runtime": 14795}, "step": 5100} {"logs": {"train/loss": 3.6167, "train/learning_rate": 0.0003266666666666666, "train/epoch": 5.08, "_timestamp": 1746580786, "_runtime": 14795}, "step": 5100} {"train_info/time_between_train_steps": 0.02398395538330078, "step": 5100} {"info/global_step": 5101, "train_info/time_within_train_step": 2.752934455871582, "step": 5101} {"train_info/time_between_train_steps": 0.0029015541076660156, "step": 5101} {"info/global_step": 5102, "train_info/time_within_train_step": 2.75386643409729, "step": 5102} {"train_info/time_between_train_steps": 0.0030198097229003906, "step": 5102} {"info/global_step": 5103, "train_info/time_within_train_step": 2.753913402557373, "step": 5103} {"train_info/time_between_train_steps": 0.002968311309814453, "step": 5103} {"info/global_step": 5104, "train_info/time_within_train_step": 2.753572463989258, "step": 5104} {"train_info/time_between_train_steps": 0.003036022186279297, "step": 5104} {"info/global_step": 5105, "train_info/time_within_train_step": 2.7530200481414795, "step": 5105} {"train_info/time_between_train_steps": 0.003262758255004883, "step": 5105} {"info/global_step": 5106, "train_info/time_within_train_step": 2.7531988620758057, "step": 5106} {"train_info/time_between_train_steps": 0.0031151771545410156, "step": 5106} {"info/global_step": 5107, "train_info/time_within_train_step": 2.7529456615448, "step": 5107} {"train_info/time_between_train_steps": 0.0029811859130859375, "step": 5107} {"info/global_step": 5108, "train_info/time_within_train_step": 2.7521071434020996, "step": 5108} {"train_info/time_between_train_steps": 0.003172159194946289, "step": 5108} {"info/global_step": 5109, "train_info/time_within_train_step": 2.754194974899292, "step": 5109} {"train_info/time_between_train_steps": 0.0031456947326660156, "step": 5109} {"info/global_step": 5110, "train_info/time_within_train_step": 2.7533233165740967, "step": 5110} {"train_info/time_between_train_steps": 0.003119945526123047, "step": 5110} {"info/global_step": 5111, "train_info/time_within_train_step": 2.754084825515747, "step": 5111} {"train_info/time_between_train_steps": 0.0033283233642578125, "step": 5111} {"info/global_step": 5112, "train_info/time_within_train_step": 2.753904104232788, "step": 5112} {"train_info/time_between_train_steps": 0.0030884742736816406, "step": 5112} {"info/global_step": 5113, "train_info/time_within_train_step": 2.7542099952697754, "step": 5113} {"train_info/time_between_train_steps": 0.0033483505249023438, "step": 5113} {"info/global_step": 5114, "train_info/time_within_train_step": 2.754572868347168, "step": 5114} {"train_info/time_between_train_steps": 0.0031757354736328125, "step": 5114} {"info/global_step": 5115, "train_info/time_within_train_step": 2.7537972927093506, "step": 5115} {"train_info/time_between_train_steps": 0.003251791000366211, "step": 5115} {"info/global_step": 5116, "train_info/time_within_train_step": 2.754058361053467, "step": 5116} {"train_info/time_between_train_steps": 0.003246784210205078, "step": 5116} {"info/global_step": 5117, "train_info/time_within_train_step": 2.7552340030670166, "step": 5117} {"train_info/time_between_train_steps": 0.0031828880310058594, "step": 5117} {"info/global_step": 5118, "train_info/time_within_train_step": 2.753732919692993, "step": 5118} {"train_info/time_between_train_steps": 0.003401041030883789, "step": 5118} {"train_info/time_between_train_steps": 3.1940574645996094, "step": 5118} {"info/global_step": 5119, "train_info/time_within_train_step": 2.6749613285064697, "step": 5119} {"train_info/time_between_train_steps": 0.0031561851501464844, "step": 5119} {"info/global_step": 5120, "train_info/time_within_train_step": 2.753103017807007, "step": 5120} {"train_info/time_between_train_steps": 0.003174304962158203, "step": 5120} {"info/global_step": 5121, "train_info/time_within_train_step": 2.754270076751709, "step": 5121} {"train_info/time_between_train_steps": 0.0031828880310058594, "step": 5121} {"info/global_step": 5122, "train_info/time_within_train_step": 2.7537553310394287, "step": 5122} {"train_info/time_between_train_steps": 0.003112316131591797, "step": 5122} {"info/global_step": 5123, "train_info/time_within_train_step": 2.754389762878418, "step": 5123} {"train_info/time_between_train_steps": 0.0031213760375976562, "step": 5123} {"info/global_step": 5124, "train_info/time_within_train_step": 2.7526605129241943, "step": 5124} {"train_info/time_between_train_steps": 0.003131866455078125, "step": 5124} {"info/global_step": 5125, "train_info/time_within_train_step": 2.754199743270874, "step": 5125} {"train_info/time_between_train_steps": 0.003113985061645508, "step": 5125} {"info/global_step": 5126, "train_info/time_within_train_step": 2.753567695617676, "step": 5126} {"train_info/time_between_train_steps": 0.0035822391510009766, "step": 5126} {"info/global_step": 5127, "train_info/time_within_train_step": 2.754687786102295, "step": 5127} {"train_info/time_between_train_steps": 0.0031957626342773438, "step": 5127} {"info/global_step": 5128, "train_info/time_within_train_step": 2.754218339920044, "step": 5128} {"train_info/time_between_train_steps": 0.0032188892364501953, "step": 5128} {"info/global_step": 5129, "train_info/time_within_train_step": 2.7552545070648193, "step": 5129} {"train_info/time_between_train_steps": 0.003128528594970703, "step": 5129} {"info/global_step": 5130, "train_info/time_within_train_step": 2.7548961639404297, "step": 5130} {"train_info/time_between_train_steps": 0.003307342529296875, "step": 5130} {"info/global_step": 5131, "train_info/time_within_train_step": 2.755126953125, "step": 5131} {"train_info/time_between_train_steps": 0.003263235092163086, "step": 5131} {"info/global_step": 5132, "train_info/time_within_train_step": 2.7536814212799072, "step": 5132} {"train_info/time_between_train_steps": 0.003265857696533203, "step": 5132} {"info/global_step": 5133, "train_info/time_within_train_step": 2.7546539306640625, "step": 5133} {"train_info/time_between_train_steps": 0.0033092498779296875, "step": 5133} {"info/global_step": 5134, "train_info/time_within_train_step": 2.7551634311676025, "step": 5134} {"train_info/time_between_train_steps": 0.0033082962036132812, "step": 5134} {"info/global_step": 5135, "train_info/time_within_train_step": 2.754742383956909, "step": 5135} {"train_info/time_between_train_steps": 0.0032727718353271484, "step": 5135} {"info/global_step": 5136, "train_info/time_within_train_step": 2.965426445007324, "step": 5136} {"train_info/time_between_train_steps": 0.0033838748931884766, "step": 5136} {"info/global_step": 5137, "train_info/time_within_train_step": 2.7542316913604736, "step": 5137} {"train_info/time_between_train_steps": 0.003282785415649414, "step": 5137} {"info/global_step": 5138, "train_info/time_within_train_step": 2.7552919387817383, "step": 5138} {"train_info/time_between_train_steps": 0.003297090530395508, "step": 5138} {"info/global_step": 5139, "train_info/time_within_train_step": 2.7541892528533936, "step": 5139} {"train_info/time_between_train_steps": 0.0032634735107421875, "step": 5139} {"info/global_step": 5140, "train_info/time_within_train_step": 2.7535512447357178, "step": 5140} {"train_info/time_between_train_steps": 0.003248453140258789, "step": 5140} {"info/global_step": 5141, "train_info/time_within_train_step": 2.7548604011535645, "step": 5141} {"train_info/time_between_train_steps": 0.0038712024688720703, "step": 5141} {"info/global_step": 5142, "train_info/time_within_train_step": 2.755110263824463, "step": 5142} {"train_info/time_between_train_steps": 0.0032753944396972656, "step": 5142} {"info/global_step": 5143, "train_info/time_within_train_step": 2.7552435398101807, "step": 5143} {"train_info/time_between_train_steps": 0.0032999515533447266, "step": 5143} {"info/global_step": 5144, "train_info/time_within_train_step": 2.75533390045166, "step": 5144} {"train_info/time_between_train_steps": 0.0032956600189208984, "step": 5144} {"info/global_step": 5145, "train_info/time_within_train_step": 2.7552714347839355, "step": 5145} {"train_info/time_between_train_steps": 0.003277301788330078, "step": 5145} {"info/global_step": 5146, "train_info/time_within_train_step": 2.7550230026245117, "step": 5146} {"train_info/time_between_train_steps": 0.0032455921173095703, "step": 5146} {"info/global_step": 5147, "train_info/time_within_train_step": 2.7551658153533936, "step": 5147} {"train_info/time_between_train_steps": 0.003278970718383789, "step": 5147} {"info/global_step": 5148, "train_info/time_within_train_step": 2.7549102306365967, "step": 5148} {"train_info/time_between_train_steps": 0.0032656192779541016, "step": 5148} {"info/global_step": 5149, "train_info/time_within_train_step": 2.753734827041626, "step": 5149} {"train_info/time_between_train_steps": 0.0030961036682128906, "step": 5149} {"info/global_step": 5150, "train_info/time_within_train_step": 2.754706859588623, "step": 5150} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746580928, "_runtime": 14937}, "step": 5150} {"logs": {"train/loss": 3.6528, "train/learning_rate": 0.0003233333333333333, "train/epoch": 6.0, "_timestamp": 1746580928, "_runtime": 14937}, "step": 5150} {"train_info/time_between_train_steps": 0.011349201202392578, "step": 5150} {"info/global_step": 5151, "train_info/time_within_train_step": 2.754678726196289, "step": 5151} {"train_info/time_between_train_steps": 0.0031120777130126953, "step": 5151} {"info/global_step": 5152, "train_info/time_within_train_step": 2.754549503326416, "step": 5152} {"train_info/time_between_train_steps": 0.003199338912963867, "step": 5152} {"info/global_step": 5153, "train_info/time_within_train_step": 2.7540316581726074, "step": 5153} {"train_info/time_between_train_steps": 0.0031833648681640625, "step": 5153} {"info/global_step": 5154, "train_info/time_within_train_step": 2.7549800872802734, "step": 5154} {"train_info/time_between_train_steps": 0.003154277801513672, "step": 5154} {"info/global_step": 5155, "train_info/time_within_train_step": 2.7555181980133057, "step": 5155} {"train_info/time_between_train_steps": 0.0032041072845458984, "step": 5155} {"info/global_step": 5156, "train_info/time_within_train_step": 2.7545154094696045, "step": 5156} {"train_info/time_between_train_steps": 0.0031638145446777344, "step": 5156} {"info/global_step": 5157, "train_info/time_within_train_step": 2.754546880722046, "step": 5157} {"train_info/time_between_train_steps": 0.003208160400390625, "step": 5157} {"info/global_step": 5158, "train_info/time_within_train_step": 2.755411386489868, "step": 5158} {"train_info/time_between_train_steps": 0.0033779144287109375, "step": 5158} {"info/global_step": 5159, "train_info/time_within_train_step": 2.755582094192505, "step": 5159} {"train_info/time_between_train_steps": 0.003289937973022461, "step": 5159} {"info/global_step": 5160, "train_info/time_within_train_step": 2.7549898624420166, "step": 5160} {"train_info/time_between_train_steps": 0.0032737255096435547, "step": 5160} {"info/global_step": 5161, "train_info/time_within_train_step": 2.755997896194458, "step": 5161} {"train_info/time_between_train_steps": 0.0032885074615478516, "step": 5161} {"info/global_step": 5162, "train_info/time_within_train_step": 2.7560300827026367, "step": 5162} {"train_info/time_between_train_steps": 0.0032601356506347656, "step": 5162} {"info/global_step": 5163, "train_info/time_within_train_step": 2.7557013034820557, "step": 5163} {"train_info/time_between_train_steps": 0.0033104419708251953, "step": 5163} {"info/global_step": 5164, "train_info/time_within_train_step": 2.7565958499908447, "step": 5164} {"train_info/time_between_train_steps": 0.003303050994873047, "step": 5164} {"info/global_step": 5165, "train_info/time_within_train_step": 2.757089376449585, "step": 5165} {"train_info/time_between_train_steps": 0.0032918453216552734, "step": 5165} {"info/global_step": 5166, "train_info/time_within_train_step": 2.7551984786987305, "step": 5166} {"train_info/time_between_train_steps": 0.003210783004760742, "step": 5166} {"info/global_step": 5167, "train_info/time_within_train_step": 2.755478620529175, "step": 5167} {"train_info/time_between_train_steps": 0.003173351287841797, "step": 5167} {"info/global_step": 5168, "train_info/time_within_train_step": 2.7557268142700195, "step": 5168} {"train_info/time_between_train_steps": 0.0031142234802246094, "step": 5168} {"info/global_step": 5169, "train_info/time_within_train_step": 2.755378484725952, "step": 5169} {"train_info/time_between_train_steps": 0.0031080245971679688, "step": 5169} {"info/global_step": 5170, "train_info/time_within_train_step": 2.754589796066284, "step": 5170} {"train_info/time_between_train_steps": 0.0032117366790771484, "step": 5170} {"info/global_step": 5171, "train_info/time_within_train_step": 2.754368782043457, "step": 5171} {"train_info/time_between_train_steps": 0.0031952857971191406, "step": 5171} {"info/global_step": 5172, "train_info/time_within_train_step": 2.75361967086792, "step": 5172} {"train_info/time_between_train_steps": 0.0031502246856689453, "step": 5172} {"info/global_step": 5173, "train_info/time_within_train_step": 2.7555413246154785, "step": 5173} {"train_info/time_between_train_steps": 0.00315093994140625, "step": 5173} {"info/global_step": 5174, "train_info/time_within_train_step": 2.7563138008117676, "step": 5174} {"train_info/time_between_train_steps": 0.0032248497009277344, "step": 5174} {"info/global_step": 5175, "train_info/time_within_train_step": 2.7539608478546143, "step": 5175} {"train_info/time_between_train_steps": 0.003130674362182617, "step": 5175} {"info/global_step": 5176, "train_info/time_within_train_step": 2.753788948059082, "step": 5176} {"train_info/time_between_train_steps": 0.0031986236572265625, "step": 5176} {"info/global_step": 5177, "train_info/time_within_train_step": 2.7542426586151123, "step": 5177} {"train_info/time_between_train_steps": 0.0032453536987304688, "step": 5177} {"info/global_step": 5178, "train_info/time_within_train_step": 2.75303053855896, "step": 5178} {"train_info/time_between_train_steps": 0.0031828880310058594, "step": 5178} {"info/global_step": 5179, "train_info/time_within_train_step": 2.7554397583007812, "step": 5179} {"train_info/time_between_train_steps": 0.003271818161010742, "step": 5179} {"info/global_step": 5180, "train_info/time_within_train_step": 2.7534825801849365, "step": 5180} {"train_info/time_between_train_steps": 0.0032432079315185547, "step": 5180} {"info/global_step": 5181, "train_info/time_within_train_step": 2.8797550201416016, "step": 5181} {"train_info/time_between_train_steps": 0.0032155513763427734, "step": 5181} {"info/global_step": 5182, "train_info/time_within_train_step": 2.756047010421753, "step": 5182} {"train_info/time_between_train_steps": 0.0032205581665039062, "step": 5182} {"info/global_step": 5183, "train_info/time_within_train_step": 2.7546744346618652, "step": 5183} {"train_info/time_between_train_steps": 0.003206014633178711, "step": 5183} {"info/global_step": 5184, "train_info/time_within_train_step": 2.7551748752593994, "step": 5184} {"train_info/time_between_train_steps": 0.0032987594604492188, "step": 5184} {"info/global_step": 5185, "train_info/time_within_train_step": 2.755878210067749, "step": 5185} {"train_info/time_between_train_steps": 0.0032796859741210938, "step": 5185} {"info/global_step": 5186, "train_info/time_within_train_step": 2.7556934356689453, "step": 5186} {"train_info/time_between_train_steps": 0.0032973289489746094, "step": 5186} {"info/global_step": 5187, "train_info/time_within_train_step": 2.755328893661499, "step": 5187} {"train_info/time_between_train_steps": 0.0033800601959228516, "step": 5187} {"info/global_step": 5188, "train_info/time_within_train_step": 2.755044937133789, "step": 5188} {"train_info/time_between_train_steps": 0.003408193588256836, "step": 5188} {"info/global_step": 5189, "train_info/time_within_train_step": 2.7546379566192627, "step": 5189} {"train_info/time_between_train_steps": 0.003515481948852539, "step": 5189} {"info/global_step": 5190, "train_info/time_within_train_step": 2.7547531127929688, "step": 5190} {"train_info/time_between_train_steps": 0.0033702850341796875, "step": 5190} {"info/global_step": 5191, "train_info/time_within_train_step": 2.7547316551208496, "step": 5191} {"train_info/time_between_train_steps": 0.003317117691040039, "step": 5191} {"info/global_step": 5192, "train_info/time_within_train_step": 2.7552852630615234, "step": 5192} {"train_info/time_between_train_steps": 0.0033388137817382812, "step": 5192} {"info/global_step": 5193, "train_info/time_within_train_step": 2.755525588989258, "step": 5193} {"train_info/time_between_train_steps": 0.0033478736877441406, "step": 5193} {"info/global_step": 5194, "train_info/time_within_train_step": 2.7561748027801514, "step": 5194} {"train_info/time_between_train_steps": 0.0033349990844726562, "step": 5194} {"info/global_step": 5195, "train_info/time_within_train_step": 2.7564406394958496, "step": 5195} {"train_info/time_between_train_steps": 0.0032949447631835938, "step": 5195} {"info/global_step": 5196, "train_info/time_within_train_step": 2.755758762359619, "step": 5196} {"train_info/time_between_train_steps": 0.0034208297729492188, "step": 5196} {"info/global_step": 5197, "train_info/time_within_train_step": 2.755044460296631, "step": 5197} {"train_info/time_between_train_steps": 0.0034532546997070312, "step": 5197} {"info/global_step": 5198, "train_info/time_within_train_step": 2.7565078735351562, "step": 5198} {"train_info/time_between_train_steps": 0.0033578872680664062, "step": 5198} {"info/global_step": 5199, "train_info/time_within_train_step": 2.755964994430542, "step": 5199} {"train_info/time_between_train_steps": 0.003372669219970703, "step": 5199} {"info/global_step": 5200, "train_info/time_within_train_step": 2.756633996963501, "step": 5200} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746581066, "_runtime": 15075}, "step": 5200} {"logs": {"train/loss": 3.5993, "train/learning_rate": 0.00031999999999999997, "train/epoch": 6.01, "_timestamp": 1746581066, "_runtime": 15075}, "step": 5200} {"train_info/time_between_train_steps": 36.38124918937683, "step": 5200} {"info/global_step": 5201, "train_info/time_within_train_step": 2.535177230834961, "step": 5201} {"train_info/time_between_train_steps": 0.003365755081176758, "step": 5201} {"info/global_step": 5202, "train_info/time_within_train_step": 2.5532023906707764, "step": 5202} {"train_info/time_between_train_steps": 0.0033178329467773438, "step": 5202} {"info/global_step": 5203, "train_info/time_within_train_step": 2.6726136207580566, "step": 5203} {"train_info/time_between_train_steps": 0.0033724308013916016, "step": 5203} {"info/global_step": 5204, "train_info/time_within_train_step": 2.684063673019409, "step": 5204} {"train_info/time_between_train_steps": 0.0033392906188964844, "step": 5204} {"info/global_step": 5205, "train_info/time_within_train_step": 2.7031123638153076, "step": 5205} {"train_info/time_between_train_steps": 0.0033905506134033203, "step": 5205} {"info/global_step": 5206, "train_info/time_within_train_step": 2.720311164855957, "step": 5206} {"train_info/time_between_train_steps": 0.0034186840057373047, "step": 5206} {"info/global_step": 5207, "train_info/time_within_train_step": 2.7528905868530273, "step": 5207} {"train_info/time_between_train_steps": 0.0033731460571289062, "step": 5207} {"info/global_step": 5208, "train_info/time_within_train_step": 2.7553133964538574, "step": 5208} {"train_info/time_between_train_steps": 0.0033702850341796875, "step": 5208} {"info/global_step": 5209, "train_info/time_within_train_step": 2.7562673091888428, "step": 5209} {"train_info/time_between_train_steps": 0.003420114517211914, "step": 5209} {"info/global_step": 5210, "train_info/time_within_train_step": 2.7572221755981445, "step": 5210} {"train_info/time_between_train_steps": 0.003364086151123047, "step": 5210} {"info/global_step": 5211, "train_info/time_within_train_step": 2.756126642227173, "step": 5211} {"train_info/time_between_train_steps": 0.0033447742462158203, "step": 5211} {"info/global_step": 5212, "train_info/time_within_train_step": 2.755880117416382, "step": 5212} {"train_info/time_between_train_steps": 0.0033185482025146484, "step": 5212} {"info/global_step": 5213, "train_info/time_within_train_step": 2.7565019130706787, "step": 5213} {"train_info/time_between_train_steps": 0.0033414363861083984, "step": 5213} {"info/global_step": 5214, "train_info/time_within_train_step": 2.756525754928589, "step": 5214} {"train_info/time_between_train_steps": 0.0033197402954101562, "step": 5214} {"info/global_step": 5215, "train_info/time_within_train_step": 2.7576262950897217, "step": 5215} {"train_info/time_between_train_steps": 0.003342151641845703, "step": 5215} {"info/global_step": 5216, "train_info/time_within_train_step": 2.9980437755584717, "step": 5216} {"train_info/time_between_train_steps": 0.0034155845642089844, "step": 5216} {"info/global_step": 5217, "train_info/time_within_train_step": 2.7557127475738525, "step": 5217} {"train_info/time_between_train_steps": 0.0031845569610595703, "step": 5217} {"info/global_step": 5218, "train_info/time_within_train_step": 2.7579269409179688, "step": 5218} {"train_info/time_between_train_steps": 0.0032181739807128906, "step": 5218} {"info/global_step": 5219, "train_info/time_within_train_step": 2.7553141117095947, "step": 5219} {"train_info/time_between_train_steps": 0.003186464309692383, "step": 5219} {"info/global_step": 5220, "train_info/time_within_train_step": 2.754633903503418, "step": 5220} {"train_info/time_between_train_steps": 0.003152608871459961, "step": 5220} {"info/global_step": 5221, "train_info/time_within_train_step": 2.7556076049804688, "step": 5221} {"train_info/time_between_train_steps": 0.0031633377075195312, "step": 5221} {"info/global_step": 5222, "train_info/time_within_train_step": 2.7547919750213623, "step": 5222} {"train_info/time_between_train_steps": 0.003139495849609375, "step": 5222} {"info/global_step": 5223, "train_info/time_within_train_step": 2.754568338394165, "step": 5223} {"train_info/time_between_train_steps": 0.003162384033203125, "step": 5223} {"info/global_step": 5224, "train_info/time_within_train_step": 2.7532198429107666, "step": 5224} {"train_info/time_between_train_steps": 0.0031583309173583984, "step": 5224} {"info/global_step": 5225, "train_info/time_within_train_step": 2.7565643787384033, "step": 5225} {"train_info/time_between_train_steps": 0.003154754638671875, "step": 5225} {"info/global_step": 5226, "train_info/time_within_train_step": 2.7562220096588135, "step": 5226} {"train_info/time_between_train_steps": 0.003142833709716797, "step": 5226} {"info/global_step": 5227, "train_info/time_within_train_step": 2.755490303039551, "step": 5227} {"train_info/time_between_train_steps": 0.0031583309173583984, "step": 5227} {"info/global_step": 5228, "train_info/time_within_train_step": 2.756317377090454, "step": 5228} {"train_info/time_between_train_steps": 0.003137826919555664, "step": 5228} {"info/global_step": 5229, "train_info/time_within_train_step": 2.7559502124786377, "step": 5229} {"train_info/time_between_train_steps": 0.003200531005859375, "step": 5229} {"info/global_step": 5230, "train_info/time_within_train_step": 2.754997968673706, "step": 5230} {"train_info/time_between_train_steps": 0.0031414031982421875, "step": 5230} {"info/global_step": 5231, "train_info/time_within_train_step": 2.755491018295288, "step": 5231} {"train_info/time_between_train_steps": 0.0031707286834716797, "step": 5231} {"info/global_step": 5232, "train_info/time_within_train_step": 2.7566254138946533, "step": 5232} {"train_info/time_between_train_steps": 0.003140687942504883, "step": 5232} {"info/global_step": 5233, "train_info/time_within_train_step": 2.7562170028686523, "step": 5233} {"train_info/time_between_train_steps": 0.003158092498779297, "step": 5233} {"info/global_step": 5234, "train_info/time_within_train_step": 2.755312442779541, "step": 5234} {"train_info/time_between_train_steps": 0.003285646438598633, "step": 5234} {"info/global_step": 5235, "train_info/time_within_train_step": 2.7561702728271484, "step": 5235} {"train_info/time_between_train_steps": 0.0032143592834472656, "step": 5235} {"info/global_step": 5236, "train_info/time_within_train_step": 2.7558646202087402, "step": 5236} {"train_info/time_between_train_steps": 0.003170013427734375, "step": 5236} {"info/global_step": 5237, "train_info/time_within_train_step": 2.7553486824035645, "step": 5237} {"train_info/time_between_train_steps": 0.0032529830932617188, "step": 5237} {"info/global_step": 5238, "train_info/time_within_train_step": 2.754704236984253, "step": 5238} {"train_info/time_between_train_steps": 0.003239154815673828, "step": 5238} {"info/global_step": 5239, "train_info/time_within_train_step": 2.7558889389038086, "step": 5239} {"train_info/time_between_train_steps": 0.003168821334838867, "step": 5239} {"info/global_step": 5240, "train_info/time_within_train_step": 2.7569212913513184, "step": 5240} {"train_info/time_between_train_steps": 0.003207683563232422, "step": 5240} {"info/global_step": 5241, "train_info/time_within_train_step": 2.7556447982788086, "step": 5241} {"train_info/time_between_train_steps": 0.003177642822265625, "step": 5241} {"info/global_step": 5242, "train_info/time_within_train_step": 2.7544853687286377, "step": 5242} {"train_info/time_between_train_steps": 0.0032410621643066406, "step": 5242} {"info/global_step": 5243, "train_info/time_within_train_step": 2.755584239959717, "step": 5243} {"train_info/time_between_train_steps": 0.1365795135498047, "step": 5243} {"info/global_step": 5244, "train_info/time_within_train_step": 2.756957769393921, "step": 5244} {"train_info/time_between_train_steps": 0.003202199935913086, "step": 5244} {"info/global_step": 5245, "train_info/time_within_train_step": 2.7557520866394043, "step": 5245} {"train_info/time_between_train_steps": 0.003246307373046875, "step": 5245} {"info/global_step": 5246, "train_info/time_within_train_step": 2.755441427230835, "step": 5246} {"train_info/time_between_train_steps": 0.0032334327697753906, "step": 5246} {"info/global_step": 5247, "train_info/time_within_train_step": 3.3517844676971436, "step": 5247} {"train_info/time_between_train_steps": 0.003221750259399414, "step": 5247} {"info/global_step": 5248, "train_info/time_within_train_step": 2.7559385299682617, "step": 5248} {"train_info/time_between_train_steps": 0.003175020217895508, "step": 5248} {"info/global_step": 5249, "train_info/time_within_train_step": 2.754255533218384, "step": 5249} {"train_info/time_between_train_steps": 0.003230571746826172, "step": 5249} {"info/global_step": 5250, "train_info/time_within_train_step": 2.755082368850708, "step": 5250} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746581241, "_runtime": 15250}, "step": 5250} {"logs": {"train/loss": 3.5914, "train/learning_rate": 0.00031666666666666665, "train/epoch": 6.01, "_timestamp": 1746581241, "_runtime": 15250}, "step": 5250} {"train_info/time_between_train_steps": 0.01326298713684082, "step": 5250} {"info/global_step": 5251, "train_info/time_within_train_step": 2.7545714378356934, "step": 5251} {"train_info/time_between_train_steps": 0.0031957626342773438, "step": 5251} {"info/global_step": 5252, "train_info/time_within_train_step": 2.7537503242492676, "step": 5252} {"train_info/time_between_train_steps": 0.00318145751953125, "step": 5252} {"info/global_step": 5253, "train_info/time_within_train_step": 2.75376558303833, "step": 5253} {"train_info/time_between_train_steps": 0.0036025047302246094, "step": 5253} {"info/global_step": 5254, "train_info/time_within_train_step": 2.7549946308135986, "step": 5254} {"train_info/time_between_train_steps": 0.003191709518432617, "step": 5254} {"info/global_step": 5255, "train_info/time_within_train_step": 2.754382371902466, "step": 5255} {"train_info/time_between_train_steps": 0.003137826919555664, "step": 5255} {"info/global_step": 5256, "train_info/time_within_train_step": 2.993567943572998, "step": 5256} {"train_info/time_between_train_steps": 0.0031616687774658203, "step": 5256} {"info/global_step": 5257, "train_info/time_within_train_step": 2.7527542114257812, "step": 5257} {"train_info/time_between_train_steps": 0.003136873245239258, "step": 5257} {"info/global_step": 5258, "train_info/time_within_train_step": 2.7531285285949707, "step": 5258} {"train_info/time_between_train_steps": 0.0031549930572509766, "step": 5258} {"info/global_step": 5259, "train_info/time_within_train_step": 2.753784656524658, "step": 5259} {"train_info/time_between_train_steps": 0.0031249523162841797, "step": 5259} {"info/global_step": 5260, "train_info/time_within_train_step": 2.7561113834381104, "step": 5260} {"train_info/time_between_train_steps": 0.0031287670135498047, "step": 5260} {"info/global_step": 5261, "train_info/time_within_train_step": 2.7551474571228027, "step": 5261} {"train_info/time_between_train_steps": 0.0031566619873046875, "step": 5261} {"info/global_step": 5262, "train_info/time_within_train_step": 2.756627082824707, "step": 5262} {"train_info/time_between_train_steps": 0.003160715103149414, "step": 5262} {"info/global_step": 5263, "train_info/time_within_train_step": 2.75484299659729, "step": 5263} {"train_info/time_between_train_steps": 0.0031502246856689453, "step": 5263} {"info/global_step": 5264, "train_info/time_within_train_step": 2.756265878677368, "step": 5264} {"train_info/time_between_train_steps": 0.0031507015228271484, "step": 5264} {"info/global_step": 5265, "train_info/time_within_train_step": 2.7795865535736084, "step": 5265} {"train_info/time_between_train_steps": 0.0031685829162597656, "step": 5265} {"info/global_step": 5266, "train_info/time_within_train_step": 2.7547290325164795, "step": 5266} {"train_info/time_between_train_steps": 0.003139019012451172, "step": 5266} {"info/global_step": 5267, "train_info/time_within_train_step": 2.7549877166748047, "step": 5267} {"train_info/time_between_train_steps": 0.003177165985107422, "step": 5267} {"info/global_step": 5268, "train_info/time_within_train_step": 2.753654956817627, "step": 5268} {"train_info/time_between_train_steps": 0.0031490325927734375, "step": 5268} {"info/global_step": 5269, "train_info/time_within_train_step": 2.754619836807251, "step": 5269} {"train_info/time_between_train_steps": 0.0031690597534179688, "step": 5269} {"info/global_step": 5270, "train_info/time_within_train_step": 2.7541048526763916, "step": 5270} {"train_info/time_between_train_steps": 0.003106832504272461, "step": 5270} {"info/global_step": 5271, "train_info/time_within_train_step": 2.7541918754577637, "step": 5271} {"train_info/time_between_train_steps": 0.003151416778564453, "step": 5271} {"info/global_step": 5272, "train_info/time_within_train_step": 2.7542247772216797, "step": 5272} {"train_info/time_between_train_steps": 0.0031180381774902344, "step": 5272} {"info/global_step": 5273, "train_info/time_within_train_step": 2.754530668258667, "step": 5273} {"train_info/time_between_train_steps": 0.0031011104583740234, "step": 5273} {"info/global_step": 5274, "train_info/time_within_train_step": 2.7549664974212646, "step": 5274} {"train_info/time_between_train_steps": 0.003134489059448242, "step": 5274} {"info/global_step": 5275, "train_info/time_within_train_step": 2.7523133754730225, "step": 5275} {"train_info/time_between_train_steps": 0.003122568130493164, "step": 5275} {"info/global_step": 5276, "train_info/time_within_train_step": 2.754201889038086, "step": 5276} {"train_info/time_between_train_steps": 0.0031290054321289062, "step": 5276} {"info/global_step": 5277, "train_info/time_within_train_step": 2.755681037902832, "step": 5277} {"train_info/time_between_train_steps": 0.003150463104248047, "step": 5277} {"info/global_step": 5278, "train_info/time_within_train_step": 2.754852056503296, "step": 5278} {"train_info/time_between_train_steps": 0.0031707286834716797, "step": 5278} {"info/global_step": 5279, "train_info/time_within_train_step": 2.7553651332855225, "step": 5279} {"train_info/time_between_train_steps": 0.0031290054321289062, "step": 5279} {"info/global_step": 5280, "train_info/time_within_train_step": 2.7557730674743652, "step": 5280} {"train_info/time_between_train_steps": 0.003174304962158203, "step": 5280} {"info/global_step": 5281, "train_info/time_within_train_step": 2.754709243774414, "step": 5281} {"train_info/time_between_train_steps": 0.0031690597534179688, "step": 5281} {"info/global_step": 5282, "train_info/time_within_train_step": 2.756103277206421, "step": 5282} {"train_info/time_between_train_steps": 0.0031957626342773438, "step": 5282} {"info/global_step": 5283, "train_info/time_within_train_step": 2.7550034523010254, "step": 5283} {"train_info/time_between_train_steps": 0.0031769275665283203, "step": 5283} {"info/global_step": 5284, "train_info/time_within_train_step": 2.7555325031280518, "step": 5284} {"train_info/time_between_train_steps": 0.0031588077545166016, "step": 5284} {"info/global_step": 5285, "train_info/time_within_train_step": 2.7543952465057373, "step": 5285} {"train_info/time_between_train_steps": 0.003185272216796875, "step": 5285} {"info/global_step": 5286, "train_info/time_within_train_step": 2.754558563232422, "step": 5286} {"train_info/time_between_train_steps": 0.003216266632080078, "step": 5286} {"info/global_step": 5287, "train_info/time_within_train_step": 2.7545392513275146, "step": 5287} {"train_info/time_between_train_steps": 0.0031430721282958984, "step": 5287} {"info/global_step": 5288, "train_info/time_within_train_step": 2.75423002243042, "step": 5288} {"train_info/time_between_train_steps": 0.0031740665435791016, "step": 5288} {"info/global_step": 5289, "train_info/time_within_train_step": 2.7538645267486572, "step": 5289} {"train_info/time_between_train_steps": 0.0031671524047851562, "step": 5289} {"info/global_step": 5290, "train_info/time_within_train_step": 2.7541606426239014, "step": 5290} {"train_info/time_between_train_steps": 0.0031731128692626953, "step": 5290} {"info/global_step": 5291, "train_info/time_within_train_step": 2.7544138431549072, "step": 5291} {"train_info/time_between_train_steps": 0.003180265426635742, "step": 5291} {"info/global_step": 5292, "train_info/time_within_train_step": 2.753822088241577, "step": 5292} {"train_info/time_between_train_steps": 0.0032110214233398438, "step": 5292} {"info/global_step": 5293, "train_info/time_within_train_step": 2.7548563480377197, "step": 5293} {"train_info/time_between_train_steps": 0.0031745433807373047, "step": 5293} {"info/global_step": 5294, "train_info/time_within_train_step": 2.7553815841674805, "step": 5294} {"train_info/time_between_train_steps": 0.0031592845916748047, "step": 5294} {"info/global_step": 5295, "train_info/time_within_train_step": 2.753146171569824, "step": 5295} {"train_info/time_between_train_steps": 0.0031473636627197266, "step": 5295} {"info/global_step": 5296, "train_info/time_within_train_step": 2.755464792251587, "step": 5296} {"train_info/time_between_train_steps": 0.0031616687774658203, "step": 5296} {"info/global_step": 5297, "train_info/time_within_train_step": 2.7550179958343506, "step": 5297} {"train_info/time_between_train_steps": 0.0031752586364746094, "step": 5297} {"info/global_step": 5298, "train_info/time_within_train_step": 2.755234479904175, "step": 5298} {"train_info/time_between_train_steps": 0.0031490325927734375, "step": 5298} {"info/global_step": 5299, "train_info/time_within_train_step": 2.75478458404541, "step": 5299} {"train_info/time_between_train_steps": 0.003118753433227539, "step": 5299} {"info/global_step": 5300, "train_info/time_within_train_step": 2.75540828704834, "step": 5300} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746581380, "_runtime": 15389}, "step": 5300} {"logs": {"train/loss": 3.5723, "train/learning_rate": 0.0003133333333333333, "train/epoch": 6.02, "_timestamp": 1746581380, "_runtime": 15389}, "step": 5300} {"train_info/time_between_train_steps": 0.013881921768188477, "step": 5300} {"info/global_step": 5301, "train_info/time_within_train_step": 2.7538511753082275, "step": 5301} {"train_info/time_between_train_steps": 0.003140687942504883, "step": 5301} {"info/global_step": 5302, "train_info/time_within_train_step": 2.75545334815979, "step": 5302} {"train_info/time_between_train_steps": 0.0031507015228271484, "step": 5302} {"info/global_step": 5303, "train_info/time_within_train_step": 2.754680871963501, "step": 5303} {"train_info/time_between_train_steps": 0.003117084503173828, "step": 5303} {"info/global_step": 5304, "train_info/time_within_train_step": 2.755082368850708, "step": 5304} {"train_info/time_between_train_steps": 0.0031409263610839844, "step": 5304} {"info/global_step": 5305, "train_info/time_within_train_step": 2.755974531173706, "step": 5305} {"train_info/time_between_train_steps": 0.0031304359436035156, "step": 5305} {"info/global_step": 5306, "train_info/time_within_train_step": 2.8778181076049805, "step": 5306} {"train_info/time_between_train_steps": 0.0031311511993408203, "step": 5306} {"info/global_step": 5307, "train_info/time_within_train_step": 2.754204511642456, "step": 5307} {"train_info/time_between_train_steps": 0.0031397342681884766, "step": 5307} {"info/global_step": 5308, "train_info/time_within_train_step": 2.755338668823242, "step": 5308} {"train_info/time_between_train_steps": 0.003159046173095703, "step": 5308} {"info/global_step": 5309, "train_info/time_within_train_step": 2.7547879219055176, "step": 5309} {"train_info/time_between_train_steps": 0.003175973892211914, "step": 5309} {"info/global_step": 5310, "train_info/time_within_train_step": 2.755380868911743, "step": 5310} {"train_info/time_between_train_steps": 0.003183126449584961, "step": 5310} {"info/global_step": 5311, "train_info/time_within_train_step": 2.7556896209716797, "step": 5311} {"train_info/time_between_train_steps": 0.0032100677490234375, "step": 5311} {"info/global_step": 5312, "train_info/time_within_train_step": 2.7561306953430176, "step": 5312} {"train_info/time_between_train_steps": 0.0032117366790771484, "step": 5312} {"info/global_step": 5313, "train_info/time_within_train_step": 2.755777359008789, "step": 5313} {"train_info/time_between_train_steps": 0.0031647682189941406, "step": 5313} {"info/global_step": 5314, "train_info/time_within_train_step": 2.755037307739258, "step": 5314} {"train_info/time_between_train_steps": 0.0032052993774414062, "step": 5314} {"info/global_step": 5315, "train_info/time_within_train_step": 2.7558059692382812, "step": 5315} {"train_info/time_between_train_steps": 0.0031890869140625, "step": 5315} {"info/global_step": 5316, "train_info/time_within_train_step": 2.7550582885742188, "step": 5316} {"train_info/time_between_train_steps": 0.0031697750091552734, "step": 5316} {"info/global_step": 5317, "train_info/time_within_train_step": 2.756072521209717, "step": 5317} {"train_info/time_between_train_steps": 0.003216981887817383, "step": 5317} {"info/global_step": 5318, "train_info/time_within_train_step": 2.755056619644165, "step": 5318} {"train_info/time_between_train_steps": 0.003172636032104492, "step": 5318} {"info/global_step": 5319, "train_info/time_within_train_step": 2.7534091472625732, "step": 5319} {"train_info/time_between_train_steps": 0.003144979476928711, "step": 5319} {"info/global_step": 5320, "train_info/time_within_train_step": 2.7549350261688232, "step": 5320} {"train_info/time_between_train_steps": 0.0031731128692626953, "step": 5320} {"info/global_step": 5321, "train_info/time_within_train_step": 2.7541143894195557, "step": 5321} {"train_info/time_between_train_steps": 0.003179311752319336, "step": 5321} {"info/global_step": 5322, "train_info/time_within_train_step": 2.7532968521118164, "step": 5322} {"train_info/time_between_train_steps": 0.0031588077545166016, "step": 5322} {"info/global_step": 5323, "train_info/time_within_train_step": 2.754045248031616, "step": 5323} {"train_info/time_between_train_steps": 0.0031833648681640625, "step": 5323} {"info/global_step": 5324, "train_info/time_within_train_step": 2.7542147636413574, "step": 5324} {"train_info/time_between_train_steps": 0.003180980682373047, "step": 5324} {"info/global_step": 5325, "train_info/time_within_train_step": 2.755521297454834, "step": 5325} {"train_info/time_between_train_steps": 0.0031762123107910156, "step": 5325} {"info/global_step": 5326, "train_info/time_within_train_step": 2.7548582553863525, "step": 5326} {"train_info/time_between_train_steps": 0.0031495094299316406, "step": 5326} {"info/global_step": 5327, "train_info/time_within_train_step": 2.755415678024292, "step": 5327} {"train_info/time_between_train_steps": 0.003179788589477539, "step": 5327} {"info/global_step": 5328, "train_info/time_within_train_step": 2.7552521228790283, "step": 5328} {"train_info/time_between_train_steps": 0.003158092498779297, "step": 5328} {"info/global_step": 5329, "train_info/time_within_train_step": 2.754739999771118, "step": 5329} {"train_info/time_between_train_steps": 0.0031571388244628906, "step": 5329} {"info/global_step": 5330, "train_info/time_within_train_step": 2.7532846927642822, "step": 5330} {"train_info/time_between_train_steps": 0.0036308765411376953, "step": 5330} {"info/global_step": 5331, "train_info/time_within_train_step": 2.754704475402832, "step": 5331} {"train_info/time_between_train_steps": 0.003236532211303711, "step": 5331} {"info/global_step": 5332, "train_info/time_within_train_step": 2.7538204193115234, "step": 5332} {"train_info/time_between_train_steps": 0.0031828880310058594, "step": 5332} {"info/global_step": 5333, "train_info/time_within_train_step": 2.754943370819092, "step": 5333} {"train_info/time_between_train_steps": 0.0031824111938476562, "step": 5333} {"info/global_step": 5334, "train_info/time_within_train_step": 2.754875421524048, "step": 5334} {"train_info/time_between_train_steps": 0.003203153610229492, "step": 5334} {"info/global_step": 5335, "train_info/time_within_train_step": 2.75514554977417, "step": 5335} {"train_info/time_between_train_steps": 0.003174304962158203, "step": 5335} {"info/global_step": 5336, "train_info/time_within_train_step": 2.7550783157348633, "step": 5336} {"train_info/time_between_train_steps": 0.0031762123107910156, "step": 5336} {"info/global_step": 5337, "train_info/time_within_train_step": 2.753422737121582, "step": 5337} {"train_info/time_between_train_steps": 0.003167390823364258, "step": 5337} {"info/global_step": 5338, "train_info/time_within_train_step": 2.7550220489501953, "step": 5338} {"train_info/time_between_train_steps": 0.0031414031982421875, "step": 5338} {"info/global_step": 5339, "train_info/time_within_train_step": 2.7536051273345947, "step": 5339} {"train_info/time_between_train_steps": 0.0031702518463134766, "step": 5339} {"info/global_step": 5340, "train_info/time_within_train_step": 2.754722833633423, "step": 5340} {"train_info/time_between_train_steps": 0.0032067298889160156, "step": 5340} {"info/global_step": 5341, "train_info/time_within_train_step": 2.75400447845459, "step": 5341} {"train_info/time_between_train_steps": 0.0031616687774658203, "step": 5341} {"info/global_step": 5342, "train_info/time_within_train_step": 2.7545113563537598, "step": 5342} {"train_info/time_between_train_steps": 0.003153562545776367, "step": 5342} {"info/global_step": 5343, "train_info/time_within_train_step": 2.7537930011749268, "step": 5343} {"train_info/time_between_train_steps": 0.0031642913818359375, "step": 5343} {"info/global_step": 5344, "train_info/time_within_train_step": 2.7538812160491943, "step": 5344} {"train_info/time_between_train_steps": 0.0031964778900146484, "step": 5344} {"info/global_step": 5345, "train_info/time_within_train_step": 2.7547833919525146, "step": 5345} {"train_info/time_between_train_steps": 0.003135204315185547, "step": 5345} {"info/global_step": 5346, "train_info/time_within_train_step": 2.7541236877441406, "step": 5346} {"train_info/time_between_train_steps": 0.003153562545776367, "step": 5346} {"info/global_step": 5347, "train_info/time_within_train_step": 2.9984469413757324, "step": 5347} {"train_info/time_between_train_steps": 0.003130197525024414, "step": 5347} {"info/global_step": 5348, "train_info/time_within_train_step": 2.754301071166992, "step": 5348} {"train_info/time_between_train_steps": 0.003145933151245117, "step": 5348} {"info/global_step": 5349, "train_info/time_within_train_step": 2.753960132598877, "step": 5349} {"train_info/time_between_train_steps": 0.003129243850708008, "step": 5349} {"info/global_step": 5350, "train_info/time_within_train_step": 2.754664182662964, "step": 5350} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746581519, "_runtime": 15528}, "step": 5350} {"logs": {"train/loss": 3.5695, "train/learning_rate": 0.00031, "train/epoch": 6.02, "_timestamp": 1746581519, "_runtime": 15528}, "step": 5350} {"train_info/time_between_train_steps": 0.013803720474243164, "step": 5350} {"info/global_step": 5351, "train_info/time_within_train_step": 2.7545719146728516, "step": 5351} {"train_info/time_between_train_steps": 0.00321197509765625, "step": 5351} {"info/global_step": 5352, "train_info/time_within_train_step": 2.7809956073760986, "step": 5352} {"train_info/time_between_train_steps": 0.0031387805938720703, "step": 5352} {"info/global_step": 5353, "train_info/time_within_train_step": 2.753702402114868, "step": 5353} {"train_info/time_between_train_steps": 0.003186941146850586, "step": 5353} {"info/global_step": 5354, "train_info/time_within_train_step": 2.7546744346618652, "step": 5354} {"train_info/time_between_train_steps": 0.0031995773315429688, "step": 5354} {"info/global_step": 5355, "train_info/time_within_train_step": 2.755056619644165, "step": 5355} {"train_info/time_between_train_steps": 0.003150463104248047, "step": 5355} {"info/global_step": 5356, "train_info/time_within_train_step": 2.7535226345062256, "step": 5356} {"train_info/time_between_train_steps": 0.0030965805053710938, "step": 5356} {"info/global_step": 5357, "train_info/time_within_train_step": 2.755409002304077, "step": 5357} {"train_info/time_between_train_steps": 0.003130674362182617, "step": 5357} {"info/global_step": 5358, "train_info/time_within_train_step": 2.753561019897461, "step": 5358} {"train_info/time_between_train_steps": 0.0031316280364990234, "step": 5358} {"info/global_step": 5359, "train_info/time_within_train_step": 2.7540037631988525, "step": 5359} {"train_info/time_between_train_steps": 0.0031125545501708984, "step": 5359} {"info/global_step": 5360, "train_info/time_within_train_step": 2.7551114559173584, "step": 5360} {"train_info/time_between_train_steps": 0.0031304359436035156, "step": 5360} {"info/global_step": 5361, "train_info/time_within_train_step": 2.7539641857147217, "step": 5361} {"train_info/time_between_train_steps": 0.0031206607818603516, "step": 5361} {"info/global_step": 5362, "train_info/time_within_train_step": 2.7544538974761963, "step": 5362} {"train_info/time_between_train_steps": 0.003154754638671875, "step": 5362} {"info/global_step": 5363, "train_info/time_within_train_step": 2.75488018989563, "step": 5363} {"train_info/time_between_train_steps": 0.003128528594970703, "step": 5363} {"info/global_step": 5364, "train_info/time_within_train_step": 2.7553317546844482, "step": 5364} {"train_info/time_between_train_steps": 0.003145933151245117, "step": 5364} {"info/global_step": 5365, "train_info/time_within_train_step": 2.7544198036193848, "step": 5365} {"train_info/time_between_train_steps": 0.0039675235748291016, "step": 5365} {"info/global_step": 5366, "train_info/time_within_train_step": 2.7541182041168213, "step": 5366} {"train_info/time_between_train_steps": 0.003129720687866211, "step": 5366} {"info/global_step": 5367, "train_info/time_within_train_step": 2.754474639892578, "step": 5367} {"train_info/time_between_train_steps": 0.0031194686889648438, "step": 5367} {"info/global_step": 5368, "train_info/time_within_train_step": 2.754183530807495, "step": 5368} {"train_info/time_between_train_steps": 0.12743353843688965, "step": 5368} {"info/global_step": 5369, "train_info/time_within_train_step": 2.7550811767578125, "step": 5369} {"train_info/time_between_train_steps": 0.003173351287841797, "step": 5369} {"info/global_step": 5370, "train_info/time_within_train_step": 2.7542197704315186, "step": 5370} {"train_info/time_between_train_steps": 0.0031256675720214844, "step": 5370} {"info/global_step": 5371, "train_info/time_within_train_step": 2.75517201423645, "step": 5371} {"train_info/time_between_train_steps": 0.003169536590576172, "step": 5371} {"info/global_step": 5372, "train_info/time_within_train_step": 2.754246473312378, "step": 5372} {"train_info/time_between_train_steps": 0.0031719207763671875, "step": 5372} {"info/global_step": 5373, "train_info/time_within_train_step": 2.7539000511169434, "step": 5373} {"train_info/time_between_train_steps": 0.003130674362182617, "step": 5373} {"info/global_step": 5374, "train_info/time_within_train_step": 2.7545852661132812, "step": 5374} {"train_info/time_between_train_steps": 0.0031812191009521484, "step": 5374} {"info/global_step": 5375, "train_info/time_within_train_step": 2.7535834312438965, "step": 5375} {"train_info/time_between_train_steps": 0.0031995773315429688, "step": 5375} {"info/global_step": 5376, "train_info/time_within_train_step": 2.75461483001709, "step": 5376} {"train_info/time_between_train_steps": 0.0031538009643554688, "step": 5376} {"info/global_step": 5377, "train_info/time_within_train_step": 2.7545557022094727, "step": 5377} {"train_info/time_between_train_steps": 0.003185749053955078, "step": 5377} {"info/global_step": 5378, "train_info/time_within_train_step": 2.7544052600860596, "step": 5378} {"train_info/time_between_train_steps": 0.0031418800354003906, "step": 5378} {"info/global_step": 5379, "train_info/time_within_train_step": 2.7550950050354004, "step": 5379} {"train_info/time_between_train_steps": 0.003117799758911133, "step": 5379} {"info/global_step": 5380, "train_info/time_within_train_step": 2.7548677921295166, "step": 5380} {"train_info/time_between_train_steps": 0.0031647682189941406, "step": 5380} {"info/global_step": 5381, "train_info/time_within_train_step": 2.754443883895874, "step": 5381} {"train_info/time_between_train_steps": 0.00315093994140625, "step": 5381} {"info/global_step": 5382, "train_info/time_within_train_step": 2.755338191986084, "step": 5382} {"train_info/time_between_train_steps": 0.0031337738037109375, "step": 5382} {"info/global_step": 5383, "train_info/time_within_train_step": 2.7539830207824707, "step": 5383} {"train_info/time_between_train_steps": 0.003203868865966797, "step": 5383} {"info/global_step": 5384, "train_info/time_within_train_step": 2.755082607269287, "step": 5384} {"train_info/time_between_train_steps": 0.0031747817993164062, "step": 5384} {"info/global_step": 5385, "train_info/time_within_train_step": 2.755465507507324, "step": 5385} {"train_info/time_between_train_steps": 0.0031986236572265625, "step": 5385} {"info/global_step": 5386, "train_info/time_within_train_step": 2.7539772987365723, "step": 5386} {"train_info/time_between_train_steps": 0.0031893253326416016, "step": 5386} {"info/global_step": 5387, "train_info/time_within_train_step": 2.7545053958892822, "step": 5387} {"train_info/time_between_train_steps": 0.0031125545501708984, "step": 5387} {"info/global_step": 5388, "train_info/time_within_train_step": 2.756373405456543, "step": 5388} {"train_info/time_between_train_steps": 0.003162860870361328, "step": 5388} {"info/global_step": 5389, "train_info/time_within_train_step": 2.7554361820220947, "step": 5389} {"train_info/time_between_train_steps": 0.0031287670135498047, "step": 5389} {"info/global_step": 5390, "train_info/time_within_train_step": 2.754657030105591, "step": 5390} {"train_info/time_between_train_steps": 0.0031690597534179688, "step": 5390} {"info/global_step": 5391, "train_info/time_within_train_step": 2.755415916442871, "step": 5391} {"train_info/time_between_train_steps": 0.0032091140747070312, "step": 5391} {"info/global_step": 5392, "train_info/time_within_train_step": 2.754941940307617, "step": 5392} {"train_info/time_between_train_steps": 0.003139019012451172, "step": 5392} {"info/global_step": 5393, "train_info/time_within_train_step": 2.754817247390747, "step": 5393} {"train_info/time_between_train_steps": 0.003209352493286133, "step": 5393} {"info/global_step": 5394, "train_info/time_within_train_step": 2.7549877166748047, "step": 5394} {"train_info/time_between_train_steps": 0.0031507015228271484, "step": 5394} {"info/global_step": 5395, "train_info/time_within_train_step": 2.754715919494629, "step": 5395} {"train_info/time_between_train_steps": 0.003171205520629883, "step": 5395} {"info/global_step": 5396, "train_info/time_within_train_step": 2.7547919750213623, "step": 5396} {"train_info/time_between_train_steps": 0.0031261444091796875, "step": 5396} {"info/global_step": 5397, "train_info/time_within_train_step": 2.7552990913391113, "step": 5397} {"train_info/time_between_train_steps": 0.0032062530517578125, "step": 5397} {"info/global_step": 5398, "train_info/time_within_train_step": 2.7546045780181885, "step": 5398} {"train_info/time_between_train_steps": 0.003149271011352539, "step": 5398} {"info/global_step": 5399, "train_info/time_within_train_step": 2.75540828704834, "step": 5399} {"train_info/time_between_train_steps": 0.003161907196044922, "step": 5399} {"info/global_step": 5400, "train_info/time_within_train_step": 2.7538273334503174, "step": 5400} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746581657, "_runtime": 15666}, "step": 5400} {"logs": {"train/loss": 3.5457, "train/learning_rate": 0.0003066666666666666, "train/epoch": 6.03, "_timestamp": 1746581657, "_runtime": 15666}, "step": 5400} {"train_info/time_between_train_steps": 27.702954053878784, "step": 5400} {"info/global_step": 5401, "train_info/time_within_train_step": 2.536698818206787, "step": 5401} {"train_info/time_between_train_steps": 0.0031592845916748047, "step": 5401} {"info/global_step": 5402, "train_info/time_within_train_step": 2.5932819843292236, "step": 5402} {"train_info/time_between_train_steps": 0.003176450729370117, "step": 5402} {"info/global_step": 5403, "train_info/time_within_train_step": 2.933873414993286, "step": 5403} {"train_info/time_between_train_steps": 0.003164052963256836, "step": 5403} {"info/global_step": 5404, "train_info/time_within_train_step": 2.6904633045196533, "step": 5404} {"train_info/time_between_train_steps": 0.0031762123107910156, "step": 5404} {"info/global_step": 5405, "train_info/time_within_train_step": 2.717542886734009, "step": 5405} {"train_info/time_between_train_steps": 0.0032083988189697266, "step": 5405} {"info/global_step": 5406, "train_info/time_within_train_step": 2.7528533935546875, "step": 5406} {"train_info/time_between_train_steps": 0.0031828880310058594, "step": 5406} {"info/global_step": 5407, "train_info/time_within_train_step": 2.75551438331604, "step": 5407} {"train_info/time_between_train_steps": 0.0032041072845458984, "step": 5407} {"info/global_step": 5408, "train_info/time_within_train_step": 2.7554962635040283, "step": 5408} {"train_info/time_between_train_steps": 0.003194570541381836, "step": 5408} {"info/global_step": 5409, "train_info/time_within_train_step": 2.7557477951049805, "step": 5409} {"train_info/time_between_train_steps": 0.0032050609588623047, "step": 5409} {"info/global_step": 5410, "train_info/time_within_train_step": 2.755913496017456, "step": 5410} {"train_info/time_between_train_steps": 0.0031812191009521484, "step": 5410} {"info/global_step": 5411, "train_info/time_within_train_step": 2.757005453109741, "step": 5411} {"train_info/time_between_train_steps": 0.0032041072845458984, "step": 5411} {"info/global_step": 5412, "train_info/time_within_train_step": 2.7557668685913086, "step": 5412} {"train_info/time_between_train_steps": 0.003198862075805664, "step": 5412} {"info/global_step": 5413, "train_info/time_within_train_step": 2.7553164958953857, "step": 5413} {"train_info/time_between_train_steps": 0.0031936168670654297, "step": 5413} {"info/global_step": 5414, "train_info/time_within_train_step": 2.754401206970215, "step": 5414} {"train_info/time_between_train_steps": 0.0031740665435791016, "step": 5414} {"info/global_step": 5415, "train_info/time_within_train_step": 2.754520893096924, "step": 5415} {"train_info/time_between_train_steps": 0.0031616687774658203, "step": 5415} {"info/global_step": 5416, "train_info/time_within_train_step": 2.7542827129364014, "step": 5416} {"train_info/time_between_train_steps": 0.0032062530517578125, "step": 5416} {"info/global_step": 5417, "train_info/time_within_train_step": 2.7558231353759766, "step": 5417} {"train_info/time_between_train_steps": 0.003172636032104492, "step": 5417} {"info/global_step": 5418, "train_info/time_within_train_step": 2.7548773288726807, "step": 5418} {"train_info/time_between_train_steps": 0.003216266632080078, "step": 5418} {"info/global_step": 5419, "train_info/time_within_train_step": 2.755317449569702, "step": 5419} {"train_info/time_between_train_steps": 0.003198385238647461, "step": 5419} {"info/global_step": 5420, "train_info/time_within_train_step": 2.7551369667053223, "step": 5420} {"train_info/time_between_train_steps": 0.003177642822265625, "step": 5420} {"info/global_step": 5421, "train_info/time_within_train_step": 2.752622604370117, "step": 5421} {"train_info/time_between_train_steps": 0.0031960010528564453, "step": 5421} {"info/global_step": 5422, "train_info/time_within_train_step": 2.754403829574585, "step": 5422} {"train_info/time_between_train_steps": 0.0031859874725341797, "step": 5422} {"info/global_step": 5423, "train_info/time_within_train_step": 2.7563648223876953, "step": 5423} {"train_info/time_between_train_steps": 0.0031871795654296875, "step": 5423} {"info/global_step": 5424, "train_info/time_within_train_step": 2.754875421524048, "step": 5424} {"train_info/time_between_train_steps": 0.0031485557556152344, "step": 5424} {"info/global_step": 5425, "train_info/time_within_train_step": 2.7557244300842285, "step": 5425} {"train_info/time_between_train_steps": 0.003178834915161133, "step": 5425} {"info/global_step": 5426, "train_info/time_within_train_step": 2.755568265914917, "step": 5426} {"train_info/time_between_train_steps": 0.0031464099884033203, "step": 5426} {"info/global_step": 5427, "train_info/time_within_train_step": 2.7560033798217773, "step": 5427} {"train_info/time_between_train_steps": 0.003177165985107422, "step": 5427} {"info/global_step": 5428, "train_info/time_within_train_step": 2.7556803226470947, "step": 5428} {"train_info/time_between_train_steps": 0.0032274723052978516, "step": 5428} {"info/global_step": 5429, "train_info/time_within_train_step": 2.7555181980133057, "step": 5429} {"train_info/time_between_train_steps": 0.0031936168670654297, "step": 5429} {"info/global_step": 5430, "train_info/time_within_train_step": 2.754521608352661, "step": 5430} {"train_info/time_between_train_steps": 0.0031447410583496094, "step": 5430} {"info/global_step": 5431, "train_info/time_within_train_step": 2.8822193145751953, "step": 5431} {"train_info/time_between_train_steps": 0.0032172203063964844, "step": 5431} {"info/global_step": 5432, "train_info/time_within_train_step": 2.7562713623046875, "step": 5432} {"train_info/time_between_train_steps": 0.003155946731567383, "step": 5432} {"info/global_step": 5433, "train_info/time_within_train_step": 2.755826234817505, "step": 5433} {"train_info/time_between_train_steps": 0.0032067298889160156, "step": 5433} {"info/global_step": 5434, "train_info/time_within_train_step": 2.755218744277954, "step": 5434} {"train_info/time_between_train_steps": 0.003173351287841797, "step": 5434} {"info/global_step": 5435, "train_info/time_within_train_step": 2.7566335201263428, "step": 5435} {"train_info/time_between_train_steps": 0.0031952857971191406, "step": 5435} {"info/global_step": 5436, "train_info/time_within_train_step": 2.754558801651001, "step": 5436} {"train_info/time_between_train_steps": 0.003214597702026367, "step": 5436} {"info/global_step": 5437, "train_info/time_within_train_step": 2.75537109375, "step": 5437} {"train_info/time_between_train_steps": 0.0031638145446777344, "step": 5437} {"info/global_step": 5438, "train_info/time_within_train_step": 2.7548129558563232, "step": 5438} {"train_info/time_between_train_steps": 0.0031654834747314453, "step": 5438} {"info/global_step": 5439, "train_info/time_within_train_step": 2.7553956508636475, "step": 5439} {"train_info/time_between_train_steps": 0.003194093704223633, "step": 5439} {"info/global_step": 5440, "train_info/time_within_train_step": 2.755460739135742, "step": 5440} {"train_info/time_between_train_steps": 0.0032415390014648438, "step": 5440} {"info/global_step": 5441, "train_info/time_within_train_step": 2.756032943725586, "step": 5441} {"train_info/time_between_train_steps": 0.0031757354736328125, "step": 5441} {"info/global_step": 5442, "train_info/time_within_train_step": 2.7548043727874756, "step": 5442} {"train_info/time_between_train_steps": 0.0031785964965820312, "step": 5442} {"info/global_step": 5443, "train_info/time_within_train_step": 2.7558021545410156, "step": 5443} {"train_info/time_between_train_steps": 0.003175020217895508, "step": 5443} {"info/global_step": 5444, "train_info/time_within_train_step": 2.755980968475342, "step": 5444} {"train_info/time_between_train_steps": 0.0031495094299316406, "step": 5444} {"info/global_step": 5445, "train_info/time_within_train_step": 2.7551517486572266, "step": 5445} {"train_info/time_between_train_steps": 0.003179788589477539, "step": 5445} {"info/global_step": 5446, "train_info/time_within_train_step": 2.755443572998047, "step": 5446} {"train_info/time_between_train_steps": 0.003164052963256836, "step": 5446} {"info/global_step": 5447, "train_info/time_within_train_step": 2.755398988723755, "step": 5447} {"train_info/time_between_train_steps": 0.0031244754791259766, "step": 5447} {"info/global_step": 5448, "train_info/time_within_train_step": 2.7533750534057617, "step": 5448} {"train_info/time_between_train_steps": 0.0031375885009765625, "step": 5448} {"info/global_step": 5449, "train_info/time_within_train_step": 2.7547097206115723, "step": 5449} {"train_info/time_between_train_steps": 0.003138303756713867, "step": 5449} {"info/global_step": 5450, "train_info/time_within_train_step": 2.7538604736328125, "step": 5450} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746581823, "_runtime": 15832}, "step": 5450} {"logs": {"train/loss": 3.5432, "train/learning_rate": 0.0003033333333333333, "train/epoch": 6.03, "_timestamp": 1746581823, "_runtime": 15832}, "step": 5450} {"train_info/time_between_train_steps": 0.006932735443115234, "step": 5450} {"info/global_step": 5451, "train_info/time_within_train_step": 2.753462553024292, "step": 5451} {"train_info/time_between_train_steps": 0.003147602081298828, "step": 5451} {"info/global_step": 5452, "train_info/time_within_train_step": 2.7551677227020264, "step": 5452} {"train_info/time_between_train_steps": 0.003164052963256836, "step": 5452} {"info/global_step": 5453, "train_info/time_within_train_step": 2.754368305206299, "step": 5453} {"train_info/time_between_train_steps": 0.0031638145446777344, "step": 5453} {"info/global_step": 5454, "train_info/time_within_train_step": 2.754260301589966, "step": 5454} {"train_info/time_between_train_steps": 0.0031638145446777344, "step": 5454} {"info/global_step": 5455, "train_info/time_within_train_step": 2.7539122104644775, "step": 5455} {"train_info/time_between_train_steps": 0.003117799758911133, "step": 5455} {"info/global_step": 5456, "train_info/time_within_train_step": 2.754869222640991, "step": 5456} {"train_info/time_between_train_steps": 0.003152132034301758, "step": 5456} {"info/global_step": 5457, "train_info/time_within_train_step": 2.753929853439331, "step": 5457} {"train_info/time_between_train_steps": 0.0031404495239257812, "step": 5457} {"info/global_step": 5458, "train_info/time_within_train_step": 2.7545807361602783, "step": 5458} {"train_info/time_between_train_steps": 0.0031490325927734375, "step": 5458} {"info/global_step": 5459, "train_info/time_within_train_step": 2.7549517154693604, "step": 5459} {"train_info/time_between_train_steps": 0.003217458724975586, "step": 5459} {"info/global_step": 5460, "train_info/time_within_train_step": 2.755817413330078, "step": 5460} {"train_info/time_between_train_steps": 0.0031626224517822266, "step": 5460} {"info/global_step": 5461, "train_info/time_within_train_step": 2.7545177936553955, "step": 5461} {"train_info/time_between_train_steps": 0.0031347274780273438, "step": 5461} {"info/global_step": 5462, "train_info/time_within_train_step": 2.7541098594665527, "step": 5462} {"train_info/time_between_train_steps": 0.0031728744506835938, "step": 5462} {"info/global_step": 5463, "train_info/time_within_train_step": 2.754640579223633, "step": 5463} {"train_info/time_between_train_steps": 0.003144979476928711, "step": 5463} {"info/global_step": 5464, "train_info/time_within_train_step": 2.7542264461517334, "step": 5464} {"train_info/time_between_train_steps": 0.003183603286743164, "step": 5464} {"info/global_step": 5465, "train_info/time_within_train_step": 2.7543814182281494, "step": 5465} {"train_info/time_between_train_steps": 0.003161191940307617, "step": 5465} {"info/global_step": 5466, "train_info/time_within_train_step": 2.754791259765625, "step": 5466} {"train_info/time_between_train_steps": 0.0031714439392089844, "step": 5466} {"info/global_step": 5467, "train_info/time_within_train_step": 2.754331588745117, "step": 5467} {"train_info/time_between_train_steps": 0.0031533241271972656, "step": 5467} {"info/global_step": 5468, "train_info/time_within_train_step": 2.753377914428711, "step": 5468} {"train_info/time_between_train_steps": 0.0031671524047851562, "step": 5468} {"info/global_step": 5469, "train_info/time_within_train_step": 2.7544000148773193, "step": 5469} {"train_info/time_between_train_steps": 0.003128528594970703, "step": 5469} {"info/global_step": 5470, "train_info/time_within_train_step": 2.7540242671966553, "step": 5470} {"train_info/time_between_train_steps": 0.0031447410583496094, "step": 5470} {"info/global_step": 5471, "train_info/time_within_train_step": 2.7536332607269287, "step": 5471} {"train_info/time_between_train_steps": 0.003186464309692383, "step": 5471} {"info/global_step": 5472, "train_info/time_within_train_step": 2.7553017139434814, "step": 5472} {"train_info/time_between_train_steps": 0.0031969547271728516, "step": 5472} {"info/global_step": 5473, "train_info/time_within_train_step": 2.7626633644104004, "step": 5473} {"train_info/time_between_train_steps": 0.00316619873046875, "step": 5473} {"info/global_step": 5474, "train_info/time_within_train_step": 2.7546279430389404, "step": 5474} {"train_info/time_between_train_steps": 0.003195047378540039, "step": 5474} {"info/global_step": 5475, "train_info/time_within_train_step": 2.7560386657714844, "step": 5475} {"train_info/time_between_train_steps": 0.0031816959381103516, "step": 5475} {"info/global_step": 5476, "train_info/time_within_train_step": 2.755376100540161, "step": 5476} {"train_info/time_between_train_steps": 0.0032012462615966797, "step": 5476} {"info/global_step": 5477, "train_info/time_within_train_step": 2.755800724029541, "step": 5477} {"train_info/time_between_train_steps": 0.003172636032104492, "step": 5477} {"info/global_step": 5478, "train_info/time_within_train_step": 2.7546863555908203, "step": 5478} {"train_info/time_between_train_steps": 0.003168344497680664, "step": 5478} {"info/global_step": 5479, "train_info/time_within_train_step": 2.754498243331909, "step": 5479} {"train_info/time_between_train_steps": 0.003179788589477539, "step": 5479} {"info/global_step": 5480, "train_info/time_within_train_step": 2.754582166671753, "step": 5480} {"train_info/time_between_train_steps": 0.003228425979614258, "step": 5480} {"info/global_step": 5481, "train_info/time_within_train_step": 2.7551538944244385, "step": 5481} {"train_info/time_between_train_steps": 0.0031883716583251953, "step": 5481} {"info/global_step": 5482, "train_info/time_within_train_step": 2.7526285648345947, "step": 5482} {"train_info/time_between_train_steps": 0.003173351287841797, "step": 5482} {"info/global_step": 5483, "train_info/time_within_train_step": 2.7546427249908447, "step": 5483} {"train_info/time_between_train_steps": 0.0032205581665039062, "step": 5483} {"info/global_step": 5484, "train_info/time_within_train_step": 2.753783702850342, "step": 5484} {"train_info/time_between_train_steps": 0.003180980682373047, "step": 5484} {"info/global_step": 5485, "train_info/time_within_train_step": 2.754453659057617, "step": 5485} {"train_info/time_between_train_steps": 0.003187417984008789, "step": 5485} {"info/global_step": 5486, "train_info/time_within_train_step": 2.75410795211792, "step": 5486} {"train_info/time_between_train_steps": 0.0031375885009765625, "step": 5486} {"info/global_step": 5487, "train_info/time_within_train_step": 2.7535181045532227, "step": 5487} {"train_info/time_between_train_steps": 0.0031671524047851562, "step": 5487} {"info/global_step": 5488, "train_info/time_within_train_step": 2.7540810108184814, "step": 5488} {"train_info/time_between_train_steps": 0.003173351287841797, "step": 5488} {"info/global_step": 5489, "train_info/time_within_train_step": 2.754133701324463, "step": 5489} {"train_info/time_between_train_steps": 0.00313568115234375, "step": 5489} {"info/global_step": 5490, "train_info/time_within_train_step": 2.754671096801758, "step": 5490} {"train_info/time_between_train_steps": 0.0031337738037109375, "step": 5490} {"info/global_step": 5491, "train_info/time_within_train_step": 2.755269765853882, "step": 5491} {"train_info/time_between_train_steps": 0.0031440258026123047, "step": 5491} {"info/global_step": 5492, "train_info/time_within_train_step": 2.7554807662963867, "step": 5492} {"train_info/time_between_train_steps": 0.0031235218048095703, "step": 5492} {"info/global_step": 5493, "train_info/time_within_train_step": 2.754671335220337, "step": 5493} {"train_info/time_between_train_steps": 0.1327204704284668, "step": 5493} {"info/global_step": 5494, "train_info/time_within_train_step": 3.04429030418396, "step": 5494} {"train_info/time_between_train_steps": 0.0031468868255615234, "step": 5494} {"info/global_step": 5495, "train_info/time_within_train_step": 2.7528703212738037, "step": 5495} {"train_info/time_between_train_steps": 0.0031156539916992188, "step": 5495} {"info/global_step": 5496, "train_info/time_within_train_step": 2.754230260848999, "step": 5496} {"train_info/time_between_train_steps": 0.003195047378540039, "step": 5496} {"info/global_step": 5497, "train_info/time_within_train_step": 3.351685047149658, "step": 5497} {"train_info/time_between_train_steps": 0.0032079219818115234, "step": 5497} {"info/global_step": 5498, "train_info/time_within_train_step": 2.750932455062866, "step": 5498} {"train_info/time_between_train_steps": 0.003142833709716797, "step": 5498} {"info/global_step": 5499, "train_info/time_within_train_step": 2.753592014312744, "step": 5499} {"train_info/time_between_train_steps": 0.0031442642211914062, "step": 5499} {"info/global_step": 5500, "train_info/time_within_train_step": 2.754206657409668, "step": 5500} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746581962, "_runtime": 15971}, "step": 5500} {"logs": {"train/loss": 3.5476, "train/learning_rate": 0.0003, "train/epoch": 6.04, "_timestamp": 1746581962, "_runtime": 15971}, "step": 5500} {"train_info/time_between_train_steps": 0.0063631534576416016, "step": 5500} {"info/global_step": 5501, "train_info/time_within_train_step": 2.753995895385742, "step": 5501} {"train_info/time_between_train_steps": 0.0031278133392333984, "step": 5501} {"info/global_step": 5502, "train_info/time_within_train_step": 2.7539870738983154, "step": 5502} {"train_info/time_between_train_steps": 0.0031418800354003906, "step": 5502} {"info/global_step": 5503, "train_info/time_within_train_step": 2.7537457942962646, "step": 5503} {"train_info/time_between_train_steps": 0.003142118453979492, "step": 5503} {"info/global_step": 5504, "train_info/time_within_train_step": 2.754373550415039, "step": 5504} {"train_info/time_between_train_steps": 0.003168344497680664, "step": 5504} {"info/global_step": 5505, "train_info/time_within_train_step": 2.753884792327881, "step": 5505} {"train_info/time_between_train_steps": 0.003175973892211914, "step": 5505} {"info/global_step": 5506, "train_info/time_within_train_step": 2.754861831665039, "step": 5506} {"train_info/time_between_train_steps": 0.003162384033203125, "step": 5506} {"info/global_step": 5507, "train_info/time_within_train_step": 2.755190372467041, "step": 5507} {"train_info/time_between_train_steps": 0.003209352493286133, "step": 5507} {"info/global_step": 5508, "train_info/time_within_train_step": 2.754034996032715, "step": 5508} {"train_info/time_between_train_steps": 0.0031638145446777344, "step": 5508} {"info/global_step": 5509, "train_info/time_within_train_step": 2.7536208629608154, "step": 5509} {"train_info/time_between_train_steps": 0.003175973892211914, "step": 5509} {"info/global_step": 5510, "train_info/time_within_train_step": 2.7548365592956543, "step": 5510} {"train_info/time_between_train_steps": 0.0031440258026123047, "step": 5510} {"info/global_step": 5511, "train_info/time_within_train_step": 2.7548716068267822, "step": 5511} {"train_info/time_between_train_steps": 0.0031638145446777344, "step": 5511} {"info/global_step": 5512, "train_info/time_within_train_step": 2.7553670406341553, "step": 5512} {"train_info/time_between_train_steps": 0.003139972686767578, "step": 5512} {"info/global_step": 5513, "train_info/time_within_train_step": 2.7548723220825195, "step": 5513} {"train_info/time_between_train_steps": 0.003184080123901367, "step": 5513} {"info/global_step": 5514, "train_info/time_within_train_step": 2.7541286945343018, "step": 5514} {"train_info/time_between_train_steps": 0.003146648406982422, "step": 5514} {"info/global_step": 5515, "train_info/time_within_train_step": 2.7538459300994873, "step": 5515} {"train_info/time_between_train_steps": 0.003140687942504883, "step": 5515} {"info/global_step": 5516, "train_info/time_within_train_step": 2.754115343093872, "step": 5516} {"train_info/time_between_train_steps": 0.003151416778564453, "step": 5516} {"info/global_step": 5517, "train_info/time_within_train_step": 2.7543227672576904, "step": 5517} {"train_info/time_between_train_steps": 0.003200054168701172, "step": 5517} {"info/global_step": 5518, "train_info/time_within_train_step": 2.7545087337493896, "step": 5518} {"train_info/time_between_train_steps": 0.003168821334838867, "step": 5518} {"info/global_step": 5519, "train_info/time_within_train_step": 2.7539443969726562, "step": 5519} {"train_info/time_between_train_steps": 0.0031752586364746094, "step": 5519} {"info/global_step": 5520, "train_info/time_within_train_step": 2.7547550201416016, "step": 5520} {"train_info/time_between_train_steps": 0.0031566619873046875, "step": 5520} {"info/global_step": 5521, "train_info/time_within_train_step": 2.754730701446533, "step": 5521} {"train_info/time_between_train_steps": 0.003173828125, "step": 5521} {"info/global_step": 5522, "train_info/time_within_train_step": 2.753486394882202, "step": 5522} {"train_info/time_between_train_steps": 0.0031414031982421875, "step": 5522} {"info/global_step": 5523, "train_info/time_within_train_step": 2.7551181316375732, "step": 5523} {"train_info/time_between_train_steps": 0.0031380653381347656, "step": 5523} {"info/global_step": 5524, "train_info/time_within_train_step": 2.7547521591186523, "step": 5524} {"train_info/time_between_train_steps": 0.003121614456176758, "step": 5524} {"info/global_step": 5525, "train_info/time_within_train_step": 2.7552857398986816, "step": 5525} {"train_info/time_between_train_steps": 0.003148794174194336, "step": 5525} {"info/global_step": 5526, "train_info/time_within_train_step": 2.75451397895813, "step": 5526} {"train_info/time_between_train_steps": 0.0031392574310302734, "step": 5526} {"info/global_step": 5527, "train_info/time_within_train_step": 2.7542529106140137, "step": 5527} {"train_info/time_between_train_steps": 0.0031211376190185547, "step": 5527} {"info/global_step": 5528, "train_info/time_within_train_step": 2.7547669410705566, "step": 5528} {"train_info/time_between_train_steps": 0.0031752586364746094, "step": 5528} {"info/global_step": 5529, "train_info/time_within_train_step": 2.7539384365081787, "step": 5529} {"train_info/time_between_train_steps": 0.0031359195709228516, "step": 5529} {"info/global_step": 5530, "train_info/time_within_train_step": 2.7540769577026367, "step": 5530} {"train_info/time_between_train_steps": 0.0031354427337646484, "step": 5530} {"info/global_step": 5531, "train_info/time_within_train_step": 2.7524092197418213, "step": 5531} {"train_info/time_between_train_steps": 0.0031402111053466797, "step": 5531} {"info/global_step": 5532, "train_info/time_within_train_step": 2.753730058670044, "step": 5532} {"train_info/time_between_train_steps": 0.0031311511993408203, "step": 5532} {"info/global_step": 5533, "train_info/time_within_train_step": 2.753934383392334, "step": 5533} {"train_info/time_between_train_steps": 0.0031180381774902344, "step": 5533} {"info/global_step": 5534, "train_info/time_within_train_step": 2.7535502910614014, "step": 5534} {"train_info/time_between_train_steps": 0.003139019012451172, "step": 5534} {"info/global_step": 5535, "train_info/time_within_train_step": 2.753394603729248, "step": 5535} {"train_info/time_between_train_steps": 0.003123044967651367, "step": 5535} {"info/global_step": 5536, "train_info/time_within_train_step": 2.753676414489746, "step": 5536} {"train_info/time_between_train_steps": 0.0031380653381347656, "step": 5536} {"info/global_step": 5537, "train_info/time_within_train_step": 2.754204273223877, "step": 5537} {"train_info/time_between_train_steps": 0.003213644027709961, "step": 5537} {"info/global_step": 5538, "train_info/time_within_train_step": 2.7534866333007812, "step": 5538} {"train_info/time_between_train_steps": 0.003143787384033203, "step": 5538} {"info/global_step": 5539, "train_info/time_within_train_step": 2.7539401054382324, "step": 5539} {"train_info/time_between_train_steps": 0.0031540393829345703, "step": 5539} {"info/global_step": 5540, "train_info/time_within_train_step": 2.7539854049682617, "step": 5540} {"train_info/time_between_train_steps": 0.0032351016998291016, "step": 5540} {"info/global_step": 5541, "train_info/time_within_train_step": 2.7550127506256104, "step": 5541} {"train_info/time_between_train_steps": 0.003150463104248047, "step": 5541} {"info/global_step": 5542, "train_info/time_within_train_step": 2.7528750896453857, "step": 5542} {"train_info/time_between_train_steps": 0.003153085708618164, "step": 5542} {"info/global_step": 5543, "train_info/time_within_train_step": 2.755451202392578, "step": 5543} {"train_info/time_between_train_steps": 0.003170013427734375, "step": 5543} {"info/global_step": 5544, "train_info/time_within_train_step": 2.751086711883545, "step": 5544} {"train_info/time_between_train_steps": 0.0031375885009765625, "step": 5544} {"info/global_step": 5545, "train_info/time_within_train_step": 2.7548415660858154, "step": 5545} {"train_info/time_between_train_steps": 0.0031387805938720703, "step": 5545} {"info/global_step": 5546, "train_info/time_within_train_step": 2.7541306018829346, "step": 5546} {"train_info/time_between_train_steps": 0.003152608871459961, "step": 5546} {"info/global_step": 5547, "train_info/time_within_train_step": 2.754403829574585, "step": 5547} {"train_info/time_between_train_steps": 0.003133058547973633, "step": 5547} {"info/global_step": 5548, "train_info/time_within_train_step": 2.753448724746704, "step": 5548} {"train_info/time_between_train_steps": 0.003170013427734375, "step": 5548} {"info/global_step": 5549, "train_info/time_within_train_step": 2.7545177936553955, "step": 5549} {"train_info/time_between_train_steps": 0.0031311511993408203, "step": 5549} {"info/global_step": 5550, "train_info/time_within_train_step": 3.0152485370635986, "step": 5550} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746582100, "_runtime": 16109}, "step": 5550} {"logs": {"train/loss": 3.5277, "train/learning_rate": 0.00029666666666666665, "train/epoch": 6.04, "_timestamp": 1746582100, "_runtime": 16109}, "step": 5550} {"train_info/time_between_train_steps": 0.006803274154663086, "step": 5550} {"info/global_step": 5551, "train_info/time_within_train_step": 2.750955820083618, "step": 5551} {"train_info/time_between_train_steps": 0.0031311511993408203, "step": 5551} {"info/global_step": 5552, "train_info/time_within_train_step": 2.7546539306640625, "step": 5552} {"train_info/time_between_train_steps": 0.0031280517578125, "step": 5552} {"info/global_step": 5553, "train_info/time_within_train_step": 2.7549331188201904, "step": 5553} {"train_info/time_between_train_steps": 0.0031359195709228516, "step": 5553} {"info/global_step": 5554, "train_info/time_within_train_step": 2.7544665336608887, "step": 5554} {"train_info/time_between_train_steps": 0.003155231475830078, "step": 5554} {"info/global_step": 5555, "train_info/time_within_train_step": 2.7539093494415283, "step": 5555} {"train_info/time_between_train_steps": 0.003132343292236328, "step": 5555} {"info/global_step": 5556, "train_info/time_within_train_step": 2.881091833114624, "step": 5556} {"train_info/time_between_train_steps": 0.0031588077545166016, "step": 5556} {"info/global_step": 5557, "train_info/time_within_train_step": 2.7526755332946777, "step": 5557} {"train_info/time_between_train_steps": 0.003207683563232422, "step": 5557} {"info/global_step": 5558, "train_info/time_within_train_step": 2.754540205001831, "step": 5558} {"train_info/time_between_train_steps": 0.003136157989501953, "step": 5558} {"info/global_step": 5559, "train_info/time_within_train_step": 2.7541146278381348, "step": 5559} {"train_info/time_between_train_steps": 0.003191709518432617, "step": 5559} {"info/global_step": 5560, "train_info/time_within_train_step": 2.7524971961975098, "step": 5560} {"train_info/time_between_train_steps": 0.0031540393829345703, "step": 5560} {"info/global_step": 5561, "train_info/time_within_train_step": 2.7537827491760254, "step": 5561} {"train_info/time_between_train_steps": 0.0031943321228027344, "step": 5561} {"info/global_step": 5562, "train_info/time_within_train_step": 2.753444194793701, "step": 5562} {"train_info/time_between_train_steps": 0.003142118453979492, "step": 5562} {"info/global_step": 5563, "train_info/time_within_train_step": 2.7530293464660645, "step": 5563} {"train_info/time_between_train_steps": 0.0031418800354003906, "step": 5563} {"info/global_step": 5564, "train_info/time_within_train_step": 2.7532482147216797, "step": 5564} {"train_info/time_between_train_steps": 0.0031354427337646484, "step": 5564} {"info/global_step": 5565, "train_info/time_within_train_step": 2.754798173904419, "step": 5565} {"train_info/time_between_train_steps": 0.0031728744506835938, "step": 5565} {"info/global_step": 5566, "train_info/time_within_train_step": 2.7551229000091553, "step": 5566} {"train_info/time_between_train_steps": 0.0031571388244628906, "step": 5566} {"info/global_step": 5567, "train_info/time_within_train_step": 2.7535183429718018, "step": 5567} {"train_info/time_between_train_steps": 0.003144502639770508, "step": 5567} {"info/global_step": 5568, "train_info/time_within_train_step": 2.754793882369995, "step": 5568} {"train_info/time_between_train_steps": 0.0031621456146240234, "step": 5568} {"info/global_step": 5569, "train_info/time_within_train_step": 2.7552618980407715, "step": 5569} {"train_info/time_between_train_steps": 0.003145933151245117, "step": 5569} {"info/global_step": 5570, "train_info/time_within_train_step": 2.7545788288116455, "step": 5570} {"train_info/time_between_train_steps": 0.0031201839447021484, "step": 5570} {"info/global_step": 5571, "train_info/time_within_train_step": 2.7549479007720947, "step": 5571} {"train_info/time_between_train_steps": 0.0031480789184570312, "step": 5571} {"info/global_step": 5572, "train_info/time_within_train_step": 2.7551097869873047, "step": 5572} {"train_info/time_between_train_steps": 0.0031800270080566406, "step": 5572} {"info/global_step": 5573, "train_info/time_within_train_step": 2.754971742630005, "step": 5573} {"train_info/time_between_train_steps": 0.0031256675720214844, "step": 5573} {"info/global_step": 5574, "train_info/time_within_train_step": 2.754671812057495, "step": 5574} {"train_info/time_between_train_steps": 0.003178834915161133, "step": 5574} {"info/global_step": 5575, "train_info/time_within_train_step": 2.7538840770721436, "step": 5575} {"train_info/time_between_train_steps": 0.0031566619873046875, "step": 5575} {"info/global_step": 5576, "train_info/time_within_train_step": 2.754807472229004, "step": 5576} {"train_info/time_between_train_steps": 0.0031511783599853516, "step": 5576} {"info/global_step": 5577, "train_info/time_within_train_step": 2.7550108432769775, "step": 5577} {"train_info/time_between_train_steps": 0.0031485557556152344, "step": 5577} {"info/global_step": 5578, "train_info/time_within_train_step": 2.755354881286621, "step": 5578} {"train_info/time_between_train_steps": 0.0031485557556152344, "step": 5578} {"info/global_step": 5579, "train_info/time_within_train_step": 2.7538251876831055, "step": 5579} {"train_info/time_between_train_steps": 0.0031957626342773438, "step": 5579} {"info/global_step": 5580, "train_info/time_within_train_step": 2.755295753479004, "step": 5580} {"train_info/time_between_train_steps": 0.003175020217895508, "step": 5580} {"info/global_step": 5581, "train_info/time_within_train_step": 2.755359649658203, "step": 5581} {"train_info/time_between_train_steps": 0.0032358169555664062, "step": 5581} {"info/global_step": 5582, "train_info/time_within_train_step": 2.7551422119140625, "step": 5582} {"train_info/time_between_train_steps": 0.0031855106353759766, "step": 5582} {"info/global_step": 5583, "train_info/time_within_train_step": 2.7559385299682617, "step": 5583} {"train_info/time_between_train_steps": 0.0032300949096679688, "step": 5583} {"info/global_step": 5584, "train_info/time_within_train_step": 2.7546427249908447, "step": 5584} {"train_info/time_between_train_steps": 0.00319671630859375, "step": 5584} {"info/global_step": 5585, "train_info/time_within_train_step": 2.753716468811035, "step": 5585} {"train_info/time_between_train_steps": 0.0031599998474121094, "step": 5585} {"info/global_step": 5586, "train_info/time_within_train_step": 2.754513740539551, "step": 5586} {"train_info/time_between_train_steps": 0.0032014846801757812, "step": 5586} {"info/global_step": 5587, "train_info/time_within_train_step": 2.755326509475708, "step": 5587} {"train_info/time_between_train_steps": 0.0031909942626953125, "step": 5587} {"info/global_step": 5588, "train_info/time_within_train_step": 2.754818916320801, "step": 5588} {"train_info/time_between_train_steps": 0.003182649612426758, "step": 5588} {"info/global_step": 5589, "train_info/time_within_train_step": 2.7548367977142334, "step": 5589} {"train_info/time_between_train_steps": 0.0031969547271728516, "step": 5589} {"info/global_step": 5590, "train_info/time_within_train_step": 2.755300998687744, "step": 5590} {"train_info/time_between_train_steps": 0.0031740665435791016, "step": 5590} {"info/global_step": 5591, "train_info/time_within_train_step": 2.7558796405792236, "step": 5591} {"train_info/time_between_train_steps": 0.003185749053955078, "step": 5591} {"info/global_step": 5592, "train_info/time_within_train_step": 2.7559280395507812, "step": 5592} {"train_info/time_between_train_steps": 0.0031757354736328125, "step": 5592} {"info/global_step": 5593, "train_info/time_within_train_step": 2.75457763671875, "step": 5593} {"train_info/time_between_train_steps": 0.0031435489654541016, "step": 5593} {"info/global_step": 5594, "train_info/time_within_train_step": 2.7554399967193604, "step": 5594} {"train_info/time_between_train_steps": 0.0031960010528564453, "step": 5594} {"info/global_step": 5595, "train_info/time_within_train_step": 2.755990743637085, "step": 5595} {"train_info/time_between_train_steps": 0.0031604766845703125, "step": 5595} {"info/global_step": 5596, "train_info/time_within_train_step": 2.7559518814086914, "step": 5596} {"train_info/time_between_train_steps": 0.0031783580780029297, "step": 5596} {"info/global_step": 5597, "train_info/time_within_train_step": 2.755326271057129, "step": 5597} {"train_info/time_between_train_steps": 0.0031669139862060547, "step": 5597} {"info/global_step": 5598, "train_info/time_within_train_step": 2.7554752826690674, "step": 5598} {"train_info/time_between_train_steps": 0.003164052963256836, "step": 5598} {"info/global_step": 5599, "train_info/time_within_train_step": 2.754777431488037, "step": 5599} {"train_info/time_between_train_steps": 0.0032095909118652344, "step": 5599} {"info/global_step": 5600, "train_info/time_within_train_step": 2.7556591033935547, "step": 5600} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746582238, "_runtime": 16247}, "step": 5600} {"logs": {"train/loss": 3.5224, "train/learning_rate": 0.00029333333333333327, "train/epoch": 6.05, "_timestamp": 1746582238, "_runtime": 16247}, "step": 5600} {"train_info/time_between_train_steps": 14.411120176315308, "step": 5600} {"info/global_step": 5601, "train_info/time_within_train_step": 2.5344173908233643, "step": 5601} {"train_info/time_between_train_steps": 0.0033266544342041016, "step": 5601} {"info/global_step": 5602, "train_info/time_within_train_step": 2.5708253383636475, "step": 5602} {"train_info/time_between_train_steps": 0.003324270248413086, "step": 5602} {"info/global_step": 5603, "train_info/time_within_train_step": 2.6944360733032227, "step": 5603} {"train_info/time_between_train_steps": 0.0033402442932128906, "step": 5603} {"info/global_step": 5604, "train_info/time_within_train_step": 2.75114369392395, "step": 5604} {"train_info/time_between_train_steps": 0.003393888473510742, "step": 5604} {"info/global_step": 5605, "train_info/time_within_train_step": 3.019752025604248, "step": 5605} {"train_info/time_between_train_steps": 0.003293752670288086, "step": 5605} {"info/global_step": 5606, "train_info/time_within_train_step": 2.7560980319976807, "step": 5606} {"train_info/time_between_train_steps": 0.0033223628997802734, "step": 5606} {"info/global_step": 5607, "train_info/time_within_train_step": 2.7573206424713135, "step": 5607} {"train_info/time_between_train_steps": 0.0033118724822998047, "step": 5607} {"info/global_step": 5608, "train_info/time_within_train_step": 2.756317138671875, "step": 5608} {"train_info/time_between_train_steps": 0.003309011459350586, "step": 5608} {"info/global_step": 5609, "train_info/time_within_train_step": 2.7566089630126953, "step": 5609} {"train_info/time_between_train_steps": 0.003371715545654297, "step": 5609} {"info/global_step": 5610, "train_info/time_within_train_step": 2.755953311920166, "step": 5610} {"train_info/time_between_train_steps": 0.0032999515533447266, "step": 5610} {"info/global_step": 5611, "train_info/time_within_train_step": 2.7562155723571777, "step": 5611} {"train_info/time_between_train_steps": 0.003334522247314453, "step": 5611} {"info/global_step": 5612, "train_info/time_within_train_step": 2.756915807723999, "step": 5612} {"train_info/time_between_train_steps": 0.0033216476440429688, "step": 5612} {"info/global_step": 5613, "train_info/time_within_train_step": 2.7569386959075928, "step": 5613} {"train_info/time_between_train_steps": 0.0033025741577148438, "step": 5613} {"info/global_step": 5614, "train_info/time_within_train_step": 2.757737874984741, "step": 5614} {"train_info/time_between_train_steps": 0.003282785415649414, "step": 5614} {"info/global_step": 5615, "train_info/time_within_train_step": 2.7581167221069336, "step": 5615} {"train_info/time_between_train_steps": 0.0033245086669921875, "step": 5615} {"info/global_step": 5616, "train_info/time_within_train_step": 2.7573132514953613, "step": 5616} {"train_info/time_between_train_steps": 0.0033588409423828125, "step": 5616} {"info/global_step": 5617, "train_info/time_within_train_step": 2.757347583770752, "step": 5617} {"train_info/time_between_train_steps": 0.0033195018768310547, "step": 5617} {"info/global_step": 5618, "train_info/time_within_train_step": 2.757755994796753, "step": 5618} {"train_info/time_between_train_steps": 0.09653186798095703, "step": 5618} {"info/global_step": 5619, "train_info/time_within_train_step": 2.758615016937256, "step": 5619} {"train_info/time_between_train_steps": 0.0034291744232177734, "step": 5619} {"info/global_step": 5620, "train_info/time_within_train_step": 2.756636381149292, "step": 5620} {"train_info/time_between_train_steps": 0.003370523452758789, "step": 5620} {"info/global_step": 5621, "train_info/time_within_train_step": 2.7564635276794434, "step": 5621} {"train_info/time_between_train_steps": 0.003197193145751953, "step": 5621} {"info/global_step": 5622, "train_info/time_within_train_step": 2.7561380863189697, "step": 5622} {"train_info/time_between_train_steps": 0.0031900405883789062, "step": 5622} {"info/global_step": 5623, "train_info/time_within_train_step": 2.755842447280884, "step": 5623} {"train_info/time_between_train_steps": 0.003214120864868164, "step": 5623} {"info/global_step": 5624, "train_info/time_within_train_step": 2.755444288253784, "step": 5624} {"train_info/time_between_train_steps": 0.0031938552856445312, "step": 5624} {"info/global_step": 5625, "train_info/time_within_train_step": 2.755506992340088, "step": 5625} {"train_info/time_between_train_steps": 0.0032389163970947266, "step": 5625} {"info/global_step": 5626, "train_info/time_within_train_step": 2.754878044128418, "step": 5626} {"train_info/time_between_train_steps": 0.003237485885620117, "step": 5626} {"info/global_step": 5627, "train_info/time_within_train_step": 2.757314443588257, "step": 5627} {"train_info/time_between_train_steps": 0.003349781036376953, "step": 5627} {"info/global_step": 5628, "train_info/time_within_train_step": 2.7564525604248047, "step": 5628} {"train_info/time_between_train_steps": 0.003314971923828125, "step": 5628} {"info/global_step": 5629, "train_info/time_within_train_step": 2.7570693492889404, "step": 5629} {"train_info/time_between_train_steps": 0.0034804344177246094, "step": 5629} {"info/global_step": 5630, "train_info/time_within_train_step": 2.7574048042297363, "step": 5630} {"train_info/time_between_train_steps": 0.0033614635467529297, "step": 5630} {"info/global_step": 5631, "train_info/time_within_train_step": 2.757575273513794, "step": 5631} {"train_info/time_between_train_steps": 0.003392457962036133, "step": 5631} {"info/global_step": 5632, "train_info/time_within_train_step": 2.757350206375122, "step": 5632} {"train_info/time_between_train_steps": 0.0033812522888183594, "step": 5632} {"info/global_step": 5633, "train_info/time_within_train_step": 2.7559797763824463, "step": 5633} {"train_info/time_between_train_steps": 0.0032286643981933594, "step": 5633} {"info/global_step": 5634, "train_info/time_within_train_step": 2.7567965984344482, "step": 5634} {"train_info/time_between_train_steps": 0.0032520294189453125, "step": 5634} {"info/global_step": 5635, "train_info/time_within_train_step": 2.755970001220703, "step": 5635} {"train_info/time_between_train_steps": 0.0032770633697509766, "step": 5635} {"info/global_step": 5636, "train_info/time_within_train_step": 2.7558205127716064, "step": 5636} {"train_info/time_between_train_steps": 0.0032470226287841797, "step": 5636} {"info/global_step": 5637, "train_info/time_within_train_step": 2.756153106689453, "step": 5637} {"train_info/time_between_train_steps": 0.003198385238647461, "step": 5637} {"info/global_step": 5638, "train_info/time_within_train_step": 2.7556307315826416, "step": 5638} {"train_info/time_between_train_steps": 0.0033617019653320312, "step": 5638} {"info/global_step": 5639, "train_info/time_within_train_step": 2.756395101547241, "step": 5639} {"train_info/time_between_train_steps": 0.0032045841217041016, "step": 5639} {"info/global_step": 5640, "train_info/time_within_train_step": 2.7548563480377197, "step": 5640} {"train_info/time_between_train_steps": 0.0032112598419189453, "step": 5640} {"info/global_step": 5641, "train_info/time_within_train_step": 2.7553491592407227, "step": 5641} {"train_info/time_between_train_steps": 0.0032258033752441406, "step": 5641} {"info/global_step": 5642, "train_info/time_within_train_step": 2.7556827068328857, "step": 5642} {"train_info/time_between_train_steps": 0.0033109188079833984, "step": 5642} {"info/global_step": 5643, "train_info/time_within_train_step": 2.7555854320526123, "step": 5643} {"train_info/time_between_train_steps": 0.003216981887817383, "step": 5643} {"info/global_step": 5644, "train_info/time_within_train_step": 2.7554945945739746, "step": 5644} {"train_info/time_between_train_steps": 0.0032732486724853516, "step": 5644} {"info/global_step": 5645, "train_info/time_within_train_step": 2.756624698638916, "step": 5645} {"train_info/time_between_train_steps": 0.0032231807708740234, "step": 5645} {"info/global_step": 5646, "train_info/time_within_train_step": 2.7563114166259766, "step": 5646} {"train_info/time_between_train_steps": 0.0032396316528320312, "step": 5646} {"info/global_step": 5647, "train_info/time_within_train_step": 2.7558796405792236, "step": 5647} {"train_info/time_between_train_steps": 0.0032215118408203125, "step": 5647} {"info/global_step": 5648, "train_info/time_within_train_step": 2.7562313079833984, "step": 5648} {"train_info/time_between_train_steps": 0.003214120864868164, "step": 5648} {"info/global_step": 5649, "train_info/time_within_train_step": 2.7552785873413086, "step": 5649} {"train_info/time_between_train_steps": 0.00328826904296875, "step": 5649} {"info/global_step": 5650, "train_info/time_within_train_step": 2.7553579807281494, "step": 5650} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746582391, "_runtime": 16400}, "step": 5650} {"logs": {"train/loss": 3.5131, "train/learning_rate": 0.00029, "train/epoch": 6.05, "_timestamp": 1746582391, "_runtime": 16400}, "step": 5650} {"train_info/time_between_train_steps": 0.007718801498413086, "step": 5650} {"info/global_step": 5651, "train_info/time_within_train_step": 2.7542548179626465, "step": 5651} {"train_info/time_between_train_steps": 0.0032417774200439453, "step": 5651} {"info/global_step": 5652, "train_info/time_within_train_step": 2.756551504135132, "step": 5652} {"train_info/time_between_train_steps": 0.003244638442993164, "step": 5652} {"info/global_step": 5653, "train_info/time_within_train_step": 2.7553188800811768, "step": 5653} {"train_info/time_between_train_steps": 0.0032067298889160156, "step": 5653} {"info/global_step": 5654, "train_info/time_within_train_step": 2.755039691925049, "step": 5654} {"train_info/time_between_train_steps": 0.0031948089599609375, "step": 5654} {"info/global_step": 5655, "train_info/time_within_train_step": 2.7558956146240234, "step": 5655} {"train_info/time_between_train_steps": 0.003235340118408203, "step": 5655} {"info/global_step": 5656, "train_info/time_within_train_step": 2.753854751586914, "step": 5656} {"train_info/time_between_train_steps": 0.003238201141357422, "step": 5656} {"info/global_step": 5657, "train_info/time_within_train_step": 2.7555601596832275, "step": 5657} {"train_info/time_between_train_steps": 0.0032198429107666016, "step": 5657} {"info/global_step": 5658, "train_info/time_within_train_step": 2.7550978660583496, "step": 5658} {"train_info/time_between_train_steps": 0.0032732486724853516, "step": 5658} {"info/global_step": 5659, "train_info/time_within_train_step": 2.7564103603363037, "step": 5659} {"train_info/time_between_train_steps": 0.02055215835571289, "step": 5659} {"info/global_step": 5660, "train_info/time_within_train_step": 2.755006790161133, "step": 5660} {"train_info/time_between_train_steps": 0.0029265880584716797, "step": 5660} {"info/global_step": 5661, "train_info/time_within_train_step": 2.7535817623138428, "step": 5661} {"train_info/time_between_train_steps": 0.0029206275939941406, "step": 5661} {"info/global_step": 5662, "train_info/time_within_train_step": 2.75445818901062, "step": 5662} {"train_info/time_between_train_steps": 0.0029468536376953125, "step": 5662} {"info/global_step": 5663, "train_info/time_within_train_step": 2.753969192504883, "step": 5663} {"train_info/time_between_train_steps": 0.0028836727142333984, "step": 5663} {"info/global_step": 5664, "train_info/time_within_train_step": 2.753755569458008, "step": 5664} {"train_info/time_between_train_steps": 0.0028994083404541016, "step": 5664} {"info/global_step": 5665, "train_info/time_within_train_step": 2.7528462409973145, "step": 5665} {"train_info/time_between_train_steps": 0.0029327869415283203, "step": 5665} {"info/global_step": 5666, "train_info/time_within_train_step": 2.7534544467926025, "step": 5666} {"train_info/time_between_train_steps": 0.0028791427612304688, "step": 5666} {"info/global_step": 5667, "train_info/time_within_train_step": 2.7540500164031982, "step": 5667} {"train_info/time_between_train_steps": 0.0029115676879882812, "step": 5667} {"info/global_step": 5668, "train_info/time_within_train_step": 2.7538657188415527, "step": 5668} {"train_info/time_between_train_steps": 0.002905607223510742, "step": 5668} {"info/global_step": 5669, "train_info/time_within_train_step": 2.7543208599090576, "step": 5669} {"train_info/time_between_train_steps": 0.002871990203857422, "step": 5669} {"info/global_step": 5670, "train_info/time_within_train_step": 2.7527949810028076, "step": 5670} {"train_info/time_between_train_steps": 0.002897977828979492, "step": 5670} {"info/global_step": 5671, "train_info/time_within_train_step": 2.753788471221924, "step": 5671} {"train_info/time_between_train_steps": 0.002917051315307617, "step": 5671} {"info/global_step": 5672, "train_info/time_within_train_step": 2.752906560897827, "step": 5672} {"train_info/time_between_train_steps": 0.0029277801513671875, "step": 5672} {"info/global_step": 5673, "train_info/time_within_train_step": 2.75374174118042, "step": 5673} {"train_info/time_between_train_steps": 0.002871274948120117, "step": 5673} {"info/global_step": 5674, "train_info/time_within_train_step": 2.7550175189971924, "step": 5674} {"train_info/time_between_train_steps": 0.0028607845306396484, "step": 5674} {"info/global_step": 5675, "train_info/time_within_train_step": 2.7543485164642334, "step": 5675} {"train_info/time_between_train_steps": 0.002891063690185547, "step": 5675} {"info/global_step": 5676, "train_info/time_within_train_step": 2.7525737285614014, "step": 5676} {"train_info/time_between_train_steps": 0.0029146671295166016, "step": 5676} {"info/global_step": 5677, "train_info/time_within_train_step": 2.755342483520508, "step": 5677} {"train_info/time_between_train_steps": 0.0028743743896484375, "step": 5677} {"info/global_step": 5678, "train_info/time_within_train_step": 2.754361629486084, "step": 5678} {"train_info/time_between_train_steps": 0.002936124801635742, "step": 5678} {"info/global_step": 5679, "train_info/time_within_train_step": 2.7540767192840576, "step": 5679} {"train_info/time_between_train_steps": 0.002938508987426758, "step": 5679} {"info/global_step": 5680, "train_info/time_within_train_step": 2.754457473754883, "step": 5680} {"train_info/time_between_train_steps": 0.002905130386352539, "step": 5680} {"info/global_step": 5681, "train_info/time_within_train_step": 2.753490447998047, "step": 5681} {"train_info/time_between_train_steps": 0.002909421920776367, "step": 5681} {"info/global_step": 5682, "train_info/time_within_train_step": 2.753404140472412, "step": 5682} {"train_info/time_between_train_steps": 0.002947092056274414, "step": 5682} {"info/global_step": 5683, "train_info/time_within_train_step": 2.753746509552002, "step": 5683} {"train_info/time_between_train_steps": 0.0029435157775878906, "step": 5683} {"info/global_step": 5684, "train_info/time_within_train_step": 2.752300262451172, "step": 5684} {"train_info/time_between_train_steps": 0.0029227733612060547, "step": 5684} {"info/global_step": 5685, "train_info/time_within_train_step": 2.754180669784546, "step": 5685} {"train_info/time_between_train_steps": 0.0028967857360839844, "step": 5685} {"info/global_step": 5686, "train_info/time_within_train_step": 2.7541873455047607, "step": 5686} {"train_info/time_between_train_steps": 0.0029392242431640625, "step": 5686} {"info/global_step": 5687, "train_info/time_within_train_step": 2.755319118499756, "step": 5687} {"train_info/time_between_train_steps": 0.002879619598388672, "step": 5687} {"info/global_step": 5688, "train_info/time_within_train_step": 2.7544775009155273, "step": 5688} {"train_info/time_between_train_steps": 0.0029098987579345703, "step": 5688} {"info/global_step": 5689, "train_info/time_within_train_step": 2.7528903484344482, "step": 5689} {"train_info/time_between_train_steps": 0.002878427505493164, "step": 5689} {"info/global_step": 5690, "train_info/time_within_train_step": 2.7543184757232666, "step": 5690} {"train_info/time_between_train_steps": 0.0028717517852783203, "step": 5690} {"info/global_step": 5691, "train_info/time_within_train_step": 2.753133773803711, "step": 5691} {"train_info/time_between_train_steps": 0.002875804901123047, "step": 5691} {"info/global_step": 5692, "train_info/time_within_train_step": 2.75372052192688, "step": 5692} {"train_info/time_between_train_steps": 0.002846240997314453, "step": 5692} {"info/global_step": 5693, "train_info/time_within_train_step": 2.754422426223755, "step": 5693} {"train_info/time_between_train_steps": 0.0029380321502685547, "step": 5693} {"info/global_step": 5694, "train_info/time_within_train_step": 2.754122734069824, "step": 5694} {"train_info/time_between_train_steps": 0.0028929710388183594, "step": 5694} {"info/global_step": 5695, "train_info/time_within_train_step": 2.753223419189453, "step": 5695} {"train_info/time_between_train_steps": 0.002887248992919922, "step": 5695} {"info/global_step": 5696, "train_info/time_within_train_step": 2.753868579864502, "step": 5696} {"train_info/time_between_train_steps": 0.0029022693634033203, "step": 5696} {"info/global_step": 5697, "train_info/time_within_train_step": 2.753101348876953, "step": 5697} {"train_info/time_between_train_steps": 0.0029506683349609375, "step": 5697} {"info/global_step": 5698, "train_info/time_within_train_step": 2.7522783279418945, "step": 5698} {"train_info/time_between_train_steps": 0.002910614013671875, "step": 5698} {"info/global_step": 5699, "train_info/time_within_train_step": 2.7524092197418213, "step": 5699} {"train_info/time_between_train_steps": 0.002894878387451172, "step": 5699} {"info/global_step": 5700, "train_info/time_within_train_step": 2.753790855407715, "step": 5700} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746582529, "_runtime": 16538}, "step": 5700} {"logs": {"train/loss": 3.5132, "train/learning_rate": 0.0002866666666666667, "train/epoch": 6.06, "_timestamp": 1746582529, "_runtime": 16538}, "step": 5700} {"train_info/time_between_train_steps": 0.00885152816772461, "step": 5700} {"info/global_step": 5701, "train_info/time_within_train_step": 2.7542247772216797, "step": 5701} {"train_info/time_between_train_steps": 0.0029103755950927734, "step": 5701} {"info/global_step": 5702, "train_info/time_within_train_step": 2.7535738945007324, "step": 5702} {"train_info/time_between_train_steps": 0.00287628173828125, "step": 5702} {"info/global_step": 5703, "train_info/time_within_train_step": 2.7550933361053467, "step": 5703} {"train_info/time_between_train_steps": 0.0028977394104003906, "step": 5703} {"info/global_step": 5704, "train_info/time_within_train_step": 2.7557296752929688, "step": 5704} {"train_info/time_between_train_steps": 0.002916097640991211, "step": 5704} {"info/global_step": 5705, "train_info/time_within_train_step": 2.9831631183624268, "step": 5705} {"train_info/time_between_train_steps": 0.0028619766235351562, "step": 5705} {"info/global_step": 5706, "train_info/time_within_train_step": 2.7541375160217285, "step": 5706} {"train_info/time_between_train_steps": 0.0028374195098876953, "step": 5706} {"info/global_step": 5707, "train_info/time_within_train_step": 2.754049301147461, "step": 5707} {"train_info/time_between_train_steps": 0.002876758575439453, "step": 5707} {"info/global_step": 5708, "train_info/time_within_train_step": 2.7538814544677734, "step": 5708} {"train_info/time_between_train_steps": 0.0029206275939941406, "step": 5708} {"info/global_step": 5709, "train_info/time_within_train_step": 2.75411057472229, "step": 5709} {"train_info/time_between_train_steps": 0.0028696060180664062, "step": 5709} {"info/global_step": 5710, "train_info/time_within_train_step": 2.7535183429718018, "step": 5710} {"train_info/time_between_train_steps": 0.0033125877380371094, "step": 5710} {"info/global_step": 5711, "train_info/time_within_train_step": 2.7530863285064697, "step": 5711} {"train_info/time_between_train_steps": 0.002860546112060547, "step": 5711} {"info/global_step": 5712, "train_info/time_within_train_step": 2.7539265155792236, "step": 5712} {"train_info/time_between_train_steps": 0.002851724624633789, "step": 5712} {"info/global_step": 5713, "train_info/time_within_train_step": 2.7537503242492676, "step": 5713} {"train_info/time_between_train_steps": 0.0029180049896240234, "step": 5713} {"info/global_step": 5714, "train_info/time_within_train_step": 2.7526979446411133, "step": 5714} {"train_info/time_between_train_steps": 0.0028612613677978516, "step": 5714} {"info/global_step": 5715, "train_info/time_within_train_step": 2.753413677215576, "step": 5715} {"train_info/time_between_train_steps": 0.002906322479248047, "step": 5715} {"info/global_step": 5716, "train_info/time_within_train_step": 2.75439190864563, "step": 5716} {"train_info/time_between_train_steps": 0.002893686294555664, "step": 5716} {"info/global_step": 5717, "train_info/time_within_train_step": 2.7546863555908203, "step": 5717} {"train_info/time_between_train_steps": 0.0029115676879882812, "step": 5717} {"info/global_step": 5718, "train_info/time_within_train_step": 2.7546586990356445, "step": 5718} {"train_info/time_between_train_steps": 0.0028874874114990234, "step": 5718} {"info/global_step": 5719, "train_info/time_within_train_step": 2.754678726196289, "step": 5719} {"train_info/time_between_train_steps": 0.0029230117797851562, "step": 5719} {"info/global_step": 5720, "train_info/time_within_train_step": 2.753551483154297, "step": 5720} {"train_info/time_between_train_steps": 0.0028984546661376953, "step": 5720} {"info/global_step": 5721, "train_info/time_within_train_step": 2.755021572113037, "step": 5721} {"train_info/time_between_train_steps": 0.0029287338256835938, "step": 5721} {"info/global_step": 5722, "train_info/time_within_train_step": 2.7547128200531006, "step": 5722} {"train_info/time_between_train_steps": 0.002913951873779297, "step": 5722} {"info/global_step": 5723, "train_info/time_within_train_step": 2.754063129425049, "step": 5723} {"train_info/time_between_train_steps": 0.002928018569946289, "step": 5723} {"info/global_step": 5724, "train_info/time_within_train_step": 2.755402088165283, "step": 5724} {"train_info/time_between_train_steps": 0.002923250198364258, "step": 5724} {"info/global_step": 5725, "train_info/time_within_train_step": 2.7554738521575928, "step": 5725} {"train_info/time_between_train_steps": 0.0028934478759765625, "step": 5725} {"info/global_step": 5726, "train_info/time_within_train_step": 2.7541911602020264, "step": 5726} {"train_info/time_between_train_steps": 0.0029022693634033203, "step": 5726} {"info/global_step": 5727, "train_info/time_within_train_step": 2.7540762424468994, "step": 5727} {"train_info/time_between_train_steps": 0.002904653549194336, "step": 5727} {"info/global_step": 5728, "train_info/time_within_train_step": 2.7540464401245117, "step": 5728} {"train_info/time_between_train_steps": 0.002885580062866211, "step": 5728} {"info/global_step": 5729, "train_info/time_within_train_step": 2.754957914352417, "step": 5729} {"train_info/time_between_train_steps": 0.0028879642486572266, "step": 5729} {"info/global_step": 5730, "train_info/time_within_train_step": 2.7545368671417236, "step": 5730} {"train_info/time_between_train_steps": 0.0029909610748291016, "step": 5730} {"info/global_step": 5731, "train_info/time_within_train_step": 2.7563045024871826, "step": 5731} {"train_info/time_between_train_steps": 0.0028994083404541016, "step": 5731} {"info/global_step": 5732, "train_info/time_within_train_step": 2.754603862762451, "step": 5732} {"train_info/time_between_train_steps": 0.002901792526245117, "step": 5732} {"info/global_step": 5733, "train_info/time_within_train_step": 2.7542505264282227, "step": 5733} {"train_info/time_between_train_steps": 0.002920389175415039, "step": 5733} {"info/global_step": 5734, "train_info/time_within_train_step": 2.7564499378204346, "step": 5734} {"train_info/time_between_train_steps": 0.002928018569946289, "step": 5734} {"info/global_step": 5735, "train_info/time_within_train_step": 2.75333833694458, "step": 5735} {"train_info/time_between_train_steps": 0.0028886795043945312, "step": 5735} {"info/global_step": 5736, "train_info/time_within_train_step": 2.7554311752319336, "step": 5736} {"train_info/time_between_train_steps": 0.0029392242431640625, "step": 5736} {"info/global_step": 5737, "train_info/time_within_train_step": 2.755882501602173, "step": 5737} {"train_info/time_between_train_steps": 0.0029387474060058594, "step": 5737} {"info/global_step": 5738, "train_info/time_within_train_step": 2.753962755203247, "step": 5738} {"train_info/time_between_train_steps": 0.0028934478759765625, "step": 5738} {"info/global_step": 5739, "train_info/time_within_train_step": 2.7539751529693604, "step": 5739} {"train_info/time_between_train_steps": 0.0029277801513671875, "step": 5739} {"info/global_step": 5740, "train_info/time_within_train_step": 2.75350284576416, "step": 5740} {"train_info/time_between_train_steps": 0.0028984546661376953, "step": 5740} {"info/global_step": 5741, "train_info/time_within_train_step": 2.7537286281585693, "step": 5741} {"train_info/time_between_train_steps": 0.0029382705688476562, "step": 5741} {"info/global_step": 5742, "train_info/time_within_train_step": 2.7537848949432373, "step": 5742} {"train_info/time_between_train_steps": 0.002949953079223633, "step": 5742} {"info/global_step": 5743, "train_info/time_within_train_step": 2.7533085346221924, "step": 5743} {"train_info/time_between_train_steps": 0.002923250198364258, "step": 5743} {"info/global_step": 5744, "train_info/time_within_train_step": 2.752619504928589, "step": 5744} {"train_info/time_between_train_steps": 0.0029311180114746094, "step": 5744} {"info/global_step": 5745, "train_info/time_within_train_step": 2.7542130947113037, "step": 5745} {"train_info/time_between_train_steps": 0.0029058456420898438, "step": 5745} {"info/global_step": 5746, "train_info/time_within_train_step": 2.754028558731079, "step": 5746} {"train_info/time_between_train_steps": 0.0029153823852539062, "step": 5746} {"info/global_step": 5747, "train_info/time_within_train_step": 3.340405225753784, "step": 5747} {"train_info/time_between_train_steps": 0.002910614013671875, "step": 5747} {"info/global_step": 5748, "train_info/time_within_train_step": 2.7530176639556885, "step": 5748} {"train_info/time_between_train_steps": 0.0029113292694091797, "step": 5748} {"info/global_step": 5749, "train_info/time_within_train_step": 2.7546067237854004, "step": 5749} {"train_info/time_between_train_steps": 0.0029091835021972656, "step": 5749} {"info/global_step": 5750, "train_info/time_within_train_step": 2.753756046295166, "step": 5750} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746582668, "_runtime": 16677}, "step": 5750} {"logs": {"train/loss": 3.4923, "train/learning_rate": 0.0002833333333333333, "train/epoch": 6.06, "_timestamp": 1746582668, "_runtime": 16677}, "step": 5750} {"train_info/time_between_train_steps": 0.007852792739868164, "step": 5750} {"info/global_step": 5751, "train_info/time_within_train_step": 2.754678726196289, "step": 5751} {"train_info/time_between_train_steps": 0.002931833267211914, "step": 5751} {"info/global_step": 5752, "train_info/time_within_train_step": 2.754180431365967, "step": 5752} {"train_info/time_between_train_steps": 0.002899646759033203, "step": 5752} {"info/global_step": 5753, "train_info/time_within_train_step": 2.754284620285034, "step": 5753} {"train_info/time_between_train_steps": 0.002916574478149414, "step": 5753} {"info/global_step": 5754, "train_info/time_within_train_step": 2.754183769226074, "step": 5754} {"train_info/time_between_train_steps": 0.0028765201568603516, "step": 5754} {"info/global_step": 5755, "train_info/time_within_train_step": 2.754176378250122, "step": 5755} {"train_info/time_between_train_steps": 0.0029244422912597656, "step": 5755} {"info/global_step": 5756, "train_info/time_within_train_step": 2.753135919570923, "step": 5756} {"train_info/time_between_train_steps": 0.0033986568450927734, "step": 5756} {"info/global_step": 5757, "train_info/time_within_train_step": 2.7541322708129883, "step": 5757} {"train_info/time_between_train_steps": 0.002942323684692383, "step": 5757} {"info/global_step": 5758, "train_info/time_within_train_step": 2.75549578666687, "step": 5758} {"train_info/time_between_train_steps": 0.0029435157775878906, "step": 5758} {"info/global_step": 5759, "train_info/time_within_train_step": 2.7536394596099854, "step": 5759} {"train_info/time_between_train_steps": 0.003011941909790039, "step": 5759} {"info/global_step": 5760, "train_info/time_within_train_step": 2.7537007331848145, "step": 5760} {"train_info/time_between_train_steps": 0.0028963088989257812, "step": 5760} {"info/global_step": 5761, "train_info/time_within_train_step": 2.7542812824249268, "step": 5761} {"train_info/time_between_train_steps": 0.0029172897338867188, "step": 5761} {"info/global_step": 5762, "train_info/time_within_train_step": 2.7549123764038086, "step": 5762} {"train_info/time_between_train_steps": 0.002905130386352539, "step": 5762} {"info/global_step": 5763, "train_info/time_within_train_step": 2.7539825439453125, "step": 5763} {"train_info/time_between_train_steps": 0.0028803348541259766, "step": 5763} {"info/global_step": 5764, "train_info/time_within_train_step": 2.753521680831909, "step": 5764} {"train_info/time_between_train_steps": 0.002883434295654297, "step": 5764} {"info/global_step": 5765, "train_info/time_within_train_step": 2.753108501434326, "step": 5765} {"train_info/time_between_train_steps": 0.0029840469360351562, "step": 5765} {"info/global_step": 5766, "train_info/time_within_train_step": 2.942250967025757, "step": 5766} {"train_info/time_between_train_steps": 0.0028777122497558594, "step": 5766} {"info/global_step": 5767, "train_info/time_within_train_step": 2.7543554306030273, "step": 5767} {"train_info/time_between_train_steps": 0.0028917789459228516, "step": 5767} {"info/global_step": 5768, "train_info/time_within_train_step": 2.753995418548584, "step": 5768} {"train_info/time_between_train_steps": 0.0028438568115234375, "step": 5768} {"info/global_step": 5769, "train_info/time_within_train_step": 2.7543742656707764, "step": 5769} {"train_info/time_between_train_steps": 0.0028989315032958984, "step": 5769} {"info/global_step": 5770, "train_info/time_within_train_step": 2.754366159439087, "step": 5770} {"train_info/time_between_train_steps": 0.0029053688049316406, "step": 5770} {"info/global_step": 5771, "train_info/time_within_train_step": 2.7541611194610596, "step": 5771} {"train_info/time_between_train_steps": 0.002880573272705078, "step": 5771} {"info/global_step": 5772, "train_info/time_within_train_step": 2.7541685104370117, "step": 5772} {"train_info/time_between_train_steps": 0.0028839111328125, "step": 5772} {"info/global_step": 5773, "train_info/time_within_train_step": 2.754117727279663, "step": 5773} {"train_info/time_between_train_steps": 0.0029044151306152344, "step": 5773} {"info/global_step": 5774, "train_info/time_within_train_step": 2.7539052963256836, "step": 5774} {"train_info/time_between_train_steps": 0.002879619598388672, "step": 5774} {"info/global_step": 5775, "train_info/time_within_train_step": 2.754089832305908, "step": 5775} {"train_info/time_between_train_steps": 0.0028531551361083984, "step": 5775} {"info/global_step": 5776, "train_info/time_within_train_step": 2.7548611164093018, "step": 5776} {"train_info/time_between_train_steps": 0.002866506576538086, "step": 5776} {"info/global_step": 5777, "train_info/time_within_train_step": 2.754666328430176, "step": 5777} {"train_info/time_between_train_steps": 0.0028715133666992188, "step": 5777} {"info/global_step": 5778, "train_info/time_within_train_step": 2.754589796066284, "step": 5778} {"train_info/time_between_train_steps": 0.002874612808227539, "step": 5778} {"info/global_step": 5779, "train_info/time_within_train_step": 2.7546474933624268, "step": 5779} {"train_info/time_between_train_steps": 0.0029294490814208984, "step": 5779} {"info/global_step": 5780, "train_info/time_within_train_step": 2.754807949066162, "step": 5780} {"train_info/time_between_train_steps": 0.0029141902923583984, "step": 5780} {"info/global_step": 5781, "train_info/time_within_train_step": 2.755182981491089, "step": 5781} {"train_info/time_between_train_steps": 0.0029218196868896484, "step": 5781} {"info/global_step": 5782, "train_info/time_within_train_step": 2.7541584968566895, "step": 5782} {"train_info/time_between_train_steps": 0.0029075145721435547, "step": 5782} {"info/global_step": 5783, "train_info/time_within_train_step": 2.755136013031006, "step": 5783} {"train_info/time_between_train_steps": 0.002880096435546875, "step": 5783} {"info/global_step": 5784, "train_info/time_within_train_step": 2.7543578147888184, "step": 5784} {"train_info/time_between_train_steps": 0.0028696060180664062, "step": 5784} {"info/global_step": 5785, "train_info/time_within_train_step": 2.7551145553588867, "step": 5785} {"train_info/time_between_train_steps": 0.0028858184814453125, "step": 5785} {"info/global_step": 5786, "train_info/time_within_train_step": 2.7551050186157227, "step": 5786} {"train_info/time_between_train_steps": 0.002884387969970703, "step": 5786} {"info/global_step": 5787, "train_info/time_within_train_step": 2.753708600997925, "step": 5787} {"train_info/time_between_train_steps": 0.0028951168060302734, "step": 5787} {"info/global_step": 5788, "train_info/time_within_train_step": 2.7532804012298584, "step": 5788} {"train_info/time_between_train_steps": 0.0029180049896240234, "step": 5788} {"info/global_step": 5789, "train_info/time_within_train_step": 2.7518930435180664, "step": 5789} {"train_info/time_between_train_steps": 0.002904176712036133, "step": 5789} {"info/global_step": 5790, "train_info/time_within_train_step": 2.7541632652282715, "step": 5790} {"train_info/time_between_train_steps": 0.002928495407104492, "step": 5790} {"info/global_step": 5791, "train_info/time_within_train_step": 2.7544784545898438, "step": 5791} {"train_info/time_between_train_steps": 0.002894163131713867, "step": 5791} {"info/global_step": 5792, "train_info/time_within_train_step": 2.754297971725464, "step": 5792} {"train_info/time_between_train_steps": 0.002876758575439453, "step": 5792} {"info/global_step": 5793, "train_info/time_within_train_step": 2.752007246017456, "step": 5793} {"train_info/time_between_train_steps": 0.00289154052734375, "step": 5793} {"info/global_step": 5794, "train_info/time_within_train_step": 2.753215789794922, "step": 5794} {"train_info/time_between_train_steps": 0.0029401779174804688, "step": 5794} {"info/global_step": 5795, "train_info/time_within_train_step": 2.7520949840545654, "step": 5795} {"train_info/time_between_train_steps": 0.002861499786376953, "step": 5795} {"info/global_step": 5796, "train_info/time_within_train_step": 2.754472255706787, "step": 5796} {"train_info/time_between_train_steps": 0.002930164337158203, "step": 5796} {"info/global_step": 5797, "train_info/time_within_train_step": 2.753739595413208, "step": 5797} {"train_info/time_between_train_steps": 0.0028946399688720703, "step": 5797} {"info/global_step": 5798, "train_info/time_within_train_step": 2.7538819313049316, "step": 5798} {"train_info/time_between_train_steps": 0.002872467041015625, "step": 5798} {"info/global_step": 5799, "train_info/time_within_train_step": 2.754340648651123, "step": 5799} {"train_info/time_between_train_steps": 0.0029449462890625, "step": 5799} {"info/global_step": 5800, "train_info/time_within_train_step": 2.754504442214966, "step": 5800} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746582806, "_runtime": 16815}, "step": 5800} {"logs": {"train/loss": 3.488, "train/learning_rate": 0.00028, "train/epoch": 6.07, "_timestamp": 1746582806, "_runtime": 16815}, "step": 5800} {"train_info/time_between_train_steps": 13.36277437210083, "step": 5800} {"info/global_step": 5801, "train_info/time_within_train_step": 2.5335612297058105, "step": 5801} {"train_info/time_between_train_steps": 0.0030455589294433594, "step": 5801} {"info/global_step": 5802, "train_info/time_within_train_step": 2.5803534984588623, "step": 5802} {"train_info/time_between_train_steps": 0.002948760986328125, "step": 5802} {"info/global_step": 5803, "train_info/time_within_train_step": 2.7294657230377197, "step": 5803} {"train_info/time_between_train_steps": 0.0029821395874023438, "step": 5803} {"info/global_step": 5804, "train_info/time_within_train_step": 2.7488598823547363, "step": 5804} {"train_info/time_between_train_steps": 0.002959012985229492, "step": 5804} {"info/global_step": 5805, "train_info/time_within_train_step": 2.7510123252868652, "step": 5805} {"train_info/time_between_train_steps": 0.0028839111328125, "step": 5805} {"info/global_step": 5806, "train_info/time_within_train_step": 2.7533044815063477, "step": 5806} {"train_info/time_between_train_steps": 0.0028901100158691406, "step": 5806} {"info/global_step": 5807, "train_info/time_within_train_step": 2.753784418106079, "step": 5807} {"train_info/time_between_train_steps": 0.002924680709838867, "step": 5807} {"info/global_step": 5808, "train_info/time_within_train_step": 2.912522554397583, "step": 5808} {"train_info/time_between_train_steps": 0.0029065608978271484, "step": 5808} {"info/global_step": 5809, "train_info/time_within_train_step": 2.7540314197540283, "step": 5809} {"train_info/time_between_train_steps": 0.0029144287109375, "step": 5809} {"info/global_step": 5810, "train_info/time_within_train_step": 2.753095865249634, "step": 5810} {"train_info/time_between_train_steps": 0.002889394760131836, "step": 5810} {"info/global_step": 5811, "train_info/time_within_train_step": 2.7545559406280518, "step": 5811} {"train_info/time_between_train_steps": 0.002893209457397461, "step": 5811} {"info/global_step": 5812, "train_info/time_within_train_step": 2.7543914318084717, "step": 5812} {"train_info/time_between_train_steps": 0.0028891563415527344, "step": 5812} {"info/global_step": 5813, "train_info/time_within_train_step": 2.753039836883545, "step": 5813} {"train_info/time_between_train_steps": 0.0028793811798095703, "step": 5813} {"info/global_step": 5814, "train_info/time_within_train_step": 2.753831386566162, "step": 5814} {"train_info/time_between_train_steps": 0.0028810501098632812, "step": 5814} {"info/global_step": 5815, "train_info/time_within_train_step": 2.7545087337493896, "step": 5815} {"train_info/time_between_train_steps": 0.0029234886169433594, "step": 5815} {"info/global_step": 5816, "train_info/time_within_train_step": 2.7541298866271973, "step": 5816} {"train_info/time_between_train_steps": 0.002897024154663086, "step": 5816} {"info/global_step": 5817, "train_info/time_within_train_step": 2.7542035579681396, "step": 5817} {"train_info/time_between_train_steps": 0.0029125213623046875, "step": 5817} {"info/global_step": 5818, "train_info/time_within_train_step": 2.7545790672302246, "step": 5818} {"train_info/time_between_train_steps": 0.0028793811798095703, "step": 5818} {"info/global_step": 5819, "train_info/time_within_train_step": 2.7548112869262695, "step": 5819} {"train_info/time_between_train_steps": 0.0029535293579101562, "step": 5819} {"info/global_step": 5820, "train_info/time_within_train_step": 2.7537829875946045, "step": 5820} {"train_info/time_between_train_steps": 0.0029015541076660156, "step": 5820} {"info/global_step": 5821, "train_info/time_within_train_step": 2.7546627521514893, "step": 5821} {"train_info/time_between_train_steps": 0.0028922557830810547, "step": 5821} {"info/global_step": 5822, "train_info/time_within_train_step": 2.7554855346679688, "step": 5822} {"train_info/time_between_train_steps": 0.002894163131713867, "step": 5822} {"info/global_step": 5823, "train_info/time_within_train_step": 2.7549219131469727, "step": 5823} {"train_info/time_between_train_steps": 0.002904653549194336, "step": 5823} {"info/global_step": 5824, "train_info/time_within_train_step": 2.7540500164031982, "step": 5824} {"train_info/time_between_train_steps": 0.0030024051666259766, "step": 5824} {"info/global_step": 5825, "train_info/time_within_train_step": 2.7544240951538086, "step": 5825} {"train_info/time_between_train_steps": 0.002960681915283203, "step": 5825} {"info/global_step": 5826, "train_info/time_within_train_step": 2.7534101009368896, "step": 5826} {"train_info/time_between_train_steps": 0.002938508987426758, "step": 5826} {"info/global_step": 5827, "train_info/time_within_train_step": 2.7529516220092773, "step": 5827} {"train_info/time_between_train_steps": 0.002882242202758789, "step": 5827} {"info/global_step": 5828, "train_info/time_within_train_step": 2.7550437450408936, "step": 5828} {"train_info/time_between_train_steps": 0.002908945083618164, "step": 5828} {"info/global_step": 5829, "train_info/time_within_train_step": 2.7556629180908203, "step": 5829} {"train_info/time_between_train_steps": 0.002930879592895508, "step": 5829} {"info/global_step": 5830, "train_info/time_within_train_step": 2.754793167114258, "step": 5830} {"train_info/time_between_train_steps": 0.0029163360595703125, "step": 5830} {"info/global_step": 5831, "train_info/time_within_train_step": 2.7553224563598633, "step": 5831} {"train_info/time_between_train_steps": 0.0029306411743164062, "step": 5831} {"info/global_step": 5832, "train_info/time_within_train_step": 2.753453254699707, "step": 5832} {"train_info/time_between_train_steps": 0.002935647964477539, "step": 5832} {"info/global_step": 5833, "train_info/time_within_train_step": 2.7545535564422607, "step": 5833} {"train_info/time_between_train_steps": 0.0029709339141845703, "step": 5833} {"info/global_step": 5834, "train_info/time_within_train_step": 2.7540104389190674, "step": 5834} {"train_info/time_between_train_steps": 0.002924680709838867, "step": 5834} {"info/global_step": 5835, "train_info/time_within_train_step": 2.7543845176696777, "step": 5835} {"train_info/time_between_train_steps": 0.0029294490814208984, "step": 5835} {"info/global_step": 5836, "train_info/time_within_train_step": 2.7556440830230713, "step": 5836} {"train_info/time_between_train_steps": 0.0030889511108398438, "step": 5836} {"info/global_step": 5837, "train_info/time_within_train_step": 2.755889654159546, "step": 5837} {"train_info/time_between_train_steps": 0.003031015396118164, "step": 5837} {"info/global_step": 5838, "train_info/time_within_train_step": 2.756293535232544, "step": 5838} {"train_info/time_between_train_steps": 0.003023386001586914, "step": 5838} {"info/global_step": 5839, "train_info/time_within_train_step": 2.75565242767334, "step": 5839} {"train_info/time_between_train_steps": 0.0030264854431152344, "step": 5839} {"info/global_step": 5840, "train_info/time_within_train_step": 2.7556958198547363, "step": 5840} {"train_info/time_between_train_steps": 0.0029938220977783203, "step": 5840} {"info/global_step": 5841, "train_info/time_within_train_step": 2.756071090698242, "step": 5841} {"train_info/time_between_train_steps": 0.0030508041381835938, "step": 5841} {"info/global_step": 5842, "train_info/time_within_train_step": 2.755655527114868, "step": 5842} {"train_info/time_between_train_steps": 0.002976655960083008, "step": 5842} {"info/global_step": 5843, "train_info/time_within_train_step": 2.756251335144043, "step": 5843} {"train_info/time_between_train_steps": 0.0029828548431396484, "step": 5843} {"info/global_step": 5844, "train_info/time_within_train_step": 2.7553303241729736, "step": 5844} {"train_info/time_between_train_steps": 0.0030035972595214844, "step": 5844} {"info/global_step": 5845, "train_info/time_within_train_step": 2.7568790912628174, "step": 5845} {"train_info/time_between_train_steps": 0.0029981136322021484, "step": 5845} {"info/global_step": 5846, "train_info/time_within_train_step": 2.756115674972534, "step": 5846} {"train_info/time_between_train_steps": 0.0030641555786132812, "step": 5846} {"info/global_step": 5847, "train_info/time_within_train_step": 2.7550976276397705, "step": 5847} {"train_info/time_between_train_steps": 0.0031206607818603516, "step": 5847} {"info/global_step": 5848, "train_info/time_within_train_step": 2.755978584289551, "step": 5848} {"train_info/time_between_train_steps": 0.0031282901763916016, "step": 5848} {"info/global_step": 5849, "train_info/time_within_train_step": 2.7533271312713623, "step": 5849} {"train_info/time_between_train_steps": 0.0030095577239990234, "step": 5849} {"info/global_step": 5850, "train_info/time_within_train_step": 2.7563862800598145, "step": 5850} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746582957, "_runtime": 16966}, "step": 5850} {"logs": {"train/loss": 3.4803, "train/learning_rate": 0.00027666666666666665, "train/epoch": 6.07, "_timestamp": 1746582957, "_runtime": 16966}, "step": 5850} {"train_info/time_between_train_steps": 0.008408308029174805, "step": 5850} {"info/global_step": 5851, "train_info/time_within_train_step": 2.756498098373413, "step": 5851} {"train_info/time_between_train_steps": 0.0029761791229248047, "step": 5851} {"info/global_step": 5852, "train_info/time_within_train_step": 2.756748914718628, "step": 5852} {"train_info/time_between_train_steps": 0.0029938220977783203, "step": 5852} {"info/global_step": 5853, "train_info/time_within_train_step": 2.7557015419006348, "step": 5853} {"train_info/time_between_train_steps": 0.003029346466064453, "step": 5853} {"info/global_step": 5854, "train_info/time_within_train_step": 2.756063938140869, "step": 5854} {"train_info/time_between_train_steps": 0.003039121627807617, "step": 5854} {"info/global_step": 5855, "train_info/time_within_train_step": 2.7556395530700684, "step": 5855} {"train_info/time_between_train_steps": 0.002996206283569336, "step": 5855} {"info/global_step": 5856, "train_info/time_within_train_step": 2.7574565410614014, "step": 5856} {"train_info/time_between_train_steps": 0.003040313720703125, "step": 5856} {"info/global_step": 5857, "train_info/time_within_train_step": 2.7553985118865967, "step": 5857} {"train_info/time_between_train_steps": 0.002997159957885742, "step": 5857} {"info/global_step": 5858, "train_info/time_within_train_step": 2.7534971237182617, "step": 5858} {"train_info/time_between_train_steps": 0.0029006004333496094, "step": 5858} {"info/global_step": 5859, "train_info/time_within_train_step": 2.7546801567077637, "step": 5859} {"train_info/time_between_train_steps": 0.0030183792114257812, "step": 5859} {"info/global_step": 5860, "train_info/time_within_train_step": 2.7536561489105225, "step": 5860} {"train_info/time_between_train_steps": 0.002904176712036133, "step": 5860} {"info/global_step": 5861, "train_info/time_within_train_step": 2.753126621246338, "step": 5861} {"train_info/time_between_train_steps": 0.002945423126220703, "step": 5861} {"info/global_step": 5862, "train_info/time_within_train_step": 2.753976821899414, "step": 5862} {"train_info/time_between_train_steps": 0.002924680709838867, "step": 5862} {"info/global_step": 5863, "train_info/time_within_train_step": 2.754544973373413, "step": 5863} {"train_info/time_between_train_steps": 0.002928018569946289, "step": 5863} {"info/global_step": 5864, "train_info/time_within_train_step": 2.7545006275177, "step": 5864} {"train_info/time_between_train_steps": 0.002901792526245117, "step": 5864} {"info/global_step": 5865, "train_info/time_within_train_step": 2.7560434341430664, "step": 5865} {"train_info/time_between_train_steps": 0.002985715866088867, "step": 5865} {"info/global_step": 5866, "train_info/time_within_train_step": 2.7548696994781494, "step": 5866} {"train_info/time_between_train_steps": 0.0029277801513671875, "step": 5866} {"info/global_step": 5867, "train_info/time_within_train_step": 2.754615306854248, "step": 5867} {"train_info/time_between_train_steps": 0.0030100345611572266, "step": 5867} {"info/global_step": 5868, "train_info/time_within_train_step": 2.7526743412017822, "step": 5868} {"train_info/time_between_train_steps": 0.0028929710388183594, "step": 5868} {"info/global_step": 5869, "train_info/time_within_train_step": 2.7544116973876953, "step": 5869} {"train_info/time_between_train_steps": 0.002916097640991211, "step": 5869} {"info/global_step": 5870, "train_info/time_within_train_step": 2.754232168197632, "step": 5870} {"train_info/time_between_train_steps": 0.0029239654541015625, "step": 5870} {"info/global_step": 5871, "train_info/time_within_train_step": 2.7548675537109375, "step": 5871} {"train_info/time_between_train_steps": 0.002928495407104492, "step": 5871} {"info/global_step": 5872, "train_info/time_within_train_step": 2.754868745803833, "step": 5872} {"train_info/time_between_train_steps": 0.002969503402709961, "step": 5872} {"info/global_step": 5873, "train_info/time_within_train_step": 2.7540037631988525, "step": 5873} {"train_info/time_between_train_steps": 0.0029189586639404297, "step": 5873} {"info/global_step": 5874, "train_info/time_within_train_step": 2.754854917526245, "step": 5874} {"train_info/time_between_train_steps": 0.0030143260955810547, "step": 5874} {"info/global_step": 5875, "train_info/time_within_train_step": 2.754314422607422, "step": 5875} {"train_info/time_between_train_steps": 0.0029540061950683594, "step": 5875} {"info/global_step": 5876, "train_info/time_within_train_step": 2.7546944618225098, "step": 5876} {"train_info/time_between_train_steps": 0.002933025360107422, "step": 5876} {"info/global_step": 5877, "train_info/time_within_train_step": 2.754869222640991, "step": 5877} {"train_info/time_between_train_steps": 0.0029268264770507812, "step": 5877} {"info/global_step": 5878, "train_info/time_within_train_step": 2.755607843399048, "step": 5878} {"train_info/time_between_train_steps": 0.0029201507568359375, "step": 5878} {"info/global_step": 5879, "train_info/time_within_train_step": 2.7539045810699463, "step": 5879} {"train_info/time_between_train_steps": 0.002932310104370117, "step": 5879} {"info/global_step": 5880, "train_info/time_within_train_step": 2.753277063369751, "step": 5880} {"train_info/time_between_train_steps": 0.002923250198364258, "step": 5880} {"info/global_step": 5881, "train_info/time_within_train_step": 2.7544972896575928, "step": 5881} {"train_info/time_between_train_steps": 0.002905130386352539, "step": 5881} {"info/global_step": 5882, "train_info/time_within_train_step": 2.7543277740478516, "step": 5882} {"train_info/time_between_train_steps": 0.0029659271240234375, "step": 5882} {"info/global_step": 5883, "train_info/time_within_train_step": 2.7533419132232666, "step": 5883} {"train_info/time_between_train_steps": 0.00295257568359375, "step": 5883} {"info/global_step": 5884, "train_info/time_within_train_step": 2.753782272338867, "step": 5884} {"train_info/time_between_train_steps": 0.002874135971069336, "step": 5884} {"info/global_step": 5885, "train_info/time_within_train_step": 2.7543935775756836, "step": 5885} {"train_info/time_between_train_steps": 0.002973794937133789, "step": 5885} {"info/global_step": 5886, "train_info/time_within_train_step": 2.754487991333008, "step": 5886} {"train_info/time_between_train_steps": 0.002884387969970703, "step": 5886} {"info/global_step": 5887, "train_info/time_within_train_step": 2.753696918487549, "step": 5887} {"train_info/time_between_train_steps": 0.0029430389404296875, "step": 5887} {"info/global_step": 5888, "train_info/time_within_train_step": 2.754664421081543, "step": 5888} {"train_info/time_between_train_steps": 0.002912282943725586, "step": 5888} {"info/global_step": 5889, "train_info/time_within_train_step": 2.7549374103546143, "step": 5889} {"train_info/time_between_train_steps": 0.002942323684692383, "step": 5889} {"info/global_step": 5890, "train_info/time_within_train_step": 2.754570484161377, "step": 5890} {"train_info/time_between_train_steps": 0.0028870105743408203, "step": 5890} {"info/global_step": 5891, "train_info/time_within_train_step": 2.7543563842773438, "step": 5891} {"train_info/time_between_train_steps": 0.002897024154663086, "step": 5891} {"info/global_step": 5892, "train_info/time_within_train_step": 2.7549171447753906, "step": 5892} {"train_info/time_between_train_steps": 0.0028688907623291016, "step": 5892} {"info/global_step": 5893, "train_info/time_within_train_step": 2.755451202392578, "step": 5893} {"train_info/time_between_train_steps": 0.002907276153564453, "step": 5893} {"info/global_step": 5894, "train_info/time_within_train_step": 2.754601240158081, "step": 5894} {"train_info/time_between_train_steps": 0.0029332637786865234, "step": 5894} {"info/global_step": 5895, "train_info/time_within_train_step": 2.752614974975586, "step": 5895} {"train_info/time_between_train_steps": 0.0029366016387939453, "step": 5895} {"info/global_step": 5896, "train_info/time_within_train_step": 2.753647565841675, "step": 5896} {"train_info/time_between_train_steps": 0.0031120777130126953, "step": 5896} {"info/global_step": 5897, "train_info/time_within_train_step": 2.7534990310668945, "step": 5897} {"train_info/time_between_train_steps": 0.0029234886169433594, "step": 5897} {"info/global_step": 5898, "train_info/time_within_train_step": 2.7532730102539062, "step": 5898} {"train_info/time_between_train_steps": 0.0029158592224121094, "step": 5898} {"info/global_step": 5899, "train_info/time_within_train_step": 2.7536916732788086, "step": 5899} {"train_info/time_between_train_steps": 0.0029289722442626953, "step": 5899} {"info/global_step": 5900, "train_info/time_within_train_step": 2.754073143005371, "step": 5900} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746583096, "_runtime": 17105}, "step": 5900} {"logs": {"train/loss": 3.4664, "train/learning_rate": 0.00027333333333333333, "train/epoch": 6.08, "_timestamp": 1746583096, "_runtime": 17105}, "step": 5900} {"train_info/time_between_train_steps": 0.014088153839111328, "step": 5900} {"info/global_step": 5901, "train_info/time_within_train_step": 2.7532312870025635, "step": 5901} {"train_info/time_between_train_steps": 0.002897977828979492, "step": 5901} {"info/global_step": 5902, "train_info/time_within_train_step": 2.754659414291382, "step": 5902} {"train_info/time_between_train_steps": 0.002933979034423828, "step": 5902} {"info/global_step": 5903, "train_info/time_within_train_step": 2.7551333904266357, "step": 5903} {"train_info/time_between_train_steps": 0.00298309326171875, "step": 5903} {"info/global_step": 5904, "train_info/time_within_train_step": 2.7543718814849854, "step": 5904} {"train_info/time_between_train_steps": 0.0029299259185791016, "step": 5904} {"info/global_step": 5905, "train_info/time_within_train_step": 2.754100799560547, "step": 5905} {"train_info/time_between_train_steps": 0.0029604434967041016, "step": 5905} {"info/global_step": 5906, "train_info/time_within_train_step": 2.75376033782959, "step": 5906} {"train_info/time_between_train_steps": 0.0029594898223876953, "step": 5906} {"info/global_step": 5907, "train_info/time_within_train_step": 2.7551159858703613, "step": 5907} {"train_info/time_between_train_steps": 0.0029244422912597656, "step": 5907} {"info/global_step": 5908, "train_info/time_within_train_step": 2.754753589630127, "step": 5908} {"train_info/time_between_train_steps": 0.002935647964477539, "step": 5908} {"info/global_step": 5909, "train_info/time_within_train_step": 2.754504919052124, "step": 5909} {"train_info/time_between_train_steps": 0.002952098846435547, "step": 5909} {"info/global_step": 5910, "train_info/time_within_train_step": 2.753948926925659, "step": 5910} {"train_info/time_between_train_steps": 0.0033767223358154297, "step": 5910} {"info/global_step": 5911, "train_info/time_within_train_step": 2.8359129428863525, "step": 5911} {"train_info/time_between_train_steps": 0.002974987030029297, "step": 5911} {"info/global_step": 5912, "train_info/time_within_train_step": 2.754210948944092, "step": 5912} {"train_info/time_between_train_steps": 0.002868175506591797, "step": 5912} {"info/global_step": 5913, "train_info/time_within_train_step": 2.753530979156494, "step": 5913} {"train_info/time_between_train_steps": 0.0028531551361083984, "step": 5913} {"info/global_step": 5914, "train_info/time_within_train_step": 2.7536089420318604, "step": 5914} {"train_info/time_between_train_steps": 0.0028798580169677734, "step": 5914} {"info/global_step": 5915, "train_info/time_within_train_step": 2.7552452087402344, "step": 5915} {"train_info/time_between_train_steps": 0.002882719039916992, "step": 5915} {"info/global_step": 5916, "train_info/time_within_train_step": 2.7540323734283447, "step": 5916} {"train_info/time_between_train_steps": 0.0028994083404541016, "step": 5916} {"info/global_step": 5917, "train_info/time_within_train_step": 2.7541279792785645, "step": 5917} {"train_info/time_between_train_steps": 0.002880573272705078, "step": 5917} {"info/global_step": 5918, "train_info/time_within_train_step": 2.752763271331787, "step": 5918} {"train_info/time_between_train_steps": 0.002862215042114258, "step": 5918} {"info/global_step": 5919, "train_info/time_within_train_step": 2.7554943561553955, "step": 5919} {"train_info/time_between_train_steps": 0.002876758575439453, "step": 5919} {"info/global_step": 5920, "train_info/time_within_train_step": 2.7525644302368164, "step": 5920} {"train_info/time_between_train_steps": 0.0028848648071289062, "step": 5920} {"info/global_step": 5921, "train_info/time_within_train_step": 2.7548744678497314, "step": 5921} {"train_info/time_between_train_steps": 0.002841949462890625, "step": 5921} {"info/global_step": 5922, "train_info/time_within_train_step": 2.7556357383728027, "step": 5922} {"train_info/time_between_train_steps": 0.0029871463775634766, "step": 5922} {"info/global_step": 5923, "train_info/time_within_train_step": 2.75447154045105, "step": 5923} {"train_info/time_between_train_steps": 0.0028624534606933594, "step": 5923} {"info/global_step": 5924, "train_info/time_within_train_step": 2.7538912296295166, "step": 5924} {"train_info/time_between_train_steps": 0.0028471946716308594, "step": 5924} {"info/global_step": 5925, "train_info/time_within_train_step": 2.753061056137085, "step": 5925} {"train_info/time_between_train_steps": 0.002901315689086914, "step": 5925} {"info/global_step": 5926, "train_info/time_within_train_step": 2.755202054977417, "step": 5926} {"train_info/time_between_train_steps": 0.002874612808227539, "step": 5926} {"info/global_step": 5927, "train_info/time_within_train_step": 2.7529687881469727, "step": 5927} {"train_info/time_between_train_steps": 0.0028448104858398438, "step": 5927} {"info/global_step": 5928, "train_info/time_within_train_step": 2.7533137798309326, "step": 5928} {"train_info/time_between_train_steps": 0.002877473831176758, "step": 5928} {"info/global_step": 5929, "train_info/time_within_train_step": 2.752769947052002, "step": 5929} {"train_info/time_between_train_steps": 0.0029239654541015625, "step": 5929} {"info/global_step": 5930, "train_info/time_within_train_step": 2.7541699409484863, "step": 5930} {"train_info/time_between_train_steps": 0.0029306411743164062, "step": 5930} {"info/global_step": 5931, "train_info/time_within_train_step": 2.753432273864746, "step": 5931} {"train_info/time_between_train_steps": 0.0028734207153320312, "step": 5931} {"info/global_step": 5932, "train_info/time_within_train_step": 2.7545180320739746, "step": 5932} {"train_info/time_between_train_steps": 0.0028460025787353516, "step": 5932} {"info/global_step": 5933, "train_info/time_within_train_step": 2.7548911571502686, "step": 5933} {"train_info/time_between_train_steps": 0.003064870834350586, "step": 5933} {"info/global_step": 5934, "train_info/time_within_train_step": 2.755124807357788, "step": 5934} {"train_info/time_between_train_steps": 0.0029311180114746094, "step": 5934} {"info/global_step": 5935, "train_info/time_within_train_step": 2.755356788635254, "step": 5935} {"train_info/time_between_train_steps": 0.0029692649841308594, "step": 5935} {"info/global_step": 5936, "train_info/time_within_train_step": 2.7558815479278564, "step": 5936} {"train_info/time_between_train_steps": 0.0029404163360595703, "step": 5936} {"info/global_step": 5937, "train_info/time_within_train_step": 2.754897356033325, "step": 5937} {"train_info/time_between_train_steps": 0.0030498504638671875, "step": 5937} {"info/global_step": 5938, "train_info/time_within_train_step": 2.7551310062408447, "step": 5938} {"train_info/time_between_train_steps": 0.003061056137084961, "step": 5938} {"info/global_step": 5939, "train_info/time_within_train_step": 2.7563493251800537, "step": 5939} {"train_info/time_between_train_steps": 0.002965688705444336, "step": 5939} {"info/global_step": 5940, "train_info/time_within_train_step": 2.7555735111236572, "step": 5940} {"train_info/time_between_train_steps": 0.0029485225677490234, "step": 5940} {"info/global_step": 5941, "train_info/time_within_train_step": 2.755491018295288, "step": 5941} {"train_info/time_between_train_steps": 0.0029549598693847656, "step": 5941} {"info/global_step": 5942, "train_info/time_within_train_step": 2.7548301219940186, "step": 5942} {"train_info/time_between_train_steps": 0.0029511451721191406, "step": 5942} {"info/global_step": 5943, "train_info/time_within_train_step": 2.7546777725219727, "step": 5943} {"train_info/time_between_train_steps": 0.002960205078125, "step": 5943} {"info/global_step": 5944, "train_info/time_within_train_step": 2.754467725753784, "step": 5944} {"train_info/time_between_train_steps": 0.0031135082244873047, "step": 5944} {"info/global_step": 5945, "train_info/time_within_train_step": 2.755485773086548, "step": 5945} {"train_info/time_between_train_steps": 0.0030677318572998047, "step": 5945} {"info/global_step": 5946, "train_info/time_within_train_step": 2.7560415267944336, "step": 5946} {"train_info/time_between_train_steps": 0.002968311309814453, "step": 5946} {"info/global_step": 5947, "train_info/time_within_train_step": 2.7560741901397705, "step": 5947} {"train_info/time_between_train_steps": 0.003027200698852539, "step": 5947} {"info/global_step": 5948, "train_info/time_within_train_step": 2.755993604660034, "step": 5948} {"train_info/time_between_train_steps": 0.0031614303588867188, "step": 5948} {"info/global_step": 5949, "train_info/time_within_train_step": 2.755657434463501, "step": 5949} {"train_info/time_between_train_steps": 0.0031011104583740234, "step": 5949} {"info/global_step": 5950, "train_info/time_within_train_step": 2.755458354949951, "step": 5950} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746583234, "_runtime": 17243}, "step": 5950} {"logs": {"train/loss": 3.4592, "train/learning_rate": 0.00027, "train/epoch": 6.08, "_timestamp": 1746583234, "_runtime": 17243}, "step": 5950} {"train_info/time_between_train_steps": 0.013049840927124023, "step": 5950} {"info/global_step": 5951, "train_info/time_within_train_step": 2.7565155029296875, "step": 5951} {"train_info/time_between_train_steps": 0.003153562545776367, "step": 5951} {"info/global_step": 5952, "train_info/time_within_train_step": 2.7553939819335938, "step": 5952} {"train_info/time_between_train_steps": 0.003135204315185547, "step": 5952} {"info/global_step": 5953, "train_info/time_within_train_step": 2.755876064300537, "step": 5953} {"train_info/time_between_train_steps": 0.0031070709228515625, "step": 5953} {"info/global_step": 5954, "train_info/time_within_train_step": 2.7552542686462402, "step": 5954} {"train_info/time_between_train_steps": 0.0030698776245117188, "step": 5954} {"info/global_step": 5955, "train_info/time_within_train_step": 2.7557613849639893, "step": 5955} {"train_info/time_between_train_steps": 0.003145933151245117, "step": 5955} {"info/global_step": 5956, "train_info/time_within_train_step": 2.756491184234619, "step": 5956} {"train_info/time_between_train_steps": 0.003187894821166992, "step": 5956} {"info/global_step": 5957, "train_info/time_within_train_step": 2.755622386932373, "step": 5957} {"train_info/time_between_train_steps": 0.003156423568725586, "step": 5957} {"info/global_step": 5958, "train_info/time_within_train_step": 2.755514621734619, "step": 5958} {"train_info/time_between_train_steps": 0.003427743911743164, "step": 5958} {"info/global_step": 5959, "train_info/time_within_train_step": 2.7552669048309326, "step": 5959} {"train_info/time_between_train_steps": 0.0031447410583496094, "step": 5959} {"info/global_step": 5960, "train_info/time_within_train_step": 2.754401683807373, "step": 5960} {"train_info/time_between_train_steps": 0.0032279491424560547, "step": 5960} {"info/global_step": 5961, "train_info/time_within_train_step": 2.755868434906006, "step": 5961} {"train_info/time_between_train_steps": 0.0032548904418945312, "step": 5961} {"info/global_step": 5962, "train_info/time_within_train_step": 2.7560651302337646, "step": 5962} {"train_info/time_between_train_steps": 0.0035827159881591797, "step": 5962} {"info/global_step": 5963, "train_info/time_within_train_step": 2.7560954093933105, "step": 5963} {"train_info/time_between_train_steps": 0.003059864044189453, "step": 5963} {"info/global_step": 5964, "train_info/time_within_train_step": 2.757108688354492, "step": 5964} {"train_info/time_between_train_steps": 0.003373384475708008, "step": 5964} {"info/global_step": 5965, "train_info/time_within_train_step": 2.7573344707489014, "step": 5965} {"train_info/time_between_train_steps": 0.0032663345336914062, "step": 5965} {"info/global_step": 5966, "train_info/time_within_train_step": 2.793712615966797, "step": 5966} {"train_info/time_between_train_steps": 0.0032501220703125, "step": 5966} {"info/global_step": 5967, "train_info/time_within_train_step": 2.7575480937957764, "step": 5967} {"train_info/time_between_train_steps": 0.0032587051391601562, "step": 5967} {"info/global_step": 5968, "train_info/time_within_train_step": 2.7572662830352783, "step": 5968} {"train_info/time_between_train_steps": 0.003362417221069336, "step": 5968} {"info/global_step": 5969, "train_info/time_within_train_step": 2.7562713623046875, "step": 5969} {"train_info/time_between_train_steps": 0.0034537315368652344, "step": 5969} {"info/global_step": 5970, "train_info/time_within_train_step": 2.756453514099121, "step": 5970} {"train_info/time_between_train_steps": 0.003306865692138672, "step": 5970} {"info/global_step": 5971, "train_info/time_within_train_step": 2.756361961364746, "step": 5971} {"train_info/time_between_train_steps": 0.0035827159881591797, "step": 5971} {"train_info/time_between_train_steps": 3.1521718502044678, "step": 5971} {"info/global_step": 5972, "train_info/time_within_train_step": 2.689974308013916, "step": 5972} {"train_info/time_between_train_steps": 0.0033125877380371094, "step": 5972} {"info/global_step": 5973, "train_info/time_within_train_step": 2.755557060241699, "step": 5973} {"train_info/time_between_train_steps": 0.0031461715698242188, "step": 5973} {"info/global_step": 5974, "train_info/time_within_train_step": 2.7558553218841553, "step": 5974} {"train_info/time_between_train_steps": 0.003096342086791992, "step": 5974} {"info/global_step": 5975, "train_info/time_within_train_step": 2.7543811798095703, "step": 5975} {"train_info/time_between_train_steps": 0.0031011104583740234, "step": 5975} {"info/global_step": 5976, "train_info/time_within_train_step": 2.755676746368408, "step": 5976} {"train_info/time_between_train_steps": 0.003088235855102539, "step": 5976} {"info/global_step": 5977, "train_info/time_within_train_step": 2.7549238204956055, "step": 5977} {"train_info/time_between_train_steps": 0.003088712692260742, "step": 5977} {"info/global_step": 5978, "train_info/time_within_train_step": 2.754523515701294, "step": 5978} {"train_info/time_between_train_steps": 0.00310516357421875, "step": 5978} {"info/global_step": 5979, "train_info/time_within_train_step": 2.754396438598633, "step": 5979} {"train_info/time_between_train_steps": 0.003124237060546875, "step": 5979} {"info/global_step": 5980, "train_info/time_within_train_step": 2.753546953201294, "step": 5980} {"train_info/time_between_train_steps": 0.0030956268310546875, "step": 5980} {"info/global_step": 5981, "train_info/time_within_train_step": 2.9646756649017334, "step": 5981} {"train_info/time_between_train_steps": 0.003115415573120117, "step": 5981} {"info/global_step": 5982, "train_info/time_within_train_step": 2.754908323287964, "step": 5982} {"train_info/time_between_train_steps": 0.0030798912048339844, "step": 5982} {"info/global_step": 5983, "train_info/time_within_train_step": 2.753739356994629, "step": 5983} {"train_info/time_between_train_steps": 0.003110647201538086, "step": 5983} {"info/global_step": 5984, "train_info/time_within_train_step": 2.754430055618286, "step": 5984} {"train_info/time_between_train_steps": 0.0031540393829345703, "step": 5984} {"info/global_step": 5985, "train_info/time_within_train_step": 2.754568576812744, "step": 5985} {"train_info/time_between_train_steps": 0.0031070709228515625, "step": 5985} {"info/global_step": 5986, "train_info/time_within_train_step": 2.7553985118865967, "step": 5986} {"train_info/time_between_train_steps": 0.003086566925048828, "step": 5986} {"info/global_step": 5987, "train_info/time_within_train_step": 2.755497932434082, "step": 5987} {"train_info/time_between_train_steps": 0.003218412399291992, "step": 5987} {"info/global_step": 5988, "train_info/time_within_train_step": 2.754072666168213, "step": 5988} {"train_info/time_between_train_steps": 0.003186464309692383, "step": 5988} {"info/global_step": 5989, "train_info/time_within_train_step": 2.7544384002685547, "step": 5989} {"train_info/time_between_train_steps": 0.0031044483184814453, "step": 5989} {"info/global_step": 5990, "train_info/time_within_train_step": 2.7544453144073486, "step": 5990} {"train_info/time_between_train_steps": 0.0031785964965820312, "step": 5990} {"info/global_step": 5991, "train_info/time_within_train_step": 2.7545669078826904, "step": 5991} {"train_info/time_between_train_steps": 0.003152132034301758, "step": 5991} {"info/global_step": 5992, "train_info/time_within_train_step": 2.7544498443603516, "step": 5992} {"train_info/time_between_train_steps": 0.003210783004760742, "step": 5992} {"info/global_step": 5993, "train_info/time_within_train_step": 2.753725528717041, "step": 5993} {"train_info/time_between_train_steps": 0.003137826919555664, "step": 5993} {"info/global_step": 5994, "train_info/time_within_train_step": 2.7547619342803955, "step": 5994} {"train_info/time_between_train_steps": 0.0031096935272216797, "step": 5994} {"info/global_step": 5995, "train_info/time_within_train_step": 2.7556724548339844, "step": 5995} {"train_info/time_between_train_steps": 0.003208160400390625, "step": 5995} {"info/global_step": 5996, "train_info/time_within_train_step": 2.7558743953704834, "step": 5996} {"train_info/time_between_train_steps": 0.0031197071075439453, "step": 5996} {"info/global_step": 5997, "train_info/time_within_train_step": 3.332702875137329, "step": 5997} {"train_info/time_between_train_steps": 0.003147602081298828, "step": 5997} {"info/global_step": 5998, "train_info/time_within_train_step": 2.7537269592285156, "step": 5998} {"train_info/time_between_train_steps": 0.0031104087829589844, "step": 5998} {"info/global_step": 5999, "train_info/time_within_train_step": 2.754310369491577, "step": 5999} {"train_info/time_between_train_steps": 0.0034360885620117188, "step": 5999} {"info/global_step": 6000, "train_info/time_within_train_step": 2.7522473335266113, "step": 6000} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746583376, "_runtime": 17385}, "step": 6000} {"logs": {"train/loss": 3.4935, "train/learning_rate": 0.0002666666666666666, "train/epoch": 7.0, "_timestamp": 1746583376, "_runtime": 17385}, "step": 6000} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746583381, "_runtime": 17390}, "step": 6000} {"logs": {"eval/loss": 4.690811634063721, "eval/runtime": 5.1622, "eval/samples_per_second": 36.806, "eval/steps_per_second": 1.162, "train/epoch": 7.0, "_timestamp": 1746583381, "_runtime": 17390}, "step": 6000} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746583381, "_runtime": 17390}, "step": 6000} {"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.690811634063721, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 108.94156461930206, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 5.1622, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 36.806, "train/epoch": 7.0, "_timestamp": 1746583381, "_runtime": 17390}, "step": 6000} {"train_info/time_between_train_steps": 18.52056908607483, "step": 6000} {"info/global_step": 6001, "train_info/time_within_train_step": 2.5355336666107178, "step": 6001} {"train_info/time_between_train_steps": 0.0034737586975097656, "step": 6001} {"info/global_step": 6002, "train_info/time_within_train_step": 2.6017510890960693, "step": 6002} {"train_info/time_between_train_steps": 0.003264188766479492, "step": 6002} {"info/global_step": 6003, "train_info/time_within_train_step": 2.728752851486206, "step": 6003} {"train_info/time_between_train_steps": 0.003268718719482422, "step": 6003} {"info/global_step": 6004, "train_info/time_within_train_step": 2.7500154972076416, "step": 6004} {"train_info/time_between_train_steps": 0.0032799243927001953, "step": 6004} {"info/global_step": 6005, "train_info/time_within_train_step": 2.7529780864715576, "step": 6005} {"train_info/time_between_train_steps": 0.003303050994873047, "step": 6005} {"info/global_step": 6006, "train_info/time_within_train_step": 2.755849599838257, "step": 6006} {"train_info/time_between_train_steps": 0.0032956600189208984, "step": 6006} {"info/global_step": 6007, "train_info/time_within_train_step": 2.7551794052124023, "step": 6007} {"train_info/time_between_train_steps": 0.0033130645751953125, "step": 6007} {"info/global_step": 6008, "train_info/time_within_train_step": 2.757441997528076, "step": 6008} {"train_info/time_between_train_steps": 0.003317117691040039, "step": 6008} {"info/global_step": 6009, "train_info/time_within_train_step": 2.7556631565093994, "step": 6009} {"train_info/time_between_train_steps": 0.003294229507446289, "step": 6009} {"info/global_step": 6010, "train_info/time_within_train_step": 2.756131649017334, "step": 6010} {"train_info/time_between_train_steps": 0.0033974647521972656, "step": 6010} {"info/global_step": 6011, "train_info/time_within_train_step": 2.7569732666015625, "step": 6011} {"train_info/time_between_train_steps": 0.00330352783203125, "step": 6011} {"info/global_step": 6012, "train_info/time_within_train_step": 2.7560172080993652, "step": 6012} {"train_info/time_between_train_steps": 0.003261089324951172, "step": 6012} {"info/global_step": 6013, "train_info/time_within_train_step": 2.7579469680786133, "step": 6013} {"train_info/time_between_train_steps": 0.0032956600189208984, "step": 6013} {"info/global_step": 6014, "train_info/time_within_train_step": 2.7578284740448, "step": 6014} {"train_info/time_between_train_steps": 0.0033965110778808594, "step": 6014} {"info/global_step": 6015, "train_info/time_within_train_step": 2.7568321228027344, "step": 6015} {"train_info/time_between_train_steps": 0.0032799243927001953, "step": 6015} {"info/global_step": 6016, "train_info/time_within_train_step": 2.7570910453796387, "step": 6016} {"train_info/time_between_train_steps": 0.0033638477325439453, "step": 6016} {"info/global_step": 6017, "train_info/time_within_train_step": 2.7569568157196045, "step": 6017} {"train_info/time_between_train_steps": 0.0032765865325927734, "step": 6017} {"info/global_step": 6018, "train_info/time_within_train_step": 2.757403612136841, "step": 6018} {"train_info/time_between_train_steps": 0.003313302993774414, "step": 6018} {"info/global_step": 6019, "train_info/time_within_train_step": 2.7575957775115967, "step": 6019} {"train_info/time_between_train_steps": 0.003442525863647461, "step": 6019} {"info/global_step": 6020, "train_info/time_within_train_step": 2.7575433254241943, "step": 6020} {"train_info/time_between_train_steps": 0.0033562183380126953, "step": 6020} {"info/global_step": 6021, "train_info/time_within_train_step": 2.7577478885650635, "step": 6021} {"train_info/time_between_train_steps": 0.0033125877380371094, "step": 6021} {"info/global_step": 6022, "train_info/time_within_train_step": 2.7557075023651123, "step": 6022} {"train_info/time_between_train_steps": 0.0031375885009765625, "step": 6022} {"info/global_step": 6023, "train_info/time_within_train_step": 2.755897283554077, "step": 6023} {"train_info/time_between_train_steps": 0.0031626224517822266, "step": 6023} {"info/global_step": 6024, "train_info/time_within_train_step": 2.756923198699951, "step": 6024} {"train_info/time_between_train_steps": 0.003243684768676758, "step": 6024} {"info/global_step": 6025, "train_info/time_within_train_step": 2.9835805892944336, "step": 6025} {"train_info/time_between_train_steps": 0.0031566619873046875, "step": 6025} {"info/global_step": 6026, "train_info/time_within_train_step": 2.756305694580078, "step": 6026} {"train_info/time_between_train_steps": 0.0030913352966308594, "step": 6026} {"info/global_step": 6027, "train_info/time_within_train_step": 2.7553818225860596, "step": 6027} {"train_info/time_between_train_steps": 0.0031609535217285156, "step": 6027} {"info/global_step": 6028, "train_info/time_within_train_step": 2.755136013031006, "step": 6028} {"train_info/time_between_train_steps": 0.003101348876953125, "step": 6028} {"info/global_step": 6029, "train_info/time_within_train_step": 2.7558562755584717, "step": 6029} {"train_info/time_between_train_steps": 0.0031578540802001953, "step": 6029} {"info/global_step": 6030, "train_info/time_within_train_step": 2.7541964054107666, "step": 6030} {"train_info/time_between_train_steps": 0.0031278133392333984, "step": 6030} {"info/global_step": 6031, "train_info/time_within_train_step": 2.756171703338623, "step": 6031} {"train_info/time_between_train_steps": 0.0031065940856933594, "step": 6031} {"info/global_step": 6032, "train_info/time_within_train_step": 2.755574941635132, "step": 6032} {"train_info/time_between_train_steps": 0.0031385421752929688, "step": 6032} {"info/global_step": 6033, "train_info/time_within_train_step": 2.756260871887207, "step": 6033} {"train_info/time_between_train_steps": 0.003131389617919922, "step": 6033} {"info/global_step": 6034, "train_info/time_within_train_step": 2.879697322845459, "step": 6034} {"train_info/time_between_train_steps": 0.0032198429107666016, "step": 6034} {"info/global_step": 6035, "train_info/time_within_train_step": 2.7557766437530518, "step": 6035} {"train_info/time_between_train_steps": 0.0031709671020507812, "step": 6035} {"info/global_step": 6036, "train_info/time_within_train_step": 2.755262613296509, "step": 6036} {"train_info/time_between_train_steps": 0.003102540969848633, "step": 6036} {"info/global_step": 6037, "train_info/time_within_train_step": 2.755183219909668, "step": 6037} {"train_info/time_between_train_steps": 0.0031044483184814453, "step": 6037} {"info/global_step": 6038, "train_info/time_within_train_step": 2.7550015449523926, "step": 6038} {"train_info/time_between_train_steps": 0.0031418800354003906, "step": 6038} {"info/global_step": 6039, "train_info/time_within_train_step": 2.756047010421753, "step": 6039} {"train_info/time_between_train_steps": 0.003152132034301758, "step": 6039} {"info/global_step": 6040, "train_info/time_within_train_step": 2.7545599937438965, "step": 6040} {"train_info/time_between_train_steps": 0.003167867660522461, "step": 6040} {"info/global_step": 6041, "train_info/time_within_train_step": 2.7549164295196533, "step": 6041} {"train_info/time_between_train_steps": 0.003139019012451172, "step": 6041} {"info/global_step": 6042, "train_info/time_within_train_step": 2.7539329528808594, "step": 6042} {"train_info/time_between_train_steps": 0.003137350082397461, "step": 6042} {"info/global_step": 6043, "train_info/time_within_train_step": 2.7549257278442383, "step": 6043} {"train_info/time_between_train_steps": 0.0031299591064453125, "step": 6043} {"info/global_step": 6044, "train_info/time_within_train_step": 2.763796329498291, "step": 6044} {"train_info/time_between_train_steps": 0.0031380653381347656, "step": 6044} {"info/global_step": 6045, "train_info/time_within_train_step": 2.7547688484191895, "step": 6045} {"train_info/time_between_train_steps": 0.003122568130493164, "step": 6045} {"info/global_step": 6046, "train_info/time_within_train_step": 2.754176616668701, "step": 6046} {"train_info/time_between_train_steps": 0.0031228065490722656, "step": 6046} {"info/global_step": 6047, "train_info/time_within_train_step": 2.7543718814849854, "step": 6047} {"train_info/time_between_train_steps": 0.0033020973205566406, "step": 6047} {"info/global_step": 6048, "train_info/time_within_train_step": 2.757439613342285, "step": 6048} {"train_info/time_between_train_steps": 0.0032956600189208984, "step": 6048} {"info/global_step": 6049, "train_info/time_within_train_step": 2.7565982341766357, "step": 6049} {"train_info/time_between_train_steps": 0.0033419132232666016, "step": 6049} {"info/global_step": 6050, "train_info/time_within_train_step": 2.755007743835449, "step": 6050} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746583533, "_runtime": 17542}, "step": 6050} {"logs": {"train/loss": 3.442, "train/learning_rate": 0.0002633333333333333, "train/epoch": 7.01, "_timestamp": 1746583533, "_runtime": 17542}, "step": 6050} {"train_info/time_between_train_steps": 0.009618997573852539, "step": 6050} {"info/global_step": 6051, "train_info/time_within_train_step": 2.75705623626709, "step": 6051} {"train_info/time_between_train_steps": 0.003293752670288086, "step": 6051} {"info/global_step": 6052, "train_info/time_within_train_step": 2.7574448585510254, "step": 6052} {"train_info/time_between_train_steps": 0.003309965133666992, "step": 6052} {"info/global_step": 6053, "train_info/time_within_train_step": 2.7545478343963623, "step": 6053} {"train_info/time_between_train_steps": 0.0032968521118164062, "step": 6053} {"info/global_step": 6054, "train_info/time_within_train_step": 2.756910800933838, "step": 6054} {"train_info/time_between_train_steps": 0.0032682418823242188, "step": 6054} {"info/global_step": 6055, "train_info/time_within_train_step": 2.754493236541748, "step": 6055} {"train_info/time_between_train_steps": 0.0032815933227539062, "step": 6055} {"info/global_step": 6056, "train_info/time_within_train_step": 2.755932092666626, "step": 6056} {"train_info/time_between_train_steps": 0.003284454345703125, "step": 6056} {"info/global_step": 6057, "train_info/time_within_train_step": 2.754955291748047, "step": 6057} {"train_info/time_between_train_steps": 0.0033032894134521484, "step": 6057} {"info/global_step": 6058, "train_info/time_within_train_step": 2.7556984424591064, "step": 6058} {"train_info/time_between_train_steps": 0.0033147335052490234, "step": 6058} {"info/global_step": 6059, "train_info/time_within_train_step": 2.7554500102996826, "step": 6059} {"train_info/time_between_train_steps": 0.0033464431762695312, "step": 6059} {"info/global_step": 6060, "train_info/time_within_train_step": 2.7551040649414062, "step": 6060} {"train_info/time_between_train_steps": 0.003334522247314453, "step": 6060} {"info/global_step": 6061, "train_info/time_within_train_step": 2.755341053009033, "step": 6061} {"train_info/time_between_train_steps": 0.003325223922729492, "step": 6061} {"info/global_step": 6062, "train_info/time_within_train_step": 2.7561147212982178, "step": 6062} {"train_info/time_between_train_steps": 0.0033588409423828125, "step": 6062} {"info/global_step": 6063, "train_info/time_within_train_step": 2.7566730976104736, "step": 6063} {"train_info/time_between_train_steps": 0.0032677650451660156, "step": 6063} {"info/global_step": 6064, "train_info/time_within_train_step": 2.755871295928955, "step": 6064} {"train_info/time_between_train_steps": 0.0033261775970458984, "step": 6064} {"info/global_step": 6065, "train_info/time_within_train_step": 2.7563533782958984, "step": 6065} {"train_info/time_between_train_steps": 0.0032851696014404297, "step": 6065} {"info/global_step": 6066, "train_info/time_within_train_step": 2.7574682235717773, "step": 6066} {"train_info/time_between_train_steps": 0.003293752670288086, "step": 6066} {"info/global_step": 6067, "train_info/time_within_train_step": 2.757608652114868, "step": 6067} {"train_info/time_between_train_steps": 0.0033991336822509766, "step": 6067} {"info/global_step": 6068, "train_info/time_within_train_step": 2.7557153701782227, "step": 6068} {"train_info/time_between_train_steps": 0.003312826156616211, "step": 6068} {"info/global_step": 6069, "train_info/time_within_train_step": 2.7566885948181152, "step": 6069} {"train_info/time_between_train_steps": 0.003302335739135742, "step": 6069} {"info/global_step": 6070, "train_info/time_within_train_step": 2.7550806999206543, "step": 6070} {"train_info/time_between_train_steps": 0.0033266544342041016, "step": 6070} {"info/global_step": 6071, "train_info/time_within_train_step": 2.7561917304992676, "step": 6071} {"train_info/time_between_train_steps": 0.0033376216888427734, "step": 6071} {"info/global_step": 6072, "train_info/time_within_train_step": 2.7545535564422607, "step": 6072} {"train_info/time_between_train_steps": 0.0032694339752197266, "step": 6072} {"info/global_step": 6073, "train_info/time_within_train_step": 2.755066156387329, "step": 6073} {"train_info/time_between_train_steps": 0.003289937973022461, "step": 6073} {"info/global_step": 6074, "train_info/time_within_train_step": 2.755239486694336, "step": 6074} {"train_info/time_between_train_steps": 0.0032873153686523438, "step": 6074} {"info/global_step": 6075, "train_info/time_within_train_step": 2.7548089027404785, "step": 6075} {"train_info/time_between_train_steps": 0.0033006668090820312, "step": 6075} {"info/global_step": 6076, "train_info/time_within_train_step": 2.754760503768921, "step": 6076} {"train_info/time_between_train_steps": 0.003283262252807617, "step": 6076} {"info/global_step": 6077, "train_info/time_within_train_step": 2.7556874752044678, "step": 6077} {"train_info/time_between_train_steps": 0.0032949447631835938, "step": 6077} {"info/global_step": 6078, "train_info/time_within_train_step": 2.756810188293457, "step": 6078} {"train_info/time_between_train_steps": 0.003351926803588867, "step": 6078} {"info/global_step": 6079, "train_info/time_within_train_step": 2.7561213970184326, "step": 6079} {"train_info/time_between_train_steps": 0.003293752670288086, "step": 6079} {"info/global_step": 6080, "train_info/time_within_train_step": 2.756695508956909, "step": 6080} {"train_info/time_between_train_steps": 0.0033087730407714844, "step": 6080} {"info/global_step": 6081, "train_info/time_within_train_step": 2.7569820880889893, "step": 6081} {"train_info/time_between_train_steps": 0.003317117691040039, "step": 6081} {"info/global_step": 6082, "train_info/time_within_train_step": 2.7556354999542236, "step": 6082} {"train_info/time_between_train_steps": 0.003278017044067383, "step": 6082} {"info/global_step": 6083, "train_info/time_within_train_step": 2.7551896572113037, "step": 6083} {"train_info/time_between_train_steps": 0.003266572952270508, "step": 6083} {"info/global_step": 6084, "train_info/time_within_train_step": 2.7565290927886963, "step": 6084} {"train_info/time_between_train_steps": 0.0032923221588134766, "step": 6084} {"info/global_step": 6085, "train_info/time_within_train_step": 2.7558155059814453, "step": 6085} {"train_info/time_between_train_steps": 0.003320455551147461, "step": 6085} {"info/global_step": 6086, "train_info/time_within_train_step": 2.7555012702941895, "step": 6086} {"train_info/time_between_train_steps": 0.003322601318359375, "step": 6086} {"info/global_step": 6087, "train_info/time_within_train_step": 2.755357265472412, "step": 6087} {"train_info/time_between_train_steps": 0.0033266544342041016, "step": 6087} {"info/global_step": 6088, "train_info/time_within_train_step": 2.75604248046875, "step": 6088} {"train_info/time_between_train_steps": 0.0032956600189208984, "step": 6088} {"info/global_step": 6089, "train_info/time_within_train_step": 2.754762887954712, "step": 6089} {"train_info/time_between_train_steps": 0.003280162811279297, "step": 6089} {"info/global_step": 6090, "train_info/time_within_train_step": 2.75434947013855, "step": 6090} {"train_info/time_between_train_steps": 0.0033354759216308594, "step": 6090} {"info/global_step": 6091, "train_info/time_within_train_step": 2.7543108463287354, "step": 6091} {"train_info/time_between_train_steps": 0.0032951831817626953, "step": 6091} {"info/global_step": 6092, "train_info/time_within_train_step": 2.7551188468933105, "step": 6092} {"train_info/time_between_train_steps": 0.003315448760986328, "step": 6092} {"info/global_step": 6093, "train_info/time_within_train_step": 2.7551634311676025, "step": 6093} {"train_info/time_between_train_steps": 0.0033397674560546875, "step": 6093} {"info/global_step": 6094, "train_info/time_within_train_step": 2.754899263381958, "step": 6094} {"train_info/time_between_train_steps": 0.003288745880126953, "step": 6094} {"info/global_step": 6095, "train_info/time_within_train_step": 2.7544703483581543, "step": 6095} {"train_info/time_between_train_steps": 0.0032775402069091797, "step": 6095} {"info/global_step": 6096, "train_info/time_within_train_step": 2.75630259513855, "step": 6096} {"train_info/time_between_train_steps": 0.12721490859985352, "step": 6096} {"info/global_step": 6097, "train_info/time_within_train_step": 2.7553813457489014, "step": 6097} {"train_info/time_between_train_steps": 0.00322723388671875, "step": 6097} {"info/global_step": 6098, "train_info/time_within_train_step": 2.7556450366973877, "step": 6098} {"train_info/time_between_train_steps": 0.0031020641326904297, "step": 6098} {"info/global_step": 6099, "train_info/time_within_train_step": 2.7553365230560303, "step": 6099} {"train_info/time_between_train_steps": 0.003170013427734375, "step": 6099} {"info/global_step": 6100, "train_info/time_within_train_step": 2.7551021575927734, "step": 6100} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746583671, "_runtime": 17680}, "step": 6100} {"logs": {"train/loss": 3.4359, "train/learning_rate": 0.00026, "train/epoch": 7.01, "_timestamp": 1746583671, "_runtime": 17680}, "step": 6100} {"train_info/time_between_train_steps": 0.0067958831787109375, "step": 6100} {"info/global_step": 6101, "train_info/time_within_train_step": 2.7557594776153564, "step": 6101} {"train_info/time_between_train_steps": 0.003154277801513672, "step": 6101} {"info/global_step": 6102, "train_info/time_within_train_step": 2.754153251647949, "step": 6102} {"train_info/time_between_train_steps": 0.003143310546875, "step": 6102} {"info/global_step": 6103, "train_info/time_within_train_step": 2.7536873817443848, "step": 6103} {"train_info/time_between_train_steps": 0.0031366348266601562, "step": 6103} {"info/global_step": 6104, "train_info/time_within_train_step": 2.7538201808929443, "step": 6104} {"train_info/time_between_train_steps": 0.0031867027282714844, "step": 6104} {"info/global_step": 6105, "train_info/time_within_train_step": 2.753466844558716, "step": 6105} {"train_info/time_between_train_steps": 0.003137350082397461, "step": 6105} {"info/global_step": 6106, "train_info/time_within_train_step": 2.753891944885254, "step": 6106} {"train_info/time_between_train_steps": 0.0032448768615722656, "step": 6106} {"info/global_step": 6107, "train_info/time_within_train_step": 2.7539961338043213, "step": 6107} {"train_info/time_between_train_steps": 0.003147125244140625, "step": 6107} {"info/global_step": 6108, "train_info/time_within_train_step": 2.7540557384490967, "step": 6108} {"train_info/time_between_train_steps": 0.0031371116638183594, "step": 6108} {"info/global_step": 6109, "train_info/time_within_train_step": 2.7544667720794678, "step": 6109} {"train_info/time_between_train_steps": 0.003125429153442383, "step": 6109} {"info/global_step": 6110, "train_info/time_within_train_step": 2.755018711090088, "step": 6110} {"train_info/time_between_train_steps": 0.0031402111053466797, "step": 6110} {"info/global_step": 6111, "train_info/time_within_train_step": 2.756730318069458, "step": 6111} {"train_info/time_between_train_steps": 0.0033071041107177734, "step": 6111} {"info/global_step": 6112, "train_info/time_within_train_step": 2.7572731971740723, "step": 6112} {"train_info/time_between_train_steps": 0.003281831741333008, "step": 6112} {"info/global_step": 6113, "train_info/time_within_train_step": 2.757094144821167, "step": 6113} {"train_info/time_between_train_steps": 0.0033164024353027344, "step": 6113} {"info/global_step": 6114, "train_info/time_within_train_step": 2.7570717334747314, "step": 6114} {"train_info/time_between_train_steps": 0.0032923221588134766, "step": 6114} {"info/global_step": 6115, "train_info/time_within_train_step": 2.7562835216522217, "step": 6115} {"train_info/time_between_train_steps": 0.003144979476928711, "step": 6115} {"info/global_step": 6116, "train_info/time_within_train_step": 2.754401683807373, "step": 6116} {"train_info/time_between_train_steps": 0.003149271011352539, "step": 6116} {"info/global_step": 6117, "train_info/time_within_train_step": 2.988421678543091, "step": 6117} {"train_info/time_between_train_steps": 0.003173351287841797, "step": 6117} {"info/global_step": 6118, "train_info/time_within_train_step": 2.756330728530884, "step": 6118} {"train_info/time_between_train_steps": 0.003156423568725586, "step": 6118} {"info/global_step": 6119, "train_info/time_within_train_step": 2.754040002822876, "step": 6119} {"train_info/time_between_train_steps": 0.0031855106353759766, "step": 6119} {"info/global_step": 6120, "train_info/time_within_train_step": 2.7544515132904053, "step": 6120} {"train_info/time_between_train_steps": 0.003128528594970703, "step": 6120} {"info/global_step": 6121, "train_info/time_within_train_step": 2.7548274993896484, "step": 6121} {"train_info/time_between_train_steps": 0.003143787384033203, "step": 6121} {"info/global_step": 6122, "train_info/time_within_train_step": 2.7551119327545166, "step": 6122} {"train_info/time_between_train_steps": 0.0031855106353759766, "step": 6122} {"info/global_step": 6123, "train_info/time_within_train_step": 2.75531005859375, "step": 6123} {"train_info/time_between_train_steps": 0.0031232833862304688, "step": 6123} {"info/global_step": 6124, "train_info/time_within_train_step": 2.7546558380126953, "step": 6124} {"train_info/time_between_train_steps": 0.0031805038452148438, "step": 6124} {"info/global_step": 6125, "train_info/time_within_train_step": 2.7564220428466797, "step": 6125} {"train_info/time_between_train_steps": 0.0033016204833984375, "step": 6125} {"info/global_step": 6126, "train_info/time_within_train_step": 2.757702589035034, "step": 6126} {"train_info/time_between_train_steps": 0.0033447742462158203, "step": 6126} {"info/global_step": 6127, "train_info/time_within_train_step": 2.7567832469940186, "step": 6127} {"train_info/time_between_train_steps": 0.0033121109008789062, "step": 6127} {"info/global_step": 6128, "train_info/time_within_train_step": 2.757612705230713, "step": 6128} {"train_info/time_between_train_steps": 0.003316640853881836, "step": 6128} {"info/global_step": 6129, "train_info/time_within_train_step": 2.756519079208374, "step": 6129} {"train_info/time_between_train_steps": 0.003300189971923828, "step": 6129} {"info/global_step": 6130, "train_info/time_within_train_step": 2.7568864822387695, "step": 6130} {"train_info/time_between_train_steps": 0.003366708755493164, "step": 6130} {"info/global_step": 6131, "train_info/time_within_train_step": 2.761653423309326, "step": 6131} {"train_info/time_between_train_steps": 0.003325939178466797, "step": 6131} {"info/global_step": 6132, "train_info/time_within_train_step": 2.7573978900909424, "step": 6132} {"train_info/time_between_train_steps": 0.0032813549041748047, "step": 6132} {"info/global_step": 6133, "train_info/time_within_train_step": 2.756927013397217, "step": 6133} {"train_info/time_between_train_steps": 0.0033288002014160156, "step": 6133} {"info/global_step": 6134, "train_info/time_within_train_step": 2.7560219764709473, "step": 6134} {"train_info/time_between_train_steps": 0.0033097267150878906, "step": 6134} {"info/global_step": 6135, "train_info/time_within_train_step": 2.7562096118927, "step": 6135} {"train_info/time_between_train_steps": 0.0033257007598876953, "step": 6135} {"info/global_step": 6136, "train_info/time_within_train_step": 2.756349802017212, "step": 6136} {"train_info/time_between_train_steps": 0.003345966339111328, "step": 6136} {"info/global_step": 6137, "train_info/time_within_train_step": 2.7557244300842285, "step": 6137} {"train_info/time_between_train_steps": 0.003289937973022461, "step": 6137} {"info/global_step": 6138, "train_info/time_within_train_step": 2.75641131401062, "step": 6138} {"train_info/time_between_train_steps": 0.0032889842987060547, "step": 6138} {"info/global_step": 6139, "train_info/time_within_train_step": 2.7556262016296387, "step": 6139} {"train_info/time_between_train_steps": 0.0033032894134521484, "step": 6139} {"info/global_step": 6140, "train_info/time_within_train_step": 2.7565908432006836, "step": 6140} {"train_info/time_between_train_steps": 0.0032863616943359375, "step": 6140} {"info/global_step": 6141, "train_info/time_within_train_step": 2.7568936347961426, "step": 6141} {"train_info/time_between_train_steps": 0.0033617019653320312, "step": 6141} {"info/global_step": 6142, "train_info/time_within_train_step": 2.7564430236816406, "step": 6142} {"train_info/time_between_train_steps": 0.003162860870361328, "step": 6142} {"info/global_step": 6143, "train_info/time_within_train_step": 2.75471568107605, "step": 6143} {"train_info/time_between_train_steps": 0.0031137466430664062, "step": 6143} {"info/global_step": 6144, "train_info/time_within_train_step": 2.7535834312438965, "step": 6144} {"train_info/time_between_train_steps": 0.003146648406982422, "step": 6144} {"info/global_step": 6145, "train_info/time_within_train_step": 2.7557830810546875, "step": 6145} {"train_info/time_between_train_steps": 0.0031342506408691406, "step": 6145} {"info/global_step": 6146, "train_info/time_within_train_step": 2.7552361488342285, "step": 6146} {"train_info/time_between_train_steps": 0.003123760223388672, "step": 6146} {"info/global_step": 6147, "train_info/time_within_train_step": 2.755733013153076, "step": 6147} {"train_info/time_between_train_steps": 0.003168344497680664, "step": 6147} {"info/global_step": 6148, "train_info/time_within_train_step": 2.755368947982788, "step": 6148} {"train_info/time_between_train_steps": 0.003139019012451172, "step": 6148} {"info/global_step": 6149, "train_info/time_within_train_step": 2.755150318145752, "step": 6149} {"train_info/time_between_train_steps": 0.0031304359436035156, "step": 6149} {"info/global_step": 6150, "train_info/time_within_train_step": 2.75447154045105, "step": 6150} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746583810, "_runtime": 17819}, "step": 6150} {"logs": {"train/loss": 3.4185, "train/learning_rate": 0.00025666666666666665, "train/epoch": 7.02, "_timestamp": 1746583810, "_runtime": 17819}, "step": 6150} {"train_info/time_between_train_steps": 0.006979942321777344, "step": 6150} {"info/global_step": 6151, "train_info/time_within_train_step": 2.755336046218872, "step": 6151} {"train_info/time_between_train_steps": 0.00312042236328125, "step": 6151} {"info/global_step": 6152, "train_info/time_within_train_step": 2.755718231201172, "step": 6152} {"train_info/time_between_train_steps": 0.0031156539916992188, "step": 6152} {"info/global_step": 6153, "train_info/time_within_train_step": 2.7557246685028076, "step": 6153} {"train_info/time_between_train_steps": 0.0031321048736572266, "step": 6153} {"info/global_step": 6154, "train_info/time_within_train_step": 2.7550888061523438, "step": 6154} {"train_info/time_between_train_steps": 0.003118276596069336, "step": 6154} {"info/global_step": 6155, "train_info/time_within_train_step": 2.7547388076782227, "step": 6155} {"train_info/time_between_train_steps": 0.0031070709228515625, "step": 6155} {"info/global_step": 6156, "train_info/time_within_train_step": 2.755371570587158, "step": 6156} {"train_info/time_between_train_steps": 0.0031337738037109375, "step": 6156} {"info/global_step": 6157, "train_info/time_within_train_step": 2.755303382873535, "step": 6157} {"train_info/time_between_train_steps": 0.0031332969665527344, "step": 6157} {"info/global_step": 6158, "train_info/time_within_train_step": 2.7551350593566895, "step": 6158} {"train_info/time_between_train_steps": 0.003109455108642578, "step": 6158} {"info/global_step": 6159, "train_info/time_within_train_step": 2.8785955905914307, "step": 6159} {"train_info/time_between_train_steps": 0.0032439231872558594, "step": 6159} {"info/global_step": 6160, "train_info/time_within_train_step": 2.7543752193450928, "step": 6160} {"train_info/time_between_train_steps": 0.0031964778900146484, "step": 6160} {"info/global_step": 6161, "train_info/time_within_train_step": 2.754176378250122, "step": 6161} {"train_info/time_between_train_steps": 0.003171682357788086, "step": 6161} {"info/global_step": 6162, "train_info/time_within_train_step": 2.7535881996154785, "step": 6162} {"train_info/time_between_train_steps": 0.0031616687774658203, "step": 6162} {"info/global_step": 6163, "train_info/time_within_train_step": 2.75437593460083, "step": 6163} {"train_info/time_between_train_steps": 0.0031654834747314453, "step": 6163} {"info/global_step": 6164, "train_info/time_within_train_step": 2.754152297973633, "step": 6164} {"train_info/time_between_train_steps": 0.003149747848510742, "step": 6164} {"info/global_step": 6165, "train_info/time_within_train_step": 2.7540433406829834, "step": 6165} {"train_info/time_between_train_steps": 0.003191709518432617, "step": 6165} {"info/global_step": 6166, "train_info/time_within_train_step": 2.753389596939087, "step": 6166} {"train_info/time_between_train_steps": 0.003121614456176758, "step": 6166} {"info/global_step": 6167, "train_info/time_within_train_step": 2.755032539367676, "step": 6167} {"train_info/time_between_train_steps": 0.0031516551971435547, "step": 6167} {"info/global_step": 6168, "train_info/time_within_train_step": 2.75748348236084, "step": 6168} {"train_info/time_between_train_steps": 0.0032236576080322266, "step": 6168} {"info/global_step": 6169, "train_info/time_within_train_step": 2.7561516761779785, "step": 6169} {"train_info/time_between_train_steps": 0.00316619873046875, "step": 6169} {"info/global_step": 6170, "train_info/time_within_train_step": 2.755225658416748, "step": 6170} {"train_info/time_between_train_steps": 0.003223419189453125, "step": 6170} {"info/global_step": 6171, "train_info/time_within_train_step": 2.7547407150268555, "step": 6171} {"train_info/time_between_train_steps": 0.0031561851501464844, "step": 6171} {"info/global_step": 6172, "train_info/time_within_train_step": 2.754138708114624, "step": 6172} {"train_info/time_between_train_steps": 0.003117799758911133, "step": 6172} {"info/global_step": 6173, "train_info/time_within_train_step": 2.9940779209136963, "step": 6173} {"train_info/time_between_train_steps": 0.0032036304473876953, "step": 6173} {"info/global_step": 6174, "train_info/time_within_train_step": 2.7543222904205322, "step": 6174} {"train_info/time_between_train_steps": 0.0031461715698242188, "step": 6174} {"info/global_step": 6175, "train_info/time_within_train_step": 2.7544193267822266, "step": 6175} {"train_info/time_between_train_steps": 0.0033004283905029297, "step": 6175} {"info/global_step": 6176, "train_info/time_within_train_step": 2.7551398277282715, "step": 6176} {"train_info/time_between_train_steps": 0.0034389495849609375, "step": 6176} {"info/global_step": 6177, "train_info/time_within_train_step": 2.7558834552764893, "step": 6177} {"train_info/time_between_train_steps": 0.0033566951751708984, "step": 6177} {"info/global_step": 6178, "train_info/time_within_train_step": 2.7552490234375, "step": 6178} {"train_info/time_between_train_steps": 0.0033261775970458984, "step": 6178} {"info/global_step": 6179, "train_info/time_within_train_step": 2.7559397220611572, "step": 6179} {"train_info/time_between_train_steps": 0.0033562183380126953, "step": 6179} {"info/global_step": 6180, "train_info/time_within_train_step": 2.756429433822632, "step": 6180} {"train_info/time_between_train_steps": 0.0033292770385742188, "step": 6180} {"info/global_step": 6181, "train_info/time_within_train_step": 2.7554662227630615, "step": 6181} {"train_info/time_between_train_steps": 0.0031685829162597656, "step": 6181} {"info/global_step": 6182, "train_info/time_within_train_step": 2.7566304206848145, "step": 6182} {"train_info/time_between_train_steps": 0.003331422805786133, "step": 6182} {"info/global_step": 6183, "train_info/time_within_train_step": 2.7567813396453857, "step": 6183} {"train_info/time_between_train_steps": 0.003319263458251953, "step": 6183} {"info/global_step": 6184, "train_info/time_within_train_step": 2.756922721862793, "step": 6184} {"train_info/time_between_train_steps": 0.003328561782836914, "step": 6184} {"info/global_step": 6185, "train_info/time_within_train_step": 2.757540225982666, "step": 6185} {"train_info/time_between_train_steps": 0.0033283233642578125, "step": 6185} {"info/global_step": 6186, "train_info/time_within_train_step": 2.7555437088012695, "step": 6186} {"train_info/time_between_train_steps": 0.0033452510833740234, "step": 6186} {"info/global_step": 6187, "train_info/time_within_train_step": 2.7568576335906982, "step": 6187} {"train_info/time_between_train_steps": 0.0033125877380371094, "step": 6187} {"info/global_step": 6188, "train_info/time_within_train_step": 2.757528781890869, "step": 6188} {"train_info/time_between_train_steps": 0.003285646438598633, "step": 6188} {"info/global_step": 6189, "train_info/time_within_train_step": 2.7557389736175537, "step": 6189} {"train_info/time_between_train_steps": 0.0032777786254882812, "step": 6189} {"info/global_step": 6190, "train_info/time_within_train_step": 2.754849910736084, "step": 6190} {"train_info/time_between_train_steps": 0.0033113956451416016, "step": 6190} {"info/global_step": 6191, "train_info/time_within_train_step": 2.755744218826294, "step": 6191} {"train_info/time_between_train_steps": 0.003409147262573242, "step": 6191} {"info/global_step": 6192, "train_info/time_within_train_step": 2.754793167114258, "step": 6192} {"train_info/time_between_train_steps": 0.0033364295959472656, "step": 6192} {"info/global_step": 6193, "train_info/time_within_train_step": 2.7552802562713623, "step": 6193} {"train_info/time_between_train_steps": 0.003323793411254883, "step": 6193} {"info/global_step": 6194, "train_info/time_within_train_step": 2.7559869289398193, "step": 6194} {"train_info/time_between_train_steps": 0.003290891647338867, "step": 6194} {"info/global_step": 6195, "train_info/time_within_train_step": 2.75632905960083, "step": 6195} {"train_info/time_between_train_steps": 0.003317117691040039, "step": 6195} {"info/global_step": 6196, "train_info/time_within_train_step": 2.7554380893707275, "step": 6196} {"train_info/time_between_train_steps": 0.0033364295959472656, "step": 6196} {"info/global_step": 6197, "train_info/time_within_train_step": 2.7566184997558594, "step": 6197} {"train_info/time_between_train_steps": 0.0032873153686523438, "step": 6197} {"info/global_step": 6198, "train_info/time_within_train_step": 2.7573130130767822, "step": 6198} {"train_info/time_between_train_steps": 0.003293752670288086, "step": 6198} {"info/global_step": 6199, "train_info/time_within_train_step": 2.7564144134521484, "step": 6199} {"train_info/time_between_train_steps": 0.003142118453979492, "step": 6199} {"info/global_step": 6200, "train_info/time_within_train_step": 2.755509614944458, "step": 6200} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746583948, "_runtime": 17957}, "step": 6200} {"logs": {"train/loss": 3.4103, "train/learning_rate": 0.00025333333333333333, "train/epoch": 7.02, "_timestamp": 1746583948, "_runtime": 17957}, "step": 6200} {"train_info/time_between_train_steps": 18.990411043167114, "step": 6200} {"info/global_step": 6201, "train_info/time_within_train_step": 2.528958797454834, "step": 6201} {"train_info/time_between_train_steps": 0.0033447742462158203, "step": 6201} {"info/global_step": 6202, "train_info/time_within_train_step": 2.572566509246826, "step": 6202} {"train_info/time_between_train_steps": 0.0033342838287353516, "step": 6202} {"info/global_step": 6203, "train_info/time_within_train_step": 2.699373722076416, "step": 6203} {"train_info/time_between_train_steps": 0.0033044815063476562, "step": 6203} {"info/global_step": 6204, "train_info/time_within_train_step": 2.7469825744628906, "step": 6204} {"train_info/time_between_train_steps": 0.003298521041870117, "step": 6204} {"info/global_step": 6205, "train_info/time_within_train_step": 2.751995801925659, "step": 6205} {"train_info/time_between_train_steps": 0.003330230712890625, "step": 6205} {"info/global_step": 6206, "train_info/time_within_train_step": 2.7575113773345947, "step": 6206} {"train_info/time_between_train_steps": 0.0032956600189208984, "step": 6206} {"info/global_step": 6207, "train_info/time_within_train_step": 2.75608229637146, "step": 6207} {"train_info/time_between_train_steps": 0.0032806396484375, "step": 6207} {"info/global_step": 6208, "train_info/time_within_train_step": 2.7567901611328125, "step": 6208} {"train_info/time_between_train_steps": 0.003337860107421875, "step": 6208} {"info/global_step": 6209, "train_info/time_within_train_step": 2.7571661472320557, "step": 6209} {"train_info/time_between_train_steps": 0.0032973289489746094, "step": 6209} {"info/global_step": 6210, "train_info/time_within_train_step": 2.7576076984405518, "step": 6210} {"train_info/time_between_train_steps": 0.0033020973205566406, "step": 6210} {"info/global_step": 6211, "train_info/time_within_train_step": 2.7562341690063477, "step": 6211} {"train_info/time_between_train_steps": 0.003338336944580078, "step": 6211} {"info/global_step": 6212, "train_info/time_within_train_step": 2.7564213275909424, "step": 6212} {"train_info/time_between_train_steps": 0.003298521041870117, "step": 6212} {"info/global_step": 6213, "train_info/time_within_train_step": 2.7573094367980957, "step": 6213} {"train_info/time_between_train_steps": 0.0033218860626220703, "step": 6213} {"info/global_step": 6214, "train_info/time_within_train_step": 2.7571797370910645, "step": 6214} {"train_info/time_between_train_steps": 0.0033295154571533203, "step": 6214} {"info/global_step": 6215, "train_info/time_within_train_step": 2.756770133972168, "step": 6215} {"train_info/time_between_train_steps": 0.0032999515533447266, "step": 6215} {"info/global_step": 6216, "train_info/time_within_train_step": 2.7570443153381348, "step": 6216} {"train_info/time_between_train_steps": 0.0033473968505859375, "step": 6216} {"info/global_step": 6217, "train_info/time_within_train_step": 2.7572789192199707, "step": 6217} {"train_info/time_between_train_steps": 0.003307819366455078, "step": 6217} {"info/global_step": 6218, "train_info/time_within_train_step": 2.7551162242889404, "step": 6218} {"train_info/time_between_train_steps": 0.0032799243927001953, "step": 6218} {"info/global_step": 6219, "train_info/time_within_train_step": 2.7565395832061768, "step": 6219} {"train_info/time_between_train_steps": 0.0033578872680664062, "step": 6219} {"info/global_step": 6220, "train_info/time_within_train_step": 2.757864236831665, "step": 6220} {"train_info/time_between_train_steps": 0.0033190250396728516, "step": 6220} {"info/global_step": 6221, "train_info/time_within_train_step": 2.756901502609253, "step": 6221} {"train_info/time_between_train_steps": 0.12693071365356445, "step": 6221} {"info/global_step": 6222, "train_info/time_within_train_step": 2.7563986778259277, "step": 6222} {"train_info/time_between_train_steps": 0.0031778812408447266, "step": 6222} {"info/global_step": 6223, "train_info/time_within_train_step": 2.756584882736206, "step": 6223} {"train_info/time_between_train_steps": 0.003117799758911133, "step": 6223} {"info/global_step": 6224, "train_info/time_within_train_step": 2.7562716007232666, "step": 6224} {"train_info/time_between_train_steps": 0.003350973129272461, "step": 6224} {"info/global_step": 6225, "train_info/time_within_train_step": 2.755441427230835, "step": 6225} {"train_info/time_between_train_steps": 0.003145456314086914, "step": 6225} {"info/global_step": 6226, "train_info/time_within_train_step": 2.7561111450195312, "step": 6226} {"train_info/time_between_train_steps": 0.003175497055053711, "step": 6226} {"info/global_step": 6227, "train_info/time_within_train_step": 2.7547199726104736, "step": 6227} {"train_info/time_between_train_steps": 0.003144979476928711, "step": 6227} {"info/global_step": 6228, "train_info/time_within_train_step": 2.7535533905029297, "step": 6228} {"train_info/time_between_train_steps": 0.0031545162200927734, "step": 6228} {"info/global_step": 6229, "train_info/time_within_train_step": 2.755018949508667, "step": 6229} {"train_info/time_between_train_steps": 0.0031785964965820312, "step": 6229} {"info/global_step": 6230, "train_info/time_within_train_step": 2.999150514602661, "step": 6230} {"train_info/time_between_train_steps": 0.0031592845916748047, "step": 6230} {"info/global_step": 6231, "train_info/time_within_train_step": 2.7540853023529053, "step": 6231} {"train_info/time_between_train_steps": 0.0031385421752929688, "step": 6231} {"info/global_step": 6232, "train_info/time_within_train_step": 2.755199909210205, "step": 6232} {"train_info/time_between_train_steps": 0.003153085708618164, "step": 6232} {"info/global_step": 6233, "train_info/time_within_train_step": 2.754079818725586, "step": 6233} {"train_info/time_between_train_steps": 0.0032088756561279297, "step": 6233} {"info/global_step": 6234, "train_info/time_within_train_step": 2.7554190158843994, "step": 6234} {"train_info/time_between_train_steps": 0.0031294822692871094, "step": 6234} {"info/global_step": 6235, "train_info/time_within_train_step": 2.7541277408599854, "step": 6235} {"train_info/time_between_train_steps": 0.003110170364379883, "step": 6235} {"info/global_step": 6236, "train_info/time_within_train_step": 2.7552857398986816, "step": 6236} {"train_info/time_between_train_steps": 0.0031452178955078125, "step": 6236} {"info/global_step": 6237, "train_info/time_within_train_step": 2.7558488845825195, "step": 6237} {"train_info/time_between_train_steps": 0.0031287670135498047, "step": 6237} {"info/global_step": 6238, "train_info/time_within_train_step": 2.7556307315826416, "step": 6238} {"train_info/time_between_train_steps": 0.0031266212463378906, "step": 6238} {"info/global_step": 6239, "train_info/time_within_train_step": 2.7558889389038086, "step": 6239} {"train_info/time_between_train_steps": 0.003148317337036133, "step": 6239} {"info/global_step": 6240, "train_info/time_within_train_step": 2.755035400390625, "step": 6240} {"train_info/time_between_train_steps": 0.0030999183654785156, "step": 6240} {"info/global_step": 6241, "train_info/time_within_train_step": 2.7552456855773926, "step": 6241} {"train_info/time_between_train_steps": 0.003131389617919922, "step": 6241} {"info/global_step": 6242, "train_info/time_within_train_step": 2.755267858505249, "step": 6242} {"train_info/time_between_train_steps": 0.0032067298889160156, "step": 6242} {"info/global_step": 6243, "train_info/time_within_train_step": 2.7553577423095703, "step": 6243} {"train_info/time_between_train_steps": 0.0031523704528808594, "step": 6243} {"info/global_step": 6244, "train_info/time_within_train_step": 2.754359483718872, "step": 6244} {"train_info/time_between_train_steps": 0.003122568130493164, "step": 6244} {"info/global_step": 6245, "train_info/time_within_train_step": 2.7557361125946045, "step": 6245} {"train_info/time_between_train_steps": 0.0031888484954833984, "step": 6245} {"info/global_step": 6246, "train_info/time_within_train_step": 2.7552692890167236, "step": 6246} {"train_info/time_between_train_steps": 0.0031642913818359375, "step": 6246} {"info/global_step": 6247, "train_info/time_within_train_step": 3.3182008266448975, "step": 6247} {"train_info/time_between_train_steps": 0.003141641616821289, "step": 6247} {"info/global_step": 6248, "train_info/time_within_train_step": 2.7543888092041016, "step": 6248} {"train_info/time_between_train_steps": 0.0031151771545410156, "step": 6248} {"info/global_step": 6249, "train_info/time_within_train_step": 2.754122018814087, "step": 6249} {"train_info/time_between_train_steps": 0.003125905990600586, "step": 6249} {"info/global_step": 6250, "train_info/time_within_train_step": 2.754103899002075, "step": 6250} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746584106, "_runtime": 18115}, "step": 6250} {"logs": {"train/loss": 3.3922, "train/learning_rate": 0.00025, "train/epoch": 7.03, "_timestamp": 1746584106, "_runtime": 18115}, "step": 6250} {"train_info/time_between_train_steps": 0.0066945552825927734, "step": 6250} {"info/global_step": 6251, "train_info/time_within_train_step": 2.754901170730591, "step": 6251} {"train_info/time_between_train_steps": 0.003153085708618164, "step": 6251} {"info/global_step": 6252, "train_info/time_within_train_step": 2.7537689208984375, "step": 6252} {"train_info/time_between_train_steps": 0.003127574920654297, "step": 6252} {"info/global_step": 6253, "train_info/time_within_train_step": 2.7537808418273926, "step": 6253} {"train_info/time_between_train_steps": 0.0032088756561279297, "step": 6253} {"info/global_step": 6254, "train_info/time_within_train_step": 2.7540132999420166, "step": 6254} {"train_info/time_between_train_steps": 0.0031685829162597656, "step": 6254} {"info/global_step": 6255, "train_info/time_within_train_step": 2.7773118019104004, "step": 6255} {"train_info/time_between_train_steps": 0.003152608871459961, "step": 6255} {"info/global_step": 6256, "train_info/time_within_train_step": 2.7546918392181396, "step": 6256} {"train_info/time_between_train_steps": 0.0031287670135498047, "step": 6256} {"info/global_step": 6257, "train_info/time_within_train_step": 2.7549500465393066, "step": 6257} {"train_info/time_between_train_steps": 0.0031337738037109375, "step": 6257} {"info/global_step": 6258, "train_info/time_within_train_step": 2.75520658493042, "step": 6258} {"train_info/time_between_train_steps": 0.0031273365020751953, "step": 6258} {"info/global_step": 6259, "train_info/time_within_train_step": 2.75468373298645, "step": 6259} {"train_info/time_between_train_steps": 0.0031244754791259766, "step": 6259} {"info/global_step": 6260, "train_info/time_within_train_step": 2.7550461292266846, "step": 6260} {"train_info/time_between_train_steps": 0.003174304962158203, "step": 6260} {"info/global_step": 6261, "train_info/time_within_train_step": 2.7551023960113525, "step": 6261} {"train_info/time_between_train_steps": 0.0031325817108154297, "step": 6261} {"info/global_step": 6262, "train_info/time_within_train_step": 2.7536325454711914, "step": 6262} {"train_info/time_between_train_steps": 0.0031490325927734375, "step": 6262} {"info/global_step": 6263, "train_info/time_within_train_step": 2.7540123462677, "step": 6263} {"train_info/time_between_train_steps": 0.003149747848510742, "step": 6263} {"info/global_step": 6264, "train_info/time_within_train_step": 2.753873348236084, "step": 6264} {"train_info/time_between_train_steps": 0.0031828880310058594, "step": 6264} {"info/global_step": 6265, "train_info/time_within_train_step": 2.7537248134613037, "step": 6265} {"train_info/time_between_train_steps": 0.0031626224517822266, "step": 6265} {"info/global_step": 6266, "train_info/time_within_train_step": 2.7544710636138916, "step": 6266} {"train_info/time_between_train_steps": 0.003144502639770508, "step": 6266} {"info/global_step": 6267, "train_info/time_within_train_step": 2.7545840740203857, "step": 6267} {"train_info/time_between_train_steps": 0.0031278133392333984, "step": 6267} {"info/global_step": 6268, "train_info/time_within_train_step": 2.7547011375427246, "step": 6268} {"train_info/time_between_train_steps": 0.0031244754791259766, "step": 6268} {"info/global_step": 6269, "train_info/time_within_train_step": 2.7544336318969727, "step": 6269} {"train_info/time_between_train_steps": 0.0031173229217529297, "step": 6269} {"info/global_step": 6270, "train_info/time_within_train_step": 2.7531790733337402, "step": 6270} {"train_info/time_between_train_steps": 0.003163576126098633, "step": 6270} {"info/global_step": 6271, "train_info/time_within_train_step": 2.755263328552246, "step": 6271} {"train_info/time_between_train_steps": 0.0031404495239257812, "step": 6271} {"info/global_step": 6272, "train_info/time_within_train_step": 2.755894899368286, "step": 6272} {"train_info/time_between_train_steps": 0.0031311511993408203, "step": 6272} {"info/global_step": 6273, "train_info/time_within_train_step": 2.7544469833374023, "step": 6273} {"train_info/time_between_train_steps": 0.003145933151245117, "step": 6273} {"info/global_step": 6274, "train_info/time_within_train_step": 2.756145715713501, "step": 6274} {"train_info/time_between_train_steps": 0.003323793411254883, "step": 6274} {"info/global_step": 6275, "train_info/time_within_train_step": 2.756836175918579, "step": 6275} {"train_info/time_between_train_steps": 0.0033042430877685547, "step": 6275} {"info/global_step": 6276, "train_info/time_within_train_step": 2.7556283473968506, "step": 6276} {"train_info/time_between_train_steps": 0.0033164024353027344, "step": 6276} {"info/global_step": 6277, "train_info/time_within_train_step": 2.757270574569702, "step": 6277} {"train_info/time_between_train_steps": 0.0033195018768310547, "step": 6277} {"info/global_step": 6278, "train_info/time_within_train_step": 2.756915330886841, "step": 6278} {"train_info/time_between_train_steps": 0.0032968521118164062, "step": 6278} {"info/global_step": 6279, "train_info/time_within_train_step": 2.7565066814422607, "step": 6279} {"train_info/time_between_train_steps": 0.0032966136932373047, "step": 6279} {"info/global_step": 6280, "train_info/time_within_train_step": 2.7551767826080322, "step": 6280} {"train_info/time_between_train_steps": 0.0032911300659179688, "step": 6280} {"info/global_step": 6281, "train_info/time_within_train_step": 2.7557642459869385, "step": 6281} {"train_info/time_between_train_steps": 0.0033159255981445312, "step": 6281} {"info/global_step": 6282, "train_info/time_within_train_step": 2.756044864654541, "step": 6282} {"train_info/time_between_train_steps": 0.0033156871795654297, "step": 6282} {"info/global_step": 6283, "train_info/time_within_train_step": 2.7571022510528564, "step": 6283} {"train_info/time_between_train_steps": 0.0032875537872314453, "step": 6283} {"info/global_step": 6284, "train_info/time_within_train_step": 2.909762144088745, "step": 6284} {"train_info/time_between_train_steps": 0.0033388137817382812, "step": 6284} {"info/global_step": 6285, "train_info/time_within_train_step": 2.7562386989593506, "step": 6285} {"train_info/time_between_train_steps": 0.0033104419708251953, "step": 6285} {"info/global_step": 6286, "train_info/time_within_train_step": 3.008718490600586, "step": 6286} {"train_info/time_between_train_steps": 0.003157377243041992, "step": 6286} {"info/global_step": 6287, "train_info/time_within_train_step": 2.7559518814086914, "step": 6287} {"train_info/time_between_train_steps": 0.0031480789184570312, "step": 6287} {"info/global_step": 6288, "train_info/time_within_train_step": 2.7552683353424072, "step": 6288} {"train_info/time_between_train_steps": 0.003221750259399414, "step": 6288} {"info/global_step": 6289, "train_info/time_within_train_step": 2.7549662590026855, "step": 6289} {"train_info/time_between_train_steps": 0.0031452178955078125, "step": 6289} {"info/global_step": 6290, "train_info/time_within_train_step": 2.755333662033081, "step": 6290} {"train_info/time_between_train_steps": 0.0031409263610839844, "step": 6290} {"info/global_step": 6291, "train_info/time_within_train_step": 2.755048990249634, "step": 6291} {"train_info/time_between_train_steps": 0.003138303756713867, "step": 6291} {"info/global_step": 6292, "train_info/time_within_train_step": 2.754932403564453, "step": 6292} {"train_info/time_between_train_steps": 0.003120899200439453, "step": 6292} {"info/global_step": 6293, "train_info/time_within_train_step": 2.7549097537994385, "step": 6293} {"train_info/time_between_train_steps": 0.003160238265991211, "step": 6293} {"info/global_step": 6294, "train_info/time_within_train_step": 2.7541534900665283, "step": 6294} {"train_info/time_between_train_steps": 0.0031375885009765625, "step": 6294} {"info/global_step": 6295, "train_info/time_within_train_step": 2.7544174194335938, "step": 6295} {"train_info/time_between_train_steps": 0.0031881332397460938, "step": 6295} {"info/global_step": 6296, "train_info/time_within_train_step": 2.754641056060791, "step": 6296} {"train_info/time_between_train_steps": 0.0031538009643554688, "step": 6296} {"info/global_step": 6297, "train_info/time_within_train_step": 2.755467176437378, "step": 6297} {"train_info/time_between_train_steps": 0.003139495849609375, "step": 6297} {"info/global_step": 6298, "train_info/time_within_train_step": 2.7548632621765137, "step": 6298} {"train_info/time_between_train_steps": 0.003134489059448242, "step": 6298} {"info/global_step": 6299, "train_info/time_within_train_step": 2.7556815147399902, "step": 6299} {"train_info/time_between_train_steps": 0.0031719207763671875, "step": 6299} {"info/global_step": 6300, "train_info/time_within_train_step": 2.7560126781463623, "step": 6300} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746584244, "_runtime": 18253}, "step": 6300} {"logs": {"train/loss": 3.3881, "train/learning_rate": 0.0002466666666666666, "train/epoch": 7.03, "_timestamp": 1746584244, "_runtime": 18253}, "step": 6300} {"train_info/time_between_train_steps": 0.00677943229675293, "step": 6300} {"info/global_step": 6301, "train_info/time_within_train_step": 2.755711555480957, "step": 6301} {"train_info/time_between_train_steps": 0.003148794174194336, "step": 6301} {"info/global_step": 6302, "train_info/time_within_train_step": 2.7544748783111572, "step": 6302} {"train_info/time_between_train_steps": 0.0031435489654541016, "step": 6302} {"info/global_step": 6303, "train_info/time_within_train_step": 2.7563486099243164, "step": 6303} {"train_info/time_between_train_steps": 0.003179311752319336, "step": 6303} {"info/global_step": 6304, "train_info/time_within_train_step": 2.7554261684417725, "step": 6304} {"train_info/time_between_train_steps": 0.0031533241271972656, "step": 6304} {"info/global_step": 6305, "train_info/time_within_train_step": 2.7565746307373047, "step": 6305} {"train_info/time_between_train_steps": 0.006436586380004883, "step": 6305} {"info/global_step": 6306, "train_info/time_within_train_step": 2.7589733600616455, "step": 6306} {"train_info/time_between_train_steps": 0.006456851959228516, "step": 6306} {"info/global_step": 6307, "train_info/time_within_train_step": 2.7589597702026367, "step": 6307} {"train_info/time_between_train_steps": 0.006482601165771484, "step": 6307} {"info/global_step": 6308, "train_info/time_within_train_step": 2.759505271911621, "step": 6308} {"train_info/time_between_train_steps": 0.006433725357055664, "step": 6308} {"info/global_step": 6309, "train_info/time_within_train_step": 2.757863998413086, "step": 6309} {"train_info/time_between_train_steps": 0.006394624710083008, "step": 6309} {"info/global_step": 6310, "train_info/time_within_train_step": 2.7580654621124268, "step": 6310} {"train_info/time_between_train_steps": 0.0031251907348632812, "step": 6310} {"info/global_step": 6311, "train_info/time_within_train_step": 2.753600597381592, "step": 6311} {"train_info/time_between_train_steps": 0.003138303756713867, "step": 6311} {"info/global_step": 6312, "train_info/time_within_train_step": 2.7554397583007812, "step": 6312} {"train_info/time_between_train_steps": 0.0031347274780273438, "step": 6312} {"info/global_step": 6313, "train_info/time_within_train_step": 2.754408359527588, "step": 6313} {"train_info/time_between_train_steps": 0.0031502246856689453, "step": 6313} {"info/global_step": 6314, "train_info/time_within_train_step": 2.754709005355835, "step": 6314} {"train_info/time_between_train_steps": 0.0031354427337646484, "step": 6314} {"info/global_step": 6315, "train_info/time_within_train_step": 2.7544522285461426, "step": 6315} {"train_info/time_between_train_steps": 0.0031342506408691406, "step": 6315} {"info/global_step": 6316, "train_info/time_within_train_step": 2.7546794414520264, "step": 6316} {"train_info/time_between_train_steps": 0.0031588077545166016, "step": 6316} {"info/global_step": 6317, "train_info/time_within_train_step": 2.754621982574463, "step": 6317} {"train_info/time_between_train_steps": 0.0031774044036865234, "step": 6317} {"info/global_step": 6318, "train_info/time_within_train_step": 2.7544755935668945, "step": 6318} {"train_info/time_between_train_steps": 0.0031294822692871094, "step": 6318} {"info/global_step": 6319, "train_info/time_within_train_step": 2.7537875175476074, "step": 6319} {"train_info/time_between_train_steps": 0.003144979476928711, "step": 6319} {"info/global_step": 6320, "train_info/time_within_train_step": 2.755657434463501, "step": 6320} {"train_info/time_between_train_steps": 0.003140687942504883, "step": 6320} {"info/global_step": 6321, "train_info/time_within_train_step": 2.7536280155181885, "step": 6321} {"train_info/time_between_train_steps": 0.003119230270385742, "step": 6321} {"info/global_step": 6322, "train_info/time_within_train_step": 2.7539408206939697, "step": 6322} {"train_info/time_between_train_steps": 0.0031533241271972656, "step": 6322} {"info/global_step": 6323, "train_info/time_within_train_step": 2.7534866333007812, "step": 6323} {"train_info/time_between_train_steps": 0.003141641616821289, "step": 6323} {"info/global_step": 6324, "train_info/time_within_train_step": 2.754833221435547, "step": 6324} {"train_info/time_between_train_steps": 0.0031523704528808594, "step": 6324} {"info/global_step": 6325, "train_info/time_within_train_step": 2.75404691696167, "step": 6325} {"train_info/time_between_train_steps": 0.003156900405883789, "step": 6325} {"info/global_step": 6326, "train_info/time_within_train_step": 3.007972478866577, "step": 6326} {"train_info/time_between_train_steps": 0.003166675567626953, "step": 6326} {"info/global_step": 6327, "train_info/time_within_train_step": 2.7545909881591797, "step": 6327} {"train_info/time_between_train_steps": 0.0031523704528808594, "step": 6327} {"info/global_step": 6328, "train_info/time_within_train_step": 2.754551410675049, "step": 6328} {"train_info/time_between_train_steps": 0.0031495094299316406, "step": 6328} {"info/global_step": 6329, "train_info/time_within_train_step": 2.7556610107421875, "step": 6329} {"train_info/time_between_train_steps": 0.0031464099884033203, "step": 6329} {"info/global_step": 6330, "train_info/time_within_train_step": 2.75496506690979, "step": 6330} {"train_info/time_between_train_steps": 0.0031893253326416016, "step": 6330} {"info/global_step": 6331, "train_info/time_within_train_step": 2.755380630493164, "step": 6331} {"train_info/time_between_train_steps": 0.0031375885009765625, "step": 6331} {"info/global_step": 6332, "train_info/time_within_train_step": 2.7552826404571533, "step": 6332} {"train_info/time_between_train_steps": 0.003146648406982422, "step": 6332} {"info/global_step": 6333, "train_info/time_within_train_step": 2.7554664611816406, "step": 6333} {"train_info/time_between_train_steps": 0.003217935562133789, "step": 6333} {"info/global_step": 6334, "train_info/time_within_train_step": 2.75532603263855, "step": 6334} {"train_info/time_between_train_steps": 0.0031349658966064453, "step": 6334} {"info/global_step": 6335, "train_info/time_within_train_step": 2.7551162242889404, "step": 6335} {"train_info/time_between_train_steps": 0.003190279006958008, "step": 6335} {"info/global_step": 6336, "train_info/time_within_train_step": 2.7546513080596924, "step": 6336} {"train_info/time_between_train_steps": 0.003151416778564453, "step": 6336} {"info/global_step": 6337, "train_info/time_within_train_step": 2.7544164657592773, "step": 6337} {"train_info/time_between_train_steps": 0.0031397342681884766, "step": 6337} {"info/global_step": 6338, "train_info/time_within_train_step": 2.7549400329589844, "step": 6338} {"train_info/time_between_train_steps": 0.003184080123901367, "step": 6338} {"info/global_step": 6339, "train_info/time_within_train_step": 2.75419020652771, "step": 6339} {"train_info/time_between_train_steps": 0.0031435489654541016, "step": 6339} {"info/global_step": 6340, "train_info/time_within_train_step": 2.752554178237915, "step": 6340} {"train_info/time_between_train_steps": 0.003107309341430664, "step": 6340} {"info/global_step": 6341, "train_info/time_within_train_step": 2.7546005249023438, "step": 6341} {"train_info/time_between_train_steps": 0.0032019615173339844, "step": 6341} {"info/global_step": 6342, "train_info/time_within_train_step": 2.7547032833099365, "step": 6342} {"train_info/time_between_train_steps": 0.0031719207763671875, "step": 6342} {"info/global_step": 6343, "train_info/time_within_train_step": 2.7547876834869385, "step": 6343} {"train_info/time_between_train_steps": 0.003137350082397461, "step": 6343} {"info/global_step": 6344, "train_info/time_within_train_step": 2.7524681091308594, "step": 6344} {"train_info/time_between_train_steps": 0.003180980682373047, "step": 6344} {"info/global_step": 6345, "train_info/time_within_train_step": 2.7550594806671143, "step": 6345} {"train_info/time_between_train_steps": 0.0031642913818359375, "step": 6345} {"info/global_step": 6346, "train_info/time_within_train_step": 2.7553939819335938, "step": 6346} {"train_info/time_between_train_steps": 0.1286182403564453, "step": 6346} {"info/global_step": 6347, "train_info/time_within_train_step": 2.757373094558716, "step": 6347} {"train_info/time_between_train_steps": 0.0031890869140625, "step": 6347} {"info/global_step": 6348, "train_info/time_within_train_step": 2.753757953643799, "step": 6348} {"train_info/time_between_train_steps": 0.003121614456176758, "step": 6348} {"info/global_step": 6349, "train_info/time_within_train_step": 2.755218505859375, "step": 6349} {"train_info/time_between_train_steps": 0.0031461715698242188, "step": 6349} {"info/global_step": 6350, "train_info/time_within_train_step": 2.7543652057647705, "step": 6350} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746584383, "_runtime": 18392}, "step": 6350} {"logs": {"train/loss": 3.3928, "train/learning_rate": 0.0002433333333333333, "train/epoch": 7.04, "_timestamp": 1746584383, "_runtime": 18392}, "step": 6350} {"train_info/time_between_train_steps": 0.006896257400512695, "step": 6350} {"info/global_step": 6351, "train_info/time_within_train_step": 2.7552378177642822, "step": 6351} {"train_info/time_between_train_steps": 0.003137350082397461, "step": 6351} {"info/global_step": 6352, "train_info/time_within_train_step": 2.7550289630889893, "step": 6352} {"train_info/time_between_train_steps": 0.003120899200439453, "step": 6352} {"info/global_step": 6353, "train_info/time_within_train_step": 2.754054546356201, "step": 6353} {"train_info/time_between_train_steps": 0.003168344497680664, "step": 6353} {"info/global_step": 6354, "train_info/time_within_train_step": 2.754533529281616, "step": 6354} {"train_info/time_between_train_steps": 0.0031485557556152344, "step": 6354} {"info/global_step": 6355, "train_info/time_within_train_step": 2.7566699981689453, "step": 6355} {"train_info/time_between_train_steps": 0.0031332969665527344, "step": 6355} {"info/global_step": 6356, "train_info/time_within_train_step": 2.7555150985717773, "step": 6356} {"train_info/time_between_train_steps": 0.003322124481201172, "step": 6356} {"info/global_step": 6357, "train_info/time_within_train_step": 2.756518840789795, "step": 6357} {"train_info/time_between_train_steps": 0.003331899642944336, "step": 6357} {"info/global_step": 6358, "train_info/time_within_train_step": 2.7565550804138184, "step": 6358} {"train_info/time_between_train_steps": 0.0033066272735595703, "step": 6358} {"info/global_step": 6359, "train_info/time_within_train_step": 2.754246234893799, "step": 6359} {"train_info/time_between_train_steps": 0.0031409263610839844, "step": 6359} {"info/global_step": 6360, "train_info/time_within_train_step": 2.7536001205444336, "step": 6360} {"train_info/time_between_train_steps": 0.0031328201293945312, "step": 6360} {"info/global_step": 6361, "train_info/time_within_train_step": 2.7544302940368652, "step": 6361} {"train_info/time_between_train_steps": 0.0031452178955078125, "step": 6361} {"info/global_step": 6362, "train_info/time_within_train_step": 2.7553961277008057, "step": 6362} {"train_info/time_between_train_steps": 0.0031566619873046875, "step": 6362} {"info/global_step": 6363, "train_info/time_within_train_step": 2.755262851715088, "step": 6363} {"train_info/time_between_train_steps": 0.0031251907348632812, "step": 6363} {"info/global_step": 6364, "train_info/time_within_train_step": 2.7550573348999023, "step": 6364} {"train_info/time_between_train_steps": 0.003115415573120117, "step": 6364} {"info/global_step": 6365, "train_info/time_within_train_step": 2.7541069984436035, "step": 6365} {"train_info/time_between_train_steps": 0.003178834915161133, "step": 6365} {"info/global_step": 6366, "train_info/time_within_train_step": 2.75544810295105, "step": 6366} {"train_info/time_between_train_steps": 0.003284931182861328, "step": 6366} {"info/global_step": 6367, "train_info/time_within_train_step": 2.7561700344085693, "step": 6367} {"train_info/time_between_train_steps": 0.0031485557556152344, "step": 6367} {"info/global_step": 6368, "train_info/time_within_train_step": 2.7543094158172607, "step": 6368} {"train_info/time_between_train_steps": 0.0031599998474121094, "step": 6368} {"info/global_step": 6369, "train_info/time_within_train_step": 2.7559659481048584, "step": 6369} {"train_info/time_between_train_steps": 0.0031440258026123047, "step": 6369} {"info/global_step": 6370, "train_info/time_within_train_step": 2.755002737045288, "step": 6370} {"train_info/time_between_train_steps": 0.003142833709716797, "step": 6370} {"info/global_step": 6371, "train_info/time_within_train_step": 2.7553768157958984, "step": 6371} {"train_info/time_between_train_steps": 0.0031583309173583984, "step": 6371} {"info/global_step": 6372, "train_info/time_within_train_step": 2.7553787231445312, "step": 6372} {"train_info/time_between_train_steps": 0.003178119659423828, "step": 6372} {"info/global_step": 6373, "train_info/time_within_train_step": 2.7556698322296143, "step": 6373} {"train_info/time_between_train_steps": 0.0031855106353759766, "step": 6373} {"info/global_step": 6374, "train_info/time_within_train_step": 2.7544143199920654, "step": 6374} {"train_info/time_between_train_steps": 0.0031845569610595703, "step": 6374} {"info/global_step": 6375, "train_info/time_within_train_step": 2.7552714347839355, "step": 6375} {"train_info/time_between_train_steps": 0.0031173229217529297, "step": 6375} {"info/global_step": 6376, "train_info/time_within_train_step": 2.755053758621216, "step": 6376} {"train_info/time_between_train_steps": 0.003164529800415039, "step": 6376} {"info/global_step": 6377, "train_info/time_within_train_step": 2.7556135654449463, "step": 6377} {"train_info/time_between_train_steps": 0.0031626224517822266, "step": 6377} {"info/global_step": 6378, "train_info/time_within_train_step": 2.7554211616516113, "step": 6378} {"train_info/time_between_train_steps": 0.003146648406982422, "step": 6378} {"info/global_step": 6379, "train_info/time_within_train_step": 2.755681276321411, "step": 6379} {"train_info/time_between_train_steps": 0.0032057762145996094, "step": 6379} {"info/global_step": 6380, "train_info/time_within_train_step": 2.7552335262298584, "step": 6380} {"train_info/time_between_train_steps": 0.0031766891479492188, "step": 6380} {"info/global_step": 6381, "train_info/time_within_train_step": 2.7538061141967773, "step": 6381} {"train_info/time_between_train_steps": 0.003139019012451172, "step": 6381} {"info/global_step": 6382, "train_info/time_within_train_step": 2.753676652908325, "step": 6382} {"train_info/time_between_train_steps": 0.003157377243041992, "step": 6382} {"info/global_step": 6383, "train_info/time_within_train_step": 2.7552592754364014, "step": 6383} {"train_info/time_between_train_steps": 0.0036096572875976562, "step": 6383} {"info/global_step": 6384, "train_info/time_within_train_step": 2.7548723220825195, "step": 6384} {"train_info/time_between_train_steps": 0.003203868865966797, "step": 6384} {"info/global_step": 6385, "train_info/time_within_train_step": 2.755079746246338, "step": 6385} {"train_info/time_between_train_steps": 0.0031850337982177734, "step": 6385} {"info/global_step": 6386, "train_info/time_within_train_step": 2.75425124168396, "step": 6386} {"train_info/time_between_train_steps": 0.003194570541381836, "step": 6386} {"info/global_step": 6387, "train_info/time_within_train_step": 2.7548558712005615, "step": 6387} {"train_info/time_between_train_steps": 0.0031304359436035156, "step": 6387} {"info/global_step": 6388, "train_info/time_within_train_step": 2.7549097537994385, "step": 6388} {"train_info/time_between_train_steps": 0.0032851696014404297, "step": 6388} {"info/global_step": 6389, "train_info/time_within_train_step": 2.755131959915161, "step": 6389} {"train_info/time_between_train_steps": 0.003355741500854492, "step": 6389} {"info/global_step": 6390, "train_info/time_within_train_step": 2.7564492225646973, "step": 6390} {"train_info/time_between_train_steps": 0.003386974334716797, "step": 6390} {"info/global_step": 6391, "train_info/time_within_train_step": 2.755922555923462, "step": 6391} {"train_info/time_between_train_steps": 0.0033926963806152344, "step": 6391} {"info/global_step": 6392, "train_info/time_within_train_step": 2.756639003753662, "step": 6392} {"train_info/time_between_train_steps": 0.003340482711791992, "step": 6392} {"info/global_step": 6393, "train_info/time_within_train_step": 2.7552907466888428, "step": 6393} {"train_info/time_between_train_steps": 0.003431558609008789, "step": 6393} {"info/global_step": 6394, "train_info/time_within_train_step": 2.7542293071746826, "step": 6394} {"train_info/time_between_train_steps": 0.003414154052734375, "step": 6394} {"info/global_step": 6395, "train_info/time_within_train_step": 2.7558975219726562, "step": 6395} {"train_info/time_between_train_steps": 0.003358602523803711, "step": 6395} {"info/global_step": 6396, "train_info/time_within_train_step": 2.7563116550445557, "step": 6396} {"train_info/time_between_train_steps": 0.003416776657104492, "step": 6396} {"info/global_step": 6397, "train_info/time_within_train_step": 2.7562105655670166, "step": 6397} {"train_info/time_between_train_steps": 0.003355741500854492, "step": 6397} {"info/global_step": 6398, "train_info/time_within_train_step": 2.755845069885254, "step": 6398} {"train_info/time_between_train_steps": 0.0033063888549804688, "step": 6398} {"info/global_step": 6399, "train_info/time_within_train_step": 2.7548153400421143, "step": 6399} {"train_info/time_between_train_steps": 0.0033295154571533203, "step": 6399} {"info/global_step": 6400, "train_info/time_within_train_step": 2.7550971508026123, "step": 6400} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746584521, "_runtime": 18530}, "step": 6400} {"logs": {"train/loss": 3.3766, "train/learning_rate": 0.00023999999999999998, "train/epoch": 7.04, "_timestamp": 1746584521, "_runtime": 18530}, "step": 6400} {"train_info/time_between_train_steps": 26.06648898124695, "step": 6400} {"info/global_step": 6401, "train_info/time_within_train_step": 2.5427870750427246, "step": 6401} {"train_info/time_between_train_steps": 0.0034737586975097656, "step": 6401} {"info/global_step": 6402, "train_info/time_within_train_step": 2.5808355808258057, "step": 6402} {"train_info/time_between_train_steps": 0.0035338401794433594, "step": 6402} {"info/global_step": 6403, "train_info/time_within_train_step": 2.711674690246582, "step": 6403} {"train_info/time_between_train_steps": 0.0035588741302490234, "step": 6403} {"info/global_step": 6404, "train_info/time_within_train_step": 2.7244131565093994, "step": 6404} {"train_info/time_between_train_steps": 0.0034673213958740234, "step": 6404} {"info/global_step": 6405, "train_info/time_within_train_step": 2.7445075511932373, "step": 6405} {"train_info/time_between_train_steps": 0.0034897327423095703, "step": 6405} {"info/global_step": 6406, "train_info/time_within_train_step": 2.7582337856292725, "step": 6406} {"train_info/time_between_train_steps": 0.003502368927001953, "step": 6406} {"info/global_step": 6407, "train_info/time_within_train_step": 2.7574102878570557, "step": 6407} {"train_info/time_between_train_steps": 0.0035102367401123047, "step": 6407} {"info/global_step": 6408, "train_info/time_within_train_step": 2.758209228515625, "step": 6408} {"train_info/time_between_train_steps": 0.0034580230712890625, "step": 6408} {"info/global_step": 6409, "train_info/time_within_train_step": 2.9112443923950195, "step": 6409} {"train_info/time_between_train_steps": 0.003462553024291992, "step": 6409} {"info/global_step": 6410, "train_info/time_within_train_step": 2.758945941925049, "step": 6410} {"train_info/time_between_train_steps": 0.003434896469116211, "step": 6410} {"info/global_step": 6411, "train_info/time_within_train_step": 3.061316728591919, "step": 6411} {"train_info/time_between_train_steps": 0.003327608108520508, "step": 6411} {"info/global_step": 6412, "train_info/time_within_train_step": 2.7573161125183105, "step": 6412} {"train_info/time_between_train_steps": 0.0033409595489501953, "step": 6412} {"info/global_step": 6413, "train_info/time_within_train_step": 2.757371187210083, "step": 6413} {"train_info/time_between_train_steps": 0.0033349990844726562, "step": 6413} {"info/global_step": 6414, "train_info/time_within_train_step": 2.7578353881835938, "step": 6414} {"train_info/time_between_train_steps": 0.0033500194549560547, "step": 6414} {"info/global_step": 6415, "train_info/time_within_train_step": 2.758533000946045, "step": 6415} {"train_info/time_between_train_steps": 0.0033490657806396484, "step": 6415} {"info/global_step": 6416, "train_info/time_within_train_step": 2.7580699920654297, "step": 6416} {"train_info/time_between_train_steps": 0.0034024715423583984, "step": 6416} {"info/global_step": 6417, "train_info/time_within_train_step": 2.759456157684326, "step": 6417} {"train_info/time_between_train_steps": 0.0033550262451171875, "step": 6417} {"info/global_step": 6418, "train_info/time_within_train_step": 2.7580811977386475, "step": 6418} {"train_info/time_between_train_steps": 0.0033540725708007812, "step": 6418} {"info/global_step": 6419, "train_info/time_within_train_step": 2.7585906982421875, "step": 6419} {"train_info/time_between_train_steps": 0.003330707550048828, "step": 6419} {"info/global_step": 6420, "train_info/time_within_train_step": 2.757676362991333, "step": 6420} {"train_info/time_between_train_steps": 0.0033664703369140625, "step": 6420} {"info/global_step": 6421, "train_info/time_within_train_step": 2.758200168609619, "step": 6421} {"train_info/time_between_train_steps": 0.0033965110778808594, "step": 6421} {"info/global_step": 6422, "train_info/time_within_train_step": 2.7577147483825684, "step": 6422} {"train_info/time_between_train_steps": 0.0033152103424072266, "step": 6422} {"info/global_step": 6423, "train_info/time_within_train_step": 2.758683919906616, "step": 6423} {"train_info/time_between_train_steps": 0.003360271453857422, "step": 6423} {"info/global_step": 6424, "train_info/time_within_train_step": 2.7588491439819336, "step": 6424} {"train_info/time_between_train_steps": 0.0033500194549560547, "step": 6424} {"info/global_step": 6425, "train_info/time_within_train_step": 2.7581515312194824, "step": 6425} {"train_info/time_between_train_steps": 0.0033037662506103516, "step": 6425} {"info/global_step": 6426, "train_info/time_within_train_step": 2.758646011352539, "step": 6426} {"train_info/time_between_train_steps": 0.0033435821533203125, "step": 6426} {"info/global_step": 6427, "train_info/time_within_train_step": 2.758812665939331, "step": 6427} {"train_info/time_between_train_steps": 0.0033888816833496094, "step": 6427} {"info/global_step": 6428, "train_info/time_within_train_step": 2.75775146484375, "step": 6428} {"train_info/time_between_train_steps": 0.0033397674560546875, "step": 6428} {"info/global_step": 6429, "train_info/time_within_train_step": 2.757680892944336, "step": 6429} {"train_info/time_between_train_steps": 0.003354310989379883, "step": 6429} {"info/global_step": 6430, "train_info/time_within_train_step": 2.759037494659424, "step": 6430} {"train_info/time_between_train_steps": 0.003339529037475586, "step": 6430} {"info/global_step": 6431, "train_info/time_within_train_step": 2.75838041305542, "step": 6431} {"train_info/time_between_train_steps": 0.003463268280029297, "step": 6431} {"info/global_step": 6432, "train_info/time_within_train_step": 2.7585511207580566, "step": 6432} {"train_info/time_between_train_steps": 0.0033791065216064453, "step": 6432} {"info/global_step": 6433, "train_info/time_within_train_step": 2.7585535049438477, "step": 6433} {"train_info/time_between_train_steps": 0.003326892852783203, "step": 6433} {"info/global_step": 6434, "train_info/time_within_train_step": 2.7599024772644043, "step": 6434} {"train_info/time_between_train_steps": 0.0033206939697265625, "step": 6434} {"info/global_step": 6435, "train_info/time_within_train_step": 2.7578177452087402, "step": 6435} {"train_info/time_between_train_steps": 0.003343343734741211, "step": 6435} {"info/global_step": 6436, "train_info/time_within_train_step": 2.7566921710968018, "step": 6436} {"train_info/time_between_train_steps": 0.0033347606658935547, "step": 6436} {"info/global_step": 6437, "train_info/time_within_train_step": 2.7576687335968018, "step": 6437} {"train_info/time_between_train_steps": 0.0032014846801757812, "step": 6437} {"info/global_step": 6438, "train_info/time_within_train_step": 2.7573256492614746, "step": 6438} {"train_info/time_between_train_steps": 0.003170013427734375, "step": 6438} {"info/global_step": 6439, "train_info/time_within_train_step": 2.7570371627807617, "step": 6439} {"train_info/time_between_train_steps": 0.0031507015228271484, "step": 6439} {"info/global_step": 6440, "train_info/time_within_train_step": 2.756517171859741, "step": 6440} {"train_info/time_between_train_steps": 0.0031538009643554688, "step": 6440} {"info/global_step": 6441, "train_info/time_within_train_step": 2.756183385848999, "step": 6441} {"train_info/time_between_train_steps": 0.0031557083129882812, "step": 6441} {"info/global_step": 6442, "train_info/time_within_train_step": 2.7549147605895996, "step": 6442} {"train_info/time_between_train_steps": 0.003170013427734375, "step": 6442} {"info/global_step": 6443, "train_info/time_within_train_step": 2.7557148933410645, "step": 6443} {"train_info/time_between_train_steps": 0.0031719207763671875, "step": 6443} {"info/global_step": 6444, "train_info/time_within_train_step": 2.7566394805908203, "step": 6444} {"train_info/time_between_train_steps": 0.003175497055053711, "step": 6444} {"info/global_step": 6445, "train_info/time_within_train_step": 2.756084680557251, "step": 6445} {"train_info/time_between_train_steps": 0.0032052993774414062, "step": 6445} {"info/global_step": 6446, "train_info/time_within_train_step": 2.755598783493042, "step": 6446} {"train_info/time_between_train_steps": 0.0031821727752685547, "step": 6446} {"info/global_step": 6447, "train_info/time_within_train_step": 2.7561378479003906, "step": 6447} {"train_info/time_between_train_steps": 0.0031576156616210938, "step": 6447} {"info/global_step": 6448, "train_info/time_within_train_step": 2.7559666633605957, "step": 6448} {"train_info/time_between_train_steps": 0.003142118453979492, "step": 6448} {"info/global_step": 6449, "train_info/time_within_train_step": 2.756500482559204, "step": 6449} {"train_info/time_between_train_steps": 0.0032014846801757812, "step": 6449} {"info/global_step": 6450, "train_info/time_within_train_step": 2.7562265396118164, "step": 6450} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746584686, "_runtime": 18695}, "step": 6450} {"logs": {"train/loss": 3.3656, "train/learning_rate": 0.00023666666666666663, "train/epoch": 7.05, "_timestamp": 1746584686, "_runtime": 18695}, "step": 6450} {"train_info/time_between_train_steps": 0.012886524200439453, "step": 6450} {"info/global_step": 6451, "train_info/time_within_train_step": 2.756988763809204, "step": 6451} {"train_info/time_between_train_steps": 0.003129243850708008, "step": 6451} {"info/global_step": 6452, "train_info/time_within_train_step": 3.0178070068359375, "step": 6452} {"train_info/time_between_train_steps": 0.0031592845916748047, "step": 6452} {"info/global_step": 6453, "train_info/time_within_train_step": 2.7552616596221924, "step": 6453} {"train_info/time_between_train_steps": 0.0031266212463378906, "step": 6453} {"info/global_step": 6454, "train_info/time_within_train_step": 2.754936933517456, "step": 6454} {"train_info/time_between_train_steps": 0.003154754638671875, "step": 6454} {"info/global_step": 6455, "train_info/time_within_train_step": 2.7555484771728516, "step": 6455} {"train_info/time_between_train_steps": 0.003162860870361328, "step": 6455} {"info/global_step": 6456, "train_info/time_within_train_step": 2.7561607360839844, "step": 6456} {"train_info/time_between_train_steps": 0.0031790733337402344, "step": 6456} {"info/global_step": 6457, "train_info/time_within_train_step": 2.7554714679718018, "step": 6457} {"train_info/time_between_train_steps": 0.003134489059448242, "step": 6457} {"info/global_step": 6458, "train_info/time_within_train_step": 2.756685972213745, "step": 6458} {"train_info/time_between_train_steps": 0.0031447410583496094, "step": 6458} {"info/global_step": 6459, "train_info/time_within_train_step": 2.7560439109802246, "step": 6459} {"train_info/time_between_train_steps": 0.003146648406982422, "step": 6459} {"info/global_step": 6460, "train_info/time_within_train_step": 2.756364345550537, "step": 6460} {"train_info/time_between_train_steps": 0.0032215118408203125, "step": 6460} {"info/global_step": 6461, "train_info/time_within_train_step": 2.7558133602142334, "step": 6461} {"train_info/time_between_train_steps": 0.003168344497680664, "step": 6461} {"info/global_step": 6462, "train_info/time_within_train_step": 2.75443696975708, "step": 6462} {"train_info/time_between_train_steps": 0.0031213760375976562, "step": 6462} {"info/global_step": 6463, "train_info/time_within_train_step": 2.7559902667999268, "step": 6463} {"train_info/time_between_train_steps": 0.003189563751220703, "step": 6463} {"info/global_step": 6464, "train_info/time_within_train_step": 2.756281852722168, "step": 6464} {"train_info/time_between_train_steps": 0.0031404495239257812, "step": 6464} {"info/global_step": 6465, "train_info/time_within_train_step": 2.755740165710449, "step": 6465} {"train_info/time_between_train_steps": 0.003185272216796875, "step": 6465} {"info/global_step": 6466, "train_info/time_within_train_step": 2.7554452419281006, "step": 6466} {"train_info/time_between_train_steps": 0.00318145751953125, "step": 6466} {"info/global_step": 6467, "train_info/time_within_train_step": 2.7563464641571045, "step": 6467} {"train_info/time_between_train_steps": 0.00318145751953125, "step": 6467} {"info/global_step": 6468, "train_info/time_within_train_step": 2.755815029144287, "step": 6468} {"train_info/time_between_train_steps": 0.0031800270080566406, "step": 6468} {"info/global_step": 6469, "train_info/time_within_train_step": 2.7548375129699707, "step": 6469} {"train_info/time_between_train_steps": 0.0031654834747314453, "step": 6469} {"info/global_step": 6470, "train_info/time_within_train_step": 2.7553868293762207, "step": 6470} {"train_info/time_between_train_steps": 0.0031595230102539062, "step": 6470} {"info/global_step": 6471, "train_info/time_within_train_step": 2.755465269088745, "step": 6471} {"train_info/time_between_train_steps": 0.09493255615234375, "step": 6471} {"info/global_step": 6472, "train_info/time_within_train_step": 2.7570009231567383, "step": 6472} {"train_info/time_between_train_steps": 0.0031800270080566406, "step": 6472} {"info/global_step": 6473, "train_info/time_within_train_step": 2.7555408477783203, "step": 6473} {"train_info/time_between_train_steps": 0.0031850337982177734, "step": 6473} {"info/global_step": 6474, "train_info/time_within_train_step": 2.7552359104156494, "step": 6474} {"train_info/time_between_train_steps": 0.003190755844116211, "step": 6474} {"info/global_step": 6475, "train_info/time_within_train_step": 2.7546017169952393, "step": 6475} {"train_info/time_between_train_steps": 0.003171205520629883, "step": 6475} {"info/global_step": 6476, "train_info/time_within_train_step": 2.7565886974334717, "step": 6476} {"train_info/time_between_train_steps": 0.003195047378540039, "step": 6476} {"info/global_step": 6477, "train_info/time_within_train_step": 2.7557647228240967, "step": 6477} {"train_info/time_between_train_steps": 0.0031805038452148438, "step": 6477} {"info/global_step": 6478, "train_info/time_within_train_step": 2.7562882900238037, "step": 6478} {"train_info/time_between_train_steps": 0.0031974315643310547, "step": 6478} {"info/global_step": 6479, "train_info/time_within_train_step": 2.755065441131592, "step": 6479} {"train_info/time_between_train_steps": 0.0031561851501464844, "step": 6479} {"info/global_step": 6480, "train_info/time_within_train_step": 2.755732297897339, "step": 6480} {"train_info/time_between_train_steps": 0.003225088119506836, "step": 6480} {"info/global_step": 6481, "train_info/time_within_train_step": 2.7566473484039307, "step": 6481} {"train_info/time_between_train_steps": 0.003170490264892578, "step": 6481} {"info/global_step": 6482, "train_info/time_within_train_step": 2.755740165710449, "step": 6482} {"train_info/time_between_train_steps": 0.003195524215698242, "step": 6482} {"info/global_step": 6483, "train_info/time_within_train_step": 2.7547922134399414, "step": 6483} {"train_info/time_between_train_steps": 0.003242015838623047, "step": 6483} {"info/global_step": 6484, "train_info/time_within_train_step": 2.756077527999878, "step": 6484} {"train_info/time_between_train_steps": 0.0031888484954833984, "step": 6484} {"info/global_step": 6485, "train_info/time_within_train_step": 2.755427598953247, "step": 6485} {"train_info/time_between_train_steps": 0.003172159194946289, "step": 6485} {"info/global_step": 6486, "train_info/time_within_train_step": 2.75276255607605, "step": 6486} {"train_info/time_between_train_steps": 0.00321197509765625, "step": 6486} {"info/global_step": 6487, "train_info/time_within_train_step": 2.7797861099243164, "step": 6487} {"train_info/time_between_train_steps": 0.003202199935913086, "step": 6487} {"info/global_step": 6488, "train_info/time_within_train_step": 2.7555453777313232, "step": 6488} {"train_info/time_between_train_steps": 0.0031976699829101562, "step": 6488} {"info/global_step": 6489, "train_info/time_within_train_step": 2.755955696105957, "step": 6489} {"train_info/time_between_train_steps": 0.003239154815673828, "step": 6489} {"info/global_step": 6490, "train_info/time_within_train_step": 2.7559452056884766, "step": 6490} {"train_info/time_between_train_steps": 0.0031669139862060547, "step": 6490} {"info/global_step": 6491, "train_info/time_within_train_step": 2.7551937103271484, "step": 6491} {"train_info/time_between_train_steps": 0.003180980682373047, "step": 6491} {"info/global_step": 6492, "train_info/time_within_train_step": 2.756152868270874, "step": 6492} {"train_info/time_between_train_steps": 0.003209829330444336, "step": 6492} {"info/global_step": 6493, "train_info/time_within_train_step": 2.757167100906372, "step": 6493} {"train_info/time_between_train_steps": 0.0031495094299316406, "step": 6493} {"info/global_step": 6494, "train_info/time_within_train_step": 2.755641460418701, "step": 6494} {"train_info/time_between_train_steps": 0.0031752586364746094, "step": 6494} {"info/global_step": 6495, "train_info/time_within_train_step": 2.75586199760437, "step": 6495} {"train_info/time_between_train_steps": 0.0031785964965820312, "step": 6495} {"info/global_step": 6496, "train_info/time_within_train_step": 2.7552473545074463, "step": 6496} {"train_info/time_between_train_steps": 0.0031270980834960938, "step": 6496} {"info/global_step": 6497, "train_info/time_within_train_step": 3.3633010387420654, "step": 6497} {"train_info/time_between_train_steps": 0.0034630298614501953, "step": 6497} {"info/global_step": 6498, "train_info/time_within_train_step": 2.75649356842041, "step": 6498} {"train_info/time_between_train_steps": 0.003337383270263672, "step": 6498} {"info/global_step": 6499, "train_info/time_within_train_step": 2.7565112113952637, "step": 6499} {"train_info/time_between_train_steps": 0.003377199172973633, "step": 6499} {"info/global_step": 6500, "train_info/time_within_train_step": 2.7560043334960938, "step": 6500} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746584825, "_runtime": 18834}, "step": 6500} {"logs": {"train/loss": 3.3584, "train/learning_rate": 0.0002333333333333333, "train/epoch": 7.05, "_timestamp": 1746584825, "_runtime": 18834}, "step": 6500} {"train_info/time_between_train_steps": 0.01527094841003418, "step": 6500} {"info/global_step": 6501, "train_info/time_within_train_step": 2.7570860385894775, "step": 6501} {"train_info/time_between_train_steps": 0.0033576488494873047, "step": 6501} {"info/global_step": 6502, "train_info/time_within_train_step": 2.7568840980529785, "step": 6502} {"train_info/time_between_train_steps": 0.0033791065216064453, "step": 6502} {"info/global_step": 6503, "train_info/time_within_train_step": 2.757112741470337, "step": 6503} {"train_info/time_between_train_steps": 0.0033762454986572266, "step": 6503} {"info/global_step": 6504, "train_info/time_within_train_step": 2.756683588027954, "step": 6504} {"train_info/time_between_train_steps": 0.003336668014526367, "step": 6504} {"info/global_step": 6505, "train_info/time_within_train_step": 2.757521867752075, "step": 6505} {"train_info/time_between_train_steps": 0.003370046615600586, "step": 6505} {"info/global_step": 6506, "train_info/time_within_train_step": 2.7561802864074707, "step": 6506} {"train_info/time_between_train_steps": 0.0033779144287109375, "step": 6506} {"info/global_step": 6507, "train_info/time_within_train_step": 2.7560343742370605, "step": 6507} {"train_info/time_between_train_steps": 0.0034432411193847656, "step": 6507} {"info/global_step": 6508, "train_info/time_within_train_step": 2.756592035293579, "step": 6508} {"train_info/time_between_train_steps": 0.003362894058227539, "step": 6508} {"info/global_step": 6509, "train_info/time_within_train_step": 2.7569994926452637, "step": 6509} {"train_info/time_between_train_steps": 0.003365039825439453, "step": 6509} {"info/global_step": 6510, "train_info/time_within_train_step": 2.7553911209106445, "step": 6510} {"train_info/time_between_train_steps": 0.0033147335052490234, "step": 6510} {"info/global_step": 6511, "train_info/time_within_train_step": 2.7575888633728027, "step": 6511} {"train_info/time_between_train_steps": 0.0033521652221679688, "step": 6511} {"info/global_step": 6512, "train_info/time_within_train_step": 2.757032632827759, "step": 6512} {"train_info/time_between_train_steps": 0.020213603973388672, "step": 6512} {"info/global_step": 6513, "train_info/time_within_train_step": 2.7568068504333496, "step": 6513} {"train_info/time_between_train_steps": 0.0029973983764648438, "step": 6513} {"info/global_step": 6514, "train_info/time_within_train_step": 2.7563986778259277, "step": 6514} {"train_info/time_between_train_steps": 0.0030298233032226562, "step": 6514} {"info/global_step": 6515, "train_info/time_within_train_step": 2.756284475326538, "step": 6515} {"train_info/time_between_train_steps": 0.002978801727294922, "step": 6515} {"info/global_step": 6516, "train_info/time_within_train_step": 2.7576630115509033, "step": 6516} {"train_info/time_between_train_steps": 0.0030219554901123047, "step": 6516} {"info/global_step": 6517, "train_info/time_within_train_step": 2.756442070007324, "step": 6517} {"train_info/time_between_train_steps": 0.002988576889038086, "step": 6517} {"info/global_step": 6518, "train_info/time_within_train_step": 2.7559657096862793, "step": 6518} {"train_info/time_between_train_steps": 0.0029478073120117188, "step": 6518} {"info/global_step": 6519, "train_info/time_within_train_step": 2.756007194519043, "step": 6519} {"train_info/time_between_train_steps": 0.0029697418212890625, "step": 6519} {"info/global_step": 6520, "train_info/time_within_train_step": 2.7563254833221436, "step": 6520} {"train_info/time_between_train_steps": 0.00301361083984375, "step": 6520} {"info/global_step": 6521, "train_info/time_within_train_step": 2.7547154426574707, "step": 6521} {"train_info/time_between_train_steps": 0.002956390380859375, "step": 6521} {"info/global_step": 6522, "train_info/time_within_train_step": 2.755537986755371, "step": 6522} {"train_info/time_between_train_steps": 0.002974987030029297, "step": 6522} {"info/global_step": 6523, "train_info/time_within_train_step": 2.755805253982544, "step": 6523} {"train_info/time_between_train_steps": 0.003027677536010742, "step": 6523} {"info/global_step": 6524, "train_info/time_within_train_step": 2.7548327445983887, "step": 6524} {"train_info/time_between_train_steps": 0.002966642379760742, "step": 6524} {"info/global_step": 6525, "train_info/time_within_train_step": 2.756251811981201, "step": 6525} {"train_info/time_between_train_steps": 0.003015756607055664, "step": 6525} {"info/global_step": 6526, "train_info/time_within_train_step": 2.756223440170288, "step": 6526} {"train_info/time_between_train_steps": 0.002976655960083008, "step": 6526} {"info/global_step": 6527, "train_info/time_within_train_step": 2.756317138671875, "step": 6527} {"train_info/time_between_train_steps": 0.0030045509338378906, "step": 6527} {"info/global_step": 6528, "train_info/time_within_train_step": 2.755981922149658, "step": 6528} {"train_info/time_between_train_steps": 0.0030059814453125, "step": 6528} {"info/global_step": 6529, "train_info/time_within_train_step": 2.756835460662842, "step": 6529} {"train_info/time_between_train_steps": 0.0029897689819335938, "step": 6529} {"info/global_step": 6530, "train_info/time_within_train_step": 2.756533622741699, "step": 6530} {"train_info/time_between_train_steps": 0.0029981136322021484, "step": 6530} {"info/global_step": 6531, "train_info/time_within_train_step": 2.7570085525512695, "step": 6531} {"train_info/time_between_train_steps": 0.002993345260620117, "step": 6531} {"info/global_step": 6532, "train_info/time_within_train_step": 2.7560739517211914, "step": 6532} {"train_info/time_between_train_steps": 0.002973318099975586, "step": 6532} {"info/global_step": 6533, "train_info/time_within_train_step": 2.7552244663238525, "step": 6533} {"train_info/time_between_train_steps": 0.0029456615447998047, "step": 6533} {"info/global_step": 6534, "train_info/time_within_train_step": 2.7569706439971924, "step": 6534} {"train_info/time_between_train_steps": 0.0029735565185546875, "step": 6534} {"info/global_step": 6535, "train_info/time_within_train_step": 2.75614070892334, "step": 6535} {"train_info/time_between_train_steps": 0.0029959678649902344, "step": 6535} {"info/global_step": 6536, "train_info/time_within_train_step": 2.755638599395752, "step": 6536} {"train_info/time_between_train_steps": 0.0029783248901367188, "step": 6536} {"info/global_step": 6537, "train_info/time_within_train_step": 2.754640817642212, "step": 6537} {"train_info/time_between_train_steps": 0.00301361083984375, "step": 6537} {"info/global_step": 6538, "train_info/time_within_train_step": 2.755289316177368, "step": 6538} {"train_info/time_between_train_steps": 0.0030019283294677734, "step": 6538} {"info/global_step": 6539, "train_info/time_within_train_step": 2.7555606365203857, "step": 6539} {"train_info/time_between_train_steps": 0.002973318099975586, "step": 6539} {"info/global_step": 6540, "train_info/time_within_train_step": 2.7552449703216553, "step": 6540} {"train_info/time_between_train_steps": 0.0029714107513427734, "step": 6540} {"info/global_step": 6541, "train_info/time_within_train_step": 2.7627432346343994, "step": 6541} {"train_info/time_between_train_steps": 0.0029358863830566406, "step": 6541} {"info/global_step": 6542, "train_info/time_within_train_step": 2.760218381881714, "step": 6542} {"train_info/time_between_train_steps": 0.002985239028930664, "step": 6542} {"info/global_step": 6543, "train_info/time_within_train_step": 2.7560019493103027, "step": 6543} {"train_info/time_between_train_steps": 0.002992868423461914, "step": 6543} {"info/global_step": 6544, "train_info/time_within_train_step": 2.756592035293579, "step": 6544} {"train_info/time_between_train_steps": 0.0030260086059570312, "step": 6544} {"info/global_step": 6545, "train_info/time_within_train_step": 2.7562954425811768, "step": 6545} {"train_info/time_between_train_steps": 0.0029664039611816406, "step": 6545} {"info/global_step": 6546, "train_info/time_within_train_step": 2.7565042972564697, "step": 6546} {"train_info/time_between_train_steps": 0.0029599666595458984, "step": 6546} {"info/global_step": 6547, "train_info/time_within_train_step": 2.7557952404022217, "step": 6547} {"train_info/time_between_train_steps": 0.002964019775390625, "step": 6547} {"info/global_step": 6548, "train_info/time_within_train_step": 2.7567737102508545, "step": 6548} {"train_info/time_between_train_steps": 0.002997159957885742, "step": 6548} {"info/global_step": 6549, "train_info/time_within_train_step": 2.756709337234497, "step": 6549} {"train_info/time_between_train_steps": 0.002956867218017578, "step": 6549} {"info/global_step": 6550, "train_info/time_within_train_step": 2.9714272022247314, "step": 6550} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746584964, "_runtime": 18973}, "step": 6550} {"logs": {"train/loss": 3.3588, "train/learning_rate": 0.00023, "train/epoch": 7.06, "_timestamp": 1746584964, "_runtime": 18973}, "step": 6550} {"train_info/time_between_train_steps": 0.00654149055480957, "step": 6550} {"info/global_step": 6551, "train_info/time_within_train_step": 2.754005193710327, "step": 6551} {"train_info/time_between_train_steps": 0.0028874874114990234, "step": 6551} {"info/global_step": 6552, "train_info/time_within_train_step": 2.7608277797698975, "step": 6552} {"train_info/time_between_train_steps": 0.0028662681579589844, "step": 6552} {"info/global_step": 6553, "train_info/time_within_train_step": 2.7539689540863037, "step": 6553} {"train_info/time_between_train_steps": 0.002887248992919922, "step": 6553} {"info/global_step": 6554, "train_info/time_within_train_step": 2.753910779953003, "step": 6554} {"train_info/time_between_train_steps": 0.0028810501098632812, "step": 6554} {"info/global_step": 6555, "train_info/time_within_train_step": 2.754441261291504, "step": 6555} {"train_info/time_between_train_steps": 0.002874135971069336, "step": 6555} {"info/global_step": 6556, "train_info/time_within_train_step": 2.75382661819458, "step": 6556} {"train_info/time_between_train_steps": 0.0028624534606933594, "step": 6556} {"info/global_step": 6557, "train_info/time_within_train_step": 2.754595994949341, "step": 6557} {"train_info/time_between_train_steps": 0.0029022693634033203, "step": 6557} {"info/global_step": 6558, "train_info/time_within_train_step": 2.754617929458618, "step": 6558} {"train_info/time_between_train_steps": 0.0029480457305908203, "step": 6558} {"info/global_step": 6559, "train_info/time_within_train_step": 2.754506826400757, "step": 6559} {"train_info/time_between_train_steps": 0.002859354019165039, "step": 6559} {"info/global_step": 6560, "train_info/time_within_train_step": 2.755253314971924, "step": 6560} {"train_info/time_between_train_steps": 0.002936840057373047, "step": 6560} {"info/global_step": 6561, "train_info/time_within_train_step": 2.7557876110076904, "step": 6561} {"train_info/time_between_train_steps": 0.0028564929962158203, "step": 6561} {"info/global_step": 6562, "train_info/time_within_train_step": 2.7551920413970947, "step": 6562} {"train_info/time_between_train_steps": 0.002861499786376953, "step": 6562} {"info/global_step": 6563, "train_info/time_within_train_step": 2.7562496662139893, "step": 6563} {"train_info/time_between_train_steps": 0.0029268264770507812, "step": 6563} {"info/global_step": 6564, "train_info/time_within_train_step": 2.7559027671813965, "step": 6564} {"train_info/time_between_train_steps": 0.0028760433197021484, "step": 6564} {"info/global_step": 6565, "train_info/time_within_train_step": 2.7543604373931885, "step": 6565} {"train_info/time_between_train_steps": 0.0028824806213378906, "step": 6565} {"info/global_step": 6566, "train_info/time_within_train_step": 2.7549757957458496, "step": 6566} {"train_info/time_between_train_steps": 0.0028884410858154297, "step": 6566} {"info/global_step": 6567, "train_info/time_within_train_step": 2.754389762878418, "step": 6567} {"train_info/time_between_train_steps": 0.002847433090209961, "step": 6567} {"info/global_step": 6568, "train_info/time_within_train_step": 2.7545864582061768, "step": 6568} {"train_info/time_between_train_steps": 0.002875089645385742, "step": 6568} {"info/global_step": 6569, "train_info/time_within_train_step": 2.7543370723724365, "step": 6569} {"train_info/time_between_train_steps": 0.00293731689453125, "step": 6569} {"info/global_step": 6570, "train_info/time_within_train_step": 2.753859519958496, "step": 6570} {"train_info/time_between_train_steps": 0.0028486251831054688, "step": 6570} {"info/global_step": 6571, "train_info/time_within_train_step": 2.7534005641937256, "step": 6571} {"train_info/time_between_train_steps": 0.0029001235961914062, "step": 6571} {"info/global_step": 6572, "train_info/time_within_train_step": 2.754479169845581, "step": 6572} {"train_info/time_between_train_steps": 0.0028710365295410156, "step": 6572} {"info/global_step": 6573, "train_info/time_within_train_step": 2.754585027694702, "step": 6573} {"train_info/time_between_train_steps": 0.0029175281524658203, "step": 6573} {"info/global_step": 6574, "train_info/time_within_train_step": 2.754093647003174, "step": 6574} {"train_info/time_between_train_steps": 0.0028748512268066406, "step": 6574} {"info/global_step": 6575, "train_info/time_within_train_step": 2.7536637783050537, "step": 6575} {"train_info/time_between_train_steps": 0.0028765201568603516, "step": 6575} {"info/global_step": 6576, "train_info/time_within_train_step": 2.7549526691436768, "step": 6576} {"train_info/time_between_train_steps": 0.0028700828552246094, "step": 6576} {"info/global_step": 6577, "train_info/time_within_train_step": 2.7529919147491455, "step": 6577} {"train_info/time_between_train_steps": 0.002892017364501953, "step": 6577} {"info/global_step": 6578, "train_info/time_within_train_step": 2.754153251647949, "step": 6578} {"train_info/time_between_train_steps": 0.00287628173828125, "step": 6578} {"info/global_step": 6579, "train_info/time_within_train_step": 2.754396915435791, "step": 6579} {"train_info/time_between_train_steps": 0.0029151439666748047, "step": 6579} {"info/global_step": 6580, "train_info/time_within_train_step": 2.7543299198150635, "step": 6580} {"train_info/time_between_train_steps": 0.0028657913208007812, "step": 6580} {"info/global_step": 6581, "train_info/time_within_train_step": 2.7549307346343994, "step": 6581} {"train_info/time_between_train_steps": 0.0028760433197021484, "step": 6581} {"info/global_step": 6582, "train_info/time_within_train_step": 2.7546205520629883, "step": 6582} {"train_info/time_between_train_steps": 0.0029070377349853516, "step": 6582} {"info/global_step": 6583, "train_info/time_within_train_step": 2.753906726837158, "step": 6583} {"train_info/time_between_train_steps": 0.0028934478759765625, "step": 6583} {"info/global_step": 6584, "train_info/time_within_train_step": 2.753779172897339, "step": 6584} {"train_info/time_between_train_steps": 0.0028963088989257812, "step": 6584} {"info/global_step": 6585, "train_info/time_within_train_step": 2.754110097885132, "step": 6585} {"train_info/time_between_train_steps": 0.0028493404388427734, "step": 6585} {"info/global_step": 6586, "train_info/time_within_train_step": 2.7548763751983643, "step": 6586} {"train_info/time_between_train_steps": 0.002895355224609375, "step": 6586} {"info/global_step": 6587, "train_info/time_within_train_step": 2.753981590270996, "step": 6587} {"train_info/time_between_train_steps": 0.0028908252716064453, "step": 6587} {"info/global_step": 6588, "train_info/time_within_train_step": 2.753383159637451, "step": 6588} {"train_info/time_between_train_steps": 0.0028679370880126953, "step": 6588} {"info/global_step": 6589, "train_info/time_within_train_step": 2.7537119388580322, "step": 6589} {"train_info/time_between_train_steps": 0.002884387969970703, "step": 6589} {"info/global_step": 6590, "train_info/time_within_train_step": 2.7528131008148193, "step": 6590} {"train_info/time_between_train_steps": 0.002889394760131836, "step": 6590} {"info/global_step": 6591, "train_info/time_within_train_step": 2.7547922134399414, "step": 6591} {"train_info/time_between_train_steps": 0.002908945083618164, "step": 6591} {"info/global_step": 6592, "train_info/time_within_train_step": 2.7528345584869385, "step": 6592} {"train_info/time_between_train_steps": 0.002891063690185547, "step": 6592} {"info/global_step": 6593, "train_info/time_within_train_step": 2.7545006275177, "step": 6593} {"train_info/time_between_train_steps": 0.0028667449951171875, "step": 6593} {"info/global_step": 6594, "train_info/time_within_train_step": 2.755096673965454, "step": 6594} {"train_info/time_between_train_steps": 0.002880096435546875, "step": 6594} {"info/global_step": 6595, "train_info/time_within_train_step": 2.755004405975342, "step": 6595} {"train_info/time_between_train_steps": 0.0028839111328125, "step": 6595} {"info/global_step": 6596, "train_info/time_within_train_step": 2.753962278366089, "step": 6596} {"train_info/time_between_train_steps": 0.002872467041015625, "step": 6596} {"info/global_step": 6597, "train_info/time_within_train_step": 2.7525057792663574, "step": 6597} {"train_info/time_between_train_steps": 0.002922534942626953, "step": 6597} {"info/global_step": 6598, "train_info/time_within_train_step": 2.7544212341308594, "step": 6598} {"train_info/time_between_train_steps": 0.002872467041015625, "step": 6598} {"info/global_step": 6599, "train_info/time_within_train_step": 2.7554590702056885, "step": 6599} {"train_info/time_between_train_steps": 0.0029020309448242188, "step": 6599} {"info/global_step": 6600, "train_info/time_within_train_step": 2.753722906112671, "step": 6600} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746585102, "_runtime": 19111}, "step": 6600} {"logs": {"train/loss": 3.3414, "train/learning_rate": 0.00022666666666666663, "train/epoch": 7.06, "_timestamp": 1746585102, "_runtime": 19111}, "step": 6600} {"train_info/time_between_train_steps": 13.22065258026123, "step": 6600} {"info/global_step": 6601, "train_info/time_within_train_step": 2.528189182281494, "step": 6601} {"train_info/time_between_train_steps": 0.002989053726196289, "step": 6601} {"info/global_step": 6602, "train_info/time_within_train_step": 2.5869300365448, "step": 6602} {"train_info/time_between_train_steps": 0.0029942989349365234, "step": 6602} {"info/global_step": 6603, "train_info/time_within_train_step": 2.7321507930755615, "step": 6603} {"train_info/time_between_train_steps": 0.0030100345611572266, "step": 6603} {"info/global_step": 6604, "train_info/time_within_train_step": 2.7511374950408936, "step": 6604} {"train_info/time_between_train_steps": 0.0029823780059814453, "step": 6604} {"info/global_step": 6605, "train_info/time_within_train_step": 2.752751350402832, "step": 6605} {"train_info/time_between_train_steps": 0.0030319690704345703, "step": 6605} {"info/global_step": 6606, "train_info/time_within_train_step": 2.7560949325561523, "step": 6606} {"train_info/time_between_train_steps": 0.0029730796813964844, "step": 6606} {"info/global_step": 6607, "train_info/time_within_train_step": 2.7551066875457764, "step": 6607} {"train_info/time_between_train_steps": 0.0030062198638916016, "step": 6607} {"info/global_step": 6608, "train_info/time_within_train_step": 2.7555007934570312, "step": 6608} {"train_info/time_between_train_steps": 0.003106832504272461, "step": 6608} {"info/global_step": 6609, "train_info/time_within_train_step": 2.7560746669769287, "step": 6609} {"train_info/time_between_train_steps": 0.002961874008178711, "step": 6609} {"info/global_step": 6610, "train_info/time_within_train_step": 2.755948066711426, "step": 6610} {"train_info/time_between_train_steps": 0.0029485225677490234, "step": 6610} {"info/global_step": 6611, "train_info/time_within_train_step": 2.7561991214752197, "step": 6611} {"train_info/time_between_train_steps": 0.0028743743896484375, "step": 6611} {"info/global_step": 6612, "train_info/time_within_train_step": 2.7558488845825195, "step": 6612} {"train_info/time_between_train_steps": 0.002861499786376953, "step": 6612} {"info/global_step": 6613, "train_info/time_within_train_step": 2.7554006576538086, "step": 6613} {"train_info/time_between_train_steps": 0.002881288528442383, "step": 6613} {"info/global_step": 6614, "train_info/time_within_train_step": 2.755859375, "step": 6614} {"train_info/time_between_train_steps": 0.002930164337158203, "step": 6614} {"info/global_step": 6615, "train_info/time_within_train_step": 2.7559685707092285, "step": 6615} {"train_info/time_between_train_steps": 0.002951383590698242, "step": 6615} {"info/global_step": 6616, "train_info/time_within_train_step": 2.756772994995117, "step": 6616} {"train_info/time_between_train_steps": 0.0029878616333007812, "step": 6616} {"info/global_step": 6617, "train_info/time_within_train_step": 2.757012128829956, "step": 6617} {"train_info/time_between_train_steps": 0.0029616355895996094, "step": 6617} {"info/global_step": 6618, "train_info/time_within_train_step": 2.755948543548584, "step": 6618} {"train_info/time_between_train_steps": 0.0029027462005615234, "step": 6618} {"info/global_step": 6619, "train_info/time_within_train_step": 2.754373550415039, "step": 6619} {"train_info/time_between_train_steps": 0.0028493404388427734, "step": 6619} {"info/global_step": 6620, "train_info/time_within_train_step": 2.7548086643218994, "step": 6620} {"train_info/time_between_train_steps": 0.0028924942016601562, "step": 6620} {"info/global_step": 6621, "train_info/time_within_train_step": 2.755513906478882, "step": 6621} {"train_info/time_between_train_steps": 0.002900838851928711, "step": 6621} {"info/global_step": 6622, "train_info/time_within_train_step": 2.755070686340332, "step": 6622} {"train_info/time_between_train_steps": 0.002882242202758789, "step": 6622} {"info/global_step": 6623, "train_info/time_within_train_step": 2.7546489238739014, "step": 6623} {"train_info/time_between_train_steps": 0.0028781890869140625, "step": 6623} {"info/global_step": 6624, "train_info/time_within_train_step": 2.754363775253296, "step": 6624} {"train_info/time_between_train_steps": 0.0029191970825195312, "step": 6624} {"info/global_step": 6625, "train_info/time_within_train_step": 2.754265069961548, "step": 6625} {"train_info/time_between_train_steps": 0.002933025360107422, "step": 6625} {"info/global_step": 6626, "train_info/time_within_train_step": 2.7553775310516357, "step": 6626} {"train_info/time_between_train_steps": 0.002901315689086914, "step": 6626} {"info/global_step": 6627, "train_info/time_within_train_step": 2.755018711090088, "step": 6627} {"train_info/time_between_train_steps": 0.002885580062866211, "step": 6627} {"info/global_step": 6628, "train_info/time_within_train_step": 2.7556395530700684, "step": 6628} {"train_info/time_between_train_steps": 0.0029249191284179688, "step": 6628} {"info/global_step": 6629, "train_info/time_within_train_step": 2.755967855453491, "step": 6629} {"train_info/time_between_train_steps": 0.00296783447265625, "step": 6629} {"info/global_step": 6630, "train_info/time_within_train_step": 2.756166696548462, "step": 6630} {"train_info/time_between_train_steps": 0.0028791427612304688, "step": 6630} {"info/global_step": 6631, "train_info/time_within_train_step": 2.756946325302124, "step": 6631} {"train_info/time_between_train_steps": 0.0028922557830810547, "step": 6631} {"info/global_step": 6632, "train_info/time_within_train_step": 2.755382776260376, "step": 6632} {"train_info/time_between_train_steps": 0.0028901100158691406, "step": 6632} {"info/global_step": 6633, "train_info/time_within_train_step": 2.7561795711517334, "step": 6633} {"train_info/time_between_train_steps": 0.0028810501098632812, "step": 6633} {"info/global_step": 6634, "train_info/time_within_train_step": 2.7546958923339844, "step": 6634} {"train_info/time_between_train_steps": 0.0028929710388183594, "step": 6634} {"info/global_step": 6635, "train_info/time_within_train_step": 2.7542777061462402, "step": 6635} {"train_info/time_between_train_steps": 0.0029425621032714844, "step": 6635} {"info/global_step": 6636, "train_info/time_within_train_step": 2.7559032440185547, "step": 6636} {"train_info/time_between_train_steps": 0.002881765365600586, "step": 6636} {"info/global_step": 6637, "train_info/time_within_train_step": 2.7546846866607666, "step": 6637} {"train_info/time_between_train_steps": 0.0028753280639648438, "step": 6637} {"info/global_step": 6638, "train_info/time_within_train_step": 2.7547080516815186, "step": 6638} {"train_info/time_between_train_steps": 0.0028715133666992188, "step": 6638} {"info/global_step": 6639, "train_info/time_within_train_step": 2.754542350769043, "step": 6639} {"train_info/time_between_train_steps": 0.0028815269470214844, "step": 6639} {"info/global_step": 6640, "train_info/time_within_train_step": 2.7523815631866455, "step": 6640} {"train_info/time_between_train_steps": 0.00295257568359375, "step": 6640} {"info/global_step": 6641, "train_info/time_within_train_step": 2.754188299179077, "step": 6641} {"train_info/time_between_train_steps": 0.002890348434448242, "step": 6641} {"info/global_step": 6642, "train_info/time_within_train_step": 2.7554755210876465, "step": 6642} {"train_info/time_between_train_steps": 0.0028862953186035156, "step": 6642} {"info/global_step": 6643, "train_info/time_within_train_step": 2.753497838973999, "step": 6643} {"train_info/time_between_train_steps": 0.002905607223510742, "step": 6643} {"info/global_step": 6644, "train_info/time_within_train_step": 2.7543747425079346, "step": 6644} {"train_info/time_between_train_steps": 0.002888917922973633, "step": 6644} {"info/global_step": 6645, "train_info/time_within_train_step": 2.7544267177581787, "step": 6645} {"train_info/time_between_train_steps": 0.0028810501098632812, "step": 6645} {"info/global_step": 6646, "train_info/time_within_train_step": 2.7546608448028564, "step": 6646} {"train_info/time_between_train_steps": 0.002886056900024414, "step": 6646} {"info/global_step": 6647, "train_info/time_within_train_step": 2.7554023265838623, "step": 6647} {"train_info/time_between_train_steps": 0.00289154052734375, "step": 6647} {"info/global_step": 6648, "train_info/time_within_train_step": 2.754272699356079, "step": 6648} {"train_info/time_between_train_steps": 0.0028655529022216797, "step": 6648} {"info/global_step": 6649, "train_info/time_within_train_step": 2.7543153762817383, "step": 6649} {"train_info/time_between_train_steps": 0.0028808116912841797, "step": 6649} {"info/global_step": 6650, "train_info/time_within_train_step": 2.75358247756958, "step": 6650} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746585253, "_runtime": 19262}, "step": 6650} {"logs": {"train/loss": 3.3343, "train/learning_rate": 0.00022333333333333333, "train/epoch": 7.07, "_timestamp": 1746585253, "_runtime": 19262}, "step": 6650} {"train_info/time_between_train_steps": 0.00658416748046875, "step": 6650} {"info/global_step": 6651, "train_info/time_within_train_step": 2.7540411949157715, "step": 6651} {"train_info/time_between_train_steps": 0.0028634071350097656, "step": 6651} {"info/global_step": 6652, "train_info/time_within_train_step": 2.7540767192840576, "step": 6652} {"train_info/time_between_train_steps": 0.002869129180908203, "step": 6652} {"info/global_step": 6653, "train_info/time_within_train_step": 2.7540476322174072, "step": 6653} {"train_info/time_between_train_steps": 0.002905607223510742, "step": 6653} {"info/global_step": 6654, "train_info/time_within_train_step": 2.7532546520233154, "step": 6654} {"train_info/time_between_train_steps": 0.00290679931640625, "step": 6654} {"info/global_step": 6655, "train_info/time_within_train_step": 2.753460645675659, "step": 6655} {"train_info/time_between_train_steps": 0.002895355224609375, "step": 6655} {"info/global_step": 6656, "train_info/time_within_train_step": 2.753657341003418, "step": 6656} {"train_info/time_between_train_steps": 0.0029144287109375, "step": 6656} {"info/global_step": 6657, "train_info/time_within_train_step": 2.75254487991333, "step": 6657} {"train_info/time_between_train_steps": 0.0028777122497558594, "step": 6657} {"info/global_step": 6658, "train_info/time_within_train_step": 2.753763198852539, "step": 6658} {"train_info/time_between_train_steps": 0.0029134750366210938, "step": 6658} {"info/global_step": 6659, "train_info/time_within_train_step": 2.9007937908172607, "step": 6659} {"train_info/time_between_train_steps": 0.0028700828552246094, "step": 6659} {"info/global_step": 6660, "train_info/time_within_train_step": 2.754497528076172, "step": 6660} {"train_info/time_between_train_steps": 0.0028853416442871094, "step": 6660} {"info/global_step": 6661, "train_info/time_within_train_step": 2.7541658878326416, "step": 6661} {"train_info/time_between_train_steps": 0.002858400344848633, "step": 6661} {"info/global_step": 6662, "train_info/time_within_train_step": 2.7536256313323975, "step": 6662} {"train_info/time_between_train_steps": 0.002901792526245117, "step": 6662} {"info/global_step": 6663, "train_info/time_within_train_step": 2.7528371810913086, "step": 6663} {"train_info/time_between_train_steps": 0.002948284149169922, "step": 6663} {"info/global_step": 6664, "train_info/time_within_train_step": 2.754152536392212, "step": 6664} {"train_info/time_between_train_steps": 0.0028998851776123047, "step": 6664} {"info/global_step": 6665, "train_info/time_within_train_step": 2.7536661624908447, "step": 6665} {"train_info/time_between_train_steps": 0.0028645992279052734, "step": 6665} {"info/global_step": 6666, "train_info/time_within_train_step": 2.754361867904663, "step": 6666} {"train_info/time_between_train_steps": 0.0029175281524658203, "step": 6666} {"info/global_step": 6667, "train_info/time_within_train_step": 2.754573106765747, "step": 6667} {"train_info/time_between_train_steps": 0.0028641223907470703, "step": 6667} {"info/global_step": 6668, "train_info/time_within_train_step": 2.7542407512664795, "step": 6668} {"train_info/time_between_train_steps": 0.002847433090209961, "step": 6668} {"info/global_step": 6669, "train_info/time_within_train_step": 2.753514051437378, "step": 6669} {"train_info/time_between_train_steps": 0.0028929710388183594, "step": 6669} {"info/global_step": 6670, "train_info/time_within_train_step": 2.753883123397827, "step": 6670} {"train_info/time_between_train_steps": 0.002869129180908203, "step": 6670} {"info/global_step": 6671, "train_info/time_within_train_step": 2.75400710105896, "step": 6671} {"train_info/time_between_train_steps": 0.002883434295654297, "step": 6671} {"info/global_step": 6672, "train_info/time_within_train_step": 2.7531917095184326, "step": 6672} {"train_info/time_between_train_steps": 0.0028829574584960938, "step": 6672} {"info/global_step": 6673, "train_info/time_within_train_step": 2.753549098968506, "step": 6673} {"train_info/time_between_train_steps": 0.0029189586639404297, "step": 6673} {"info/global_step": 6674, "train_info/time_within_train_step": 2.75431227684021, "step": 6674} {"train_info/time_between_train_steps": 0.002856731414794922, "step": 6674} {"info/global_step": 6675, "train_info/time_within_train_step": 2.7540249824523926, "step": 6675} {"train_info/time_between_train_steps": 0.002893209457397461, "step": 6675} {"info/global_step": 6676, "train_info/time_within_train_step": 2.7542474269866943, "step": 6676} {"train_info/time_between_train_steps": 0.0028810501098632812, "step": 6676} {"info/global_step": 6677, "train_info/time_within_train_step": 2.7540206909179688, "step": 6677} {"train_info/time_between_train_steps": 0.002896547317504883, "step": 6677} {"info/global_step": 6678, "train_info/time_within_train_step": 2.754549503326416, "step": 6678} {"train_info/time_between_train_steps": 0.0028924942016601562, "step": 6678} {"info/global_step": 6679, "train_info/time_within_train_step": 2.752939224243164, "step": 6679} {"train_info/time_between_train_steps": 0.002897024154663086, "step": 6679} {"info/global_step": 6680, "train_info/time_within_train_step": 2.754037618637085, "step": 6680} {"train_info/time_between_train_steps": 0.0029048919677734375, "step": 6680} {"info/global_step": 6681, "train_info/time_within_train_step": 2.7539021968841553, "step": 6681} {"train_info/time_between_train_steps": 0.0028862953186035156, "step": 6681} {"info/global_step": 6682, "train_info/time_within_train_step": 2.753169298171997, "step": 6682} {"train_info/time_between_train_steps": 0.002934694290161133, "step": 6682} {"info/global_step": 6683, "train_info/time_within_train_step": 2.7509377002716064, "step": 6683} {"train_info/time_between_train_steps": 0.0028803348541259766, "step": 6683} {"info/global_step": 6684, "train_info/time_within_train_step": 2.7532684803009033, "step": 6684} {"train_info/time_between_train_steps": 0.0029256343841552734, "step": 6684} {"info/global_step": 6685, "train_info/time_within_train_step": 2.752656936645508, "step": 6685} {"train_info/time_between_train_steps": 0.002885103225708008, "step": 6685} {"info/global_step": 6686, "train_info/time_within_train_step": 2.7520158290863037, "step": 6686} {"train_info/time_between_train_steps": 0.0028874874114990234, "step": 6686} {"info/global_step": 6687, "train_info/time_within_train_step": 2.7532598972320557, "step": 6687} {"train_info/time_between_train_steps": 0.002893209457397461, "step": 6687} {"info/global_step": 6688, "train_info/time_within_train_step": 2.753389835357666, "step": 6688} {"train_info/time_between_train_steps": 0.0028781890869140625, "step": 6688} {"info/global_step": 6689, "train_info/time_within_train_step": 2.7537736892700195, "step": 6689} {"train_info/time_between_train_steps": 0.0028853416442871094, "step": 6689} {"info/global_step": 6690, "train_info/time_within_train_step": 2.754112482070923, "step": 6690} {"train_info/time_between_train_steps": 0.0029001235961914062, "step": 6690} {"info/global_step": 6691, "train_info/time_within_train_step": 2.7534239292144775, "step": 6691} {"train_info/time_between_train_steps": 0.0028831958770751953, "step": 6691} {"info/global_step": 6692, "train_info/time_within_train_step": 2.7548539638519287, "step": 6692} {"train_info/time_between_train_steps": 0.0030090808868408203, "step": 6692} {"info/global_step": 6693, "train_info/time_within_train_step": 2.755556344985962, "step": 6693} {"train_info/time_between_train_steps": 0.003066539764404297, "step": 6693} {"info/global_step": 6694, "train_info/time_within_train_step": 2.7550575733184814, "step": 6694} {"train_info/time_between_train_steps": 0.0029821395874023438, "step": 6694} {"info/global_step": 6695, "train_info/time_within_train_step": 2.755113363265991, "step": 6695} {"train_info/time_between_train_steps": 0.0029878616333007812, "step": 6695} {"info/global_step": 6696, "train_info/time_within_train_step": 2.7558655738830566, "step": 6696} {"train_info/time_between_train_steps": 0.00298309326171875, "step": 6696} {"info/global_step": 6697, "train_info/time_within_train_step": 2.7561378479003906, "step": 6697} {"train_info/time_between_train_steps": 0.0030341148376464844, "step": 6697} {"info/global_step": 6698, "train_info/time_within_train_step": 2.75490665435791, "step": 6698} {"train_info/time_between_train_steps": 0.0034215450286865234, "step": 6698} {"info/global_step": 6699, "train_info/time_within_train_step": 2.754281520843506, "step": 6699} {"train_info/time_between_train_steps": 0.003014802932739258, "step": 6699} {"info/global_step": 6700, "train_info/time_within_train_step": 2.7540957927703857, "step": 6700} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746585391, "_runtime": 19400}, "step": 6700} {"logs": {"train/loss": 3.3275, "train/learning_rate": 0.00021999999999999995, "train/epoch": 7.07, "_timestamp": 1746585391, "_runtime": 19400}, "step": 6700} {"train_info/time_between_train_steps": 0.014793157577514648, "step": 6700} {"info/global_step": 6701, "train_info/time_within_train_step": 2.7541558742523193, "step": 6701} {"train_info/time_between_train_steps": 0.0029761791229248047, "step": 6701} {"info/global_step": 6702, "train_info/time_within_train_step": 2.7544829845428467, "step": 6702} {"train_info/time_between_train_steps": 0.0029757022857666016, "step": 6702} {"info/global_step": 6703, "train_info/time_within_train_step": 2.7544972896575928, "step": 6703} {"train_info/time_between_train_steps": 0.00295257568359375, "step": 6703} {"info/global_step": 6704, "train_info/time_within_train_step": 2.7544047832489014, "step": 6704} {"train_info/time_between_train_steps": 0.00298309326171875, "step": 6704} {"info/global_step": 6705, "train_info/time_within_train_step": 2.753917694091797, "step": 6705} {"train_info/time_between_train_steps": 0.0029544830322265625, "step": 6705} {"info/global_step": 6706, "train_info/time_within_train_step": 2.7557852268218994, "step": 6706} {"train_info/time_between_train_steps": 0.0030336380004882812, "step": 6706} {"info/global_step": 6707, "train_info/time_within_train_step": 2.7547805309295654, "step": 6707} {"train_info/time_between_train_steps": 0.002900362014770508, "step": 6707} {"info/global_step": 6708, "train_info/time_within_train_step": 2.7531731128692627, "step": 6708} {"train_info/time_between_train_steps": 0.0028951168060302734, "step": 6708} {"info/global_step": 6709, "train_info/time_within_train_step": 2.752854824066162, "step": 6709} {"train_info/time_between_train_steps": 0.002898693084716797, "step": 6709} {"info/global_step": 6710, "train_info/time_within_train_step": 2.7504775524139404, "step": 6710} {"train_info/time_between_train_steps": 0.0028984546661376953, "step": 6710} {"info/global_step": 6711, "train_info/time_within_train_step": 2.753467321395874, "step": 6711} {"train_info/time_between_train_steps": 0.0028891563415527344, "step": 6711} {"info/global_step": 6712, "train_info/time_within_train_step": 2.754265546798706, "step": 6712} {"train_info/time_between_train_steps": 0.0028798580169677734, "step": 6712} {"info/global_step": 6713, "train_info/time_within_train_step": 2.7534902095794678, "step": 6713} {"train_info/time_between_train_steps": 0.0029044151306152344, "step": 6713} {"info/global_step": 6714, "train_info/time_within_train_step": 2.754127264022827, "step": 6714} {"train_info/time_between_train_steps": 0.0028913021087646484, "step": 6714} {"info/global_step": 6715, "train_info/time_within_train_step": 2.7536308765411377, "step": 6715} {"train_info/time_between_train_steps": 0.0029222965240478516, "step": 6715} {"info/global_step": 6716, "train_info/time_within_train_step": 2.7540245056152344, "step": 6716} {"train_info/time_between_train_steps": 0.0029075145721435547, "step": 6716} {"info/global_step": 6717, "train_info/time_within_train_step": 2.861508369445801, "step": 6717} {"train_info/time_between_train_steps": 0.002911090850830078, "step": 6717} {"info/global_step": 6718, "train_info/time_within_train_step": 2.754530429840088, "step": 6718} {"train_info/time_between_train_steps": 0.0029058456420898438, "step": 6718} {"info/global_step": 6719, "train_info/time_within_train_step": 2.752391815185547, "step": 6719} {"train_info/time_between_train_steps": 0.0028755664825439453, "step": 6719} {"info/global_step": 6720, "train_info/time_within_train_step": 2.753594398498535, "step": 6720} {"train_info/time_between_train_steps": 0.0028858184814453125, "step": 6720} {"info/global_step": 6721, "train_info/time_within_train_step": 2.7538135051727295, "step": 6721} {"train_info/time_between_train_steps": 0.0028753280639648438, "step": 6721} {"info/global_step": 6722, "train_info/time_within_train_step": 2.7543091773986816, "step": 6722} {"train_info/time_between_train_steps": 0.0029294490814208984, "step": 6722} {"info/global_step": 6723, "train_info/time_within_train_step": 2.753476619720459, "step": 6723} {"train_info/time_between_train_steps": 0.00286865234375, "step": 6723} {"info/global_step": 6724, "train_info/time_within_train_step": 2.7543420791625977, "step": 6724} {"train_info/time_between_train_steps": 0.002899169921875, "step": 6724} {"info/global_step": 6725, "train_info/time_within_train_step": 2.7515816688537598, "step": 6725} {"train_info/time_between_train_steps": 0.0028760433197021484, "step": 6725} {"info/global_step": 6726, "train_info/time_within_train_step": 2.7554328441619873, "step": 6726} {"train_info/time_between_train_steps": 0.0030052661895751953, "step": 6726} {"info/global_step": 6727, "train_info/time_within_train_step": 2.7557685375213623, "step": 6727} {"train_info/time_between_train_steps": 0.002974271774291992, "step": 6727} {"info/global_step": 6728, "train_info/time_within_train_step": 2.75545597076416, "step": 6728} {"train_info/time_between_train_steps": 0.003000974655151367, "step": 6728} {"info/global_step": 6729, "train_info/time_within_train_step": 2.7553153038024902, "step": 6729} {"train_info/time_between_train_steps": 0.002966165542602539, "step": 6729} {"info/global_step": 6730, "train_info/time_within_train_step": 2.7551193237304688, "step": 6730} {"train_info/time_between_train_steps": 0.0029647350311279297, "step": 6730} {"info/global_step": 6731, "train_info/time_within_train_step": 2.7531182765960693, "step": 6731} {"train_info/time_between_train_steps": 0.0029802322387695312, "step": 6731} {"info/global_step": 6732, "train_info/time_within_train_step": 2.754565477371216, "step": 6732} {"train_info/time_between_train_steps": 0.0033292770385742188, "step": 6732} {"info/global_step": 6733, "train_info/time_within_train_step": 2.7550902366638184, "step": 6733} {"train_info/time_between_train_steps": 0.0029938220977783203, "step": 6733} {"info/global_step": 6734, "train_info/time_within_train_step": 2.7552273273468018, "step": 6734} {"train_info/time_between_train_steps": 0.0029785633087158203, "step": 6734} {"info/global_step": 6735, "train_info/time_within_train_step": 2.754826307296753, "step": 6735} {"train_info/time_between_train_steps": 0.0029571056365966797, "step": 6735} {"info/global_step": 6736, "train_info/time_within_train_step": 2.754534959793091, "step": 6736} {"train_info/time_between_train_steps": 0.0030317306518554688, "step": 6736} {"info/global_step": 6737, "train_info/time_within_train_step": 2.754424810409546, "step": 6737} {"train_info/time_between_train_steps": 0.003151416778564453, "step": 6737} {"info/global_step": 6738, "train_info/time_within_train_step": 2.75441312789917, "step": 6738} {"train_info/time_between_train_steps": 0.002964019775390625, "step": 6738} {"info/global_step": 6739, "train_info/time_within_train_step": 2.7544989585876465, "step": 6739} {"train_info/time_between_train_steps": 0.002985715866088867, "step": 6739} {"info/global_step": 6740, "train_info/time_within_train_step": 2.755791664123535, "step": 6740} {"train_info/time_between_train_steps": 0.005923748016357422, "step": 6740} {"info/global_step": 6741, "train_info/time_within_train_step": 2.7566659450531006, "step": 6741} {"train_info/time_between_train_steps": 0.0060002803802490234, "step": 6741} {"info/global_step": 6742, "train_info/time_within_train_step": 2.7564074993133545, "step": 6742} {"train_info/time_between_train_steps": 0.005843400955200195, "step": 6742} {"info/global_step": 6743, "train_info/time_within_train_step": 2.754352331161499, "step": 6743} {"train_info/time_between_train_steps": 0.0059299468994140625, "step": 6743} {"info/global_step": 6744, "train_info/time_within_train_step": 2.7587504386901855, "step": 6744} {"train_info/time_between_train_steps": 0.003001689910888672, "step": 6744} {"info/global_step": 6745, "train_info/time_within_train_step": 2.7556488513946533, "step": 6745} {"train_info/time_between_train_steps": 0.0029850006103515625, "step": 6745} {"info/global_step": 6746, "train_info/time_within_train_step": 2.755115509033203, "step": 6746} {"train_info/time_between_train_steps": 0.002961397171020508, "step": 6746} {"info/global_step": 6747, "train_info/time_within_train_step": 3.346583127975464, "step": 6747} {"train_info/time_between_train_steps": 0.002989053726196289, "step": 6747} {"info/global_step": 6748, "train_info/time_within_train_step": 2.756268262863159, "step": 6748} {"train_info/time_between_train_steps": 0.0029904842376708984, "step": 6748} {"info/global_step": 6749, "train_info/time_within_train_step": 2.756110429763794, "step": 6749} {"train_info/time_between_train_steps": 0.002995014190673828, "step": 6749} {"info/global_step": 6750, "train_info/time_within_train_step": 2.7537553310394287, "step": 6750} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746585530, "_runtime": 19539}, "step": 6750} {"logs": {"train/loss": 3.3135, "train/learning_rate": 0.00021666666666666666, "train/epoch": 7.08, "_timestamp": 1746585530, "_runtime": 19539}, "step": 6750} {"train_info/time_between_train_steps": 0.006742238998413086, "step": 6750} {"info/global_step": 6751, "train_info/time_within_train_step": 2.7554421424865723, "step": 6751} {"train_info/time_between_train_steps": 0.0029654502868652344, "step": 6751} {"info/global_step": 6752, "train_info/time_within_train_step": 2.755279302597046, "step": 6752} {"train_info/time_between_train_steps": 0.0030090808868408203, "step": 6752} {"info/global_step": 6753, "train_info/time_within_train_step": 2.7553186416625977, "step": 6753} {"train_info/time_between_train_steps": 0.002977609634399414, "step": 6753} {"info/global_step": 6754, "train_info/time_within_train_step": 2.7547483444213867, "step": 6754} {"train_info/time_between_train_steps": 0.0029451847076416016, "step": 6754} {"info/global_step": 6755, "train_info/time_within_train_step": 2.754349708557129, "step": 6755} {"train_info/time_between_train_steps": 0.0030012130737304688, "step": 6755} {"info/global_step": 6756, "train_info/time_within_train_step": 2.7543387413024902, "step": 6756} {"train_info/time_between_train_steps": 0.0029876232147216797, "step": 6756} {"info/global_step": 6757, "train_info/time_within_train_step": 2.834956407546997, "step": 6757} {"train_info/time_between_train_steps": 0.0029976367950439453, "step": 6757} {"info/global_step": 6758, "train_info/time_within_train_step": 2.7547943592071533, "step": 6758} {"train_info/time_between_train_steps": 0.00299835205078125, "step": 6758} {"info/global_step": 6759, "train_info/time_within_train_step": 2.7553813457489014, "step": 6759} {"train_info/time_between_train_steps": 0.0029990673065185547, "step": 6759} {"info/global_step": 6760, "train_info/time_within_train_step": 2.7548000812530518, "step": 6760} {"train_info/time_between_train_steps": 0.0029451847076416016, "step": 6760} {"info/global_step": 6761, "train_info/time_within_train_step": 2.7542014122009277, "step": 6761} {"train_info/time_between_train_steps": 0.002988576889038086, "step": 6761} {"info/global_step": 6762, "train_info/time_within_train_step": 2.754430055618286, "step": 6762} {"train_info/time_between_train_steps": 0.0029840469360351562, "step": 6762} {"info/global_step": 6763, "train_info/time_within_train_step": 2.7549004554748535, "step": 6763} {"train_info/time_between_train_steps": 0.002961874008178711, "step": 6763} {"info/global_step": 6764, "train_info/time_within_train_step": 2.7544004917144775, "step": 6764} {"train_info/time_between_train_steps": 0.00299072265625, "step": 6764} {"info/global_step": 6765, "train_info/time_within_train_step": 2.7534337043762207, "step": 6765} {"train_info/time_between_train_steps": 0.002990245819091797, "step": 6765} {"info/global_step": 6766, "train_info/time_within_train_step": 2.754711866378784, "step": 6766} {"train_info/time_between_train_steps": 0.0030035972595214844, "step": 6766} {"info/global_step": 6767, "train_info/time_within_train_step": 2.7540106773376465, "step": 6767} {"train_info/time_between_train_steps": 0.0029752254486083984, "step": 6767} {"info/global_step": 6768, "train_info/time_within_train_step": 2.754742383956909, "step": 6768} {"train_info/time_between_train_steps": 0.002972126007080078, "step": 6768} {"info/global_step": 6769, "train_info/time_within_train_step": 2.753800630569458, "step": 6769} {"train_info/time_between_train_steps": 0.0028679370880126953, "step": 6769} {"info/global_step": 6770, "train_info/time_within_train_step": 2.7527291774749756, "step": 6770} {"train_info/time_between_train_steps": 0.0029311180114746094, "step": 6770} {"info/global_step": 6771, "train_info/time_within_train_step": 2.752930164337158, "step": 6771} {"train_info/time_between_train_steps": 0.002882242202758789, "step": 6771} {"info/global_step": 6772, "train_info/time_within_train_step": 2.7532262802124023, "step": 6772} {"train_info/time_between_train_steps": 0.0028884410858154297, "step": 6772} {"info/global_step": 6773, "train_info/time_within_train_step": 2.754213571548462, "step": 6773} {"train_info/time_between_train_steps": 0.0029752254486083984, "step": 6773} {"info/global_step": 6774, "train_info/time_within_train_step": 2.7539660930633545, "step": 6774} {"train_info/time_between_train_steps": 0.0028488636016845703, "step": 6774} {"info/global_step": 6775, "train_info/time_within_train_step": 2.754848003387451, "step": 6775} {"train_info/time_between_train_steps": 0.002885103225708008, "step": 6775} {"info/global_step": 6776, "train_info/time_within_train_step": 2.754124641418457, "step": 6776} {"train_info/time_between_train_steps": 0.002848386764526367, "step": 6776} {"info/global_step": 6777, "train_info/time_within_train_step": 2.7538726329803467, "step": 6777} {"train_info/time_between_train_steps": 0.0028867721557617188, "step": 6777} {"info/global_step": 6778, "train_info/time_within_train_step": 2.752774953842163, "step": 6778} {"train_info/time_between_train_steps": 0.0028874874114990234, "step": 6778} {"info/global_step": 6779, "train_info/time_within_train_step": 2.7544775009155273, "step": 6779} {"train_info/time_between_train_steps": 0.0028862953186035156, "step": 6779} {"info/global_step": 6780, "train_info/time_within_train_step": 2.754011869430542, "step": 6780} {"train_info/time_between_train_steps": 0.002882719039916992, "step": 6780} {"info/global_step": 6781, "train_info/time_within_train_step": 2.7530839443206787, "step": 6781} {"train_info/time_between_train_steps": 0.0028946399688720703, "step": 6781} {"info/global_step": 6782, "train_info/time_within_train_step": 2.7538626194000244, "step": 6782} {"train_info/time_between_train_steps": 0.002896547317504883, "step": 6782} {"info/global_step": 6783, "train_info/time_within_train_step": 2.753502130508423, "step": 6783} {"train_info/time_between_train_steps": 0.002870798110961914, "step": 6783} {"info/global_step": 6784, "train_info/time_within_train_step": 2.7532081604003906, "step": 6784} {"train_info/time_between_train_steps": 0.002930164337158203, "step": 6784} {"info/global_step": 6785, "train_info/time_within_train_step": 2.7532243728637695, "step": 6785} {"train_info/time_between_train_steps": 0.0029096603393554688, "step": 6785} {"info/global_step": 6786, "train_info/time_within_train_step": 2.753026247024536, "step": 6786} {"train_info/time_between_train_steps": 0.002900362014770508, "step": 6786} {"info/global_step": 6787, "train_info/time_within_train_step": 2.752701997756958, "step": 6787} {"train_info/time_between_train_steps": 0.002875089645385742, "step": 6787} {"info/global_step": 6788, "train_info/time_within_train_step": 2.7537951469421387, "step": 6788} {"train_info/time_between_train_steps": 0.0028994083404541016, "step": 6788} {"info/global_step": 6789, "train_info/time_within_train_step": 2.753936529159546, "step": 6789} {"train_info/time_between_train_steps": 0.002936124801635742, "step": 6789} {"info/global_step": 6790, "train_info/time_within_train_step": 2.7543907165527344, "step": 6790} {"train_info/time_between_train_steps": 0.002913236618041992, "step": 6790} {"info/global_step": 6791, "train_info/time_within_train_step": 2.7542221546173096, "step": 6791} {"train_info/time_between_train_steps": 0.0029129981994628906, "step": 6791} {"info/global_step": 6792, "train_info/time_within_train_step": 2.7537577152252197, "step": 6792} {"train_info/time_between_train_steps": 0.002899646759033203, "step": 6792} {"info/global_step": 6793, "train_info/time_within_train_step": 2.7540123462677, "step": 6793} {"train_info/time_between_train_steps": 0.0030198097229003906, "step": 6793} {"info/global_step": 6794, "train_info/time_within_train_step": 2.7541935443878174, "step": 6794} {"train_info/time_between_train_steps": 0.0028676986694335938, "step": 6794} {"info/global_step": 6795, "train_info/time_within_train_step": 2.753779888153076, "step": 6795} {"train_info/time_between_train_steps": 0.0029625892639160156, "step": 6795} {"info/global_step": 6796, "train_info/time_within_train_step": 2.7537293434143066, "step": 6796} {"train_info/time_between_train_steps": 0.00298309326171875, "step": 6796} {"info/global_step": 6797, "train_info/time_within_train_step": 2.7534239292144775, "step": 6797} {"train_info/time_between_train_steps": 0.0029211044311523438, "step": 6797} {"info/global_step": 6798, "train_info/time_within_train_step": 2.752450466156006, "step": 6798} {"train_info/time_between_train_steps": 0.0029952526092529297, "step": 6798} {"info/global_step": 6799, "train_info/time_within_train_step": 2.7532782554626465, "step": 6799} {"train_info/time_between_train_steps": 0.002959728240966797, "step": 6799} {"info/global_step": 6800, "train_info/time_within_train_step": 2.7532668113708496, "step": 6800} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746585668, "_runtime": 19677}, "step": 6800} {"logs": {"train/loss": 3.3067, "train/learning_rate": 0.00021333333333333333, "train/epoch": 7.08, "_timestamp": 1746585668, "_runtime": 19677}, "step": 6800} {"train_info/time_between_train_steps": 15.62965178489685, "step": 6800} {"info/global_step": 6801, "train_info/time_within_train_step": 2.532175302505493, "step": 6801} {"train_info/time_between_train_steps": 0.006304025650024414, "step": 6801} {"info/global_step": 6802, "train_info/time_within_train_step": 2.590942621231079, "step": 6802} {"train_info/time_between_train_steps": 0.0059795379638671875, "step": 6802} {"info/global_step": 6803, "train_info/time_within_train_step": 2.7164371013641357, "step": 6803} {"train_info/time_between_train_steps": 0.006143808364868164, "step": 6803} {"info/global_step": 6804, "train_info/time_within_train_step": 2.7487406730651855, "step": 6804} {"train_info/time_between_train_steps": 0.006099700927734375, "step": 6804} {"info/global_step": 6805, "train_info/time_within_train_step": 2.7486703395843506, "step": 6805} {"train_info/time_between_train_steps": 0.006061553955078125, "step": 6805} {"info/global_step": 6806, "train_info/time_within_train_step": 2.75392484664917, "step": 6806} {"train_info/time_between_train_steps": 0.00623774528503418, "step": 6806} {"info/global_step": 6807, "train_info/time_within_train_step": 2.7531838417053223, "step": 6807} {"train_info/time_between_train_steps": 0.003018617630004883, "step": 6807} {"info/global_step": 6808, "train_info/time_within_train_step": 2.753758192062378, "step": 6808} {"train_info/time_between_train_steps": 0.0063707828521728516, "step": 6808} {"info/global_step": 6809, "train_info/time_within_train_step": 2.7551541328430176, "step": 6809} {"train_info/time_between_train_steps": 0.006180286407470703, "step": 6809} {"info/global_step": 6810, "train_info/time_within_train_step": 2.755523204803467, "step": 6810} {"train_info/time_between_train_steps": 0.006216287612915039, "step": 6810} {"info/global_step": 6811, "train_info/time_within_train_step": 2.7561936378479004, "step": 6811} {"train_info/time_between_train_steps": 0.006186723709106445, "step": 6811} {"info/global_step": 6812, "train_info/time_within_train_step": 2.7564988136291504, "step": 6812} {"train_info/time_between_train_steps": 0.006192922592163086, "step": 6812} {"info/global_step": 6813, "train_info/time_within_train_step": 2.757551431655884, "step": 6813} {"train_info/time_between_train_steps": 0.006119966506958008, "step": 6813} {"info/global_step": 6814, "train_info/time_within_train_step": 2.7579493522644043, "step": 6814} {"train_info/time_between_train_steps": 0.006522417068481445, "step": 6814} {"info/global_step": 6815, "train_info/time_within_train_step": 2.7574479579925537, "step": 6815} {"train_info/time_between_train_steps": 0.006604433059692383, "step": 6815} {"info/global_step": 6816, "train_info/time_within_train_step": 2.758004903793335, "step": 6816} {"train_info/time_between_train_steps": 0.0063838958740234375, "step": 6816} {"info/global_step": 6817, "train_info/time_within_train_step": 2.759207248687744, "step": 6817} {"train_info/time_between_train_steps": 0.006453990936279297, "step": 6817} {"info/global_step": 6818, "train_info/time_within_train_step": 2.7582008838653564, "step": 6818} {"train_info/time_between_train_steps": 0.006303548812866211, "step": 6818} {"info/global_step": 6819, "train_info/time_within_train_step": 2.7580251693725586, "step": 6819} {"train_info/time_between_train_steps": 0.006485700607299805, "step": 6819} {"info/global_step": 6820, "train_info/time_within_train_step": 2.7574946880340576, "step": 6820} {"train_info/time_between_train_steps": 0.006673336029052734, "step": 6820} {"info/global_step": 6821, "train_info/time_within_train_step": 2.7573397159576416, "step": 6821} {"train_info/time_between_train_steps": 0.006853342056274414, "step": 6821} {"info/global_step": 6822, "train_info/time_within_train_step": 2.7580652236938477, "step": 6822} {"train_info/time_between_train_steps": 0.006769418716430664, "step": 6822} {"info/global_step": 6823, "train_info/time_within_train_step": 2.7586162090301514, "step": 6823} {"train_info/time_between_train_steps": 0.007091522216796875, "step": 6823} {"info/global_step": 6824, "train_info/time_within_train_step": 2.758030891418457, "step": 6824} {"train_info/time_between_train_steps": 0.0069904327392578125, "step": 6824} {"train_info/time_between_train_steps": 3.4545741081237793, "step": 6824} {"info/global_step": 6825, "train_info/time_within_train_step": 2.7145638465881348, "step": 6825} {"train_info/time_between_train_steps": 0.006458282470703125, "step": 6825} {"info/global_step": 6826, "train_info/time_within_train_step": 2.7558183670043945, "step": 6826} {"train_info/time_between_train_steps": 0.003093242645263672, "step": 6826} {"info/global_step": 6827, "train_info/time_within_train_step": 2.757840633392334, "step": 6827} {"train_info/time_between_train_steps": 0.006485462188720703, "step": 6827} {"info/global_step": 6828, "train_info/time_within_train_step": 2.7569658756256104, "step": 6828} {"train_info/time_between_train_steps": 0.0031468868255615234, "step": 6828} {"info/global_step": 6829, "train_info/time_within_train_step": 2.755812883377075, "step": 6829} {"train_info/time_between_train_steps": 0.0031137466430664062, "step": 6829} {"info/global_step": 6830, "train_info/time_within_train_step": 2.756068468093872, "step": 6830} {"train_info/time_between_train_steps": 0.003167867660522461, "step": 6830} {"info/global_step": 6831, "train_info/time_within_train_step": 2.7559890747070312, "step": 6831} {"train_info/time_between_train_steps": 0.003131389617919922, "step": 6831} {"info/global_step": 6832, "train_info/time_within_train_step": 2.756702423095703, "step": 6832} {"train_info/time_between_train_steps": 0.0031223297119140625, "step": 6832} {"info/global_step": 6833, "train_info/time_within_train_step": 2.755368947982788, "step": 6833} {"train_info/time_between_train_steps": 0.0036439895629882812, "step": 6833} {"info/global_step": 6834, "train_info/time_within_train_step": 2.755581855773926, "step": 6834} {"train_info/time_between_train_steps": 0.0031156539916992188, "step": 6834} {"info/global_step": 6835, "train_info/time_within_train_step": 2.755963087081909, "step": 6835} {"train_info/time_between_train_steps": 0.003140687942504883, "step": 6835} {"info/global_step": 6836, "train_info/time_within_train_step": 2.7543857097625732, "step": 6836} {"train_info/time_between_train_steps": 0.0031785964965820312, "step": 6836} {"info/global_step": 6837, "train_info/time_within_train_step": 2.7546708583831787, "step": 6837} {"train_info/time_between_train_steps": 0.003160715103149414, "step": 6837} {"info/global_step": 6838, "train_info/time_within_train_step": 2.7567591667175293, "step": 6838} {"train_info/time_between_train_steps": 0.0031251907348632812, "step": 6838} {"info/global_step": 6839, "train_info/time_within_train_step": 2.756452798843384, "step": 6839} {"train_info/time_between_train_steps": 0.003110170364379883, "step": 6839} {"info/global_step": 6840, "train_info/time_within_train_step": 2.756643772125244, "step": 6840} {"train_info/time_between_train_steps": 0.00311279296875, "step": 6840} {"info/global_step": 6841, "train_info/time_within_train_step": 2.756014347076416, "step": 6841} {"train_info/time_between_train_steps": 0.003157377243041992, "step": 6841} {"info/global_step": 6842, "train_info/time_within_train_step": 2.7559571266174316, "step": 6842} {"train_info/time_between_train_steps": 0.0032732486724853516, "step": 6842} {"info/global_step": 6843, "train_info/time_within_train_step": 2.755725860595703, "step": 6843} {"train_info/time_between_train_steps": 0.003121614456176758, "step": 6843} {"info/global_step": 6844, "train_info/time_within_train_step": 2.7560958862304688, "step": 6844} {"train_info/time_between_train_steps": 0.003175973892211914, "step": 6844} {"info/global_step": 6845, "train_info/time_within_train_step": 2.7787842750549316, "step": 6845} {"train_info/time_between_train_steps": 0.0030961036682128906, "step": 6845} {"info/global_step": 6846, "train_info/time_within_train_step": 2.7560274600982666, "step": 6846} {"train_info/time_between_train_steps": 0.0031745433807373047, "step": 6846} {"info/global_step": 6847, "train_info/time_within_train_step": 2.7553088665008545, "step": 6847} {"train_info/time_between_train_steps": 0.003131389617919922, "step": 6847} {"info/global_step": 6848, "train_info/time_within_train_step": 2.7551751136779785, "step": 6848} {"train_info/time_between_train_steps": 0.0031049251556396484, "step": 6848} {"info/global_step": 6849, "train_info/time_within_train_step": 2.7557101249694824, "step": 6849} {"train_info/time_between_train_steps": 0.0030972957611083984, "step": 6849} {"info/global_step": 6850, "train_info/time_within_train_step": 2.755312442779541, "step": 6850} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746585825, "_runtime": 19834}, "step": 6850} {"logs": {"train/loss": 3.3416, "train/learning_rate": 0.00020999999999999998, "train/epoch": 8.0, "_timestamp": 1746585825, "_runtime": 19834}, "step": 6850} {"train_info/time_between_train_steps": 0.013255596160888672, "step": 6850} {"info/global_step": 6851, "train_info/time_within_train_step": 2.97054386138916, "step": 6851} {"train_info/time_between_train_steps": 0.003155231475830078, "step": 6851} {"info/global_step": 6852, "train_info/time_within_train_step": 2.755157232284546, "step": 6852} {"train_info/time_between_train_steps": 0.003117799758911133, "step": 6852} {"info/global_step": 6853, "train_info/time_within_train_step": 2.755448341369629, "step": 6853} {"train_info/time_between_train_steps": 0.003184795379638672, "step": 6853} {"info/global_step": 6854, "train_info/time_within_train_step": 2.754645586013794, "step": 6854} {"train_info/time_between_train_steps": 0.003159761428833008, "step": 6854} {"info/global_step": 6855, "train_info/time_within_train_step": 2.757190227508545, "step": 6855} {"train_info/time_between_train_steps": 0.003351926803588867, "step": 6855} {"info/global_step": 6856, "train_info/time_within_train_step": 2.7565689086914062, "step": 6856} {"train_info/time_between_train_steps": 0.003245115280151367, "step": 6856} {"info/global_step": 6857, "train_info/time_within_train_step": 2.7598953247070312, "step": 6857} {"train_info/time_between_train_steps": 0.0033113956451416016, "step": 6857} {"info/global_step": 6858, "train_info/time_within_train_step": 2.7566847801208496, "step": 6858} {"train_info/time_between_train_steps": 0.0033292770385742188, "step": 6858} {"info/global_step": 6859, "train_info/time_within_train_step": 2.756657361984253, "step": 6859} {"train_info/time_between_train_steps": 0.0032968521118164062, "step": 6859} {"info/global_step": 6860, "train_info/time_within_train_step": 2.756664991378784, "step": 6860} {"train_info/time_between_train_steps": 0.0032777786254882812, "step": 6860} {"info/global_step": 6861, "train_info/time_within_train_step": 2.75681209564209, "step": 6861} {"train_info/time_between_train_steps": 0.003294229507446289, "step": 6861} {"info/global_step": 6862, "train_info/time_within_train_step": 2.7564995288848877, "step": 6862} {"train_info/time_between_train_steps": 0.003306150436401367, "step": 6862} {"info/global_step": 6863, "train_info/time_within_train_step": 2.757675886154175, "step": 6863} {"train_info/time_between_train_steps": 0.0033271312713623047, "step": 6863} {"info/global_step": 6864, "train_info/time_within_train_step": 2.7575197219848633, "step": 6864} {"train_info/time_between_train_steps": 0.003493785858154297, "step": 6864} {"info/global_step": 6865, "train_info/time_within_train_step": 2.758514165878296, "step": 6865} {"train_info/time_between_train_steps": 0.0032777786254882812, "step": 6865} {"info/global_step": 6866, "train_info/time_within_train_step": 2.756113052368164, "step": 6866} {"train_info/time_between_train_steps": 0.0033025741577148438, "step": 6866} {"info/global_step": 6867, "train_info/time_within_train_step": 2.7578959465026855, "step": 6867} {"train_info/time_between_train_steps": 0.003287792205810547, "step": 6867} {"info/global_step": 6868, "train_info/time_within_train_step": 2.7576122283935547, "step": 6868} {"train_info/time_between_train_steps": 0.0032508373260498047, "step": 6868} {"info/global_step": 6869, "train_info/time_within_train_step": 2.757158041000366, "step": 6869} {"train_info/time_between_train_steps": 0.0033223628997802734, "step": 6869} {"info/global_step": 6870, "train_info/time_within_train_step": 2.7563507556915283, "step": 6870} {"train_info/time_between_train_steps": 0.0032711029052734375, "step": 6870} {"info/global_step": 6871, "train_info/time_within_train_step": 2.757021188735962, "step": 6871} {"train_info/time_between_train_steps": 0.0032906532287597656, "step": 6871} {"info/global_step": 6872, "train_info/time_within_train_step": 2.75679087638855, "step": 6872} {"train_info/time_between_train_steps": 0.0032739639282226562, "step": 6872} {"info/global_step": 6873, "train_info/time_within_train_step": 2.757258892059326, "step": 6873} {"train_info/time_between_train_steps": 0.003373861312866211, "step": 6873} {"info/global_step": 6874, "train_info/time_within_train_step": 2.7554922103881836, "step": 6874} {"train_info/time_between_train_steps": 0.003274202346801758, "step": 6874} {"info/global_step": 6875, "train_info/time_within_train_step": 2.75758695602417, "step": 6875} {"train_info/time_between_train_steps": 0.003282785415649414, "step": 6875} {"info/global_step": 6876, "train_info/time_within_train_step": 2.7573859691619873, "step": 6876} {"train_info/time_between_train_steps": 0.003307342529296875, "step": 6876} {"info/global_step": 6877, "train_info/time_within_train_step": 2.7578752040863037, "step": 6877} {"train_info/time_between_train_steps": 0.0033402442932128906, "step": 6877} {"info/global_step": 6878, "train_info/time_within_train_step": 2.756410837173462, "step": 6878} {"train_info/time_between_train_steps": 0.0033152103424072266, "step": 6878} {"info/global_step": 6879, "train_info/time_within_train_step": 2.7568159103393555, "step": 6879} {"train_info/time_between_train_steps": 0.0032701492309570312, "step": 6879} {"info/global_step": 6880, "train_info/time_within_train_step": 2.7569527626037598, "step": 6880} {"train_info/time_between_train_steps": 0.003314495086669922, "step": 6880} {"info/global_step": 6881, "train_info/time_within_train_step": 2.756843328475952, "step": 6881} {"train_info/time_between_train_steps": 0.0033054351806640625, "step": 6881} {"info/global_step": 6882, "train_info/time_within_train_step": 2.757641553878784, "step": 6882} {"train_info/time_between_train_steps": 0.0033011436462402344, "step": 6882} {"info/global_step": 6883, "train_info/time_within_train_step": 2.757798194885254, "step": 6883} {"train_info/time_between_train_steps": 0.0032777786254882812, "step": 6883} {"info/global_step": 6884, "train_info/time_within_train_step": 2.756662607192993, "step": 6884} {"train_info/time_between_train_steps": 0.0032999515533447266, "step": 6884} {"info/global_step": 6885, "train_info/time_within_train_step": 2.756993532180786, "step": 6885} {"train_info/time_between_train_steps": 0.0032758712768554688, "step": 6885} {"info/global_step": 6886, "train_info/time_within_train_step": 2.7575793266296387, "step": 6886} {"train_info/time_between_train_steps": 0.003335714340209961, "step": 6886} {"info/global_step": 6887, "train_info/time_within_train_step": 2.879669666290283, "step": 6887} {"train_info/time_between_train_steps": 0.0033998489379882812, "step": 6887} {"info/global_step": 6888, "train_info/time_within_train_step": 2.7570018768310547, "step": 6888} {"train_info/time_between_train_steps": 0.003367900848388672, "step": 6888} {"info/global_step": 6889, "train_info/time_within_train_step": 2.757314682006836, "step": 6889} {"train_info/time_between_train_steps": 0.003278493881225586, "step": 6889} {"info/global_step": 6890, "train_info/time_within_train_step": 2.757312774658203, "step": 6890} {"train_info/time_between_train_steps": 0.003342866897583008, "step": 6890} {"info/global_step": 6891, "train_info/time_within_train_step": 2.7572898864746094, "step": 6891} {"train_info/time_between_train_steps": 0.003299236297607422, "step": 6891} {"info/global_step": 6892, "train_info/time_within_train_step": 2.7579827308654785, "step": 6892} {"train_info/time_between_train_steps": 0.0033245086669921875, "step": 6892} {"info/global_step": 6893, "train_info/time_within_train_step": 2.757784366607666, "step": 6893} {"train_info/time_between_train_steps": 0.0033223628997802734, "step": 6893} {"info/global_step": 6894, "train_info/time_within_train_step": 2.757615089416504, "step": 6894} {"train_info/time_between_train_steps": 0.0032825469970703125, "step": 6894} {"info/global_step": 6895, "train_info/time_within_train_step": 2.7567834854125977, "step": 6895} {"train_info/time_between_train_steps": 0.0033261775970458984, "step": 6895} {"info/global_step": 6896, "train_info/time_within_train_step": 2.756742477416992, "step": 6896} {"train_info/time_between_train_steps": 0.003303050994873047, "step": 6896} {"info/global_step": 6897, "train_info/time_within_train_step": 2.7575368881225586, "step": 6897} {"train_info/time_between_train_steps": 0.003465890884399414, "step": 6897} {"info/global_step": 6898, "train_info/time_within_train_step": 2.7573750019073486, "step": 6898} {"train_info/time_between_train_steps": 0.0033104419708251953, "step": 6898} {"info/global_step": 6899, "train_info/time_within_train_step": 2.7565650939941406, "step": 6899} {"train_info/time_between_train_steps": 0.0033075809478759766, "step": 6899} {"info/global_step": 6900, "train_info/time_within_train_step": 2.757533311843872, "step": 6900} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746585964, "_runtime": 19973}, "step": 6900} {"logs": {"train/loss": 3.2922, "train/learning_rate": 0.00020666666666666666, "train/epoch": 8.01, "_timestamp": 1746585964, "_runtime": 19973}, "step": 6900} {"train_info/time_between_train_steps": 0.013087987899780273, "step": 6900} {"info/global_step": 6901, "train_info/time_within_train_step": 2.7579548358917236, "step": 6901} {"train_info/time_between_train_steps": 0.0033369064331054688, "step": 6901} {"info/global_step": 6902, "train_info/time_within_train_step": 2.7576446533203125, "step": 6902} {"train_info/time_between_train_steps": 0.0033006668090820312, "step": 6902} {"info/global_step": 6903, "train_info/time_within_train_step": 2.7570977210998535, "step": 6903} {"train_info/time_between_train_steps": 0.0032808780670166016, "step": 6903} {"info/global_step": 6904, "train_info/time_within_train_step": 2.757718563079834, "step": 6904} {"train_info/time_between_train_steps": 0.003378629684448242, "step": 6904} {"info/global_step": 6905, "train_info/time_within_train_step": 2.7570841312408447, "step": 6905} {"train_info/time_between_train_steps": 0.003306865692138672, "step": 6905} {"info/global_step": 6906, "train_info/time_within_train_step": 2.7577457427978516, "step": 6906} {"train_info/time_between_train_steps": 0.0033206939697265625, "step": 6906} {"info/global_step": 6907, "train_info/time_within_train_step": 2.7576730251312256, "step": 6907} {"train_info/time_between_train_steps": 0.003325939178466797, "step": 6907} {"info/global_step": 6908, "train_info/time_within_train_step": 2.7577149868011475, "step": 6908} {"train_info/time_between_train_steps": 0.003336191177368164, "step": 6908} {"info/global_step": 6909, "train_info/time_within_train_step": 2.7575860023498535, "step": 6909} {"train_info/time_between_train_steps": 0.0032720565795898438, "step": 6909} {"info/global_step": 6910, "train_info/time_within_train_step": 2.7566404342651367, "step": 6910} {"train_info/time_between_train_steps": 0.003349781036376953, "step": 6910} {"info/global_step": 6911, "train_info/time_within_train_step": 2.7582387924194336, "step": 6911} {"train_info/time_between_train_steps": 0.003353595733642578, "step": 6911} {"info/global_step": 6912, "train_info/time_within_train_step": 2.757391929626465, "step": 6912} {"train_info/time_between_train_steps": 0.0033359527587890625, "step": 6912} {"info/global_step": 6913, "train_info/time_within_train_step": 2.757747173309326, "step": 6913} {"train_info/time_between_train_steps": 0.003320455551147461, "step": 6913} {"info/global_step": 6914, "train_info/time_within_train_step": 2.7563230991363525, "step": 6914} {"train_info/time_between_train_steps": 0.0032966136932373047, "step": 6914} {"info/global_step": 6915, "train_info/time_within_train_step": 2.7579948902130127, "step": 6915} {"train_info/time_between_train_steps": 0.0033464431762695312, "step": 6915} {"info/global_step": 6916, "train_info/time_within_train_step": 2.757078170776367, "step": 6916} {"train_info/time_between_train_steps": 0.0032913684844970703, "step": 6916} {"info/global_step": 6917, "train_info/time_within_train_step": 2.756995439529419, "step": 6917} {"train_info/time_between_train_steps": 0.0033245086669921875, "step": 6917} {"info/global_step": 6918, "train_info/time_within_train_step": 2.7572951316833496, "step": 6918} {"train_info/time_between_train_steps": 0.00335693359375, "step": 6918} {"info/global_step": 6919, "train_info/time_within_train_step": 2.7567899227142334, "step": 6919} {"train_info/time_between_train_steps": 0.0032999515533447266, "step": 6919} {"info/global_step": 6920, "train_info/time_within_train_step": 2.756403684616089, "step": 6920} {"train_info/time_between_train_steps": 0.003373861312866211, "step": 6920} {"info/global_step": 6921, "train_info/time_within_train_step": 2.756681203842163, "step": 6921} {"train_info/time_between_train_steps": 0.003326416015625, "step": 6921} {"info/global_step": 6922, "train_info/time_within_train_step": 2.7560067176818848, "step": 6922} {"train_info/time_between_train_steps": 0.003292560577392578, "step": 6922} {"info/global_step": 6923, "train_info/time_within_train_step": 2.7561044692993164, "step": 6923} {"train_info/time_between_train_steps": 0.003297567367553711, "step": 6923} {"info/global_step": 6924, "train_info/time_within_train_step": 2.756848096847534, "step": 6924} {"train_info/time_between_train_steps": 0.003330707550048828, "step": 6924} {"info/global_step": 6925, "train_info/time_within_train_step": 2.7562780380249023, "step": 6925} {"train_info/time_between_train_steps": 0.003325939178466797, "step": 6925} {"info/global_step": 6926, "train_info/time_within_train_step": 2.75724720954895, "step": 6926} {"train_info/time_between_train_steps": 0.0033218860626220703, "step": 6926} {"info/global_step": 6927, "train_info/time_within_train_step": 2.757232427597046, "step": 6927} {"train_info/time_between_train_steps": 0.0033540725708007812, "step": 6927} {"info/global_step": 6928, "train_info/time_within_train_step": 2.756521224975586, "step": 6928} {"train_info/time_between_train_steps": 0.0033190250396728516, "step": 6928} {"info/global_step": 6929, "train_info/time_within_train_step": 2.757704734802246, "step": 6929} {"train_info/time_between_train_steps": 0.0032885074615478516, "step": 6929} {"info/global_step": 6930, "train_info/time_within_train_step": 2.756781578063965, "step": 6930} {"train_info/time_between_train_steps": 0.003323793411254883, "step": 6930} {"info/global_step": 6931, "train_info/time_within_train_step": 2.7570319175720215, "step": 6931} {"train_info/time_between_train_steps": 0.003285646438598633, "step": 6931} {"info/global_step": 6932, "train_info/time_within_train_step": 2.756864547729492, "step": 6932} {"train_info/time_between_train_steps": 0.0033118724822998047, "step": 6932} {"info/global_step": 6933, "train_info/time_within_train_step": 2.7568089962005615, "step": 6933} {"train_info/time_between_train_steps": 0.0033261775970458984, "step": 6933} {"info/global_step": 6934, "train_info/time_within_train_step": 2.756413698196411, "step": 6934} {"train_info/time_between_train_steps": 0.003314971923828125, "step": 6934} {"info/global_step": 6935, "train_info/time_within_train_step": 2.7571849822998047, "step": 6935} {"train_info/time_between_train_steps": 0.0033104419708251953, "step": 6935} {"info/global_step": 6936, "train_info/time_within_train_step": 2.7569472789764404, "step": 6936} {"train_info/time_between_train_steps": 0.0033037662506103516, "step": 6936} {"info/global_step": 6937, "train_info/time_within_train_step": 2.757099151611328, "step": 6937} {"train_info/time_between_train_steps": 0.0033512115478515625, "step": 6937} {"info/global_step": 6938, "train_info/time_within_train_step": 2.7584288120269775, "step": 6938} {"train_info/time_between_train_steps": 0.0033109188079833984, "step": 6938} {"info/global_step": 6939, "train_info/time_within_train_step": 2.7566275596618652, "step": 6939} {"train_info/time_between_train_steps": 0.003362894058227539, "step": 6939} {"info/global_step": 6940, "train_info/time_within_train_step": 2.7566657066345215, "step": 6940} {"train_info/time_between_train_steps": 0.0032987594604492188, "step": 6940} {"info/global_step": 6941, "train_info/time_within_train_step": 2.756098747253418, "step": 6941} {"train_info/time_between_train_steps": 0.003331899642944336, "step": 6941} {"info/global_step": 6942, "train_info/time_within_train_step": 2.7579987049102783, "step": 6942} {"train_info/time_between_train_steps": 0.003294229507446289, "step": 6942} {"info/global_step": 6943, "train_info/time_within_train_step": 2.997967004776001, "step": 6943} {"train_info/time_between_train_steps": 0.0033354759216308594, "step": 6943} {"info/global_step": 6944, "train_info/time_within_train_step": 2.7573397159576416, "step": 6944} {"train_info/time_between_train_steps": 0.0033316612243652344, "step": 6944} {"info/global_step": 6945, "train_info/time_within_train_step": 2.757375717163086, "step": 6945} {"train_info/time_between_train_steps": 0.003300905227661133, "step": 6945} {"info/global_step": 6946, "train_info/time_within_train_step": 2.7569093704223633, "step": 6946} {"train_info/time_between_train_steps": 0.003278493881225586, "step": 6946} {"info/global_step": 6947, "train_info/time_within_train_step": 2.7570035457611084, "step": 6947} {"train_info/time_between_train_steps": 0.0033538341522216797, "step": 6947} {"info/global_step": 6948, "train_info/time_within_train_step": 2.7567198276519775, "step": 6948} {"train_info/time_between_train_steps": 0.0032966136932373047, "step": 6948} {"info/global_step": 6949, "train_info/time_within_train_step": 2.7575531005859375, "step": 6949} {"train_info/time_between_train_steps": 0.12857723236083984, "step": 6949} {"info/global_step": 6950, "train_info/time_within_train_step": 2.759462833404541, "step": 6950} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746586103, "_runtime": 20112}, "step": 6950} {"logs": {"train/loss": 3.2837, "train/learning_rate": 0.00020333333333333333, "train/epoch": 8.01, "_timestamp": 1746586103, "_runtime": 20112}, "step": 6950} {"train_info/time_between_train_steps": 0.010174274444580078, "step": 6950} {"info/global_step": 6951, "train_info/time_within_train_step": 2.7558999061584473, "step": 6951} {"train_info/time_between_train_steps": 0.0033087730407714844, "step": 6951} {"info/global_step": 6952, "train_info/time_within_train_step": 2.7552108764648438, "step": 6952} {"train_info/time_between_train_steps": 0.003154754638671875, "step": 6952} {"info/global_step": 6953, "train_info/time_within_train_step": 2.7548763751983643, "step": 6953} {"train_info/time_between_train_steps": 0.0031616687774658203, "step": 6953} {"info/global_step": 6954, "train_info/time_within_train_step": 2.7552130222320557, "step": 6954} {"train_info/time_between_train_steps": 0.0031614303588867188, "step": 6954} {"info/global_step": 6955, "train_info/time_within_train_step": 2.754936933517456, "step": 6955} {"train_info/time_between_train_steps": 0.0031576156616210938, "step": 6955} {"info/global_step": 6956, "train_info/time_within_train_step": 2.756016731262207, "step": 6956} {"train_info/time_between_train_steps": 0.003191232681274414, "step": 6956} {"info/global_step": 6957, "train_info/time_within_train_step": 2.754969358444214, "step": 6957} {"train_info/time_between_train_steps": 0.0031282901763916016, "step": 6957} {"info/global_step": 6958, "train_info/time_within_train_step": 2.7561957836151123, "step": 6958} {"train_info/time_between_train_steps": 0.0031566619873046875, "step": 6958} {"info/global_step": 6959, "train_info/time_within_train_step": 2.7560412883758545, "step": 6959} {"train_info/time_between_train_steps": 0.0031418800354003906, "step": 6959} {"info/global_step": 6960, "train_info/time_within_train_step": 2.7561676502227783, "step": 6960} {"train_info/time_between_train_steps": 0.0031502246856689453, "step": 6960} {"info/global_step": 6961, "train_info/time_within_train_step": 2.755990505218506, "step": 6961} {"train_info/time_between_train_steps": 0.0032088756561279297, "step": 6961} {"info/global_step": 6962, "train_info/time_within_train_step": 2.756598949432373, "step": 6962} {"train_info/time_between_train_steps": 0.0031833648681640625, "step": 6962} {"info/global_step": 6963, "train_info/time_within_train_step": 2.756652593612671, "step": 6963} {"train_info/time_between_train_steps": 0.0031480789184570312, "step": 6963} {"info/global_step": 6964, "train_info/time_within_train_step": 2.755660057067871, "step": 6964} {"train_info/time_between_train_steps": 0.0031359195709228516, "step": 6964} {"info/global_step": 6965, "train_info/time_within_train_step": 2.756405830383301, "step": 6965} {"train_info/time_between_train_steps": 0.0031392574310302734, "step": 6965} {"info/global_step": 6966, "train_info/time_within_train_step": 2.75583815574646, "step": 6966} {"train_info/time_between_train_steps": 0.0031349658966064453, "step": 6966} {"info/global_step": 6967, "train_info/time_within_train_step": 2.7538394927978516, "step": 6967} {"train_info/time_between_train_steps": 0.003145456314086914, "step": 6967} {"info/global_step": 6968, "train_info/time_within_train_step": 2.754974365234375, "step": 6968} {"train_info/time_between_train_steps": 0.0031676292419433594, "step": 6968} {"info/global_step": 6969, "train_info/time_within_train_step": 2.754737138748169, "step": 6969} {"train_info/time_between_train_steps": 0.0031435489654541016, "step": 6969} {"info/global_step": 6970, "train_info/time_within_train_step": 2.754784107208252, "step": 6970} {"train_info/time_between_train_steps": 0.0031838417053222656, "step": 6970} {"info/global_step": 6971, "train_info/time_within_train_step": 2.756120443344116, "step": 6971} {"train_info/time_between_train_steps": 0.003188610076904297, "step": 6971} {"info/global_step": 6972, "train_info/time_within_train_step": 2.7551798820495605, "step": 6972} {"train_info/time_between_train_steps": 0.0031914710998535156, "step": 6972} {"info/global_step": 6973, "train_info/time_within_train_step": 2.755052328109741, "step": 6973} {"train_info/time_between_train_steps": 0.003175497055053711, "step": 6973} {"info/global_step": 6974, "train_info/time_within_train_step": 2.7567267417907715, "step": 6974} {"train_info/time_between_train_steps": 0.003133058547973633, "step": 6974} {"info/global_step": 6975, "train_info/time_within_train_step": 2.757317066192627, "step": 6975} {"train_info/time_between_train_steps": 0.003147602081298828, "step": 6975} {"info/global_step": 6976, "train_info/time_within_train_step": 2.756553888320923, "step": 6976} {"train_info/time_between_train_steps": 0.003142833709716797, "step": 6976} {"info/global_step": 6977, "train_info/time_within_train_step": 2.756629467010498, "step": 6977} {"train_info/time_between_train_steps": 0.0031282901763916016, "step": 6977} {"info/global_step": 6978, "train_info/time_within_train_step": 2.756497621536255, "step": 6978} {"train_info/time_between_train_steps": 0.003173351287841797, "step": 6978} {"info/global_step": 6979, "train_info/time_within_train_step": 2.7551188468933105, "step": 6979} {"train_info/time_between_train_steps": 0.0031583309173583984, "step": 6979} {"info/global_step": 6980, "train_info/time_within_train_step": 2.7553446292877197, "step": 6980} {"train_info/time_between_train_steps": 0.003125905990600586, "step": 6980} {"info/global_step": 6981, "train_info/time_within_train_step": 2.7554004192352295, "step": 6981} {"train_info/time_between_train_steps": 0.0031442642211914062, "step": 6981} {"info/global_step": 6982, "train_info/time_within_train_step": 2.7548301219940186, "step": 6982} {"train_info/time_between_train_steps": 0.003144502639770508, "step": 6982} {"info/global_step": 6983, "train_info/time_within_train_step": 2.755042552947998, "step": 6983} {"train_info/time_between_train_steps": 0.003168344497680664, "step": 6983} {"info/global_step": 6984, "train_info/time_within_train_step": 2.7551939487457275, "step": 6984} {"train_info/time_between_train_steps": 0.0031452178955078125, "step": 6984} {"info/global_step": 6985, "train_info/time_within_train_step": 2.7543563842773438, "step": 6985} {"train_info/time_between_train_steps": 0.0031249523162841797, "step": 6985} {"info/global_step": 6986, "train_info/time_within_train_step": 2.755004405975342, "step": 6986} {"train_info/time_between_train_steps": 0.003130674362182617, "step": 6986} {"info/global_step": 6987, "train_info/time_within_train_step": 2.75640606880188, "step": 6987} {"train_info/time_between_train_steps": 0.0031387805938720703, "step": 6987} {"info/global_step": 6988, "train_info/time_within_train_step": 2.75594425201416, "step": 6988} {"train_info/time_between_train_steps": 0.003137826919555664, "step": 6988} {"info/global_step": 6989, "train_info/time_within_train_step": 2.7570548057556152, "step": 6989} {"train_info/time_between_train_steps": 0.003175020217895508, "step": 6989} {"info/global_step": 6990, "train_info/time_within_train_step": 2.756107807159424, "step": 6990} {"train_info/time_between_train_steps": 0.003142118453979492, "step": 6990} {"info/global_step": 6991, "train_info/time_within_train_step": 2.756032943725586, "step": 6991} {"train_info/time_between_train_steps": 0.003138303756713867, "step": 6991} {"info/global_step": 6992, "train_info/time_within_train_step": 2.7563202381134033, "step": 6992} {"train_info/time_between_train_steps": 0.0032074451446533203, "step": 6992} {"info/global_step": 6993, "train_info/time_within_train_step": 2.757115364074707, "step": 6993} {"train_info/time_between_train_steps": 0.003145933151245117, "step": 6993} {"info/global_step": 6994, "train_info/time_within_train_step": 2.7559354305267334, "step": 6994} {"train_info/time_between_train_steps": 0.003172636032104492, "step": 6994} {"info/global_step": 6995, "train_info/time_within_train_step": 2.7547547817230225, "step": 6995} {"train_info/time_between_train_steps": 0.0031311511993408203, "step": 6995} {"info/global_step": 6996, "train_info/time_within_train_step": 3.3359932899475098, "step": 6996} {"train_info/time_between_train_steps": 0.003201007843017578, "step": 6996} {"info/global_step": 6997, "train_info/time_within_train_step": 2.778454542160034, "step": 6997} {"train_info/time_between_train_steps": 0.0031349658966064453, "step": 6997} {"info/global_step": 6998, "train_info/time_within_train_step": 2.754884719848633, "step": 6998} {"train_info/time_between_train_steps": 0.0031545162200927734, "step": 6998} {"info/global_step": 6999, "train_info/time_within_train_step": 2.996004343032837, "step": 6999} {"train_info/time_between_train_steps": 0.0031828880310058594, "step": 6999} {"info/global_step": 7000, "train_info/time_within_train_step": 2.754077911376953, "step": 7000} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746586242, "_runtime": 20251}, "step": 7000} {"logs": {"train/loss": 3.2697, "train/learning_rate": 0.00019999999999999998, "train/epoch": 8.02, "_timestamp": 1746586242, "_runtime": 20251}, "step": 7000} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746586247, "_runtime": 20256}, "step": 7000} {"logs": {"eval/loss": 4.760046005249023, "eval/runtime": 5.1787, "eval/samples_per_second": 36.689, "eval/steps_per_second": 1.159, "train/epoch": 8.02, "_timestamp": 1746586247, "_runtime": 20256}, "step": 7000} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746586247, "_runtime": 20256}, "step": 7000} {"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.760046005249023, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 116.75129694793064, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 5.1787, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 36.689, "train/epoch": 8.02, "_timestamp": 1746586247, "_runtime": 20256}, "step": 7000} {"train_info/time_between_train_steps": 18.111838579177856, "step": 7000} {"info/global_step": 7001, "train_info/time_within_train_step": 2.5314781665802, "step": 7001} {"train_info/time_between_train_steps": 0.0033507347106933594, "step": 7001} {"info/global_step": 7002, "train_info/time_within_train_step": 2.5818185806274414, "step": 7002} {"train_info/time_between_train_steps": 0.003338336944580078, "step": 7002} {"info/global_step": 7003, "train_info/time_within_train_step": 2.731471300125122, "step": 7003} {"train_info/time_between_train_steps": 0.003309965133666992, "step": 7003} {"info/global_step": 7004, "train_info/time_within_train_step": 2.749478340148926, "step": 7004} {"train_info/time_between_train_steps": 0.003334522247314453, "step": 7004} {"info/global_step": 7005, "train_info/time_within_train_step": 2.7547409534454346, "step": 7005} {"train_info/time_between_train_steps": 0.0034089088439941406, "step": 7005} {"info/global_step": 7006, "train_info/time_within_train_step": 2.756181478500366, "step": 7006} {"train_info/time_between_train_steps": 0.0033028125762939453, "step": 7006} {"info/global_step": 7007, "train_info/time_within_train_step": 2.7555246353149414, "step": 7007} {"train_info/time_between_train_steps": 0.0034258365631103516, "step": 7007} {"info/global_step": 7008, "train_info/time_within_train_step": 2.7549638748168945, "step": 7008} {"train_info/time_between_train_steps": 0.0031425952911376953, "step": 7008} {"info/global_step": 7009, "train_info/time_within_train_step": 2.753645658493042, "step": 7009} {"train_info/time_between_train_steps": 0.003155231475830078, "step": 7009} {"info/global_step": 7010, "train_info/time_within_train_step": 2.753974199295044, "step": 7010} {"train_info/time_between_train_steps": 0.0031321048736572266, "step": 7010} {"info/global_step": 7011, "train_info/time_within_train_step": 2.755021333694458, "step": 7011} {"train_info/time_between_train_steps": 0.003091573715209961, "step": 7011} {"info/global_step": 7012, "train_info/time_within_train_step": 2.8803043365478516, "step": 7012} {"train_info/time_between_train_steps": 0.003187894821166992, "step": 7012} {"info/global_step": 7013, "train_info/time_within_train_step": 2.755779981613159, "step": 7013} {"train_info/time_between_train_steps": 0.0032100677490234375, "step": 7013} {"info/global_step": 7014, "train_info/time_within_train_step": 2.7567756175994873, "step": 7014} {"train_info/time_between_train_steps": 0.003299713134765625, "step": 7014} {"info/global_step": 7015, "train_info/time_within_train_step": 2.7571542263031006, "step": 7015} {"train_info/time_between_train_steps": 0.0033392906188964844, "step": 7015} {"info/global_step": 7016, "train_info/time_within_train_step": 2.757708787918091, "step": 7016} {"train_info/time_between_train_steps": 0.0033330917358398438, "step": 7016} {"info/global_step": 7017, "train_info/time_within_train_step": 2.7581262588500977, "step": 7017} {"train_info/time_between_train_steps": 0.003324747085571289, "step": 7017} {"info/global_step": 7018, "train_info/time_within_train_step": 2.757984161376953, "step": 7018} {"train_info/time_between_train_steps": 0.0033197402954101562, "step": 7018} {"info/global_step": 7019, "train_info/time_within_train_step": 2.7577691078186035, "step": 7019} {"train_info/time_between_train_steps": 0.0034117698669433594, "step": 7019} {"info/global_step": 7020, "train_info/time_within_train_step": 2.7576205730438232, "step": 7020} {"train_info/time_between_train_steps": 0.003380298614501953, "step": 7020} {"info/global_step": 7021, "train_info/time_within_train_step": 2.7574613094329834, "step": 7021} {"train_info/time_between_train_steps": 0.0034356117248535156, "step": 7021} {"info/global_step": 7022, "train_info/time_within_train_step": 2.7574877738952637, "step": 7022} {"train_info/time_between_train_steps": 0.003501415252685547, "step": 7022} {"info/global_step": 7023, "train_info/time_within_train_step": 2.755474090576172, "step": 7023} {"train_info/time_between_train_steps": 0.0035393238067626953, "step": 7023} {"info/global_step": 7024, "train_info/time_within_train_step": 2.7567741870880127, "step": 7024} {"train_info/time_between_train_steps": 0.0035026073455810547, "step": 7024} {"info/global_step": 7025, "train_info/time_within_train_step": 2.757763385772705, "step": 7025} {"train_info/time_between_train_steps": 0.0035562515258789062, "step": 7025} {"info/global_step": 7026, "train_info/time_within_train_step": 2.7570793628692627, "step": 7026} {"train_info/time_between_train_steps": 0.003540515899658203, "step": 7026} {"info/global_step": 7027, "train_info/time_within_train_step": 2.7582457065582275, "step": 7027} {"train_info/time_between_train_steps": 0.0036623477935791016, "step": 7027} {"info/global_step": 7028, "train_info/time_within_train_step": 2.7579545974731445, "step": 7028} {"train_info/time_between_train_steps": 0.0034856796264648438, "step": 7028} {"info/global_step": 7029, "train_info/time_within_train_step": 2.7578282356262207, "step": 7029} {"train_info/time_between_train_steps": 0.003548145294189453, "step": 7029} {"info/global_step": 7030, "train_info/time_within_train_step": 2.7563936710357666, "step": 7030} {"train_info/time_between_train_steps": 0.003573894500732422, "step": 7030} {"info/global_step": 7031, "train_info/time_within_train_step": 2.758284330368042, "step": 7031} {"train_info/time_between_train_steps": 0.0035505294799804688, "step": 7031} {"info/global_step": 7032, "train_info/time_within_train_step": 2.7578914165496826, "step": 7032} {"train_info/time_between_train_steps": 0.003530263900756836, "step": 7032} {"info/global_step": 7033, "train_info/time_within_train_step": 2.757807493209839, "step": 7033} {"train_info/time_between_train_steps": 0.0035576820373535156, "step": 7033} {"info/global_step": 7034, "train_info/time_within_train_step": 2.7572057247161865, "step": 7034} {"train_info/time_between_train_steps": 0.003534555435180664, "step": 7034} {"info/global_step": 7035, "train_info/time_within_train_step": 2.7574350833892822, "step": 7035} {"train_info/time_between_train_steps": 0.003484964370727539, "step": 7035} {"info/global_step": 7036, "train_info/time_within_train_step": 2.7578186988830566, "step": 7036} {"train_info/time_between_train_steps": 0.0035965442657470703, "step": 7036} {"info/global_step": 7037, "train_info/time_within_train_step": 2.757756233215332, "step": 7037} {"train_info/time_between_train_steps": 0.0035865306854248047, "step": 7037} {"info/global_step": 7038, "train_info/time_within_train_step": 2.757082462310791, "step": 7038} {"train_info/time_between_train_steps": 0.0035452842712402344, "step": 7038} {"info/global_step": 7039, "train_info/time_within_train_step": 2.7562625408172607, "step": 7039} {"train_info/time_between_train_steps": 0.0036406517028808594, "step": 7039} {"info/global_step": 7040, "train_info/time_within_train_step": 2.757690906524658, "step": 7040} {"train_info/time_between_train_steps": 0.0035331249237060547, "step": 7040} {"info/global_step": 7041, "train_info/time_within_train_step": 2.7565131187438965, "step": 7041} {"train_info/time_between_train_steps": 0.003351449966430664, "step": 7041} {"info/global_step": 7042, "train_info/time_within_train_step": 2.755251169204712, "step": 7042} {"train_info/time_between_train_steps": 0.00335693359375, "step": 7042} {"info/global_step": 7043, "train_info/time_within_train_step": 2.7549502849578857, "step": 7043} {"train_info/time_between_train_steps": 0.0033676624298095703, "step": 7043} {"info/global_step": 7044, "train_info/time_within_train_step": 2.755690336227417, "step": 7044} {"train_info/time_between_train_steps": 0.003402233123779297, "step": 7044} {"info/global_step": 7045, "train_info/time_within_train_step": 2.7565038204193115, "step": 7045} {"train_info/time_between_train_steps": 0.0033788681030273438, "step": 7045} {"info/global_step": 7046, "train_info/time_within_train_step": 2.7551090717315674, "step": 7046} {"train_info/time_between_train_steps": 0.003352642059326172, "step": 7046} {"info/global_step": 7047, "train_info/time_within_train_step": 2.756115198135376, "step": 7047} {"train_info/time_between_train_steps": 0.003374338150024414, "step": 7047} {"info/global_step": 7048, "train_info/time_within_train_step": 2.755225658416748, "step": 7048} {"train_info/time_between_train_steps": 0.003358125686645508, "step": 7048} {"info/global_step": 7049, "train_info/time_within_train_step": 2.755272150039673, "step": 7049} {"train_info/time_between_train_steps": 0.0033702850341796875, "step": 7049} {"info/global_step": 7050, "train_info/time_within_train_step": 2.756035804748535, "step": 7050} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746586398, "_runtime": 20407}, "step": 7050} {"logs": {"train/loss": 3.2588, "train/learning_rate": 0.00019666666666666666, "train/epoch": 8.02, "_timestamp": 1746586398, "_runtime": 20407}, "step": 7050} {"train_info/time_between_train_steps": 0.006489276885986328, "step": 7050} {"info/global_step": 7051, "train_info/time_within_train_step": 2.7557332515716553, "step": 7051} {"train_info/time_between_train_steps": 0.0033669471740722656, "step": 7051} {"info/global_step": 7052, "train_info/time_within_train_step": 2.754467010498047, "step": 7052} {"train_info/time_between_train_steps": 0.003329038619995117, "step": 7052} {"info/global_step": 7053, "train_info/time_within_train_step": 3.067432403564453, "step": 7053} {"train_info/time_between_train_steps": 0.0032415390014648438, "step": 7053} {"info/global_step": 7054, "train_info/time_within_train_step": 2.7542312145233154, "step": 7054} {"train_info/time_between_train_steps": 0.0031702518463134766, "step": 7054} {"info/global_step": 7055, "train_info/time_within_train_step": 2.7548179626464844, "step": 7055} {"train_info/time_between_train_steps": 0.0031621456146240234, "step": 7055} {"info/global_step": 7056, "train_info/time_within_train_step": 2.75394344329834, "step": 7056} {"train_info/time_between_train_steps": 0.003197193145751953, "step": 7056} {"info/global_step": 7057, "train_info/time_within_train_step": 2.7546072006225586, "step": 7057} {"train_info/time_between_train_steps": 0.0032110214233398438, "step": 7057} {"info/global_step": 7058, "train_info/time_within_train_step": 2.7544503211975098, "step": 7058} {"train_info/time_between_train_steps": 0.0031824111938476562, "step": 7058} {"info/global_step": 7059, "train_info/time_within_train_step": 2.754584789276123, "step": 7059} {"train_info/time_between_train_steps": 0.003182649612426758, "step": 7059} {"info/global_step": 7060, "train_info/time_within_train_step": 2.754578113555908, "step": 7060} {"train_info/time_between_train_steps": 0.0031697750091552734, "step": 7060} {"info/global_step": 7061, "train_info/time_within_train_step": 2.755215644836426, "step": 7061} {"train_info/time_between_train_steps": 0.003178119659423828, "step": 7061} {"info/global_step": 7062, "train_info/time_within_train_step": 2.7556092739105225, "step": 7062} {"train_info/time_between_train_steps": 0.003170013427734375, "step": 7062} {"info/global_step": 7063, "train_info/time_within_train_step": 2.755741834640503, "step": 7063} {"train_info/time_between_train_steps": 0.0031905174255371094, "step": 7063} {"info/global_step": 7064, "train_info/time_within_train_step": 2.7543208599090576, "step": 7064} {"train_info/time_between_train_steps": 0.003184795379638672, "step": 7064} {"info/global_step": 7065, "train_info/time_within_train_step": 2.754061460494995, "step": 7065} {"train_info/time_between_train_steps": 0.0031511783599853516, "step": 7065} {"info/global_step": 7066, "train_info/time_within_train_step": 2.754880905151367, "step": 7066} {"train_info/time_between_train_steps": 0.003174304962158203, "step": 7066} {"info/global_step": 7067, "train_info/time_within_train_step": 2.755094051361084, "step": 7067} {"train_info/time_between_train_steps": 0.003170490264892578, "step": 7067} {"info/global_step": 7068, "train_info/time_within_train_step": 2.7542788982391357, "step": 7068} {"train_info/time_between_train_steps": 0.0031859874725341797, "step": 7068} {"info/global_step": 7069, "train_info/time_within_train_step": 2.7540314197540283, "step": 7069} {"train_info/time_between_train_steps": 0.0031774044036865234, "step": 7069} {"info/global_step": 7070, "train_info/time_within_train_step": 2.7542812824249268, "step": 7070} {"train_info/time_between_train_steps": 0.0031867027282714844, "step": 7070} {"info/global_step": 7071, "train_info/time_within_train_step": 2.7550501823425293, "step": 7071} {"train_info/time_between_train_steps": 0.0031671524047851562, "step": 7071} {"info/global_step": 7072, "train_info/time_within_train_step": 2.7557373046875, "step": 7072} {"train_info/time_between_train_steps": 0.003154754638671875, "step": 7072} {"info/global_step": 7073, "train_info/time_within_train_step": 2.755415678024292, "step": 7073} {"train_info/time_between_train_steps": 0.003179788589477539, "step": 7073} {"info/global_step": 7074, "train_info/time_within_train_step": 2.7567026615142822, "step": 7074} {"train_info/time_between_train_steps": 0.13400602340698242, "step": 7074} {"info/global_step": 7075, "train_info/time_within_train_step": 2.754807949066162, "step": 7075} {"train_info/time_between_train_steps": 0.0036385059356689453, "step": 7075} {"info/global_step": 7076, "train_info/time_within_train_step": 2.754819393157959, "step": 7076} {"train_info/time_between_train_steps": 0.0031898021697998047, "step": 7076} {"info/global_step": 7077, "train_info/time_within_train_step": 2.754295587539673, "step": 7077} {"train_info/time_between_train_steps": 0.0031824111938476562, "step": 7077} {"info/global_step": 7078, "train_info/time_within_train_step": 2.755763053894043, "step": 7078} {"train_info/time_between_train_steps": 0.0031518936157226562, "step": 7078} {"info/global_step": 7079, "train_info/time_within_train_step": 2.755486249923706, "step": 7079} {"train_info/time_between_train_steps": 0.0031747817993164062, "step": 7079} {"info/global_step": 7080, "train_info/time_within_train_step": 2.755117893218994, "step": 7080} {"train_info/time_between_train_steps": 0.003145933151245117, "step": 7080} {"info/global_step": 7081, "train_info/time_within_train_step": 2.7549829483032227, "step": 7081} {"train_info/time_between_train_steps": 0.003156900405883789, "step": 7081} {"info/global_step": 7082, "train_info/time_within_train_step": 2.754321575164795, "step": 7082} {"train_info/time_between_train_steps": 0.0031638145446777344, "step": 7082} {"info/global_step": 7083, "train_info/time_within_train_step": 2.7550785541534424, "step": 7083} {"train_info/time_between_train_steps": 0.003148317337036133, "step": 7083} {"info/global_step": 7084, "train_info/time_within_train_step": 2.755319595336914, "step": 7084} {"train_info/time_between_train_steps": 0.0031495094299316406, "step": 7084} {"info/global_step": 7085, "train_info/time_within_train_step": 2.754774570465088, "step": 7085} {"train_info/time_between_train_steps": 0.003170490264892578, "step": 7085} {"info/global_step": 7086, "train_info/time_within_train_step": 2.753716230392456, "step": 7086} {"train_info/time_between_train_steps": 0.0031404495239257812, "step": 7086} {"info/global_step": 7087, "train_info/time_within_train_step": 2.7542331218719482, "step": 7087} {"train_info/time_between_train_steps": 0.003145933151245117, "step": 7087} {"info/global_step": 7088, "train_info/time_within_train_step": 2.754317283630371, "step": 7088} {"train_info/time_between_train_steps": 0.0032269954681396484, "step": 7088} {"info/global_step": 7089, "train_info/time_within_train_step": 2.7558865547180176, "step": 7089} {"train_info/time_between_train_steps": 0.003339529037475586, "step": 7089} {"info/global_step": 7090, "train_info/time_within_train_step": 2.756010055541992, "step": 7090} {"train_info/time_between_train_steps": 0.003309965133666992, "step": 7090} {"info/global_step": 7091, "train_info/time_within_train_step": 2.7557196617126465, "step": 7091} {"train_info/time_between_train_steps": 0.003338336944580078, "step": 7091} {"info/global_step": 7092, "train_info/time_within_train_step": 2.756711959838867, "step": 7092} {"train_info/time_between_train_steps": 0.0033054351806640625, "step": 7092} {"info/global_step": 7093, "train_info/time_within_train_step": 2.755774974822998, "step": 7093} {"train_info/time_between_train_steps": 0.003307342529296875, "step": 7093} {"info/global_step": 7094, "train_info/time_within_train_step": 2.755223512649536, "step": 7094} {"train_info/time_between_train_steps": 0.0033333301544189453, "step": 7094} {"info/global_step": 7095, "train_info/time_within_train_step": 3.010430097579956, "step": 7095} {"train_info/time_between_train_steps": 0.0033333301544189453, "step": 7095} {"info/global_step": 7096, "train_info/time_within_train_step": 2.7563772201538086, "step": 7096} {"train_info/time_between_train_steps": 0.0033788681030273438, "step": 7096} {"info/global_step": 7097, "train_info/time_within_train_step": 2.7561631202697754, "step": 7097} {"train_info/time_between_train_steps": 0.003330230712890625, "step": 7097} {"info/global_step": 7098, "train_info/time_within_train_step": 2.755333423614502, "step": 7098} {"train_info/time_between_train_steps": 0.0033202171325683594, "step": 7098} {"info/global_step": 7099, "train_info/time_within_train_step": 2.7547690868377686, "step": 7099} {"train_info/time_between_train_steps": 0.0033948421478271484, "step": 7099} {"info/global_step": 7100, "train_info/time_within_train_step": 2.7543535232543945, "step": 7100} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746586536, "_runtime": 20545}, "step": 7100} {"logs": {"train/loss": 3.2479, "train/learning_rate": 0.00019333333333333333, "train/epoch": 8.03, "_timestamp": 1746586536, "_runtime": 20545}, "step": 7100} {"train_info/time_between_train_steps": 0.0069806575775146484, "step": 7100} {"info/global_step": 7101, "train_info/time_within_train_step": 2.7553014755249023, "step": 7101} {"train_info/time_between_train_steps": 0.0031533241271972656, "step": 7101} {"info/global_step": 7102, "train_info/time_within_train_step": 2.7549679279327393, "step": 7102} {"train_info/time_between_train_steps": 0.0031974315643310547, "step": 7102} {"info/global_step": 7103, "train_info/time_within_train_step": 2.7548954486846924, "step": 7103} {"train_info/time_between_train_steps": 0.0031697750091552734, "step": 7103} {"info/global_step": 7104, "train_info/time_within_train_step": 2.7538132667541504, "step": 7104} {"train_info/time_between_train_steps": 0.003161191940307617, "step": 7104} {"info/global_step": 7105, "train_info/time_within_train_step": 2.7541897296905518, "step": 7105} {"train_info/time_between_train_steps": 0.0031995773315429688, "step": 7105} {"info/global_step": 7106, "train_info/time_within_train_step": 2.754635810852051, "step": 7106} {"train_info/time_between_train_steps": 0.00318145751953125, "step": 7106} {"info/global_step": 7107, "train_info/time_within_train_step": 2.7545166015625, "step": 7107} {"train_info/time_between_train_steps": 0.0031921863555908203, "step": 7107} {"info/global_step": 7108, "train_info/time_within_train_step": 2.7544760704040527, "step": 7108} {"train_info/time_between_train_steps": 0.003225088119506836, "step": 7108} {"info/global_step": 7109, "train_info/time_within_train_step": 2.7548270225524902, "step": 7109} {"train_info/time_between_train_steps": 0.003152132034301758, "step": 7109} {"info/global_step": 7110, "train_info/time_within_train_step": 2.75150203704834, "step": 7110} {"train_info/time_between_train_steps": 0.0031557083129882812, "step": 7110} {"info/global_step": 7111, "train_info/time_within_train_step": 2.7545742988586426, "step": 7111} {"train_info/time_between_train_steps": 0.003175497055053711, "step": 7111} {"info/global_step": 7112, "train_info/time_within_train_step": 2.7540786266326904, "step": 7112} {"train_info/time_between_train_steps": 0.003220081329345703, "step": 7112} {"info/global_step": 7113, "train_info/time_within_train_step": 2.7548739910125732, "step": 7113} {"train_info/time_between_train_steps": 0.003220081329345703, "step": 7113} {"info/global_step": 7114, "train_info/time_within_train_step": 2.754835605621338, "step": 7114} {"train_info/time_between_train_steps": 0.003178119659423828, "step": 7114} {"info/global_step": 7115, "train_info/time_within_train_step": 2.7550032138824463, "step": 7115} {"train_info/time_between_train_steps": 0.003152132034301758, "step": 7115} {"info/global_step": 7116, "train_info/time_within_train_step": 2.7537031173706055, "step": 7116} {"train_info/time_between_train_steps": 0.0031838417053222656, "step": 7116} {"info/global_step": 7117, "train_info/time_within_train_step": 2.752577781677246, "step": 7117} {"train_info/time_between_train_steps": 0.003187894821166992, "step": 7117} {"info/global_step": 7118, "train_info/time_within_train_step": 2.753560781478882, "step": 7118} {"train_info/time_between_train_steps": 0.0032100677490234375, "step": 7118} {"info/global_step": 7119, "train_info/time_within_train_step": 2.7544400691986084, "step": 7119} {"train_info/time_between_train_steps": 0.003326892852783203, "step": 7119} {"info/global_step": 7120, "train_info/time_within_train_step": 2.7555992603302, "step": 7120} {"train_info/time_between_train_steps": 0.003289937973022461, "step": 7120} {"info/global_step": 7121, "train_info/time_within_train_step": 2.756614923477173, "step": 7121} {"train_info/time_between_train_steps": 0.0034325122833251953, "step": 7121} {"info/global_step": 7122, "train_info/time_within_train_step": 2.75645112991333, "step": 7122} {"train_info/time_between_train_steps": 0.0035021305084228516, "step": 7122} {"info/global_step": 7123, "train_info/time_within_train_step": 2.756319761276245, "step": 7123} {"train_info/time_between_train_steps": 0.003492116928100586, "step": 7123} {"info/global_step": 7124, "train_info/time_within_train_step": 2.7563717365264893, "step": 7124} {"train_info/time_between_train_steps": 0.0034198760986328125, "step": 7124} {"info/global_step": 7125, "train_info/time_within_train_step": 2.7565994262695312, "step": 7125} {"train_info/time_between_train_steps": 0.0035867691040039062, "step": 7125} {"info/global_step": 7126, "train_info/time_within_train_step": 2.7554519176483154, "step": 7126} {"train_info/time_between_train_steps": 0.003413677215576172, "step": 7126} {"info/global_step": 7127, "train_info/time_within_train_step": 2.755544900894165, "step": 7127} {"train_info/time_between_train_steps": 0.003481626510620117, "step": 7127} {"info/global_step": 7128, "train_info/time_within_train_step": 2.7558302879333496, "step": 7128} {"train_info/time_between_train_steps": 0.003456592559814453, "step": 7128} {"info/global_step": 7129, "train_info/time_within_train_step": 2.755662441253662, "step": 7129} {"train_info/time_between_train_steps": 0.0035126209259033203, "step": 7129} {"info/global_step": 7130, "train_info/time_within_train_step": 2.75494122505188, "step": 7130} {"train_info/time_between_train_steps": 0.0035479068756103516, "step": 7130} {"info/global_step": 7131, "train_info/time_within_train_step": 2.754899740219116, "step": 7131} {"train_info/time_between_train_steps": 0.0034775733947753906, "step": 7131} {"info/global_step": 7132, "train_info/time_within_train_step": 2.755643129348755, "step": 7132} {"train_info/time_between_train_steps": 0.0035240650177001953, "step": 7132} {"info/global_step": 7133, "train_info/time_within_train_step": 2.7556686401367188, "step": 7133} {"train_info/time_between_train_steps": 0.003389596939086914, "step": 7133} {"info/global_step": 7134, "train_info/time_within_train_step": 2.7550551891326904, "step": 7134} {"train_info/time_between_train_steps": 0.0033736228942871094, "step": 7134} {"info/global_step": 7135, "train_info/time_within_train_step": 2.7548906803131104, "step": 7135} {"train_info/time_between_train_steps": 0.0035142898559570312, "step": 7135} {"info/global_step": 7136, "train_info/time_within_train_step": 3.093256950378418, "step": 7136} {"train_info/time_between_train_steps": 0.0031948089599609375, "step": 7136} {"info/global_step": 7137, "train_info/time_within_train_step": 2.8976542949676514, "step": 7137} {"train_info/time_between_train_steps": 0.0031833648681640625, "step": 7137} {"info/global_step": 7138, "train_info/time_within_train_step": 2.7553048133850098, "step": 7138} {"train_info/time_between_train_steps": 0.0031692981719970703, "step": 7138} {"info/global_step": 7139, "train_info/time_within_train_step": 2.7543256282806396, "step": 7139} {"train_info/time_between_train_steps": 0.003192424774169922, "step": 7139} {"info/global_step": 7140, "train_info/time_within_train_step": 2.754859685897827, "step": 7140} {"train_info/time_between_train_steps": 0.003205537796020508, "step": 7140} {"info/global_step": 7141, "train_info/time_within_train_step": 2.7517967224121094, "step": 7141} {"train_info/time_between_train_steps": 0.0032210350036621094, "step": 7141} {"info/global_step": 7142, "train_info/time_within_train_step": 2.7554514408111572, "step": 7142} {"train_info/time_between_train_steps": 0.0031685829162597656, "step": 7142} {"info/global_step": 7143, "train_info/time_within_train_step": 2.7549145221710205, "step": 7143} {"train_info/time_between_train_steps": 0.0036439895629882812, "step": 7143} {"info/global_step": 7144, "train_info/time_within_train_step": 2.7557451725006104, "step": 7144} {"train_info/time_between_train_steps": 0.0031588077545166016, "step": 7144} {"info/global_step": 7145, "train_info/time_within_train_step": 2.7554819583892822, "step": 7145} {"train_info/time_between_train_steps": 0.003183126449584961, "step": 7145} {"info/global_step": 7146, "train_info/time_within_train_step": 2.7556965351104736, "step": 7146} {"train_info/time_between_train_steps": 0.003231525421142578, "step": 7146} {"info/global_step": 7147, "train_info/time_within_train_step": 2.7535107135772705, "step": 7147} {"train_info/time_between_train_steps": 0.0031821727752685547, "step": 7147} {"info/global_step": 7148, "train_info/time_within_train_step": 2.7549116611480713, "step": 7148} {"train_info/time_between_train_steps": 0.003177642822265625, "step": 7148} {"info/global_step": 7149, "train_info/time_within_train_step": 2.755641460418701, "step": 7149} {"train_info/time_between_train_steps": 0.003154277801513672, "step": 7149} {"info/global_step": 7150, "train_info/time_within_train_step": 2.7539401054382324, "step": 7150} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746586675, "_runtime": 20684}, "step": 7150} {"logs": {"train/loss": 3.2399, "train/learning_rate": 0.00018999999999999998, "train/epoch": 8.03, "_timestamp": 1746586675, "_runtime": 20684}, "step": 7150} {"train_info/time_between_train_steps": 0.006886482238769531, "step": 7150} {"info/global_step": 7151, "train_info/time_within_train_step": 2.754481792449951, "step": 7151} {"train_info/time_between_train_steps": 0.003180265426635742, "step": 7151} {"info/global_step": 7152, "train_info/time_within_train_step": 2.753584623336792, "step": 7152} {"train_info/time_between_train_steps": 0.003162860870361328, "step": 7152} {"info/global_step": 7153, "train_info/time_within_train_step": 2.7540431022644043, "step": 7153} {"train_info/time_between_train_steps": 0.003176450729370117, "step": 7153} {"info/global_step": 7154, "train_info/time_within_train_step": 2.754124164581299, "step": 7154} {"train_info/time_between_train_steps": 0.0032351016998291016, "step": 7154} {"info/global_step": 7155, "train_info/time_within_train_step": 2.754809856414795, "step": 7155} {"train_info/time_between_train_steps": 0.003201007843017578, "step": 7155} {"info/global_step": 7156, "train_info/time_within_train_step": 2.754084587097168, "step": 7156} {"train_info/time_between_train_steps": 0.003240823745727539, "step": 7156} {"info/global_step": 7157, "train_info/time_within_train_step": 2.755032777786255, "step": 7157} {"train_info/time_between_train_steps": 0.003157377243041992, "step": 7157} {"info/global_step": 7158, "train_info/time_within_train_step": 2.754690647125244, "step": 7158} {"train_info/time_between_train_steps": 0.0031332969665527344, "step": 7158} {"info/global_step": 7159, "train_info/time_within_train_step": 2.7548677921295166, "step": 7159} {"train_info/time_between_train_steps": 0.003374338150024414, "step": 7159} {"info/global_step": 7160, "train_info/time_within_train_step": 2.7566182613372803, "step": 7160} {"train_info/time_between_train_steps": 0.0033614635467529297, "step": 7160} {"info/global_step": 7161, "train_info/time_within_train_step": 2.756561040878296, "step": 7161} {"train_info/time_between_train_steps": 0.0033490657806396484, "step": 7161} {"info/global_step": 7162, "train_info/time_within_train_step": 2.755689859390259, "step": 7162} {"train_info/time_between_train_steps": 0.003353118896484375, "step": 7162} {"info/global_step": 7163, "train_info/time_within_train_step": 2.756751298904419, "step": 7163} {"train_info/time_between_train_steps": 0.0033626556396484375, "step": 7163} {"info/global_step": 7164, "train_info/time_within_train_step": 2.7571043968200684, "step": 7164} {"train_info/time_between_train_steps": 0.003340005874633789, "step": 7164} {"info/global_step": 7165, "train_info/time_within_train_step": 2.756693124771118, "step": 7165} {"train_info/time_between_train_steps": 0.0033457279205322266, "step": 7165} {"info/global_step": 7166, "train_info/time_within_train_step": 2.7565791606903076, "step": 7166} {"train_info/time_between_train_steps": 0.003321409225463867, "step": 7166} {"info/global_step": 7167, "train_info/time_within_train_step": 2.756187915802002, "step": 7167} {"train_info/time_between_train_steps": 0.0033266544342041016, "step": 7167} {"info/global_step": 7168, "train_info/time_within_train_step": 2.7557177543640137, "step": 7168} {"train_info/time_between_train_steps": 0.0033457279205322266, "step": 7168} {"info/global_step": 7169, "train_info/time_within_train_step": 2.7553155422210693, "step": 7169} {"train_info/time_between_train_steps": 0.0034410953521728516, "step": 7169} {"info/global_step": 7170, "train_info/time_within_train_step": 2.756084680557251, "step": 7170} {"train_info/time_between_train_steps": 0.0034263134002685547, "step": 7170} {"info/global_step": 7171, "train_info/time_within_train_step": 2.755647897720337, "step": 7171} {"train_info/time_between_train_steps": 0.0036172866821289062, "step": 7171} {"info/global_step": 7172, "train_info/time_within_train_step": 2.7566447257995605, "step": 7172} {"train_info/time_between_train_steps": 0.003528118133544922, "step": 7172} {"info/global_step": 7173, "train_info/time_within_train_step": 2.757129192352295, "step": 7173} {"train_info/time_between_train_steps": 0.003484964370727539, "step": 7173} {"info/global_step": 7174, "train_info/time_within_train_step": 2.756070852279663, "step": 7174} {"train_info/time_between_train_steps": 0.003509521484375, "step": 7174} {"info/global_step": 7175, "train_info/time_within_train_step": 2.7569117546081543, "step": 7175} {"train_info/time_between_train_steps": 0.003576517105102539, "step": 7175} {"info/global_step": 7176, "train_info/time_within_train_step": 2.7563788890838623, "step": 7176} {"train_info/time_between_train_steps": 0.0035660266876220703, "step": 7176} {"info/global_step": 7177, "train_info/time_within_train_step": 2.757709264755249, "step": 7177} {"train_info/time_between_train_steps": 0.003543853759765625, "step": 7177} {"info/global_step": 7178, "train_info/time_within_train_step": 2.7580320835113525, "step": 7178} {"train_info/time_between_train_steps": 0.003612041473388672, "step": 7178} {"info/global_step": 7179, "train_info/time_within_train_step": 2.7577877044677734, "step": 7179} {"train_info/time_between_train_steps": 0.003475189208984375, "step": 7179} {"info/global_step": 7180, "train_info/time_within_train_step": 2.75708270072937, "step": 7180} {"train_info/time_between_train_steps": 0.0035734176635742188, "step": 7180} {"info/global_step": 7181, "train_info/time_within_train_step": 2.7568798065185547, "step": 7181} {"train_info/time_between_train_steps": 0.003487825393676758, "step": 7181} {"info/global_step": 7182, "train_info/time_within_train_step": 2.757704496383667, "step": 7182} {"train_info/time_between_train_steps": 0.0035996437072753906, "step": 7182} {"info/global_step": 7183, "train_info/time_within_train_step": 2.7561042308807373, "step": 7183} {"train_info/time_between_train_steps": 0.0036118030548095703, "step": 7183} {"info/global_step": 7184, "train_info/time_within_train_step": 2.755715847015381, "step": 7184} {"train_info/time_between_train_steps": 0.0035915374755859375, "step": 7184} {"info/global_step": 7185, "train_info/time_within_train_step": 2.7576839923858643, "step": 7185} {"train_info/time_between_train_steps": 0.003634929656982422, "step": 7185} {"info/global_step": 7186, "train_info/time_within_train_step": 2.757899045944214, "step": 7186} {"train_info/time_between_train_steps": 0.003625154495239258, "step": 7186} {"info/global_step": 7187, "train_info/time_within_train_step": 2.7580406665802, "step": 7187} {"train_info/time_between_train_steps": 0.003550291061401367, "step": 7187} {"info/global_step": 7188, "train_info/time_within_train_step": 2.7572083473205566, "step": 7188} {"train_info/time_between_train_steps": 0.0034923553466796875, "step": 7188} {"info/global_step": 7189, "train_info/time_within_train_step": 2.7567057609558105, "step": 7189} {"train_info/time_between_train_steps": 0.003536701202392578, "step": 7189} {"info/global_step": 7190, "train_info/time_within_train_step": 2.757544994354248, "step": 7190} {"train_info/time_between_train_steps": 0.0034842491149902344, "step": 7190} {"info/global_step": 7191, "train_info/time_within_train_step": 2.757018566131592, "step": 7191} {"train_info/time_between_train_steps": 0.003554821014404297, "step": 7191} {"info/global_step": 7192, "train_info/time_within_train_step": 2.757697105407715, "step": 7192} {"train_info/time_between_train_steps": 0.00348663330078125, "step": 7192} {"info/global_step": 7193, "train_info/time_within_train_step": 2.7579667568206787, "step": 7193} {"train_info/time_between_train_steps": 0.0034780502319335938, "step": 7193} {"info/global_step": 7194, "train_info/time_within_train_step": 2.7591118812561035, "step": 7194} {"train_info/time_between_train_steps": 0.00354766845703125, "step": 7194} {"info/global_step": 7195, "train_info/time_within_train_step": 2.756870746612549, "step": 7195} {"train_info/time_between_train_steps": 0.0034766197204589844, "step": 7195} {"info/global_step": 7196, "train_info/time_within_train_step": 2.757561206817627, "step": 7196} {"train_info/time_between_train_steps": 0.0035338401794433594, "step": 7196} {"info/global_step": 7197, "train_info/time_within_train_step": 2.756875514984131, "step": 7197} {"train_info/time_between_train_steps": 0.0035266876220703125, "step": 7197} {"info/global_step": 7198, "train_info/time_within_train_step": 2.7554867267608643, "step": 7198} {"train_info/time_between_train_steps": 0.003589630126953125, "step": 7198} {"info/global_step": 7199, "train_info/time_within_train_step": 2.755683422088623, "step": 7199} {"train_info/time_between_train_steps": 0.17412590980529785, "step": 7199} {"info/global_step": 7200, "train_info/time_within_train_step": 2.757472515106201, "step": 7200} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746586813, "_runtime": 20822}, "step": 7200} {"logs": {"train/loss": 3.2432, "train/learning_rate": 0.00018666666666666666, "train/epoch": 8.04, "_timestamp": 1746586813, "_runtime": 20822}, "step": 7200} {"train_info/time_between_train_steps": 14.428149700164795, "step": 7200} {"info/global_step": 7201, "train_info/time_within_train_step": 2.5334577560424805, "step": 7201} {"train_info/time_between_train_steps": 0.0034618377685546875, "step": 7201} {"info/global_step": 7202, "train_info/time_within_train_step": 2.5991384983062744, "step": 7202} {"train_info/time_between_train_steps": 0.003574848175048828, "step": 7202} {"info/global_step": 7203, "train_info/time_within_train_step": 2.7405378818511963, "step": 7203} {"train_info/time_between_train_steps": 0.0034911632537841797, "step": 7203} {"info/global_step": 7204, "train_info/time_within_train_step": 2.749540328979492, "step": 7204} {"train_info/time_between_train_steps": 0.0035567283630371094, "step": 7204} {"info/global_step": 7205, "train_info/time_within_train_step": 2.7511956691741943, "step": 7205} {"train_info/time_between_train_steps": 0.0034482479095458984, "step": 7205} {"info/global_step": 7206, "train_info/time_within_train_step": 2.7565927505493164, "step": 7206} {"train_info/time_between_train_steps": 0.0034956932067871094, "step": 7206} {"info/global_step": 7207, "train_info/time_within_train_step": 2.7567837238311768, "step": 7207} {"train_info/time_between_train_steps": 0.0033767223358154297, "step": 7207} {"info/global_step": 7208, "train_info/time_within_train_step": 2.7564775943756104, "step": 7208} {"train_info/time_between_train_steps": 0.003376007080078125, "step": 7208} {"info/global_step": 7209, "train_info/time_within_train_step": 2.7568905353546143, "step": 7209} {"train_info/time_between_train_steps": 0.0034720897674560547, "step": 7209} {"info/global_step": 7210, "train_info/time_within_train_step": 2.7576956748962402, "step": 7210} {"train_info/time_between_train_steps": 0.003231525421142578, "step": 7210} {"info/global_step": 7211, "train_info/time_within_train_step": 2.7566845417022705, "step": 7211} {"train_info/time_between_train_steps": 0.0032918453216552734, "step": 7211} {"info/global_step": 7212, "train_info/time_within_train_step": 3.0578629970550537, "step": 7212} {"train_info/time_between_train_steps": 0.003206014633178711, "step": 7212} {"info/global_step": 7213, "train_info/time_within_train_step": 2.7545218467712402, "step": 7213} {"train_info/time_between_train_steps": 0.003269672393798828, "step": 7213} {"info/global_step": 7214, "train_info/time_within_train_step": 2.756812810897827, "step": 7214} {"train_info/time_between_train_steps": 0.003190755844116211, "step": 7214} {"info/global_step": 7215, "train_info/time_within_train_step": 2.7559680938720703, "step": 7215} {"train_info/time_between_train_steps": 0.0031709671020507812, "step": 7215} {"info/global_step": 7216, "train_info/time_within_train_step": 2.755844831466675, "step": 7216} {"train_info/time_between_train_steps": 0.003164052963256836, "step": 7216} {"info/global_step": 7217, "train_info/time_within_train_step": 2.755516290664673, "step": 7217} {"train_info/time_between_train_steps": 0.0031616687774658203, "step": 7217} {"info/global_step": 7218, "train_info/time_within_train_step": 2.7558982372283936, "step": 7218} {"train_info/time_between_train_steps": 0.003176450729370117, "step": 7218} {"info/global_step": 7219, "train_info/time_within_train_step": 2.7563462257385254, "step": 7219} {"train_info/time_between_train_steps": 0.003307342529296875, "step": 7219} {"info/global_step": 7220, "train_info/time_within_train_step": 2.7576711177825928, "step": 7220} {"train_info/time_between_train_steps": 0.003387451171875, "step": 7220} {"info/global_step": 7221, "train_info/time_within_train_step": 2.7578814029693604, "step": 7221} {"train_info/time_between_train_steps": 0.0065364837646484375, "step": 7221} {"info/global_step": 7222, "train_info/time_within_train_step": 2.7564167976379395, "step": 7222} {"train_info/time_between_train_steps": 0.0031919479370117188, "step": 7222} {"info/global_step": 7223, "train_info/time_within_train_step": 2.7565829753875732, "step": 7223} {"train_info/time_between_train_steps": 0.003180265426635742, "step": 7223} {"info/global_step": 7224, "train_info/time_within_train_step": 2.757415533065796, "step": 7224} {"train_info/time_between_train_steps": 0.0032722949981689453, "step": 7224} {"info/global_step": 7225, "train_info/time_within_train_step": 2.756585121154785, "step": 7225} {"train_info/time_between_train_steps": 0.003155231475830078, "step": 7225} {"info/global_step": 7226, "train_info/time_within_train_step": 2.755398750305176, "step": 7226} {"train_info/time_between_train_steps": 0.0031909942626953125, "step": 7226} {"info/global_step": 7227, "train_info/time_within_train_step": 2.7569515705108643, "step": 7227} {"train_info/time_between_train_steps": 0.003162384033203125, "step": 7227} {"info/global_step": 7228, "train_info/time_within_train_step": 2.7574856281280518, "step": 7228} {"train_info/time_between_train_steps": 0.00315093994140625, "step": 7228} {"info/global_step": 7229, "train_info/time_within_train_step": 2.7571709156036377, "step": 7229} {"train_info/time_between_train_steps": 0.006598234176635742, "step": 7229} {"info/global_step": 7230, "train_info/time_within_train_step": 2.753833293914795, "step": 7230} {"train_info/time_between_train_steps": 0.003141164779663086, "step": 7230} {"info/global_step": 7231, "train_info/time_within_train_step": 2.755129337310791, "step": 7231} {"train_info/time_between_train_steps": 0.003180980682373047, "step": 7231} {"info/global_step": 7232, "train_info/time_within_train_step": 2.7566263675689697, "step": 7232} {"train_info/time_between_train_steps": 0.003161191940307617, "step": 7232} {"info/global_step": 7233, "train_info/time_within_train_step": 2.7563552856445312, "step": 7233} {"train_info/time_between_train_steps": 0.003146648406982422, "step": 7233} {"info/global_step": 7234, "train_info/time_within_train_step": 2.755831480026245, "step": 7234} {"train_info/time_between_train_steps": 0.003164052963256836, "step": 7234} {"info/global_step": 7235, "train_info/time_within_train_step": 2.7553772926330566, "step": 7235} {"train_info/time_between_train_steps": 0.0033326148986816406, "step": 7235} {"info/global_step": 7236, "train_info/time_within_train_step": 2.75506329536438, "step": 7236} {"train_info/time_between_train_steps": 0.0031676292419433594, "step": 7236} {"info/global_step": 7237, "train_info/time_within_train_step": 2.755949020385742, "step": 7237} {"train_info/time_between_train_steps": 0.003267049789428711, "step": 7237} {"info/global_step": 7238, "train_info/time_within_train_step": 2.756510019302368, "step": 7238} {"train_info/time_between_train_steps": 0.003165006637573242, "step": 7238} {"info/global_step": 7239, "train_info/time_within_train_step": 2.756394386291504, "step": 7239} {"train_info/time_between_train_steps": 0.003159046173095703, "step": 7239} {"info/global_step": 7240, "train_info/time_within_train_step": 2.756078004837036, "step": 7240} {"train_info/time_between_train_steps": 0.0032253265380859375, "step": 7240} {"info/global_step": 7241, "train_info/time_within_train_step": 2.756847381591797, "step": 7241} {"train_info/time_between_train_steps": 0.0034148693084716797, "step": 7241} {"info/global_step": 7242, "train_info/time_within_train_step": 2.7579565048217773, "step": 7242} {"train_info/time_between_train_steps": 0.0034699440002441406, "step": 7242} {"info/global_step": 7243, "train_info/time_within_train_step": 2.7581229209899902, "step": 7243} {"train_info/time_between_train_steps": 0.0034613609313964844, "step": 7243} {"info/global_step": 7244, "train_info/time_within_train_step": 2.757605791091919, "step": 7244} {"train_info/time_between_train_steps": 0.003529071807861328, "step": 7244} {"info/global_step": 7245, "train_info/time_within_train_step": 2.7573659420013428, "step": 7245} {"train_info/time_between_train_steps": 0.0035407543182373047, "step": 7245} {"info/global_step": 7246, "train_info/time_within_train_step": 3.3380937576293945, "step": 7246} {"train_info/time_between_train_steps": 0.0035228729248046875, "step": 7246} {"info/global_step": 7247, "train_info/time_within_train_step": 2.7567148208618164, "step": 7247} {"train_info/time_between_train_steps": 0.003481149673461914, "step": 7247} {"info/global_step": 7248, "train_info/time_within_train_step": 2.756918430328369, "step": 7248} {"train_info/time_between_train_steps": 0.0035185813903808594, "step": 7248} {"info/global_step": 7249, "train_info/time_within_train_step": 2.757734537124634, "step": 7249} {"train_info/time_between_train_steps": 0.0034449100494384766, "step": 7249} {"info/global_step": 7250, "train_info/time_within_train_step": 2.757540702819824, "step": 7250} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746586967, "_runtime": 20976}, "step": 7250} {"logs": {"train/loss": 3.2319, "train/learning_rate": 0.00018333333333333334, "train/epoch": 8.04, "_timestamp": 1746586967, "_runtime": 20976}, "step": 7250} {"train_info/time_between_train_steps": 0.014569759368896484, "step": 7250} {"info/global_step": 7251, "train_info/time_within_train_step": 2.7567946910858154, "step": 7251} {"train_info/time_between_train_steps": 0.006557464599609375, "step": 7251} {"info/global_step": 7252, "train_info/time_within_train_step": 2.757016181945801, "step": 7252} {"train_info/time_between_train_steps": 0.006619930267333984, "step": 7252} {"info/global_step": 7253, "train_info/time_within_train_step": 2.7589643001556396, "step": 7253} {"train_info/time_between_train_steps": 0.006688356399536133, "step": 7253} {"info/global_step": 7254, "train_info/time_within_train_step": 2.759953737258911, "step": 7254} {"train_info/time_between_train_steps": 0.006712198257446289, "step": 7254} {"info/global_step": 7255, "train_info/time_within_train_step": 2.759124517440796, "step": 7255} {"train_info/time_between_train_steps": 0.00669097900390625, "step": 7255} {"info/global_step": 7256, "train_info/time_within_train_step": 2.7586400508880615, "step": 7256} {"train_info/time_between_train_steps": 0.006783246994018555, "step": 7256} {"info/global_step": 7257, "train_info/time_within_train_step": 2.7584524154663086, "step": 7257} {"train_info/time_between_train_steps": 0.006688356399536133, "step": 7257} {"info/global_step": 7258, "train_info/time_within_train_step": 2.7601277828216553, "step": 7258} {"train_info/time_between_train_steps": 0.006589174270629883, "step": 7258} {"info/global_step": 7259, "train_info/time_within_train_step": 2.7577126026153564, "step": 7259} {"train_info/time_between_train_steps": 0.006643533706665039, "step": 7259} {"info/global_step": 7260, "train_info/time_within_train_step": 2.7592215538024902, "step": 7260} {"train_info/time_between_train_steps": 0.006728172302246094, "step": 7260} {"info/global_step": 7261, "train_info/time_within_train_step": 2.7583518028259277, "step": 7261} {"train_info/time_between_train_steps": 0.006600618362426758, "step": 7261} {"info/global_step": 7262, "train_info/time_within_train_step": 2.896998643875122, "step": 7262} {"train_info/time_between_train_steps": 0.006700754165649414, "step": 7262} {"info/global_step": 7263, "train_info/time_within_train_step": 2.7568881511688232, "step": 7263} {"train_info/time_between_train_steps": 0.006493806838989258, "step": 7263} {"info/global_step": 7264, "train_info/time_within_train_step": 2.7588071823120117, "step": 7264} {"train_info/time_between_train_steps": 0.006634712219238281, "step": 7264} {"info/global_step": 7265, "train_info/time_within_train_step": 2.759683847427368, "step": 7265} {"train_info/time_between_train_steps": 0.00720524787902832, "step": 7265} {"info/global_step": 7266, "train_info/time_within_train_step": 2.757869243621826, "step": 7266} {"train_info/time_between_train_steps": 0.0065310001373291016, "step": 7266} {"info/global_step": 7267, "train_info/time_within_train_step": 2.7577130794525146, "step": 7267} {"train_info/time_between_train_steps": 0.00657343864440918, "step": 7267} {"info/global_step": 7268, "train_info/time_within_train_step": 2.756620407104492, "step": 7268} {"train_info/time_between_train_steps": 0.00764775276184082, "step": 7268} {"info/global_step": 7269, "train_info/time_within_train_step": 2.759456157684326, "step": 7269} {"train_info/time_between_train_steps": 0.006659746170043945, "step": 7269} {"info/global_step": 7270, "train_info/time_within_train_step": 2.7601585388183594, "step": 7270} {"train_info/time_between_train_steps": 0.006665945053100586, "step": 7270} {"info/global_step": 7271, "train_info/time_within_train_step": 2.756319999694824, "step": 7271} {"train_info/time_between_train_steps": 0.006672382354736328, "step": 7271} {"info/global_step": 7272, "train_info/time_within_train_step": 2.760375499725342, "step": 7272} {"train_info/time_between_train_steps": 0.006628751754760742, "step": 7272} {"info/global_step": 7273, "train_info/time_within_train_step": 2.757556200027466, "step": 7273} {"train_info/time_between_train_steps": 0.006754636764526367, "step": 7273} {"info/global_step": 7274, "train_info/time_within_train_step": 2.759328603744507, "step": 7274} {"train_info/time_between_train_steps": 0.0066471099853515625, "step": 7274} {"info/global_step": 7275, "train_info/time_within_train_step": 2.758293390274048, "step": 7275} {"train_info/time_between_train_steps": 0.006670475006103516, "step": 7275} {"info/global_step": 7276, "train_info/time_within_train_step": 2.756965398788452, "step": 7276} {"train_info/time_between_train_steps": 0.006638765335083008, "step": 7276} {"info/global_step": 7277, "train_info/time_within_train_step": 2.758078098297119, "step": 7277} {"train_info/time_between_train_steps": 0.0066602230072021484, "step": 7277} {"info/global_step": 7278, "train_info/time_within_train_step": 2.7578771114349365, "step": 7278} {"train_info/time_between_train_steps": 0.006583690643310547, "step": 7278} {"info/global_step": 7279, "train_info/time_within_train_step": 2.757324457168579, "step": 7279} {"train_info/time_between_train_steps": 0.006764888763427734, "step": 7279} {"info/global_step": 7280, "train_info/time_within_train_step": 2.7582383155822754, "step": 7280} {"train_info/time_between_train_steps": 0.006607770919799805, "step": 7280} {"info/global_step": 7281, "train_info/time_within_train_step": 2.757068157196045, "step": 7281} {"train_info/time_between_train_steps": 0.006639003753662109, "step": 7281} {"info/global_step": 7282, "train_info/time_within_train_step": 2.758488893508911, "step": 7282} {"train_info/time_between_train_steps": 0.006775379180908203, "step": 7282} {"info/global_step": 7283, "train_info/time_within_train_step": 2.7579994201660156, "step": 7283} {"train_info/time_between_train_steps": 0.0034193992614746094, "step": 7283} {"info/global_step": 7284, "train_info/time_within_train_step": 2.7546675205230713, "step": 7284} {"train_info/time_between_train_steps": 0.0032782554626464844, "step": 7284} {"info/global_step": 7285, "train_info/time_within_train_step": 2.755312442779541, "step": 7285} {"train_info/time_between_train_steps": 0.0032613277435302734, "step": 7285} {"info/global_step": 7286, "train_info/time_within_train_step": 2.756138801574707, "step": 7286} {"train_info/time_between_train_steps": 0.0032417774200439453, "step": 7286} {"info/global_step": 7287, "train_info/time_within_train_step": 2.755178451538086, "step": 7287} {"train_info/time_between_train_steps": 0.0032148361206054688, "step": 7287} {"info/global_step": 7288, "train_info/time_within_train_step": 2.7556233406066895, "step": 7288} {"train_info/time_between_train_steps": 0.00341033935546875, "step": 7288} {"info/global_step": 7289, "train_info/time_within_train_step": 2.7552075386047363, "step": 7289} {"train_info/time_between_train_steps": 0.0032007694244384766, "step": 7289} {"info/global_step": 7290, "train_info/time_within_train_step": 2.755117416381836, "step": 7290} {"train_info/time_between_train_steps": 0.0031702518463134766, "step": 7290} {"info/global_step": 7291, "train_info/time_within_train_step": 2.755129098892212, "step": 7291} {"train_info/time_between_train_steps": 0.0032358169555664062, "step": 7291} {"info/global_step": 7292, "train_info/time_within_train_step": 2.756294012069702, "step": 7292} {"train_info/time_between_train_steps": 0.0033693313598632812, "step": 7292} {"info/global_step": 7293, "train_info/time_within_train_step": 2.7568302154541016, "step": 7293} {"train_info/time_between_train_steps": 0.003451108932495117, "step": 7293} {"info/global_step": 7294, "train_info/time_within_train_step": 2.7583577632904053, "step": 7294} {"train_info/time_between_train_steps": 0.003409147262573242, "step": 7294} {"info/global_step": 7295, "train_info/time_within_train_step": 2.7568726539611816, "step": 7295} {"train_info/time_between_train_steps": 0.003383159637451172, "step": 7295} {"info/global_step": 7296, "train_info/time_within_train_step": 2.7572834491729736, "step": 7296} {"train_info/time_between_train_steps": 0.003339529037475586, "step": 7296} {"info/global_step": 7297, "train_info/time_within_train_step": 2.7553629875183105, "step": 7297} {"train_info/time_between_train_steps": 0.0033664703369140625, "step": 7297} {"info/global_step": 7298, "train_info/time_within_train_step": 2.7564890384674072, "step": 7298} {"train_info/time_between_train_steps": 0.0034630298614501953, "step": 7298} {"info/global_step": 7299, "train_info/time_within_train_step": 2.7572920322418213, "step": 7299} {"train_info/time_between_train_steps": 0.0033500194549560547, "step": 7299} {"info/global_step": 7300, "train_info/time_within_train_step": 2.7557876110076904, "step": 7300} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746587105, "_runtime": 21114}, "step": 7300} {"logs": {"train/loss": 3.2196, "train/learning_rate": 0.00017999999999999998, "train/epoch": 8.05, "_timestamp": 1746587105, "_runtime": 21114}, "step": 7300} {"train_info/time_between_train_steps": 0.006615877151489258, "step": 7300} {"info/global_step": 7301, "train_info/time_within_train_step": 2.7561357021331787, "step": 7301} {"train_info/time_between_train_steps": 0.003293752670288086, "step": 7301} {"info/global_step": 7302, "train_info/time_within_train_step": 2.7568697929382324, "step": 7302} {"train_info/time_between_train_steps": 0.003331899642944336, "step": 7302} {"info/global_step": 7303, "train_info/time_within_train_step": 2.756679058074951, "step": 7303} {"train_info/time_between_train_steps": 0.003334522247314453, "step": 7303} {"info/global_step": 7304, "train_info/time_within_train_step": 3.0129029750823975, "step": 7304} {"train_info/time_between_train_steps": 0.003358125686645508, "step": 7304} {"info/global_step": 7305, "train_info/time_within_train_step": 2.758127450942993, "step": 7305} {"train_info/time_between_train_steps": 0.0033805370330810547, "step": 7305} {"info/global_step": 7306, "train_info/time_within_train_step": 2.7568275928497314, "step": 7306} {"train_info/time_between_train_steps": 0.0033371448516845703, "step": 7306} {"info/global_step": 7307, "train_info/time_within_train_step": 2.7568063735961914, "step": 7307} {"train_info/time_between_train_steps": 0.003282308578491211, "step": 7307} {"info/global_step": 7308, "train_info/time_within_train_step": 2.7552590370178223, "step": 7308} {"train_info/time_between_train_steps": 0.003207683563232422, "step": 7308} {"info/global_step": 7309, "train_info/time_within_train_step": 2.7539188861846924, "step": 7309} {"train_info/time_between_train_steps": 0.0031516551971435547, "step": 7309} {"info/global_step": 7310, "train_info/time_within_train_step": 2.7556490898132324, "step": 7310} {"train_info/time_between_train_steps": 0.0031838417053222656, "step": 7310} {"info/global_step": 7311, "train_info/time_within_train_step": 2.7540128231048584, "step": 7311} {"train_info/time_between_train_steps": 0.003150463104248047, "step": 7311} {"info/global_step": 7312, "train_info/time_within_train_step": 2.7555482387542725, "step": 7312} {"train_info/time_between_train_steps": 0.0031456947326660156, "step": 7312} {"info/global_step": 7313, "train_info/time_within_train_step": 2.7552709579467773, "step": 7313} {"train_info/time_between_train_steps": 0.0031785964965820312, "step": 7313} {"info/global_step": 7314, "train_info/time_within_train_step": 2.753904342651367, "step": 7314} {"train_info/time_between_train_steps": 0.0031709671020507812, "step": 7314} {"info/global_step": 7315, "train_info/time_within_train_step": 2.7555882930755615, "step": 7315} {"train_info/time_between_train_steps": 0.003160238265991211, "step": 7315} {"info/global_step": 7316, "train_info/time_within_train_step": 2.7554285526275635, "step": 7316} {"train_info/time_between_train_steps": 0.0031850337982177734, "step": 7316} {"info/global_step": 7317, "train_info/time_within_train_step": 2.753749132156372, "step": 7317} {"train_info/time_between_train_steps": 0.0031862258911132812, "step": 7317} {"info/global_step": 7318, "train_info/time_within_train_step": 2.754148244857788, "step": 7318} {"train_info/time_between_train_steps": 0.0031347274780273438, "step": 7318} {"info/global_step": 7319, "train_info/time_within_train_step": 2.7545366287231445, "step": 7319} {"train_info/time_between_train_steps": 0.0031321048736572266, "step": 7319} {"info/global_step": 7320, "train_info/time_within_train_step": 2.754056692123413, "step": 7320} {"train_info/time_between_train_steps": 0.003151416778564453, "step": 7320} {"info/global_step": 7321, "train_info/time_within_train_step": 2.7540602684020996, "step": 7321} {"train_info/time_between_train_steps": 0.0031270980834960938, "step": 7321} {"info/global_step": 7322, "train_info/time_within_train_step": 2.7549405097961426, "step": 7322} {"train_info/time_between_train_steps": 0.0031194686889648438, "step": 7322} {"info/global_step": 7323, "train_info/time_within_train_step": 2.7558441162109375, "step": 7323} {"train_info/time_between_train_steps": 0.0031058788299560547, "step": 7323} {"info/global_step": 7324, "train_info/time_within_train_step": 2.753530502319336, "step": 7324} {"train_info/time_between_train_steps": 0.09118366241455078, "step": 7324} {"info/global_step": 7325, "train_info/time_within_train_step": 2.7563416957855225, "step": 7325} {"train_info/time_between_train_steps": 0.003211498260498047, "step": 7325} {"info/global_step": 7326, "train_info/time_within_train_step": 2.7549116611480713, "step": 7326} {"train_info/time_between_train_steps": 0.0032052993774414062, "step": 7326} {"info/global_step": 7327, "train_info/time_within_train_step": 2.7547385692596436, "step": 7327} {"train_info/time_between_train_steps": 0.0031309127807617188, "step": 7327} {"info/global_step": 7328, "train_info/time_within_train_step": 2.7560207843780518, "step": 7328} {"train_info/time_between_train_steps": 0.003208160400390625, "step": 7328} {"info/global_step": 7329, "train_info/time_within_train_step": 2.7545080184936523, "step": 7329} {"train_info/time_between_train_steps": 0.0031545162200927734, "step": 7329} {"info/global_step": 7330, "train_info/time_within_train_step": 2.755021095275879, "step": 7330} {"train_info/time_between_train_steps": 0.0031309127807617188, "step": 7330} {"info/global_step": 7331, "train_info/time_within_train_step": 2.7553250789642334, "step": 7331} {"train_info/time_between_train_steps": 0.0031385421752929688, "step": 7331} {"info/global_step": 7332, "train_info/time_within_train_step": 2.7547988891601562, "step": 7332} {"train_info/time_between_train_steps": 0.003155946731567383, "step": 7332} {"info/global_step": 7333, "train_info/time_within_train_step": 2.755629301071167, "step": 7333} {"train_info/time_between_train_steps": 0.0031270980834960938, "step": 7333} {"info/global_step": 7334, "train_info/time_within_train_step": 2.7534642219543457, "step": 7334} {"train_info/time_between_train_steps": 0.003157377243041992, "step": 7334} {"info/global_step": 7335, "train_info/time_within_train_step": 2.755552053451538, "step": 7335} {"train_info/time_between_train_steps": 0.0031697750091552734, "step": 7335} {"info/global_step": 7336, "train_info/time_within_train_step": 2.7539725303649902, "step": 7336} {"train_info/time_between_train_steps": 0.003155231475830078, "step": 7336} {"info/global_step": 7337, "train_info/time_within_train_step": 2.755535125732422, "step": 7337} {"train_info/time_between_train_steps": 0.0032198429107666016, "step": 7337} {"info/global_step": 7338, "train_info/time_within_train_step": 2.7545764446258545, "step": 7338} {"train_info/time_between_train_steps": 0.0031545162200927734, "step": 7338} {"info/global_step": 7339, "train_info/time_within_train_step": 2.75504207611084, "step": 7339} {"train_info/time_between_train_steps": 0.0031845569610595703, "step": 7339} {"info/global_step": 7340, "train_info/time_within_train_step": 2.754624843597412, "step": 7340} {"train_info/time_between_train_steps": 0.003206491470336914, "step": 7340} {"info/global_step": 7341, "train_info/time_within_train_step": 2.7544021606445312, "step": 7341} {"train_info/time_between_train_steps": 0.003160238265991211, "step": 7341} {"info/global_step": 7342, "train_info/time_within_train_step": 2.7546863555908203, "step": 7342} {"train_info/time_between_train_steps": 0.0031974315643310547, "step": 7342} {"info/global_step": 7343, "train_info/time_within_train_step": 2.7546334266662598, "step": 7343} {"train_info/time_between_train_steps": 0.0031354427337646484, "step": 7343} {"info/global_step": 7344, "train_info/time_within_train_step": 2.7552506923675537, "step": 7344} {"train_info/time_between_train_steps": 0.003107786178588867, "step": 7344} {"info/global_step": 7345, "train_info/time_within_train_step": 2.7553489208221436, "step": 7345} {"train_info/time_between_train_steps": 0.003128528594970703, "step": 7345} {"info/global_step": 7346, "train_info/time_within_train_step": 2.756040573120117, "step": 7346} {"train_info/time_between_train_steps": 0.0031423568725585938, "step": 7346} {"info/global_step": 7347, "train_info/time_within_train_step": 2.754317283630371, "step": 7347} {"train_info/time_between_train_steps": 0.0031309127807617188, "step": 7347} {"info/global_step": 7348, "train_info/time_within_train_step": 2.754626750946045, "step": 7348} {"train_info/time_between_train_steps": 0.003318309783935547, "step": 7348} {"info/global_step": 7349, "train_info/time_within_train_step": 2.7552945613861084, "step": 7349} {"train_info/time_between_train_steps": 0.0031294822692871094, "step": 7349} {"info/global_step": 7350, "train_info/time_within_train_step": 2.7544336318969727, "step": 7350} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746587244, "_runtime": 21253}, "step": 7350} {"logs": {"train/loss": 3.2103, "train/learning_rate": 0.00017666666666666666, "train/epoch": 8.05, "_timestamp": 1746587244, "_runtime": 21253}, "step": 7350} {"train_info/time_between_train_steps": 0.0068018436431884766, "step": 7350} {"info/global_step": 7351, "train_info/time_within_train_step": 2.755139112472534, "step": 7351} {"train_info/time_between_train_steps": 0.003153085708618164, "step": 7351} {"info/global_step": 7352, "train_info/time_within_train_step": 2.7556190490722656, "step": 7352} {"train_info/time_between_train_steps": 0.0031299591064453125, "step": 7352} {"info/global_step": 7353, "train_info/time_within_train_step": 2.7511818408966064, "step": 7353} {"train_info/time_between_train_steps": 0.003145933151245117, "step": 7353} {"info/global_step": 7354, "train_info/time_within_train_step": 2.7553725242614746, "step": 7354} {"train_info/time_between_train_steps": 0.003205537796020508, "step": 7354} {"info/global_step": 7355, "train_info/time_within_train_step": 2.7546699047088623, "step": 7355} {"train_info/time_between_train_steps": 0.003135204315185547, "step": 7355} {"info/global_step": 7356, "train_info/time_within_train_step": 2.754422664642334, "step": 7356} {"train_info/time_between_train_steps": 0.003119230270385742, "step": 7356} {"info/global_step": 7357, "train_info/time_within_train_step": 2.754584312438965, "step": 7357} {"train_info/time_between_train_steps": 0.0032112598419189453, "step": 7357} {"info/global_step": 7358, "train_info/time_within_train_step": 2.754692792892456, "step": 7358} {"train_info/time_between_train_steps": 0.003159761428833008, "step": 7358} {"info/global_step": 7359, "train_info/time_within_train_step": 2.7548158168792725, "step": 7359} {"train_info/time_between_train_steps": 0.003199338912963867, "step": 7359} {"info/global_step": 7360, "train_info/time_within_train_step": 2.991997480392456, "step": 7360} {"train_info/time_between_train_steps": 0.0032160282135009766, "step": 7360} {"info/global_step": 7361, "train_info/time_within_train_step": 2.7554023265838623, "step": 7361} {"train_info/time_between_train_steps": 0.003151416778564453, "step": 7361} {"info/global_step": 7362, "train_info/time_within_train_step": 2.754784345626831, "step": 7362} {"train_info/time_between_train_steps": 0.0031690597534179688, "step": 7362} {"info/global_step": 7363, "train_info/time_within_train_step": 2.755279302597046, "step": 7363} {"train_info/time_between_train_steps": 0.003200054168701172, "step": 7363} {"info/global_step": 7364, "train_info/time_within_train_step": 2.7549736499786377, "step": 7364} {"train_info/time_between_train_steps": 0.00315093994140625, "step": 7364} {"info/global_step": 7365, "train_info/time_within_train_step": 2.7571046352386475, "step": 7365} {"train_info/time_between_train_steps": 0.018119335174560547, "step": 7365} {"info/global_step": 7366, "train_info/time_within_train_step": 2.7550718784332275, "step": 7366} {"train_info/time_between_train_steps": 0.0029342174530029297, "step": 7366} {"info/global_step": 7367, "train_info/time_within_train_step": 2.7555184364318848, "step": 7367} {"train_info/time_between_train_steps": 0.002873659133911133, "step": 7367} {"info/global_step": 7368, "train_info/time_within_train_step": 2.754042387008667, "step": 7368} {"train_info/time_between_train_steps": 0.0028803348541259766, "step": 7368} {"info/global_step": 7369, "train_info/time_within_train_step": 2.753203868865967, "step": 7369} {"train_info/time_between_train_steps": 0.002826213836669922, "step": 7369} {"info/global_step": 7370, "train_info/time_within_train_step": 2.751434803009033, "step": 7370} {"train_info/time_between_train_steps": 0.00287628173828125, "step": 7370} {"info/global_step": 7371, "train_info/time_within_train_step": 2.753272533416748, "step": 7371} {"train_info/time_between_train_steps": 0.0028629302978515625, "step": 7371} {"info/global_step": 7372, "train_info/time_within_train_step": 2.7531824111938477, "step": 7372} {"train_info/time_between_train_steps": 0.002904176712036133, "step": 7372} {"info/global_step": 7373, "train_info/time_within_train_step": 2.754666566848755, "step": 7373} {"train_info/time_between_train_steps": 0.002847909927368164, "step": 7373} {"info/global_step": 7374, "train_info/time_within_train_step": 2.7528798580169678, "step": 7374} {"train_info/time_between_train_steps": 0.0028717517852783203, "step": 7374} {"info/global_step": 7375, "train_info/time_within_train_step": 2.7523117065429688, "step": 7375} {"train_info/time_between_train_steps": 0.0028569698333740234, "step": 7375} {"info/global_step": 7376, "train_info/time_within_train_step": 2.7526328563690186, "step": 7376} {"train_info/time_between_train_steps": 0.0028676986694335938, "step": 7376} {"info/global_step": 7377, "train_info/time_within_train_step": 2.7525687217712402, "step": 7377} {"train_info/time_between_train_steps": 0.0028696060180664062, "step": 7377} {"info/global_step": 7378, "train_info/time_within_train_step": 2.753659725189209, "step": 7378} {"train_info/time_between_train_steps": 0.0028836727142333984, "step": 7378} {"info/global_step": 7379, "train_info/time_within_train_step": 2.7533557415008545, "step": 7379} {"train_info/time_between_train_steps": 0.0028634071350097656, "step": 7379} {"info/global_step": 7380, "train_info/time_within_train_step": 2.752807378768921, "step": 7380} {"train_info/time_between_train_steps": 0.0028786659240722656, "step": 7380} {"info/global_step": 7381, "train_info/time_within_train_step": 2.754544258117676, "step": 7381} {"train_info/time_between_train_steps": 0.002914905548095703, "step": 7381} {"info/global_step": 7382, "train_info/time_within_train_step": 2.7539315223693848, "step": 7382} {"train_info/time_between_train_steps": 0.0028731822967529297, "step": 7382} {"info/global_step": 7383, "train_info/time_within_train_step": 2.7539141178131104, "step": 7383} {"train_info/time_between_train_steps": 0.0029380321502685547, "step": 7383} {"info/global_step": 7384, "train_info/time_within_train_step": 2.7543890476226807, "step": 7384} {"train_info/time_between_train_steps": 0.002869844436645508, "step": 7384} {"info/global_step": 7385, "train_info/time_within_train_step": 2.754450798034668, "step": 7385} {"train_info/time_between_train_steps": 0.002850055694580078, "step": 7385} {"info/global_step": 7386, "train_info/time_within_train_step": 2.753373861312866, "step": 7386} {"train_info/time_between_train_steps": 0.0028672218322753906, "step": 7386} {"info/global_step": 7387, "train_info/time_within_train_step": 2.7543811798095703, "step": 7387} {"train_info/time_between_train_steps": 0.002875089645385742, "step": 7387} {"info/global_step": 7388, "train_info/time_within_train_step": 2.754417896270752, "step": 7388} {"train_info/time_between_train_steps": 0.0028913021087646484, "step": 7388} {"info/global_step": 7389, "train_info/time_within_train_step": 2.754086971282959, "step": 7389} {"train_info/time_between_train_steps": 0.0028650760650634766, "step": 7389} {"info/global_step": 7390, "train_info/time_within_train_step": 2.752817392349243, "step": 7390} {"train_info/time_between_train_steps": 0.0028769969940185547, "step": 7390} {"info/global_step": 7391, "train_info/time_within_train_step": 2.7544174194335938, "step": 7391} {"train_info/time_between_train_steps": 0.002843618392944336, "step": 7391} {"info/global_step": 7392, "train_info/time_within_train_step": 2.7538633346557617, "step": 7392} {"train_info/time_between_train_steps": 0.002930164337158203, "step": 7392} {"info/global_step": 7393, "train_info/time_within_train_step": 2.7543580532073975, "step": 7393} {"train_info/time_between_train_steps": 0.0028409957885742188, "step": 7393} {"info/global_step": 7394, "train_info/time_within_train_step": 2.7541935443878174, "step": 7394} {"train_info/time_between_train_steps": 0.0029175281524658203, "step": 7394} {"info/global_step": 7395, "train_info/time_within_train_step": 2.7533421516418457, "step": 7395} {"train_info/time_between_train_steps": 0.002871990203857422, "step": 7395} {"info/global_step": 7396, "train_info/time_within_train_step": 2.7542636394500732, "step": 7396} {"train_info/time_between_train_steps": 0.0028998851776123047, "step": 7396} {"info/global_step": 7397, "train_info/time_within_train_step": 2.7550926208496094, "step": 7397} {"train_info/time_between_train_steps": 0.002847433090209961, "step": 7397} {"info/global_step": 7398, "train_info/time_within_train_step": 2.7556676864624023, "step": 7398} {"train_info/time_between_train_steps": 0.002859354019165039, "step": 7398} {"info/global_step": 7399, "train_info/time_within_train_step": 2.7553462982177734, "step": 7399} {"train_info/time_between_train_steps": 0.002840757369995117, "step": 7399} {"info/global_step": 7400, "train_info/time_within_train_step": 2.755345106124878, "step": 7400} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746587382, "_runtime": 21391}, "step": 7400} {"logs": {"train/loss": 3.2103, "train/learning_rate": 0.0001733333333333333, "train/epoch": 8.06, "_timestamp": 1746587382, "_runtime": 21391}, "step": 7400} {"train_info/time_between_train_steps": 13.474567651748657, "step": 7400} {"info/global_step": 7401, "train_info/time_within_train_step": 2.5285627841949463, "step": 7401} {"train_info/time_between_train_steps": 0.0029654502868652344, "step": 7401} {"info/global_step": 7402, "train_info/time_within_train_step": 2.5801939964294434, "step": 7402} {"train_info/time_between_train_steps": 0.00299072265625, "step": 7402} {"info/global_step": 7403, "train_info/time_within_train_step": 2.911611795425415, "step": 7403} {"train_info/time_between_train_steps": 0.003057241439819336, "step": 7403} {"info/global_step": 7404, "train_info/time_within_train_step": 2.732314348220825, "step": 7404} {"train_info/time_between_train_steps": 0.0029723644256591797, "step": 7404} {"info/global_step": 7405, "train_info/time_within_train_step": 2.7521872520446777, "step": 7405} {"train_info/time_between_train_steps": 0.002852201461791992, "step": 7405} {"info/global_step": 7406, "train_info/time_within_train_step": 2.7544467449188232, "step": 7406} {"train_info/time_between_train_steps": 0.0028426647186279297, "step": 7406} {"info/global_step": 7407, "train_info/time_within_train_step": 2.7542059421539307, "step": 7407} {"train_info/time_between_train_steps": 0.002902984619140625, "step": 7407} {"info/global_step": 7408, "train_info/time_within_train_step": 2.7550251483917236, "step": 7408} {"train_info/time_between_train_steps": 0.0028600692749023438, "step": 7408} {"info/global_step": 7409, "train_info/time_within_train_step": 2.754721164703369, "step": 7409} {"train_info/time_between_train_steps": 0.0028645992279052734, "step": 7409} {"info/global_step": 7410, "train_info/time_within_train_step": 2.7529635429382324, "step": 7410} {"train_info/time_between_train_steps": 0.0028731822967529297, "step": 7410} {"info/global_step": 7411, "train_info/time_within_train_step": 2.7545342445373535, "step": 7411} {"train_info/time_between_train_steps": 0.0028793811798095703, "step": 7411} {"info/global_step": 7412, "train_info/time_within_train_step": 2.755326509475708, "step": 7412} {"train_info/time_between_train_steps": 0.0028536319732666016, "step": 7412} {"info/global_step": 7413, "train_info/time_within_train_step": 2.7545270919799805, "step": 7413} {"train_info/time_between_train_steps": 0.002887725830078125, "step": 7413} {"info/global_step": 7414, "train_info/time_within_train_step": 2.7551231384277344, "step": 7414} {"train_info/time_between_train_steps": 0.0028638839721679688, "step": 7414} {"info/global_step": 7415, "train_info/time_within_train_step": 2.7560503482818604, "step": 7415} {"train_info/time_between_train_steps": 0.0028617382049560547, "step": 7415} {"info/global_step": 7416, "train_info/time_within_train_step": 2.7557125091552734, "step": 7416} {"train_info/time_between_train_steps": 0.002863645553588867, "step": 7416} {"info/global_step": 7417, "train_info/time_within_train_step": 2.7560317516326904, "step": 7417} {"train_info/time_between_train_steps": 0.0028836727142333984, "step": 7417} {"info/global_step": 7418, "train_info/time_within_train_step": 2.755899429321289, "step": 7418} {"train_info/time_between_train_steps": 0.002847909927368164, "step": 7418} {"info/global_step": 7419, "train_info/time_within_train_step": 2.7557241916656494, "step": 7419} {"train_info/time_between_train_steps": 0.002858400344848633, "step": 7419} {"info/global_step": 7420, "train_info/time_within_train_step": 2.7559385299682617, "step": 7420} {"train_info/time_between_train_steps": 0.002874612808227539, "step": 7420} {"info/global_step": 7421, "train_info/time_within_train_step": 2.7547664642333984, "step": 7421} {"train_info/time_between_train_steps": 0.0028536319732666016, "step": 7421} {"info/global_step": 7422, "train_info/time_within_train_step": 2.7556188106536865, "step": 7422} {"train_info/time_between_train_steps": 0.0028743743896484375, "step": 7422} {"info/global_step": 7423, "train_info/time_within_train_step": 2.7559878826141357, "step": 7423} {"train_info/time_between_train_steps": 0.002872467041015625, "step": 7423} {"info/global_step": 7424, "train_info/time_within_train_step": 2.7557175159454346, "step": 7424} {"train_info/time_between_train_steps": 0.0028657913208007812, "step": 7424} {"info/global_step": 7425, "train_info/time_within_train_step": 2.7560455799102783, "step": 7425} {"train_info/time_between_train_steps": 0.0028748512268066406, "step": 7425} {"info/global_step": 7426, "train_info/time_within_train_step": 2.7556309700012207, "step": 7426} {"train_info/time_between_train_steps": 0.0029277801513671875, "step": 7426} {"info/global_step": 7427, "train_info/time_within_train_step": 2.7551467418670654, "step": 7427} {"train_info/time_between_train_steps": 0.0028655529022216797, "step": 7427} {"info/global_step": 7428, "train_info/time_within_train_step": 2.7555439472198486, "step": 7428} {"train_info/time_between_train_steps": 0.0029134750366210938, "step": 7428} {"info/global_step": 7429, "train_info/time_within_train_step": 2.7553634643554688, "step": 7429} {"train_info/time_between_train_steps": 0.0028603076934814453, "step": 7429} {"info/global_step": 7430, "train_info/time_within_train_step": 2.756782293319702, "step": 7430} {"train_info/time_between_train_steps": 0.002858400344848633, "step": 7430} {"info/global_step": 7431, "train_info/time_within_train_step": 2.7554469108581543, "step": 7431} {"train_info/time_between_train_steps": 0.0028727054595947266, "step": 7431} {"info/global_step": 7432, "train_info/time_within_train_step": 2.7553043365478516, "step": 7432} {"train_info/time_between_train_steps": 0.002861499786376953, "step": 7432} {"info/global_step": 7433, "train_info/time_within_train_step": 2.755389928817749, "step": 7433} {"train_info/time_between_train_steps": 0.002846956253051758, "step": 7433} {"info/global_step": 7434, "train_info/time_within_train_step": 2.755303144454956, "step": 7434} {"train_info/time_between_train_steps": 0.002958059310913086, "step": 7434} {"info/global_step": 7435, "train_info/time_within_train_step": 2.756483793258667, "step": 7435} {"train_info/time_between_train_steps": 0.002962350845336914, "step": 7435} {"info/global_step": 7436, "train_info/time_within_train_step": 2.75657320022583, "step": 7436} {"train_info/time_between_train_steps": 0.0029647350311279297, "step": 7436} {"info/global_step": 7437, "train_info/time_within_train_step": 2.756412982940674, "step": 7437} {"train_info/time_between_train_steps": 0.0029709339141845703, "step": 7437} {"info/global_step": 7438, "train_info/time_within_train_step": 2.7570905685424805, "step": 7438} {"train_info/time_between_train_steps": 0.0029401779174804688, "step": 7438} {"info/global_step": 7439, "train_info/time_within_train_step": 2.7571585178375244, "step": 7439} {"train_info/time_between_train_steps": 0.002982616424560547, "step": 7439} {"info/global_step": 7440, "train_info/time_within_train_step": 2.756513833999634, "step": 7440} {"train_info/time_between_train_steps": 0.0029754638671875, "step": 7440} {"info/global_step": 7441, "train_info/time_within_train_step": 2.7552976608276367, "step": 7441} {"train_info/time_between_train_steps": 0.0029485225677490234, "step": 7441} {"info/global_step": 7442, "train_info/time_within_train_step": 2.7563211917877197, "step": 7442} {"train_info/time_between_train_steps": 0.0029299259185791016, "step": 7442} {"info/global_step": 7443, "train_info/time_within_train_step": 2.7555580139160156, "step": 7443} {"train_info/time_between_train_steps": 0.002977609634399414, "step": 7443} {"info/global_step": 7444, "train_info/time_within_train_step": 2.7562363147735596, "step": 7444} {"train_info/time_between_train_steps": 0.002943277359008789, "step": 7444} {"info/global_step": 7445, "train_info/time_within_train_step": 2.756474733352661, "step": 7445} {"train_info/time_between_train_steps": 0.0029375553131103516, "step": 7445} {"info/global_step": 7446, "train_info/time_within_train_step": 2.7561731338500977, "step": 7446} {"train_info/time_between_train_steps": 0.002968311309814453, "step": 7446} {"info/global_step": 7447, "train_info/time_within_train_step": 2.756335973739624, "step": 7447} {"train_info/time_between_train_steps": 0.0029489994049072266, "step": 7447} {"info/global_step": 7448, "train_info/time_within_train_step": 2.7559797763824463, "step": 7448} {"train_info/time_between_train_steps": 0.0029926300048828125, "step": 7448} {"info/global_step": 7449, "train_info/time_within_train_step": 2.7560763359069824, "step": 7449} {"train_info/time_between_train_steps": 0.002981901168823242, "step": 7449} {"info/global_step": 7450, "train_info/time_within_train_step": 2.7562947273254395, "step": 7450} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746587533, "_runtime": 21542}, "step": 7450} {"logs": {"train/loss": 3.1996, "train/learning_rate": 0.00016999999999999999, "train/epoch": 8.06, "_timestamp": 1746587533, "_runtime": 21542}, "step": 7450} {"train_info/time_between_train_steps": 0.006303548812866211, "step": 7450} {"info/global_step": 7451, "train_info/time_within_train_step": 2.757174253463745, "step": 7451} {"train_info/time_between_train_steps": 0.002927541732788086, "step": 7451} {"info/global_step": 7452, "train_info/time_within_train_step": 2.7557601928710938, "step": 7452} {"train_info/time_between_train_steps": 0.00295257568359375, "step": 7452} {"info/global_step": 7453, "train_info/time_within_train_step": 2.7557435035705566, "step": 7453} {"train_info/time_between_train_steps": 0.0029861927032470703, "step": 7453} {"info/global_step": 7454, "train_info/time_within_train_step": 2.755603075027466, "step": 7454} {"train_info/time_between_train_steps": 0.002977609634399414, "step": 7454} {"info/global_step": 7455, "train_info/time_within_train_step": 2.756199598312378, "step": 7455} {"train_info/time_between_train_steps": 0.0029535293579101562, "step": 7455} {"info/global_step": 7456, "train_info/time_within_train_step": 2.7553319931030273, "step": 7456} {"train_info/time_between_train_steps": 0.0029687881469726562, "step": 7456} {"info/global_step": 7457, "train_info/time_within_train_step": 2.755337953567505, "step": 7457} {"train_info/time_between_train_steps": 0.002981901168823242, "step": 7457} {"info/global_step": 7458, "train_info/time_within_train_step": 2.755011558532715, "step": 7458} {"train_info/time_between_train_steps": 0.0029366016387939453, "step": 7458} {"info/global_step": 7459, "train_info/time_within_train_step": 2.7557225227355957, "step": 7459} {"train_info/time_between_train_steps": 0.002993345260620117, "step": 7459} {"info/global_step": 7460, "train_info/time_within_train_step": 2.755387306213379, "step": 7460} {"train_info/time_between_train_steps": 0.0029637813568115234, "step": 7460} {"info/global_step": 7461, "train_info/time_within_train_step": 2.7555460929870605, "step": 7461} {"train_info/time_between_train_steps": 0.0029935836791992188, "step": 7461} {"info/global_step": 7462, "train_info/time_within_train_step": 2.7546005249023438, "step": 7462} {"train_info/time_between_train_steps": 0.0028848648071289062, "step": 7462} {"info/global_step": 7463, "train_info/time_within_train_step": 2.754836320877075, "step": 7463} {"train_info/time_between_train_steps": 0.002877950668334961, "step": 7463} {"info/global_step": 7464, "train_info/time_within_train_step": 2.755124092102051, "step": 7464} {"train_info/time_between_train_steps": 0.0028197765350341797, "step": 7464} {"info/global_step": 7465, "train_info/time_within_train_step": 2.7544543743133545, "step": 7465} {"train_info/time_between_train_steps": 0.002869129180908203, "step": 7465} {"info/global_step": 7466, "train_info/time_within_train_step": 2.753976345062256, "step": 7466} {"train_info/time_between_train_steps": 0.0028657913208007812, "step": 7466} {"info/global_step": 7467, "train_info/time_within_train_step": 2.7548272609710693, "step": 7467} {"train_info/time_between_train_steps": 0.0028815269470214844, "step": 7467} {"info/global_step": 7468, "train_info/time_within_train_step": 2.7544617652893066, "step": 7468} {"train_info/time_between_train_steps": 0.0028533935546875, "step": 7468} {"info/global_step": 7469, "train_info/time_within_train_step": 2.7551746368408203, "step": 7469} {"train_info/time_between_train_steps": 0.0028672218322753906, "step": 7469} {"info/global_step": 7470, "train_info/time_within_train_step": 2.754112482070923, "step": 7470} {"train_info/time_between_train_steps": 0.002917051315307617, "step": 7470} {"info/global_step": 7471, "train_info/time_within_train_step": 2.754167079925537, "step": 7471} {"train_info/time_between_train_steps": 0.0028715133666992188, "step": 7471} {"info/global_step": 7472, "train_info/time_within_train_step": 2.7524406909942627, "step": 7472} {"train_info/time_between_train_steps": 0.0029370784759521484, "step": 7472} {"info/global_step": 7473, "train_info/time_within_train_step": 2.754220724105835, "step": 7473} {"train_info/time_between_train_steps": 0.0028831958770751953, "step": 7473} {"info/global_step": 7474, "train_info/time_within_train_step": 2.7541658878326416, "step": 7474} {"train_info/time_between_train_steps": 0.002854585647583008, "step": 7474} {"info/global_step": 7475, "train_info/time_within_train_step": 2.7547495365142822, "step": 7475} {"train_info/time_between_train_steps": 0.002871274948120117, "step": 7475} {"info/global_step": 7476, "train_info/time_within_train_step": 2.7545013427734375, "step": 7476} {"train_info/time_between_train_steps": 0.002847433090209961, "step": 7476} {"info/global_step": 7477, "train_info/time_within_train_step": 2.7531163692474365, "step": 7477} {"train_info/time_between_train_steps": 0.002836465835571289, "step": 7477} {"info/global_step": 7478, "train_info/time_within_train_step": 2.754995107650757, "step": 7478} {"train_info/time_between_train_steps": 0.0028700828552246094, "step": 7478} {"info/global_step": 7479, "train_info/time_within_train_step": 2.7542362213134766, "step": 7479} {"train_info/time_between_train_steps": 0.0028443336486816406, "step": 7479} {"info/global_step": 7480, "train_info/time_within_train_step": 2.7543632984161377, "step": 7480} {"train_info/time_between_train_steps": 0.00286865234375, "step": 7480} {"info/global_step": 7481, "train_info/time_within_train_step": 2.7551140785217285, "step": 7481} {"train_info/time_between_train_steps": 0.0029277801513671875, "step": 7481} {"info/global_step": 7482, "train_info/time_within_train_step": 2.755638837814331, "step": 7482} {"train_info/time_between_train_steps": 0.002875804901123047, "step": 7482} {"info/global_step": 7483, "train_info/time_within_train_step": 2.754326105117798, "step": 7483} {"train_info/time_between_train_steps": 0.0029358863830566406, "step": 7483} {"info/global_step": 7484, "train_info/time_within_train_step": 2.754011631011963, "step": 7484} {"train_info/time_between_train_steps": 0.002850055694580078, "step": 7484} {"info/global_step": 7485, "train_info/time_within_train_step": 2.7544665336608887, "step": 7485} {"train_info/time_between_train_steps": 0.0028464794158935547, "step": 7485} {"info/global_step": 7486, "train_info/time_within_train_step": 2.755115270614624, "step": 7486} {"train_info/time_between_train_steps": 0.002911090850830078, "step": 7486} {"info/global_step": 7487, "train_info/time_within_train_step": 2.7542366981506348, "step": 7487} {"train_info/time_between_train_steps": 0.002868175506591797, "step": 7487} {"info/global_step": 7488, "train_info/time_within_train_step": 2.753939151763916, "step": 7488} {"train_info/time_between_train_steps": 0.0028803348541259766, "step": 7488} {"info/global_step": 7489, "train_info/time_within_train_step": 2.754563093185425, "step": 7489} {"train_info/time_between_train_steps": 0.0028853416442871094, "step": 7489} {"info/global_step": 7490, "train_info/time_within_train_step": 2.753479480743408, "step": 7490} {"train_info/time_between_train_steps": 0.002870798110961914, "step": 7490} {"info/global_step": 7491, "train_info/time_within_train_step": 2.7541463375091553, "step": 7491} {"train_info/time_between_train_steps": 0.002863168716430664, "step": 7491} {"info/global_step": 7492, "train_info/time_within_train_step": 2.753870964050293, "step": 7492} {"train_info/time_between_train_steps": 0.002956867218017578, "step": 7492} {"info/global_step": 7493, "train_info/time_within_train_step": 2.7536611557006836, "step": 7493} {"train_info/time_between_train_steps": 0.002889394760131836, "step": 7493} {"info/global_step": 7494, "train_info/time_within_train_step": 2.7548980712890625, "step": 7494} {"train_info/time_between_train_steps": 0.002930164337158203, "step": 7494} {"info/global_step": 7495, "train_info/time_within_train_step": 2.7557172775268555, "step": 7495} {"train_info/time_between_train_steps": 0.00299835205078125, "step": 7495} {"info/global_step": 7496, "train_info/time_within_train_step": 3.356926679611206, "step": 7496} {"train_info/time_between_train_steps": 0.002986431121826172, "step": 7496} {"info/global_step": 7497, "train_info/time_within_train_step": 2.7548978328704834, "step": 7497} {"train_info/time_between_train_steps": 0.0029752254486083984, "step": 7497} {"info/global_step": 7498, "train_info/time_within_train_step": 2.755624532699585, "step": 7498} {"train_info/time_between_train_steps": 0.002994537353515625, "step": 7498} {"info/global_step": 7499, "train_info/time_within_train_step": 2.756326198577881, "step": 7499} {"train_info/time_between_train_steps": 0.0030024051666259766, "step": 7499} {"info/global_step": 7500, "train_info/time_within_train_step": 2.754664182662964, "step": 7500} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746587672, "_runtime": 21681}, "step": 7500} {"logs": {"train/loss": 3.1866, "train/learning_rate": 0.00016666666666666666, "train/epoch": 8.07, "_timestamp": 1746587672, "_runtime": 21681}, "step": 7500} {"train_info/time_between_train_steps": 0.006663322448730469, "step": 7500} {"info/global_step": 7501, "train_info/time_within_train_step": 2.7555627822875977, "step": 7501} {"train_info/time_between_train_steps": 0.0029268264770507812, "step": 7501} {"info/global_step": 7502, "train_info/time_within_train_step": 2.755030393600464, "step": 7502} {"train_info/time_between_train_steps": 0.002917051315307617, "step": 7502} {"info/global_step": 7503, "train_info/time_within_train_step": 2.75612735748291, "step": 7503} {"train_info/time_between_train_steps": 0.0030450820922851562, "step": 7503} {"info/global_step": 7504, "train_info/time_within_train_step": 2.755370616912842, "step": 7504} {"train_info/time_between_train_steps": 0.0029997825622558594, "step": 7504} {"info/global_step": 7505, "train_info/time_within_train_step": 2.7549502849578857, "step": 7505} {"train_info/time_between_train_steps": 0.0029344558715820312, "step": 7505} {"info/global_step": 7506, "train_info/time_within_train_step": 2.75528883934021, "step": 7506} {"train_info/time_between_train_steps": 0.003002166748046875, "step": 7506} {"info/global_step": 7507, "train_info/time_within_train_step": 2.7558743953704834, "step": 7507} {"train_info/time_between_train_steps": 0.00295257568359375, "step": 7507} {"info/global_step": 7508, "train_info/time_within_train_step": 2.756232261657715, "step": 7508} {"train_info/time_between_train_steps": 0.002971649169921875, "step": 7508} {"info/global_step": 7509, "train_info/time_within_train_step": 2.7545814514160156, "step": 7509} {"train_info/time_between_train_steps": 0.002964496612548828, "step": 7509} {"info/global_step": 7510, "train_info/time_within_train_step": 2.754793882369995, "step": 7510} {"train_info/time_between_train_steps": 0.0030062198638916016, "step": 7510} {"info/global_step": 7511, "train_info/time_within_train_step": 2.7559475898742676, "step": 7511} {"train_info/time_between_train_steps": 0.0030825138092041016, "step": 7511} {"info/global_step": 7512, "train_info/time_within_train_step": 2.7546005249023438, "step": 7512} {"train_info/time_between_train_steps": 0.0029904842376708984, "step": 7512} {"info/global_step": 7513, "train_info/time_within_train_step": 2.8905861377716064, "step": 7513} {"train_info/time_between_train_steps": 0.003057718276977539, "step": 7513} {"info/global_step": 7514, "train_info/time_within_train_step": 2.7551252841949463, "step": 7514} {"train_info/time_between_train_steps": 0.003027200698852539, "step": 7514} {"info/global_step": 7515, "train_info/time_within_train_step": 2.755775213241577, "step": 7515} {"train_info/time_between_train_steps": 0.0029671192169189453, "step": 7515} {"info/global_step": 7516, "train_info/time_within_train_step": 2.7541391849517822, "step": 7516} {"train_info/time_between_train_steps": 0.0029659271240234375, "step": 7516} {"info/global_step": 7517, "train_info/time_within_train_step": 2.754845380783081, "step": 7517} {"train_info/time_between_train_steps": 0.003490447998046875, "step": 7517} {"info/global_step": 7518, "train_info/time_within_train_step": 2.7551867961883545, "step": 7518} {"train_info/time_between_train_steps": 0.002959012985229492, "step": 7518} {"info/global_step": 7519, "train_info/time_within_train_step": 2.7551863193511963, "step": 7519} {"train_info/time_between_train_steps": 0.0028641223907470703, "step": 7519} {"info/global_step": 7520, "train_info/time_within_train_step": 2.753814220428467, "step": 7520} {"train_info/time_between_train_steps": 0.002859354019165039, "step": 7520} {"info/global_step": 7521, "train_info/time_within_train_step": 2.7531275749206543, "step": 7521} {"train_info/time_between_train_steps": 0.0028634071350097656, "step": 7521} {"info/global_step": 7522, "train_info/time_within_train_step": 2.7530949115753174, "step": 7522} {"train_info/time_between_train_steps": 0.0029861927032470703, "step": 7522} {"info/global_step": 7523, "train_info/time_within_train_step": 2.7534658908843994, "step": 7523} {"train_info/time_between_train_steps": 0.0028526782989501953, "step": 7523} {"info/global_step": 7524, "train_info/time_within_train_step": 2.7531819343566895, "step": 7524} {"train_info/time_between_train_steps": 0.0028777122497558594, "step": 7524} {"info/global_step": 7525, "train_info/time_within_train_step": 2.7528836727142334, "step": 7525} {"train_info/time_between_train_steps": 0.0028645992279052734, "step": 7525} {"info/global_step": 7526, "train_info/time_within_train_step": 2.754753351211548, "step": 7526} {"train_info/time_between_train_steps": 0.002889394760131836, "step": 7526} {"info/global_step": 7527, "train_info/time_within_train_step": 2.753046751022339, "step": 7527} {"train_info/time_between_train_steps": 0.002849102020263672, "step": 7527} {"info/global_step": 7528, "train_info/time_within_train_step": 2.7530481815338135, "step": 7528} {"train_info/time_between_train_steps": 0.0028760433197021484, "step": 7528} {"info/global_step": 7529, "train_info/time_within_train_step": 2.7529282569885254, "step": 7529} {"train_info/time_between_train_steps": 0.002913236618041992, "step": 7529} {"info/global_step": 7530, "train_info/time_within_train_step": 2.7530927658081055, "step": 7530} {"train_info/time_between_train_steps": 0.0028831958770751953, "step": 7530} {"info/global_step": 7531, "train_info/time_within_train_step": 2.75341534614563, "step": 7531} {"train_info/time_between_train_steps": 0.0028748512268066406, "step": 7531} {"info/global_step": 7532, "train_info/time_within_train_step": 2.753788948059082, "step": 7532} {"train_info/time_between_train_steps": 0.002872467041015625, "step": 7532} {"info/global_step": 7533, "train_info/time_within_train_step": 2.754380941390991, "step": 7533} {"train_info/time_between_train_steps": 0.002862215042114258, "step": 7533} {"info/global_step": 7534, "train_info/time_within_train_step": 2.7549731731414795, "step": 7534} {"train_info/time_between_train_steps": 0.0028438568115234375, "step": 7534} {"info/global_step": 7535, "train_info/time_within_train_step": 2.753732442855835, "step": 7535} {"train_info/time_between_train_steps": 0.002902507781982422, "step": 7535} {"info/global_step": 7536, "train_info/time_within_train_step": 2.7542741298675537, "step": 7536} {"train_info/time_between_train_steps": 0.0029573440551757812, "step": 7536} {"info/global_step": 7537, "train_info/time_within_train_step": 2.754359722137451, "step": 7537} {"train_info/time_between_train_steps": 0.0028781890869140625, "step": 7537} {"info/global_step": 7538, "train_info/time_within_train_step": 2.7538607120513916, "step": 7538} {"train_info/time_between_train_steps": 0.0028922557830810547, "step": 7538} {"info/global_step": 7539, "train_info/time_within_train_step": 2.752509355545044, "step": 7539} {"train_info/time_between_train_steps": 0.002876758575439453, "step": 7539} {"info/global_step": 7540, "train_info/time_within_train_step": 2.754230499267578, "step": 7540} {"train_info/time_between_train_steps": 0.002877473831176758, "step": 7540} {"info/global_step": 7541, "train_info/time_within_train_step": 2.753885269165039, "step": 7541} {"train_info/time_between_train_steps": 0.002893686294555664, "step": 7541} {"info/global_step": 7542, "train_info/time_within_train_step": 2.754127025604248, "step": 7542} {"train_info/time_between_train_steps": 0.0028634071350097656, "step": 7542} {"info/global_step": 7543, "train_info/time_within_train_step": 2.7543976306915283, "step": 7543} {"train_info/time_between_train_steps": 0.002900362014770508, "step": 7543} {"info/global_step": 7544, "train_info/time_within_train_step": 2.7538576126098633, "step": 7544} {"train_info/time_between_train_steps": 0.0028727054595947266, "step": 7544} {"info/global_step": 7545, "train_info/time_within_train_step": 2.7535386085510254, "step": 7545} {"train_info/time_between_train_steps": 0.002869129180908203, "step": 7545} {"info/global_step": 7546, "train_info/time_within_train_step": 2.753896474838257, "step": 7546} {"train_info/time_between_train_steps": 0.002892017364501953, "step": 7546} {"info/global_step": 7547, "train_info/time_within_train_step": 2.7541401386260986, "step": 7547} {"train_info/time_between_train_steps": 0.0028951168060302734, "step": 7547} {"info/global_step": 7548, "train_info/time_within_train_step": 2.754265308380127, "step": 7548} {"train_info/time_between_train_steps": 0.0028777122497558594, "step": 7548} {"info/global_step": 7549, "train_info/time_within_train_step": 2.754528284072876, "step": 7549} {"train_info/time_between_train_steps": 0.002945423126220703, "step": 7549} {"info/global_step": 7550, "train_info/time_within_train_step": 2.7541394233703613, "step": 7550} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746587810, "_runtime": 21819}, "step": 7550} {"logs": {"train/loss": 3.184, "train/learning_rate": 0.0001633333333333333, "train/epoch": 8.07, "_timestamp": 1746587810, "_runtime": 21819}, "step": 7550} {"train_info/time_between_train_steps": 0.007984638214111328, "step": 7550} {"info/global_step": 7551, "train_info/time_within_train_step": 2.7555840015411377, "step": 7551} {"train_info/time_between_train_steps": 0.002840280532836914, "step": 7551} {"info/global_step": 7552, "train_info/time_within_train_step": 2.7540571689605713, "step": 7552} {"train_info/time_between_train_steps": 0.0028672218322753906, "step": 7552} {"info/global_step": 7553, "train_info/time_within_train_step": 2.754952907562256, "step": 7553} {"train_info/time_between_train_steps": 0.0028641223907470703, "step": 7553} {"info/global_step": 7554, "train_info/time_within_train_step": 2.7547242641448975, "step": 7554} {"train_info/time_between_train_steps": 0.0029115676879882812, "step": 7554} {"info/global_step": 7555, "train_info/time_within_train_step": 2.754305601119995, "step": 7555} {"train_info/time_between_train_steps": 0.0028722286224365234, "step": 7555} {"info/global_step": 7556, "train_info/time_within_train_step": 2.7550086975097656, "step": 7556} {"train_info/time_between_train_steps": 0.0028777122497558594, "step": 7556} {"info/global_step": 7557, "train_info/time_within_train_step": 2.754938840866089, "step": 7557} {"train_info/time_between_train_steps": 0.002893209457397461, "step": 7557} {"info/global_step": 7558, "train_info/time_within_train_step": 2.7532033920288086, "step": 7558} {"train_info/time_between_train_steps": 0.0028929710388183594, "step": 7558} {"info/global_step": 7559, "train_info/time_within_train_step": 2.7533092498779297, "step": 7559} {"train_info/time_between_train_steps": 0.002864360809326172, "step": 7559} {"info/global_step": 7560, "train_info/time_within_train_step": 2.753645896911621, "step": 7560} {"train_info/time_between_train_steps": 0.002940654754638672, "step": 7560} {"info/global_step": 7561, "train_info/time_within_train_step": 2.7531216144561768, "step": 7561} {"train_info/time_between_train_steps": 0.002897500991821289, "step": 7561} {"info/global_step": 7562, "train_info/time_within_train_step": 2.754012107849121, "step": 7562} {"train_info/time_between_train_steps": 0.0029752254486083984, "step": 7562} {"info/global_step": 7563, "train_info/time_within_train_step": 2.7548322677612305, "step": 7563} {"train_info/time_between_train_steps": 0.0029840469360351562, "step": 7563} {"info/global_step": 7564, "train_info/time_within_train_step": 2.755777359008789, "step": 7564} {"train_info/time_between_train_steps": 0.0030012130737304688, "step": 7564} {"info/global_step": 7565, "train_info/time_within_train_step": 2.7553932666778564, "step": 7565} {"train_info/time_between_train_steps": 0.0029516220092773438, "step": 7565} {"info/global_step": 7566, "train_info/time_within_train_step": 2.7566494941711426, "step": 7566} {"train_info/time_between_train_steps": 0.003031015396118164, "step": 7566} {"info/global_step": 7567, "train_info/time_within_train_step": 2.7565994262695312, "step": 7567} {"train_info/time_between_train_steps": 0.0029947757720947266, "step": 7567} {"info/global_step": 7568, "train_info/time_within_train_step": 2.755918025970459, "step": 7568} {"train_info/time_between_train_steps": 0.0029904842376708984, "step": 7568} {"info/global_step": 7569, "train_info/time_within_train_step": 2.75616192817688, "step": 7569} {"train_info/time_between_train_steps": 0.0030014514923095703, "step": 7569} {"info/global_step": 7570, "train_info/time_within_train_step": 2.7554526329040527, "step": 7570} {"train_info/time_between_train_steps": 0.002978801727294922, "step": 7570} {"info/global_step": 7571, "train_info/time_within_train_step": 2.75485897064209, "step": 7571} {"train_info/time_between_train_steps": 0.0034859180450439453, "step": 7571} {"info/global_step": 7572, "train_info/time_within_train_step": 2.8540232181549072, "step": 7572} {"train_info/time_between_train_steps": 0.003190755844116211, "step": 7572} {"info/global_step": 7573, "train_info/time_within_train_step": 2.7545909881591797, "step": 7573} {"train_info/time_between_train_steps": 0.0030155181884765625, "step": 7573} {"info/global_step": 7574, "train_info/time_within_train_step": 2.7534589767456055, "step": 7574} {"train_info/time_between_train_steps": 0.00286865234375, "step": 7574} {"info/global_step": 7575, "train_info/time_within_train_step": 2.752737283706665, "step": 7575} {"train_info/time_between_train_steps": 0.002884387969970703, "step": 7575} {"info/global_step": 7576, "train_info/time_within_train_step": 2.752840757369995, "step": 7576} {"train_info/time_between_train_steps": 0.00286102294921875, "step": 7576} {"info/global_step": 7577, "train_info/time_within_train_step": 2.7535393238067627, "step": 7577} {"train_info/time_between_train_steps": 0.002871274948120117, "step": 7577} {"info/global_step": 7578, "train_info/time_within_train_step": 2.753830909729004, "step": 7578} {"train_info/time_between_train_steps": 0.0029058456420898438, "step": 7578} {"info/global_step": 7579, "train_info/time_within_train_step": 2.753714084625244, "step": 7579} {"train_info/time_between_train_steps": 0.0028984546661376953, "step": 7579} {"info/global_step": 7580, "train_info/time_within_train_step": 2.7545924186706543, "step": 7580} {"train_info/time_between_train_steps": 0.0028409957885742188, "step": 7580} {"info/global_step": 7581, "train_info/time_within_train_step": 2.754075765609741, "step": 7581} {"train_info/time_between_train_steps": 0.0028924942016601562, "step": 7581} {"info/global_step": 7582, "train_info/time_within_train_step": 2.754573106765747, "step": 7582} {"train_info/time_between_train_steps": 0.0029125213623046875, "step": 7582} {"info/global_step": 7583, "train_info/time_within_train_step": 2.7547004222869873, "step": 7583} {"train_info/time_between_train_steps": 0.0028650760650634766, "step": 7583} {"info/global_step": 7584, "train_info/time_within_train_step": 2.7541074752807617, "step": 7584} {"train_info/time_between_train_steps": 0.002889871597290039, "step": 7584} {"info/global_step": 7585, "train_info/time_within_train_step": 2.753941774368286, "step": 7585} {"train_info/time_between_train_steps": 0.0028693675994873047, "step": 7585} {"info/global_step": 7586, "train_info/time_within_train_step": 2.756072998046875, "step": 7586} {"train_info/time_between_train_steps": 0.002983570098876953, "step": 7586} {"info/global_step": 7587, "train_info/time_within_train_step": 2.7550203800201416, "step": 7587} {"train_info/time_between_train_steps": 0.0030090808868408203, "step": 7587} {"info/global_step": 7588, "train_info/time_within_train_step": 2.7559478282928467, "step": 7588} {"train_info/time_between_train_steps": 0.002949953079223633, "step": 7588} {"info/global_step": 7589, "train_info/time_within_train_step": 2.753577947616577, "step": 7589} {"train_info/time_between_train_steps": 0.0030057430267333984, "step": 7589} {"info/global_step": 7590, "train_info/time_within_train_step": 2.7537147998809814, "step": 7590} {"train_info/time_between_train_steps": 0.0029900074005126953, "step": 7590} {"info/global_step": 7591, "train_info/time_within_train_step": 2.754600763320923, "step": 7591} {"train_info/time_between_train_steps": 0.0030066967010498047, "step": 7591} {"info/global_step": 7592, "train_info/time_within_train_step": 2.755246877670288, "step": 7592} {"train_info/time_between_train_steps": 0.0029697418212890625, "step": 7592} {"info/global_step": 7593, "train_info/time_within_train_step": 2.755628824234009, "step": 7593} {"train_info/time_between_train_steps": 0.0030298233032226562, "step": 7593} {"info/global_step": 7594, "train_info/time_within_train_step": 2.755250930786133, "step": 7594} {"train_info/time_between_train_steps": 0.0029680728912353516, "step": 7594} {"info/global_step": 7595, "train_info/time_within_train_step": 2.755807876586914, "step": 7595} {"train_info/time_between_train_steps": 0.002984285354614258, "step": 7595} {"info/global_step": 7596, "train_info/time_within_train_step": 2.755828619003296, "step": 7596} {"train_info/time_between_train_steps": 0.0028846263885498047, "step": 7596} {"info/global_step": 7597, "train_info/time_within_train_step": 2.755157709121704, "step": 7597} {"train_info/time_between_train_steps": 0.0028662681579589844, "step": 7597} {"info/global_step": 7598, "train_info/time_within_train_step": 2.7555320262908936, "step": 7598} {"train_info/time_between_train_steps": 0.0028717517852783203, "step": 7598} {"info/global_step": 7599, "train_info/time_within_train_step": 2.7540557384490967, "step": 7599} {"train_info/time_between_train_steps": 0.002866029739379883, "step": 7599} {"info/global_step": 7600, "train_info/time_within_train_step": 2.7544145584106445, "step": 7600} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746587948, "_runtime": 21957}, "step": 7600} {"logs": {"train/loss": 3.1694, "train/learning_rate": 0.00015999999999999999, "train/epoch": 8.08, "_timestamp": 1746587948, "_runtime": 21957}, "step": 7600} {"train_info/time_between_train_steps": 18.906731128692627, "step": 7600} {"info/global_step": 7601, "train_info/time_within_train_step": 2.5430006980895996, "step": 7601} {"train_info/time_between_train_steps": 0.0029549598693847656, "step": 7601} {"info/global_step": 7602, "train_info/time_within_train_step": 2.5723588466644287, "step": 7602} {"train_info/time_between_train_steps": 0.0029518604278564453, "step": 7602} {"info/global_step": 7603, "train_info/time_within_train_step": 2.7056336402893066, "step": 7603} {"train_info/time_between_train_steps": 0.002969503402709961, "step": 7603} {"info/global_step": 7604, "train_info/time_within_train_step": 2.7472970485687256, "step": 7604} {"train_info/time_between_train_steps": 0.0029752254486083984, "step": 7604} {"info/global_step": 7605, "train_info/time_within_train_step": 2.7515411376953125, "step": 7605} {"train_info/time_between_train_steps": 0.0029752254486083984, "step": 7605} {"info/global_step": 7606, "train_info/time_within_train_step": 2.753789186477661, "step": 7606} {"train_info/time_between_train_steps": 0.0029494762420654297, "step": 7606} {"info/global_step": 7607, "train_info/time_within_train_step": 2.755101203918457, "step": 7607} {"train_info/time_between_train_steps": 0.002977609634399414, "step": 7607} {"info/global_step": 7608, "train_info/time_within_train_step": 2.7556493282318115, "step": 7608} {"train_info/time_between_train_steps": 0.002964496612548828, "step": 7608} {"info/global_step": 7609, "train_info/time_within_train_step": 2.755798816680908, "step": 7609} {"train_info/time_between_train_steps": 0.003010272979736328, "step": 7609} {"info/global_step": 7610, "train_info/time_within_train_step": 2.7561357021331787, "step": 7610} {"train_info/time_between_train_steps": 0.002995014190673828, "step": 7610} {"info/global_step": 7611, "train_info/time_within_train_step": 2.7534561157226562, "step": 7611} {"train_info/time_between_train_steps": 0.0028858184814453125, "step": 7611} {"info/global_step": 7612, "train_info/time_within_train_step": 2.7546803951263428, "step": 7612} {"train_info/time_between_train_steps": 0.002929210662841797, "step": 7612} {"info/global_step": 7613, "train_info/time_within_train_step": 2.754880666732788, "step": 7613} {"train_info/time_between_train_steps": 0.002874612808227539, "step": 7613} {"info/global_step": 7614, "train_info/time_within_train_step": 2.7544751167297363, "step": 7614} {"train_info/time_between_train_steps": 0.0029227733612060547, "step": 7614} {"info/global_step": 7615, "train_info/time_within_train_step": 2.755265951156616, "step": 7615} {"train_info/time_between_train_steps": 0.002880573272705078, "step": 7615} {"info/global_step": 7616, "train_info/time_within_train_step": 2.827193021774292, "step": 7616} {"train_info/time_between_train_steps": 0.002994537353515625, "step": 7616} {"info/global_step": 7617, "train_info/time_within_train_step": 2.7563529014587402, "step": 7617} {"train_info/time_between_train_steps": 0.003024578094482422, "step": 7617} {"info/global_step": 7618, "train_info/time_within_train_step": 2.7557363510131836, "step": 7618} {"train_info/time_between_train_steps": 0.0029566287994384766, "step": 7618} {"info/global_step": 7619, "train_info/time_within_train_step": 2.755744218826294, "step": 7619} {"train_info/time_between_train_steps": 0.0029692649841308594, "step": 7619} {"info/global_step": 7620, "train_info/time_within_train_step": 2.7572860717773438, "step": 7620} {"train_info/time_between_train_steps": 0.002983570098876953, "step": 7620} {"info/global_step": 7621, "train_info/time_within_train_step": 2.7561569213867188, "step": 7621} {"train_info/time_between_train_steps": 0.002973794937133789, "step": 7621} {"info/global_step": 7622, "train_info/time_within_train_step": 2.7555971145629883, "step": 7622} {"train_info/time_between_train_steps": 0.0029823780059814453, "step": 7622} {"info/global_step": 7623, "train_info/time_within_train_step": 2.7581229209899902, "step": 7623} {"train_info/time_between_train_steps": 0.0029981136322021484, "step": 7623} {"info/global_step": 7624, "train_info/time_within_train_step": 2.757185935974121, "step": 7624} {"train_info/time_between_train_steps": 0.0029685497283935547, "step": 7624} {"info/global_step": 7625, "train_info/time_within_train_step": 2.756420135498047, "step": 7625} {"train_info/time_between_train_steps": 0.0029697418212890625, "step": 7625} {"info/global_step": 7626, "train_info/time_within_train_step": 2.7567789554595947, "step": 7626} {"train_info/time_between_train_steps": 0.0029418468475341797, "step": 7626} {"info/global_step": 7627, "train_info/time_within_train_step": 2.7573208808898926, "step": 7627} {"train_info/time_between_train_steps": 0.0031282901763916016, "step": 7627} {"info/global_step": 7628, "train_info/time_within_train_step": 2.756028890609741, "step": 7628} {"train_info/time_between_train_steps": 0.002964496612548828, "step": 7628} {"info/global_step": 7629, "train_info/time_within_train_step": 2.7569398880004883, "step": 7629} {"train_info/time_between_train_steps": 0.0029516220092773438, "step": 7629} {"info/global_step": 7630, "train_info/time_within_train_step": 2.755653142929077, "step": 7630} {"train_info/time_between_train_steps": 0.003025054931640625, "step": 7630} {"info/global_step": 7631, "train_info/time_within_train_step": 2.7549195289611816, "step": 7631} {"train_info/time_between_train_steps": 0.0029783248901367188, "step": 7631} {"info/global_step": 7632, "train_info/time_within_train_step": 2.7543749809265137, "step": 7632} {"train_info/time_between_train_steps": 0.0029616355895996094, "step": 7632} {"info/global_step": 7633, "train_info/time_within_train_step": 2.7567319869995117, "step": 7633} {"train_info/time_between_train_steps": 0.0029754638671875, "step": 7633} {"info/global_step": 7634, "train_info/time_within_train_step": 2.755070686340332, "step": 7634} {"train_info/time_between_train_steps": 0.0029675960540771484, "step": 7634} {"info/global_step": 7635, "train_info/time_within_train_step": 2.755441665649414, "step": 7635} {"train_info/time_between_train_steps": 0.0029764175415039062, "step": 7635} {"info/global_step": 7636, "train_info/time_within_train_step": 2.754727840423584, "step": 7636} {"train_info/time_between_train_steps": 0.003064870834350586, "step": 7636} {"info/global_step": 7637, "train_info/time_within_train_step": 2.7561709880828857, "step": 7637} {"train_info/time_between_train_steps": 0.0029859542846679688, "step": 7637} {"info/global_step": 7638, "train_info/time_within_train_step": 2.7555742263793945, "step": 7638} {"train_info/time_between_train_steps": 0.0029592514038085938, "step": 7638} {"info/global_step": 7639, "train_info/time_within_train_step": 2.7577459812164307, "step": 7639} {"train_info/time_between_train_steps": 0.0030651092529296875, "step": 7639} {"info/global_step": 7640, "train_info/time_within_train_step": 2.757563829421997, "step": 7640} {"train_info/time_between_train_steps": 0.0030257701873779297, "step": 7640} {"info/global_step": 7641, "train_info/time_within_train_step": 2.75608229637146, "step": 7641} {"train_info/time_between_train_steps": 0.0030083656311035156, "step": 7641} {"info/global_step": 7642, "train_info/time_within_train_step": 2.7558753490448, "step": 7642} {"train_info/time_between_train_steps": 0.0029823780059814453, "step": 7642} {"info/global_step": 7643, "train_info/time_within_train_step": 2.756078004837036, "step": 7643} {"train_info/time_between_train_steps": 0.0030317306518554688, "step": 7643} {"info/global_step": 7644, "train_info/time_within_train_step": 2.7568519115448, "step": 7644} {"train_info/time_between_train_steps": 0.0029840469360351562, "step": 7644} {"info/global_step": 7645, "train_info/time_within_train_step": 2.755988597869873, "step": 7645} {"train_info/time_between_train_steps": 0.0029702186584472656, "step": 7645} {"info/global_step": 7646, "train_info/time_within_train_step": 2.7552733421325684, "step": 7646} {"train_info/time_between_train_steps": 0.0031464099884033203, "step": 7646} {"info/global_step": 7647, "train_info/time_within_train_step": 2.754072904586792, "step": 7647} {"train_info/time_between_train_steps": 0.0030558109283447266, "step": 7647} {"info/global_step": 7648, "train_info/time_within_train_step": 2.755033493041992, "step": 7648} {"train_info/time_between_train_steps": 0.003046274185180664, "step": 7648} {"info/global_step": 7649, "train_info/time_within_train_step": 2.7540640830993652, "step": 7649} {"train_info/time_between_train_steps": 0.0030527114868164062, "step": 7649} {"info/global_step": 7650, "train_info/time_within_train_step": 2.755255937576294, "step": 7650} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746588105, "_runtime": 22114}, "step": 7650} {"logs": {"train/loss": 3.1587, "train/learning_rate": 0.00015666666666666666, "train/epoch": 8.08, "_timestamp": 1746588105, "_runtime": 22114}, "step": 7650} {"train_info/time_between_train_steps": 0.00702214241027832, "step": 7650} {"info/global_step": 7651, "train_info/time_within_train_step": 2.755741834640503, "step": 7651} {"train_info/time_between_train_steps": 0.0030798912048339844, "step": 7651} {"info/global_step": 7652, "train_info/time_within_train_step": 2.756411075592041, "step": 7652} {"train_info/time_between_train_steps": 0.00307464599609375, "step": 7652} {"info/global_step": 7653, "train_info/time_within_train_step": 2.7550604343414307, "step": 7653} {"train_info/time_between_train_steps": 0.0032193660736083984, "step": 7653} {"info/global_step": 7654, "train_info/time_within_train_step": 2.7562520503997803, "step": 7654} {"train_info/time_between_train_steps": 0.003082275390625, "step": 7654} {"info/global_step": 7655, "train_info/time_within_train_step": 2.8046531677246094, "step": 7655} {"train_info/time_between_train_steps": 0.0032167434692382812, "step": 7655} {"info/global_step": 7656, "train_info/time_within_train_step": 2.7567262649536133, "step": 7656} {"train_info/time_between_train_steps": 0.0033113956451416016, "step": 7656} {"info/global_step": 7657, "train_info/time_within_train_step": 2.7548673152923584, "step": 7657} {"train_info/time_between_train_steps": 0.003100156784057617, "step": 7657} {"info/global_step": 7658, "train_info/time_within_train_step": 2.755793571472168, "step": 7658} {"train_info/time_between_train_steps": 0.0031189918518066406, "step": 7658} {"info/global_step": 7659, "train_info/time_within_train_step": 2.7562081813812256, "step": 7659} {"train_info/time_between_train_steps": 0.0030345916748046875, "step": 7659} {"info/global_step": 7660, "train_info/time_within_train_step": 2.7541770935058594, "step": 7660} {"train_info/time_between_train_steps": 0.0029456615447998047, "step": 7660} {"info/global_step": 7661, "train_info/time_within_train_step": 2.7545337677001953, "step": 7661} {"train_info/time_between_train_steps": 0.00299072265625, "step": 7661} {"info/global_step": 7662, "train_info/time_within_train_step": 2.753330707550049, "step": 7662} {"train_info/time_between_train_steps": 0.0030221939086914062, "step": 7662} {"info/global_step": 7663, "train_info/time_within_train_step": 2.754539966583252, "step": 7663} {"train_info/time_between_train_steps": 0.0030999183654785156, "step": 7663} {"info/global_step": 7664, "train_info/time_within_train_step": 2.7528021335601807, "step": 7664} {"train_info/time_between_train_steps": 0.003165006637573242, "step": 7664} {"info/global_step": 7665, "train_info/time_within_train_step": 2.752338409423828, "step": 7665} {"train_info/time_between_train_steps": 0.002971172332763672, "step": 7665} {"info/global_step": 7666, "train_info/time_within_train_step": 2.753761053085327, "step": 7666} {"train_info/time_between_train_steps": 0.0029981136322021484, "step": 7666} {"info/global_step": 7667, "train_info/time_within_train_step": 2.753850221633911, "step": 7667} {"train_info/time_between_train_steps": 0.0030639171600341797, "step": 7667} {"info/global_step": 7668, "train_info/time_within_train_step": 2.752533197402954, "step": 7668} {"train_info/time_between_train_steps": 0.0031332969665527344, "step": 7668} {"info/global_step": 7669, "train_info/time_within_train_step": 2.7549962997436523, "step": 7669} {"train_info/time_between_train_steps": 0.0030565261840820312, "step": 7669} {"info/global_step": 7670, "train_info/time_within_train_step": 2.755587577819824, "step": 7670} {"train_info/time_between_train_steps": 0.0031690597534179688, "step": 7670} {"info/global_step": 7671, "train_info/time_within_train_step": 2.755579948425293, "step": 7671} {"train_info/time_between_train_steps": 0.0031447410583496094, "step": 7671} {"info/global_step": 7672, "train_info/time_within_train_step": 2.755469799041748, "step": 7672} {"train_info/time_between_train_steps": 0.0033049583435058594, "step": 7672} {"info/global_step": 7673, "train_info/time_within_train_step": 2.756065845489502, "step": 7673} {"train_info/time_between_train_steps": 0.003176450729370117, "step": 7673} {"info/global_step": 7674, "train_info/time_within_train_step": 2.755811929702759, "step": 7674} {"train_info/time_between_train_steps": 0.003309011459350586, "step": 7674} {"info/global_step": 7675, "train_info/time_within_train_step": 2.75453519821167, "step": 7675} {"train_info/time_between_train_steps": 0.0032112598419189453, "step": 7675} {"info/global_step": 7676, "train_info/time_within_train_step": 2.7549328804016113, "step": 7676} {"train_info/time_between_train_steps": 0.0032362937927246094, "step": 7676} {"info/global_step": 7677, "train_info/time_within_train_step": 2.754460573196411, "step": 7677} {"train_info/time_between_train_steps": 0.0033261775970458984, "step": 7677} {"train_info/time_between_train_steps": 3.0319406986236572, "step": 7677} {"info/global_step": 7678, "train_info/time_within_train_step": 2.721369743347168, "step": 7678} {"train_info/time_between_train_steps": 0.003154754638671875, "step": 7678} {"info/global_step": 7679, "train_info/time_within_train_step": 2.754469633102417, "step": 7679} {"train_info/time_between_train_steps": 0.003147125244140625, "step": 7679} {"info/global_step": 7680, "train_info/time_within_train_step": 2.7544898986816406, "step": 7680} {"train_info/time_between_train_steps": 0.0031235218048095703, "step": 7680} {"info/global_step": 7681, "train_info/time_within_train_step": 2.9723989963531494, "step": 7681} {"train_info/time_between_train_steps": 0.0031278133392333984, "step": 7681} {"info/global_step": 7682, "train_info/time_within_train_step": 2.7543962001800537, "step": 7682} {"train_info/time_between_train_steps": 0.0031189918518066406, "step": 7682} {"info/global_step": 7683, "train_info/time_within_train_step": 2.754687547683716, "step": 7683} {"train_info/time_between_train_steps": 0.0031201839447021484, "step": 7683} {"info/global_step": 7684, "train_info/time_within_train_step": 2.752260684967041, "step": 7684} {"train_info/time_between_train_steps": 0.003202199935913086, "step": 7684} {"info/global_step": 7685, "train_info/time_within_train_step": 2.7548749446868896, "step": 7685} {"train_info/time_between_train_steps": 0.003100156784057617, "step": 7685} {"info/global_step": 7686, "train_info/time_within_train_step": 2.7540104389190674, "step": 7686} {"train_info/time_between_train_steps": 0.003116130828857422, "step": 7686} {"info/global_step": 7687, "train_info/time_within_train_step": 2.7534685134887695, "step": 7687} {"train_info/time_between_train_steps": 0.003114938735961914, "step": 7687} {"info/global_step": 7688, "train_info/time_within_train_step": 2.7534399032592773, "step": 7688} {"train_info/time_between_train_steps": 0.003614187240600586, "step": 7688} {"info/global_step": 7689, "train_info/time_within_train_step": 2.7531487941741943, "step": 7689} {"train_info/time_between_train_steps": 0.003153562545776367, "step": 7689} {"info/global_step": 7690, "train_info/time_within_train_step": 2.7538225650787354, "step": 7690} {"train_info/time_between_train_steps": 0.003142118453979492, "step": 7690} {"info/global_step": 7691, "train_info/time_within_train_step": 2.7556400299072266, "step": 7691} {"train_info/time_between_train_steps": 0.003274202346801758, "step": 7691} {"info/global_step": 7692, "train_info/time_within_train_step": 2.756763219833374, "step": 7692} {"train_info/time_between_train_steps": 0.0032761096954345703, "step": 7692} {"info/global_step": 7693, "train_info/time_within_train_step": 2.7566726207733154, "step": 7693} {"train_info/time_between_train_steps": 0.003274679183959961, "step": 7693} {"info/global_step": 7694, "train_info/time_within_train_step": 2.756243944168091, "step": 7694} {"train_info/time_between_train_steps": 0.003276824951171875, "step": 7694} {"info/global_step": 7695, "train_info/time_within_train_step": 2.7573652267456055, "step": 7695} {"train_info/time_between_train_steps": 0.003353118896484375, "step": 7695} {"info/global_step": 7696, "train_info/time_within_train_step": 2.7568366527557373, "step": 7696} {"train_info/time_between_train_steps": 0.0032787322998046875, "step": 7696} {"info/global_step": 7697, "train_info/time_within_train_step": 2.7557406425476074, "step": 7697} {"train_info/time_between_train_steps": 0.003292083740234375, "step": 7697} {"info/global_step": 7698, "train_info/time_within_train_step": 2.756471633911133, "step": 7698} {"train_info/time_between_train_steps": 0.003254413604736328, "step": 7698} {"info/global_step": 7699, "train_info/time_within_train_step": 2.756293535232544, "step": 7699} {"train_info/time_between_train_steps": 0.003329038619995117, "step": 7699} {"info/global_step": 7700, "train_info/time_within_train_step": 2.755768060684204, "step": 7700} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746588246, "_runtime": 22255}, "step": 7700} {"logs": {"train/loss": 3.1963, "train/learning_rate": 0.0001533333333333333, "train/epoch": 9.0, "_timestamp": 1746588246, "_runtime": 22255}, "step": 7700} {"train_info/time_between_train_steps": 0.007205009460449219, "step": 7700} {"info/global_step": 7701, "train_info/time_within_train_step": 2.7562806606292725, "step": 7701} {"train_info/time_between_train_steps": 0.0033416748046875, "step": 7701} {"info/global_step": 7702, "train_info/time_within_train_step": 2.756462335586548, "step": 7702} {"train_info/time_between_train_steps": 0.0032663345336914062, "step": 7702} {"info/global_step": 7703, "train_info/time_within_train_step": 2.7546226978302, "step": 7703} {"train_info/time_between_train_steps": 0.0033681392669677734, "step": 7703} {"info/global_step": 7704, "train_info/time_within_train_step": 2.755689859390259, "step": 7704} {"train_info/time_between_train_steps": 0.0032999515533447266, "step": 7704} {"info/global_step": 7705, "train_info/time_within_train_step": 2.755915880203247, "step": 7705} {"train_info/time_between_train_steps": 0.0032830238342285156, "step": 7705} {"info/global_step": 7706, "train_info/time_within_train_step": 2.7562198638916016, "step": 7706} {"train_info/time_between_train_steps": 0.0033142566680908203, "step": 7706} {"info/global_step": 7707, "train_info/time_within_train_step": 2.756890296936035, "step": 7707} {"train_info/time_between_train_steps": 0.0032944679260253906, "step": 7707} {"info/global_step": 7708, "train_info/time_within_train_step": 2.7556393146514893, "step": 7708} {"train_info/time_between_train_steps": 0.003282785415649414, "step": 7708} {"info/global_step": 7709, "train_info/time_within_train_step": 2.7553727626800537, "step": 7709} {"train_info/time_between_train_steps": 0.0032155513763427734, "step": 7709} {"info/global_step": 7710, "train_info/time_within_train_step": 2.7565767765045166, "step": 7710} {"train_info/time_between_train_steps": 0.0032846927642822266, "step": 7710} {"info/global_step": 7711, "train_info/time_within_train_step": 2.7575762271881104, "step": 7711} {"train_info/time_between_train_steps": 0.0032722949981689453, "step": 7711} {"info/global_step": 7712, "train_info/time_within_train_step": 2.755492687225342, "step": 7712} {"train_info/time_between_train_steps": 0.0033087730407714844, "step": 7712} {"info/global_step": 7713, "train_info/time_within_train_step": 2.7562432289123535, "step": 7713} {"train_info/time_between_train_steps": 0.0032732486724853516, "step": 7713} {"info/global_step": 7714, "train_info/time_within_train_step": 2.75634765625, "step": 7714} {"train_info/time_between_train_steps": 0.003284454345703125, "step": 7714} {"info/global_step": 7715, "train_info/time_within_train_step": 2.7562344074249268, "step": 7715} {"train_info/time_between_train_steps": 0.0032796859741210938, "step": 7715} {"info/global_step": 7716, "train_info/time_within_train_step": 2.755875825881958, "step": 7716} {"train_info/time_between_train_steps": 0.0033202171325683594, "step": 7716} {"info/global_step": 7717, "train_info/time_within_train_step": 2.757211685180664, "step": 7717} {"train_info/time_between_train_steps": 0.0032858848571777344, "step": 7717} {"info/global_step": 7718, "train_info/time_within_train_step": 2.756470203399658, "step": 7718} {"train_info/time_between_train_steps": 0.0032656192779541016, "step": 7718} {"info/global_step": 7719, "train_info/time_within_train_step": 2.75640606880188, "step": 7719} {"train_info/time_between_train_steps": 0.003264188766479492, "step": 7719} {"info/global_step": 7720, "train_info/time_within_train_step": 2.755862236022949, "step": 7720} {"train_info/time_between_train_steps": 0.003106832504272461, "step": 7720} {"info/global_step": 7721, "train_info/time_within_train_step": 2.7559444904327393, "step": 7721} {"train_info/time_between_train_steps": 0.0031104087829589844, "step": 7721} {"info/global_step": 7722, "train_info/time_within_train_step": 2.7550792694091797, "step": 7722} {"train_info/time_between_train_steps": 0.003124713897705078, "step": 7722} {"info/global_step": 7723, "train_info/time_within_train_step": 2.756377935409546, "step": 7723} {"train_info/time_between_train_steps": 0.003122091293334961, "step": 7723} {"info/global_step": 7724, "train_info/time_within_train_step": 2.755251407623291, "step": 7724} {"train_info/time_between_train_steps": 0.0031054019927978516, "step": 7724} {"info/global_step": 7725, "train_info/time_within_train_step": 2.754955768585205, "step": 7725} {"train_info/time_between_train_steps": 0.0031158924102783203, "step": 7725} {"info/global_step": 7726, "train_info/time_within_train_step": 2.7552404403686523, "step": 7726} {"train_info/time_between_train_steps": 0.0031027793884277344, "step": 7726} {"info/global_step": 7727, "train_info/time_within_train_step": 2.7554068565368652, "step": 7727} {"train_info/time_between_train_steps": 0.0031375885009765625, "step": 7727} {"info/global_step": 7728, "train_info/time_within_train_step": 2.75508975982666, "step": 7728} {"train_info/time_between_train_steps": 0.003097057342529297, "step": 7728} {"info/global_step": 7729, "train_info/time_within_train_step": 2.7549455165863037, "step": 7729} {"train_info/time_between_train_steps": 0.0030965805053710938, "step": 7729} {"info/global_step": 7730, "train_info/time_within_train_step": 2.75480318069458, "step": 7730} {"train_info/time_between_train_steps": 0.0031206607818603516, "step": 7730} {"info/global_step": 7731, "train_info/time_within_train_step": 2.7552542686462402, "step": 7731} {"train_info/time_between_train_steps": 0.0031180381774902344, "step": 7731} {"info/global_step": 7732, "train_info/time_within_train_step": 2.7551512718200684, "step": 7732} {"train_info/time_between_train_steps": 0.003095388412475586, "step": 7732} {"info/global_step": 7733, "train_info/time_within_train_step": 2.7549960613250732, "step": 7733} {"train_info/time_between_train_steps": 0.0031540393829345703, "step": 7733} {"info/global_step": 7734, "train_info/time_within_train_step": 2.7553811073303223, "step": 7734} {"train_info/time_between_train_steps": 0.0031125545501708984, "step": 7734} {"info/global_step": 7735, "train_info/time_within_train_step": 2.7557923793792725, "step": 7735} {"train_info/time_between_train_steps": 0.0031058788299560547, "step": 7735} {"info/global_step": 7736, "train_info/time_within_train_step": 2.755671501159668, "step": 7736} {"train_info/time_between_train_steps": 0.0031507015228271484, "step": 7736} {"info/global_step": 7737, "train_info/time_within_train_step": 2.7554502487182617, "step": 7737} {"train_info/time_between_train_steps": 0.0031049251556396484, "step": 7737} {"info/global_step": 7738, "train_info/time_within_train_step": 2.973256826400757, "step": 7738} {"train_info/time_between_train_steps": 0.0030803680419921875, "step": 7738} {"info/global_step": 7739, "train_info/time_within_train_step": 2.755178928375244, "step": 7739} {"train_info/time_between_train_steps": 0.00310516357421875, "step": 7739} {"info/global_step": 7740, "train_info/time_within_train_step": 2.8769266605377197, "step": 7740} {"train_info/time_between_train_steps": 0.003156900405883789, "step": 7740} {"info/global_step": 7741, "train_info/time_within_train_step": 2.7547709941864014, "step": 7741} {"train_info/time_between_train_steps": 0.003157377243041992, "step": 7741} {"info/global_step": 7742, "train_info/time_within_train_step": 2.754892349243164, "step": 7742} {"train_info/time_between_train_steps": 0.003130674362182617, "step": 7742} {"info/global_step": 7743, "train_info/time_within_train_step": 2.754497528076172, "step": 7743} {"train_info/time_between_train_steps": 0.003104686737060547, "step": 7743} {"info/global_step": 7744, "train_info/time_within_train_step": 2.7548916339874268, "step": 7744} {"train_info/time_between_train_steps": 0.0033032894134521484, "step": 7744} {"info/global_step": 7745, "train_info/time_within_train_step": 2.755631446838379, "step": 7745} {"train_info/time_between_train_steps": 0.0033416748046875, "step": 7745} {"info/global_step": 7746, "train_info/time_within_train_step": 3.326761484146118, "step": 7746} {"train_info/time_between_train_steps": 0.0033502578735351562, "step": 7746} {"info/global_step": 7747, "train_info/time_within_train_step": 2.756164789199829, "step": 7747} {"train_info/time_between_train_steps": 0.0032966136932373047, "step": 7747} {"info/global_step": 7748, "train_info/time_within_train_step": 2.7554714679718018, "step": 7748} {"train_info/time_between_train_steps": 0.0033211708068847656, "step": 7748} {"info/global_step": 7749, "train_info/time_within_train_step": 2.756704330444336, "step": 7749} {"train_info/time_between_train_steps": 0.003366231918334961, "step": 7749} {"info/global_step": 7750, "train_info/time_within_train_step": 2.756307363510132, "step": 7750} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746588385, "_runtime": 22394}, "step": 7750} {"logs": {"train/loss": 3.1506, "train/learning_rate": 0.00015, "train/epoch": 9.01, "_timestamp": 1746588385, "_runtime": 22394}, "step": 7750} {"train_info/time_between_train_steps": 0.006999015808105469, "step": 7750} {"info/global_step": 7751, "train_info/time_within_train_step": 2.7574779987335205, "step": 7751} {"train_info/time_between_train_steps": 0.003307342529296875, "step": 7751} {"info/global_step": 7752, "train_info/time_within_train_step": 2.7557897567749023, "step": 7752} {"train_info/time_between_train_steps": 0.0034208297729492188, "step": 7752} {"info/global_step": 7753, "train_info/time_within_train_step": 2.7572810649871826, "step": 7753} {"train_info/time_between_train_steps": 0.003331422805786133, "step": 7753} {"info/global_step": 7754, "train_info/time_within_train_step": 2.7575199604034424, "step": 7754} {"train_info/time_between_train_steps": 0.0032765865325927734, "step": 7754} {"info/global_step": 7755, "train_info/time_within_train_step": 2.755547285079956, "step": 7755} {"train_info/time_between_train_steps": 0.0032968521118164062, "step": 7755} {"info/global_step": 7756, "train_info/time_within_train_step": 2.7571616172790527, "step": 7756} {"train_info/time_between_train_steps": 0.0032911300659179688, "step": 7756} {"info/global_step": 7757, "train_info/time_within_train_step": 2.75589919090271, "step": 7757} {"train_info/time_between_train_steps": 0.0032777786254882812, "step": 7757} {"info/global_step": 7758, "train_info/time_within_train_step": 2.751969814300537, "step": 7758} {"train_info/time_between_train_steps": 0.003567218780517578, "step": 7758} {"info/global_step": 7759, "train_info/time_within_train_step": 2.754638195037842, "step": 7759} {"train_info/time_between_train_steps": 0.0031423568725585938, "step": 7759} {"info/global_step": 7760, "train_info/time_within_train_step": 2.7534308433532715, "step": 7760} {"train_info/time_between_train_steps": 0.003121614456176758, "step": 7760} {"info/global_step": 7761, "train_info/time_within_train_step": 2.754657745361328, "step": 7761} {"train_info/time_between_train_steps": 0.003133535385131836, "step": 7761} {"info/global_step": 7762, "train_info/time_within_train_step": 2.753696918487549, "step": 7762} {"train_info/time_between_train_steps": 0.0031151771545410156, "step": 7762} {"info/global_step": 7763, "train_info/time_within_train_step": 2.7544522285461426, "step": 7763} {"train_info/time_between_train_steps": 0.0031731128692626953, "step": 7763} {"info/global_step": 7764, "train_info/time_within_train_step": 2.7542824745178223, "step": 7764} {"train_info/time_between_train_steps": 0.0031561851501464844, "step": 7764} {"info/global_step": 7765, "train_info/time_within_train_step": 2.7545764446258545, "step": 7765} {"train_info/time_between_train_steps": 0.0033004283905029297, "step": 7765} {"info/global_step": 7766, "train_info/time_within_train_step": 2.756439447402954, "step": 7766} {"train_info/time_between_train_steps": 0.0032753944396972656, "step": 7766} {"info/global_step": 7767, "train_info/time_within_train_step": 2.756192445755005, "step": 7767} {"train_info/time_between_train_steps": 0.003307819366455078, "step": 7767} {"info/global_step": 7768, "train_info/time_within_train_step": 2.7568869590759277, "step": 7768} {"train_info/time_between_train_steps": 0.0033311843872070312, "step": 7768} {"info/global_step": 7769, "train_info/time_within_train_step": 2.7565255165100098, "step": 7769} {"train_info/time_between_train_steps": 0.0032536983489990234, "step": 7769} {"info/global_step": 7770, "train_info/time_within_train_step": 2.755903720855713, "step": 7770} {"train_info/time_between_train_steps": 0.003445863723754883, "step": 7770} {"info/global_step": 7771, "train_info/time_within_train_step": 2.7557566165924072, "step": 7771} {"train_info/time_between_train_steps": 0.003281831741333008, "step": 7771} {"info/global_step": 7772, "train_info/time_within_train_step": 2.754804849624634, "step": 7772} {"train_info/time_between_train_steps": 0.003361940383911133, "step": 7772} {"info/global_step": 7773, "train_info/time_within_train_step": 2.756556749343872, "step": 7773} {"train_info/time_between_train_steps": 0.003287076950073242, "step": 7773} {"info/global_step": 7774, "train_info/time_within_train_step": 2.7563016414642334, "step": 7774} {"train_info/time_between_train_steps": 0.003329038619995117, "step": 7774} {"info/global_step": 7775, "train_info/time_within_train_step": 2.755087375640869, "step": 7775} {"train_info/time_between_train_steps": 0.0033135414123535156, "step": 7775} {"info/global_step": 7776, "train_info/time_within_train_step": 2.756442070007324, "step": 7776} {"train_info/time_between_train_steps": 0.003312826156616211, "step": 7776} {"info/global_step": 7777, "train_info/time_within_train_step": 2.756197452545166, "step": 7777} {"train_info/time_between_train_steps": 0.0032782554626464844, "step": 7777} {"info/global_step": 7778, "train_info/time_within_train_step": 2.7564985752105713, "step": 7778} {"train_info/time_between_train_steps": 0.0032875537872314453, "step": 7778} {"info/global_step": 7779, "train_info/time_within_train_step": 2.99100923538208, "step": 7779} {"train_info/time_between_train_steps": 0.003299713134765625, "step": 7779} {"info/global_step": 7780, "train_info/time_within_train_step": 2.757080554962158, "step": 7780} {"train_info/time_between_train_steps": 0.0032911300659179688, "step": 7780} {"info/global_step": 7781, "train_info/time_within_train_step": 2.757319927215576, "step": 7781} {"train_info/time_between_train_steps": 0.0033135414123535156, "step": 7781} {"info/global_step": 7782, "train_info/time_within_train_step": 2.756606101989746, "step": 7782} {"train_info/time_between_train_steps": 0.0033142566680908203, "step": 7782} {"info/global_step": 7783, "train_info/time_within_train_step": 2.7558305263519287, "step": 7783} {"train_info/time_between_train_steps": 0.0032787322998046875, "step": 7783} {"info/global_step": 7784, "train_info/time_within_train_step": 2.756908655166626, "step": 7784} {"train_info/time_between_train_steps": 0.0033261775970458984, "step": 7784} {"info/global_step": 7785, "train_info/time_within_train_step": 2.7555091381073, "step": 7785} {"train_info/time_between_train_steps": 0.0033197402954101562, "step": 7785} {"info/global_step": 7786, "train_info/time_within_train_step": 2.756723403930664, "step": 7786} {"train_info/time_between_train_steps": 0.003342866897583008, "step": 7786} {"info/global_step": 7787, "train_info/time_within_train_step": 2.754523992538452, "step": 7787} {"train_info/time_between_train_steps": 0.0033097267150878906, "step": 7787} {"info/global_step": 7788, "train_info/time_within_train_step": 2.7555274963378906, "step": 7788} {"train_info/time_between_train_steps": 0.003288745880126953, "step": 7788} {"info/global_step": 7789, "train_info/time_within_train_step": 2.755258798599243, "step": 7789} {"train_info/time_between_train_steps": 0.003300189971923828, "step": 7789} {"info/global_step": 7790, "train_info/time_within_train_step": 2.7557642459869385, "step": 7790} {"train_info/time_between_train_steps": 0.003292083740234375, "step": 7790} {"info/global_step": 7791, "train_info/time_within_train_step": 2.756442070007324, "step": 7791} {"train_info/time_between_train_steps": 0.003273487091064453, "step": 7791} {"info/global_step": 7792, "train_info/time_within_train_step": 2.757450580596924, "step": 7792} {"train_info/time_between_train_steps": 0.0033254623413085938, "step": 7792} {"info/global_step": 7793, "train_info/time_within_train_step": 2.756666421890259, "step": 7793} {"train_info/time_between_train_steps": 0.0032939910888671875, "step": 7793} {"info/global_step": 7794, "train_info/time_within_train_step": 2.757097005844116, "step": 7794} {"train_info/time_between_train_steps": 0.0032885074615478516, "step": 7794} {"info/global_step": 7795, "train_info/time_within_train_step": 2.7565441131591797, "step": 7795} {"train_info/time_between_train_steps": 0.0033082962036132812, "step": 7795} {"info/global_step": 7796, "train_info/time_within_train_step": 2.7559971809387207, "step": 7796} {"train_info/time_between_train_steps": 0.0032837390899658203, "step": 7796} {"info/global_step": 7797, "train_info/time_within_train_step": 2.756727695465088, "step": 7797} {"train_info/time_between_train_steps": 0.0032663345336914062, "step": 7797} {"info/global_step": 7798, "train_info/time_within_train_step": 2.7575736045837402, "step": 7798} {"train_info/time_between_train_steps": 0.0033354759216308594, "step": 7798} {"info/global_step": 7799, "train_info/time_within_train_step": 2.7632179260253906, "step": 7799} {"train_info/time_between_train_steps": 0.0032722949981689453, "step": 7799} {"info/global_step": 7800, "train_info/time_within_train_step": 2.7556099891662598, "step": 7800} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746588524, "_runtime": 22533}, "step": 7800} {"logs": {"train/loss": 3.1414, "train/learning_rate": 0.00014666666666666664, "train/epoch": 9.01, "_timestamp": 1746588524, "_runtime": 22533}, "step": 7800} {"train_info/time_between_train_steps": 13.115613222122192, "step": 7800} {"info/global_step": 7801, "train_info/time_within_train_step": 2.5377602577209473, "step": 7801} {"train_info/time_between_train_steps": 0.003108501434326172, "step": 7801} {"info/global_step": 7802, "train_info/time_within_train_step": 2.588819742202759, "step": 7802} {"train_info/time_between_train_steps": 0.1274397373199463, "step": 7802} {"info/global_step": 7803, "train_info/time_within_train_step": 2.7157418727874756, "step": 7803} {"train_info/time_between_train_steps": 0.0032265186309814453, "step": 7803} {"info/global_step": 7804, "train_info/time_within_train_step": 2.7500784397125244, "step": 7804} {"train_info/time_between_train_steps": 0.0031921863555908203, "step": 7804} {"info/global_step": 7805, "train_info/time_within_train_step": 2.75069260597229, "step": 7805} {"train_info/time_between_train_steps": 0.0031135082244873047, "step": 7805} {"info/global_step": 7806, "train_info/time_within_train_step": 2.755798816680908, "step": 7806} {"train_info/time_between_train_steps": 0.0031919479370117188, "step": 7806} {"info/global_step": 7807, "train_info/time_within_train_step": 2.754976272583008, "step": 7807} {"train_info/time_between_train_steps": 0.003123760223388672, "step": 7807} {"info/global_step": 7808, "train_info/time_within_train_step": 2.755336284637451, "step": 7808} {"train_info/time_between_train_steps": 0.0031735897064208984, "step": 7808} {"info/global_step": 7809, "train_info/time_within_train_step": 2.755401849746704, "step": 7809} {"train_info/time_between_train_steps": 0.0031609535217285156, "step": 7809} {"info/global_step": 7810, "train_info/time_within_train_step": 2.7557692527770996, "step": 7810} {"train_info/time_between_train_steps": 0.0031342506408691406, "step": 7810} {"info/global_step": 7811, "train_info/time_within_train_step": 2.756779193878174, "step": 7811} {"train_info/time_between_train_steps": 0.0031299591064453125, "step": 7811} {"info/global_step": 7812, "train_info/time_within_train_step": 2.756183624267578, "step": 7812} {"train_info/time_between_train_steps": 0.0031430721282958984, "step": 7812} {"info/global_step": 7813, "train_info/time_within_train_step": 2.756337881088257, "step": 7813} {"train_info/time_between_train_steps": 0.003161191940307617, "step": 7813} {"info/global_step": 7814, "train_info/time_within_train_step": 2.7555692195892334, "step": 7814} {"train_info/time_between_train_steps": 0.003127574920654297, "step": 7814} {"info/global_step": 7815, "train_info/time_within_train_step": 2.7558352947235107, "step": 7815} {"train_info/time_between_train_steps": 0.003155946731567383, "step": 7815} {"info/global_step": 7816, "train_info/time_within_train_step": 2.7561585903167725, "step": 7816} {"train_info/time_between_train_steps": 0.003128528594970703, "step": 7816} {"info/global_step": 7817, "train_info/time_within_train_step": 2.7553961277008057, "step": 7817} {"train_info/time_between_train_steps": 0.00316619873046875, "step": 7817} {"info/global_step": 7818, "train_info/time_within_train_step": 2.7563626766204834, "step": 7818} {"train_info/time_between_train_steps": 0.0031261444091796875, "step": 7818} {"info/global_step": 7819, "train_info/time_within_train_step": 2.7555630207061768, "step": 7819} {"train_info/time_between_train_steps": 0.0031807422637939453, "step": 7819} {"info/global_step": 7820, "train_info/time_within_train_step": 2.756241798400879, "step": 7820} {"train_info/time_between_train_steps": 0.003127574920654297, "step": 7820} {"info/global_step": 7821, "train_info/time_within_train_step": 2.756376266479492, "step": 7821} {"train_info/time_between_train_steps": 0.003144979476928711, "step": 7821} {"info/global_step": 7822, "train_info/time_within_train_step": 2.7565698623657227, "step": 7822} {"train_info/time_between_train_steps": 0.0031173229217529297, "step": 7822} {"info/global_step": 7823, "train_info/time_within_train_step": 2.7568931579589844, "step": 7823} {"train_info/time_between_train_steps": 0.003131866455078125, "step": 7823} {"info/global_step": 7824, "train_info/time_within_train_step": 2.7559831142425537, "step": 7824} {"train_info/time_between_train_steps": 0.003166675567626953, "step": 7824} {"info/global_step": 7825, "train_info/time_within_train_step": 2.755924701690674, "step": 7825} {"train_info/time_between_train_steps": 0.0031135082244873047, "step": 7825} {"info/global_step": 7826, "train_info/time_within_train_step": 2.7576637268066406, "step": 7826} {"train_info/time_between_train_steps": 0.003349781036376953, "step": 7826} {"info/global_step": 7827, "train_info/time_within_train_step": 2.757883310317993, "step": 7827} {"train_info/time_between_train_steps": 0.0033295154571533203, "step": 7827} {"info/global_step": 7828, "train_info/time_within_train_step": 2.757181406021118, "step": 7828} {"train_info/time_between_train_steps": 0.003343820571899414, "step": 7828} {"info/global_step": 7829, "train_info/time_within_train_step": 2.7565245628356934, "step": 7829} {"train_info/time_between_train_steps": 0.003306150436401367, "step": 7829} {"info/global_step": 7830, "train_info/time_within_train_step": 2.7558772563934326, "step": 7830} {"train_info/time_between_train_steps": 0.0033724308013916016, "step": 7830} {"info/global_step": 7831, "train_info/time_within_train_step": 2.7570550441741943, "step": 7831} {"train_info/time_between_train_steps": 0.003286123275756836, "step": 7831} {"info/global_step": 7832, "train_info/time_within_train_step": 2.9988162517547607, "step": 7832} {"train_info/time_between_train_steps": 0.003332376480102539, "step": 7832} {"info/global_step": 7833, "train_info/time_within_train_step": 2.7584848403930664, "step": 7833} {"train_info/time_between_train_steps": 0.00328826904296875, "step": 7833} {"info/global_step": 7834, "train_info/time_within_train_step": 2.7579517364501953, "step": 7834} {"train_info/time_between_train_steps": 0.0032765865325927734, "step": 7834} {"info/global_step": 7835, "train_info/time_within_train_step": 2.757363796234131, "step": 7835} {"train_info/time_between_train_steps": 0.003314495086669922, "step": 7835} {"info/global_step": 7836, "train_info/time_within_train_step": 2.758455991744995, "step": 7836} {"train_info/time_between_train_steps": 0.0033054351806640625, "step": 7836} {"info/global_step": 7837, "train_info/time_within_train_step": 2.756225824356079, "step": 7837} {"train_info/time_between_train_steps": 0.003354310989379883, "step": 7837} {"info/global_step": 7838, "train_info/time_within_train_step": 2.757472515106201, "step": 7838} {"train_info/time_between_train_steps": 0.0033006668090820312, "step": 7838} {"info/global_step": 7839, "train_info/time_within_train_step": 2.7577285766601562, "step": 7839} {"train_info/time_between_train_steps": 0.003365755081176758, "step": 7839} {"info/global_step": 7840, "train_info/time_within_train_step": 2.75685453414917, "step": 7840} {"train_info/time_between_train_steps": 0.0033164024353027344, "step": 7840} {"info/global_step": 7841, "train_info/time_within_train_step": 2.757014036178589, "step": 7841} {"train_info/time_between_train_steps": 0.0033304691314697266, "step": 7841} {"info/global_step": 7842, "train_info/time_within_train_step": 2.7570977210998535, "step": 7842} {"train_info/time_between_train_steps": 0.0032842159271240234, "step": 7842} {"info/global_step": 7843, "train_info/time_within_train_step": 2.7579407691955566, "step": 7843} {"train_info/time_between_train_steps": 0.003330230712890625, "step": 7843} {"info/global_step": 7844, "train_info/time_within_train_step": 2.756772518157959, "step": 7844} {"train_info/time_between_train_steps": 0.003329753875732422, "step": 7844} {"info/global_step": 7845, "train_info/time_within_train_step": 2.756873607635498, "step": 7845} {"train_info/time_between_train_steps": 0.003291606903076172, "step": 7845} {"info/global_step": 7846, "train_info/time_within_train_step": 2.756512403488159, "step": 7846} {"train_info/time_between_train_steps": 0.003291606903076172, "step": 7846} {"info/global_step": 7847, "train_info/time_within_train_step": 2.757413148880005, "step": 7847} {"train_info/time_between_train_steps": 0.00331878662109375, "step": 7847} {"info/global_step": 7848, "train_info/time_within_train_step": 2.7570972442626953, "step": 7848} {"train_info/time_between_train_steps": 0.0033452510833740234, "step": 7848} {"info/global_step": 7849, "train_info/time_within_train_step": 2.758397340774536, "step": 7849} {"train_info/time_between_train_steps": 0.0033295154571533203, "step": 7849} {"info/global_step": 7850, "train_info/time_within_train_step": 2.7578601837158203, "step": 7850} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746588675, "_runtime": 22684}, "step": 7850} {"logs": {"train/loss": 3.1301, "train/learning_rate": 0.00014333333333333334, "train/epoch": 9.02, "_timestamp": 1746588675, "_runtime": 22684}, "step": 7850} {"train_info/time_between_train_steps": 0.007102251052856445, "step": 7850} {"info/global_step": 7851, "train_info/time_within_train_step": 2.7586333751678467, "step": 7851} {"train_info/time_between_train_steps": 0.0032842159271240234, "step": 7851} {"info/global_step": 7852, "train_info/time_within_train_step": 2.759443759918213, "step": 7852} {"train_info/time_between_train_steps": 0.0033082962036132812, "step": 7852} {"info/global_step": 7853, "train_info/time_within_train_step": 2.758305072784424, "step": 7853} {"train_info/time_between_train_steps": 0.003281831741333008, "step": 7853} {"info/global_step": 7854, "train_info/time_within_train_step": 2.7574098110198975, "step": 7854} {"train_info/time_between_train_steps": 0.003365039825439453, "step": 7854} {"info/global_step": 7855, "train_info/time_within_train_step": 2.7570865154266357, "step": 7855} {"train_info/time_between_train_steps": 0.003305673599243164, "step": 7855} {"info/global_step": 7856, "train_info/time_within_train_step": 2.75732159614563, "step": 7856} {"train_info/time_between_train_steps": 0.0033130645751953125, "step": 7856} {"info/global_step": 7857, "train_info/time_within_train_step": 2.757800579071045, "step": 7857} {"train_info/time_between_train_steps": 0.0033111572265625, "step": 7857} {"info/global_step": 7858, "train_info/time_within_train_step": 2.7562954425811768, "step": 7858} {"train_info/time_between_train_steps": 0.003314971923828125, "step": 7858} {"info/global_step": 7859, "train_info/time_within_train_step": 2.7566771507263184, "step": 7859} {"train_info/time_between_train_steps": 0.0033669471740722656, "step": 7859} {"info/global_step": 7860, "train_info/time_within_train_step": 2.756232500076294, "step": 7860} {"train_info/time_between_train_steps": 0.0032935142517089844, "step": 7860} {"info/global_step": 7861, "train_info/time_within_train_step": 2.7560672760009766, "step": 7861} {"train_info/time_between_train_steps": 0.0033500194549560547, "step": 7861} {"info/global_step": 7862, "train_info/time_within_train_step": 2.757141590118408, "step": 7862} {"train_info/time_between_train_steps": 0.003422260284423828, "step": 7862} {"info/global_step": 7863, "train_info/time_within_train_step": 2.7573914527893066, "step": 7863} {"train_info/time_between_train_steps": 0.003343820571899414, "step": 7863} {"info/global_step": 7864, "train_info/time_within_train_step": 2.756091833114624, "step": 7864} {"train_info/time_between_train_steps": 0.00327301025390625, "step": 7864} {"info/global_step": 7865, "train_info/time_within_train_step": 2.8833019733428955, "step": 7865} {"train_info/time_between_train_steps": 0.0033032894134521484, "step": 7865} {"info/global_step": 7866, "train_info/time_within_train_step": 2.7583138942718506, "step": 7866} {"train_info/time_between_train_steps": 0.003315448760986328, "step": 7866} {"info/global_step": 7867, "train_info/time_within_train_step": 2.7577269077301025, "step": 7867} {"train_info/time_between_train_steps": 0.003332376480102539, "step": 7867} {"info/global_step": 7868, "train_info/time_within_train_step": 2.756953001022339, "step": 7868} {"train_info/time_between_train_steps": 0.003309011459350586, "step": 7868} {"info/global_step": 7869, "train_info/time_within_train_step": 2.757262706756592, "step": 7869} {"train_info/time_between_train_steps": 0.0033049583435058594, "step": 7869} {"info/global_step": 7870, "train_info/time_within_train_step": 2.755807399749756, "step": 7870} {"train_info/time_between_train_steps": 0.0034148693084716797, "step": 7870} {"info/global_step": 7871, "train_info/time_within_train_step": 2.7557811737060547, "step": 7871} {"train_info/time_between_train_steps": 0.0033049583435058594, "step": 7871} {"info/global_step": 7872, "train_info/time_within_train_step": 2.7575411796569824, "step": 7872} {"train_info/time_between_train_steps": 0.0033485889434814453, "step": 7872} {"info/global_step": 7873, "train_info/time_within_train_step": 2.756272315979004, "step": 7873} {"train_info/time_between_train_steps": 0.0033087730407714844, "step": 7873} {"info/global_step": 7874, "train_info/time_within_train_step": 2.758253812789917, "step": 7874} {"train_info/time_between_train_steps": 0.0033211708068847656, "step": 7874} {"info/global_step": 7875, "train_info/time_within_train_step": 2.756880044937134, "step": 7875} {"train_info/time_between_train_steps": 0.0033233165740966797, "step": 7875} {"info/global_step": 7876, "train_info/time_within_train_step": 2.7573444843292236, "step": 7876} {"train_info/time_between_train_steps": 0.003320455551147461, "step": 7876} {"info/global_step": 7877, "train_info/time_within_train_step": 2.7579638957977295, "step": 7877} {"train_info/time_between_train_steps": 0.0032989978790283203, "step": 7877} {"info/global_step": 7878, "train_info/time_within_train_step": 2.7577154636383057, "step": 7878} {"train_info/time_between_train_steps": 0.0033168792724609375, "step": 7878} {"info/global_step": 7879, "train_info/time_within_train_step": 2.7574644088745117, "step": 7879} {"train_info/time_between_train_steps": 0.003317117691040039, "step": 7879} {"info/global_step": 7880, "train_info/time_within_train_step": 2.7562766075134277, "step": 7880} {"train_info/time_between_train_steps": 0.003289937973022461, "step": 7880} {"info/global_step": 7881, "train_info/time_within_train_step": 2.7581403255462646, "step": 7881} {"train_info/time_between_train_steps": 0.0033779144287109375, "step": 7881} {"info/global_step": 7882, "train_info/time_within_train_step": 2.7578885555267334, "step": 7882} {"train_info/time_between_train_steps": 0.0032951831817626953, "step": 7882} {"info/global_step": 7883, "train_info/time_within_train_step": 2.7575907707214355, "step": 7883} {"train_info/time_between_train_steps": 0.003197908401489258, "step": 7883} {"info/global_step": 7884, "train_info/time_within_train_step": 2.7526938915252686, "step": 7884} {"train_info/time_between_train_steps": 0.0031387805938720703, "step": 7884} {"info/global_step": 7885, "train_info/time_within_train_step": 2.7547428607940674, "step": 7885} {"train_info/time_between_train_steps": 0.003143310546875, "step": 7885} {"info/global_step": 7886, "train_info/time_within_train_step": 2.7545077800750732, "step": 7886} {"train_info/time_between_train_steps": 0.003149747848510742, "step": 7886} {"info/global_step": 7887, "train_info/time_within_train_step": 2.754441261291504, "step": 7887} {"train_info/time_between_train_steps": 0.0031213760375976562, "step": 7887} {"info/global_step": 7888, "train_info/time_within_train_step": 2.7544002532958984, "step": 7888} {"train_info/time_between_train_steps": 0.003148317337036133, "step": 7888} {"info/global_step": 7889, "train_info/time_within_train_step": 2.7548201084136963, "step": 7889} {"train_info/time_between_train_steps": 0.0031387805938720703, "step": 7889} {"info/global_step": 7890, "train_info/time_within_train_step": 2.755206823348999, "step": 7890} {"train_info/time_between_train_steps": 0.003140687942504883, "step": 7890} {"info/global_step": 7891, "train_info/time_within_train_step": 2.755523681640625, "step": 7891} {"train_info/time_between_train_steps": 0.003130197525024414, "step": 7891} {"info/global_step": 7892, "train_info/time_within_train_step": 2.755953788757324, "step": 7892} {"train_info/time_between_train_steps": 0.0031774044036865234, "step": 7892} {"info/global_step": 7893, "train_info/time_within_train_step": 2.7553608417510986, "step": 7893} {"train_info/time_between_train_steps": 0.003139972686767578, "step": 7893} {"info/global_step": 7894, "train_info/time_within_train_step": 2.7561254501342773, "step": 7894} {"train_info/time_between_train_steps": 0.003144979476928711, "step": 7894} {"info/global_step": 7895, "train_info/time_within_train_step": 2.7560811042785645, "step": 7895} {"train_info/time_between_train_steps": 0.003111600875854492, "step": 7895} {"info/global_step": 7896, "train_info/time_within_train_step": 2.7566983699798584, "step": 7896} {"train_info/time_between_train_steps": 0.003145933151245117, "step": 7896} {"info/global_step": 7897, "train_info/time_within_train_step": 2.7563774585723877, "step": 7897} {"train_info/time_between_train_steps": 0.003119230270385742, "step": 7897} {"info/global_step": 7898, "train_info/time_within_train_step": 2.756011724472046, "step": 7898} {"train_info/time_between_train_steps": 0.0031244754791259766, "step": 7898} {"info/global_step": 7899, "train_info/time_within_train_step": 2.755673885345459, "step": 7899} {"train_info/time_between_train_steps": 0.0031423568725585938, "step": 7899} {"info/global_step": 7900, "train_info/time_within_train_step": 2.7546379566192627, "step": 7900} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746588813, "_runtime": 22822}, "step": 7900} {"logs": {"train/loss": 3.1141, "train/learning_rate": 0.00014, "train/epoch": 9.02, "_timestamp": 1746588813, "_runtime": 22822}, "step": 7900} {"train_info/time_between_train_steps": 0.006371974945068359, "step": 7900} {"info/global_step": 7901, "train_info/time_within_train_step": 2.754866123199463, "step": 7901} {"train_info/time_between_train_steps": 0.003125429153442383, "step": 7901} {"info/global_step": 7902, "train_info/time_within_train_step": 2.754246950149536, "step": 7902} {"train_info/time_between_train_steps": 0.0031359195709228516, "step": 7902} {"info/global_step": 7903, "train_info/time_within_train_step": 2.754150390625, "step": 7903} {"train_info/time_between_train_steps": 0.0031325817108154297, "step": 7903} {"info/global_step": 7904, "train_info/time_within_train_step": 2.7557294368743896, "step": 7904} {"train_info/time_between_train_steps": 0.003133535385131836, "step": 7904} {"info/global_step": 7905, "train_info/time_within_train_step": 2.7550551891326904, "step": 7905} {"train_info/time_between_train_steps": 0.0031626224517822266, "step": 7905} {"info/global_step": 7906, "train_info/time_within_train_step": 2.755709648132324, "step": 7906} {"train_info/time_between_train_steps": 0.003136873245239258, "step": 7906} {"info/global_step": 7907, "train_info/time_within_train_step": 2.7548742294311523, "step": 7907} {"train_info/time_between_train_steps": 0.0031805038452148438, "step": 7907} {"info/global_step": 7908, "train_info/time_within_train_step": 2.7541005611419678, "step": 7908} {"train_info/time_between_train_steps": 0.0031189918518066406, "step": 7908} {"info/global_step": 7909, "train_info/time_within_train_step": 2.755624771118164, "step": 7909} {"train_info/time_between_train_steps": 0.003145933151245117, "step": 7909} {"info/global_step": 7910, "train_info/time_within_train_step": 2.7551772594451904, "step": 7910} {"train_info/time_between_train_steps": 0.0031571388244628906, "step": 7910} {"info/global_step": 7911, "train_info/time_within_train_step": 2.754423141479492, "step": 7911} {"train_info/time_between_train_steps": 0.0031464099884033203, "step": 7911} {"info/global_step": 7912, "train_info/time_within_train_step": 2.755516767501831, "step": 7912} {"train_info/time_between_train_steps": 0.003120899200439453, "step": 7912} {"info/global_step": 7913, "train_info/time_within_train_step": 2.7546749114990234, "step": 7913} {"train_info/time_between_train_steps": 0.003129720687866211, "step": 7913} {"info/global_step": 7914, "train_info/time_within_train_step": 2.755643844604492, "step": 7914} {"train_info/time_between_train_steps": 0.003336668014526367, "step": 7914} {"info/global_step": 7915, "train_info/time_within_train_step": 2.7557454109191895, "step": 7915} {"train_info/time_between_train_steps": 0.0032815933227539062, "step": 7915} {"info/global_step": 7916, "train_info/time_within_train_step": 2.7567293643951416, "step": 7916} {"train_info/time_between_train_steps": 0.0033397674560546875, "step": 7916} {"info/global_step": 7917, "train_info/time_within_train_step": 2.7567102909088135, "step": 7917} {"train_info/time_between_train_steps": 0.0033228397369384766, "step": 7917} {"info/global_step": 7918, "train_info/time_within_train_step": 2.7543234825134277, "step": 7918} {"train_info/time_between_train_steps": 0.0033059120178222656, "step": 7918} {"info/global_step": 7919, "train_info/time_within_train_step": 2.7564728260040283, "step": 7919} {"train_info/time_between_train_steps": 0.0033104419708251953, "step": 7919} {"info/global_step": 7920, "train_info/time_within_train_step": 2.753941535949707, "step": 7920} {"train_info/time_between_train_steps": 0.0032727718353271484, "step": 7920} {"info/global_step": 7921, "train_info/time_within_train_step": 2.7564666271209717, "step": 7921} {"train_info/time_between_train_steps": 0.003280162811279297, "step": 7921} {"info/global_step": 7922, "train_info/time_within_train_step": 2.756035327911377, "step": 7922} {"train_info/time_between_train_steps": 0.003294706344604492, "step": 7922} {"info/global_step": 7923, "train_info/time_within_train_step": 2.7567763328552246, "step": 7923} {"train_info/time_between_train_steps": 0.003304004669189453, "step": 7923} {"info/global_step": 7924, "train_info/time_within_train_step": 2.755645990371704, "step": 7924} {"train_info/time_between_train_steps": 0.0032732486724853516, "step": 7924} {"info/global_step": 7925, "train_info/time_within_train_step": 3.008842945098877, "step": 7925} {"train_info/time_between_train_steps": 0.0033228397369384766, "step": 7925} {"info/global_step": 7926, "train_info/time_within_train_step": 2.757205009460449, "step": 7926} {"train_info/time_between_train_steps": 0.003291606903076172, "step": 7926} {"info/global_step": 7927, "train_info/time_within_train_step": 2.7573914527893066, "step": 7927} {"train_info/time_between_train_steps": 0.12942266464233398, "step": 7927} {"info/global_step": 7928, "train_info/time_within_train_step": 2.754826545715332, "step": 7928} {"train_info/time_between_train_steps": 0.0031478404998779297, "step": 7928} {"info/global_step": 7929, "train_info/time_within_train_step": 2.755622148513794, "step": 7929} {"train_info/time_between_train_steps": 0.0031800270080566406, "step": 7929} {"info/global_step": 7930, "train_info/time_within_train_step": 2.7552895545959473, "step": 7930} {"train_info/time_between_train_steps": 0.0031197071075439453, "step": 7930} {"info/global_step": 7931, "train_info/time_within_train_step": 2.755952835083008, "step": 7931} {"train_info/time_between_train_steps": 0.0031774044036865234, "step": 7931} {"info/global_step": 7932, "train_info/time_within_train_step": 2.755399703979492, "step": 7932} {"train_info/time_between_train_steps": 0.0031392574310302734, "step": 7932} {"info/global_step": 7933, "train_info/time_within_train_step": 2.7549726963043213, "step": 7933} {"train_info/time_between_train_steps": 0.003165721893310547, "step": 7933} {"info/global_step": 7934, "train_info/time_within_train_step": 2.755150556564331, "step": 7934} {"train_info/time_between_train_steps": 0.003155231475830078, "step": 7934} {"info/global_step": 7935, "train_info/time_within_train_step": 2.7553844451904297, "step": 7935} {"train_info/time_between_train_steps": 0.003119945526123047, "step": 7935} {"info/global_step": 7936, "train_info/time_within_train_step": 2.7559003829956055, "step": 7936} {"train_info/time_between_train_steps": 0.003171205520629883, "step": 7936} {"info/global_step": 7937, "train_info/time_within_train_step": 2.755333662033081, "step": 7937} {"train_info/time_between_train_steps": 0.0031280517578125, "step": 7937} {"info/global_step": 7938, "train_info/time_within_train_step": 2.756166458129883, "step": 7938} {"train_info/time_between_train_steps": 0.0033392906188964844, "step": 7938} {"info/global_step": 7939, "train_info/time_within_train_step": 2.7553396224975586, "step": 7939} {"train_info/time_between_train_steps": 0.0033235549926757812, "step": 7939} {"info/global_step": 7940, "train_info/time_within_train_step": 2.7555992603302, "step": 7940} {"train_info/time_between_train_steps": 0.0033152103424072266, "step": 7940} {"info/global_step": 7941, "train_info/time_within_train_step": 2.755683183670044, "step": 7941} {"train_info/time_between_train_steps": 0.0032918453216552734, "step": 7941} {"info/global_step": 7942, "train_info/time_within_train_step": 2.756661891937256, "step": 7942} {"train_info/time_between_train_steps": 0.003357410430908203, "step": 7942} {"info/global_step": 7943, "train_info/time_within_train_step": 2.7574856281280518, "step": 7943} {"train_info/time_between_train_steps": 0.003301858901977539, "step": 7943} {"info/global_step": 7944, "train_info/time_within_train_step": 2.75669002532959, "step": 7944} {"train_info/time_between_train_steps": 0.0033020973205566406, "step": 7944} {"info/global_step": 7945, "train_info/time_within_train_step": 2.7565507888793945, "step": 7945} {"train_info/time_between_train_steps": 0.0033190250396728516, "step": 7945} {"info/global_step": 7946, "train_info/time_within_train_step": 2.7570526599884033, "step": 7946} {"train_info/time_between_train_steps": 0.0032804012298583984, "step": 7946} {"info/global_step": 7947, "train_info/time_within_train_step": 2.756930112838745, "step": 7947} {"train_info/time_between_train_steps": 0.0033092498779296875, "step": 7947} {"info/global_step": 7948, "train_info/time_within_train_step": 2.7570443153381348, "step": 7948} {"train_info/time_between_train_steps": 0.003305673599243164, "step": 7948} {"info/global_step": 7949, "train_info/time_within_train_step": 2.757822036743164, "step": 7949} {"train_info/time_between_train_steps": 0.003359556198120117, "step": 7949} {"info/global_step": 7950, "train_info/time_within_train_step": 2.758608818054199, "step": 7950} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746588952, "_runtime": 22961}, "step": 7950} {"logs": {"train/loss": 3.1068, "train/learning_rate": 0.00013666666666666666, "train/epoch": 9.03, "_timestamp": 1746588952, "_runtime": 22961}, "step": 7950} {"train_info/time_between_train_steps": 0.0070285797119140625, "step": 7950} {"info/global_step": 7951, "train_info/time_within_train_step": 2.75716495513916, "step": 7951} {"train_info/time_between_train_steps": 0.0033278465270996094, "step": 7951} {"info/global_step": 7952, "train_info/time_within_train_step": 2.756157636642456, "step": 7952} {"train_info/time_between_train_steps": 0.00330352783203125, "step": 7952} {"info/global_step": 7953, "train_info/time_within_train_step": 2.757324695587158, "step": 7953} {"train_info/time_between_train_steps": 0.0033388137817382812, "step": 7953} {"info/global_step": 7954, "train_info/time_within_train_step": 2.7565855979919434, "step": 7954} {"train_info/time_between_train_steps": 0.0033445358276367188, "step": 7954} {"info/global_step": 7955, "train_info/time_within_train_step": 2.7578890323638916, "step": 7955} {"train_info/time_between_train_steps": 0.0032744407653808594, "step": 7955} {"info/global_step": 7956, "train_info/time_within_train_step": 2.7563703060150146, "step": 7956} {"train_info/time_between_train_steps": 0.0032880306243896484, "step": 7956} {"info/global_step": 7957, "train_info/time_within_train_step": 2.7567484378814697, "step": 7957} {"train_info/time_between_train_steps": 0.0033159255981445312, "step": 7957} {"info/global_step": 7958, "train_info/time_within_train_step": 2.7566919326782227, "step": 7958} {"train_info/time_between_train_steps": 0.003304719924926758, "step": 7958} {"info/global_step": 7959, "train_info/time_within_train_step": 2.756779909133911, "step": 7959} {"train_info/time_between_train_steps": 0.003342866897583008, "step": 7959} {"info/global_step": 7960, "train_info/time_within_train_step": 2.7571423053741455, "step": 7960} {"train_info/time_between_train_steps": 0.003347635269165039, "step": 7960} {"info/global_step": 7961, "train_info/time_within_train_step": 2.7558343410491943, "step": 7961} {"train_info/time_between_train_steps": 0.0032808780670166016, "step": 7961} {"info/global_step": 7962, "train_info/time_within_train_step": 2.7567169666290283, "step": 7962} {"train_info/time_between_train_steps": 0.003434896469116211, "step": 7962} {"info/global_step": 7963, "train_info/time_within_train_step": 2.756889581680298, "step": 7963} {"train_info/time_between_train_steps": 0.0032808780670166016, "step": 7963} {"info/global_step": 7964, "train_info/time_within_train_step": 2.7562947273254395, "step": 7964} {"train_info/time_between_train_steps": 0.003342866897583008, "step": 7964} {"info/global_step": 7965, "train_info/time_within_train_step": 2.7573323249816895, "step": 7965} {"train_info/time_between_train_steps": 0.0033164024353027344, "step": 7965} {"info/global_step": 7966, "train_info/time_within_train_step": 2.7583439350128174, "step": 7966} {"train_info/time_between_train_steps": 0.003324747085571289, "step": 7966} {"info/global_step": 7967, "train_info/time_within_train_step": 2.7573089599609375, "step": 7967} {"train_info/time_between_train_steps": 0.003287792205810547, "step": 7967} {"info/global_step": 7968, "train_info/time_within_train_step": 2.7562925815582275, "step": 7968} {"train_info/time_between_train_steps": 0.0032927989959716797, "step": 7968} {"info/global_step": 7969, "train_info/time_within_train_step": 2.7576024532318115, "step": 7969} {"train_info/time_between_train_steps": 0.0031976699829101562, "step": 7969} {"info/global_step": 7970, "train_info/time_within_train_step": 2.7550575733184814, "step": 7970} {"train_info/time_between_train_steps": 0.0031235218048095703, "step": 7970} {"info/global_step": 7971, "train_info/time_within_train_step": 2.7556989192962646, "step": 7971} {"train_info/time_between_train_steps": 0.003190279006958008, "step": 7971} {"info/global_step": 7972, "train_info/time_within_train_step": 2.7562143802642822, "step": 7972} {"train_info/time_between_train_steps": 0.0031328201293945312, "step": 7972} {"info/global_step": 7973, "train_info/time_within_train_step": 2.7561256885528564, "step": 7973} {"train_info/time_between_train_steps": 0.003124713897705078, "step": 7973} {"info/global_step": 7974, "train_info/time_within_train_step": 2.753666639328003, "step": 7974} {"train_info/time_between_train_steps": 0.0031342506408691406, "step": 7974} {"info/global_step": 7975, "train_info/time_within_train_step": 2.7553658485412598, "step": 7975} {"train_info/time_between_train_steps": 0.003130674362182617, "step": 7975} {"info/global_step": 7976, "train_info/time_within_train_step": 2.754802942276001, "step": 7976} {"train_info/time_between_train_steps": 0.0031495094299316406, "step": 7976} {"info/global_step": 7977, "train_info/time_within_train_step": 2.7552709579467773, "step": 7977} {"train_info/time_between_train_steps": 0.003113985061645508, "step": 7977} {"info/global_step": 7978, "train_info/time_within_train_step": 2.7544236183166504, "step": 7978} {"train_info/time_between_train_steps": 0.003138303756713867, "step": 7978} {"info/global_step": 7979, "train_info/time_within_train_step": 2.7549095153808594, "step": 7979} {"train_info/time_between_train_steps": 0.003162860870361328, "step": 7979} {"info/global_step": 7980, "train_info/time_within_train_step": 2.755206823348999, "step": 7980} {"train_info/time_between_train_steps": 0.0031845569610595703, "step": 7980} {"info/global_step": 7981, "train_info/time_within_train_step": 2.754229784011841, "step": 7981} {"train_info/time_between_train_steps": 0.0030961036682128906, "step": 7981} {"info/global_step": 7982, "train_info/time_within_train_step": 2.755495071411133, "step": 7982} {"train_info/time_between_train_steps": 0.0031995773315429688, "step": 7982} {"info/global_step": 7983, "train_info/time_within_train_step": 2.7547500133514404, "step": 7983} {"train_info/time_between_train_steps": 0.003106832504272461, "step": 7983} {"info/global_step": 7984, "train_info/time_within_train_step": 2.7545440196990967, "step": 7984} {"train_info/time_between_train_steps": 0.0031080245971679688, "step": 7984} {"info/global_step": 7985, "train_info/time_within_train_step": 2.7547199726104736, "step": 7985} {"train_info/time_between_train_steps": 0.003133058547973633, "step": 7985} {"info/global_step": 7986, "train_info/time_within_train_step": 2.754312753677368, "step": 7986} {"train_info/time_between_train_steps": 0.003122568130493164, "step": 7986} {"info/global_step": 7987, "train_info/time_within_train_step": 2.7540552616119385, "step": 7987} {"train_info/time_between_train_steps": 0.003137350082397461, "step": 7987} {"info/global_step": 7988, "train_info/time_within_train_step": 2.7547619342803955, "step": 7988} {"train_info/time_between_train_steps": 0.003131389617919922, "step": 7988} {"info/global_step": 7989, "train_info/time_within_train_step": 2.7539963722229004, "step": 7989} {"train_info/time_between_train_steps": 0.003133535385131836, "step": 7989} {"info/global_step": 7990, "train_info/time_within_train_step": 2.8790276050567627, "step": 7990} {"train_info/time_between_train_steps": 0.00313568115234375, "step": 7990} {"info/global_step": 7991, "train_info/time_within_train_step": 2.7538914680480957, "step": 7991} {"train_info/time_between_train_steps": 0.0031664371490478516, "step": 7991} {"info/global_step": 7992, "train_info/time_within_train_step": 2.7533481121063232, "step": 7992} {"train_info/time_between_train_steps": 0.0031533241271972656, "step": 7992} {"info/global_step": 7993, "train_info/time_within_train_step": 2.7553701400756836, "step": 7993} {"train_info/time_between_train_steps": 0.0031821727752685547, "step": 7993} {"info/global_step": 7994, "train_info/time_within_train_step": 2.753291130065918, "step": 7994} {"train_info/time_between_train_steps": 0.003179311752319336, "step": 7994} {"info/global_step": 7995, "train_info/time_within_train_step": 2.7539353370666504, "step": 7995} {"train_info/time_between_train_steps": 0.0033304691314697266, "step": 7995} {"info/global_step": 7996, "train_info/time_within_train_step": 3.3236024379730225, "step": 7996} {"train_info/time_between_train_steps": 0.0033104419708251953, "step": 7996} {"info/global_step": 7997, "train_info/time_within_train_step": 2.756629467010498, "step": 7997} {"train_info/time_between_train_steps": 0.0033202171325683594, "step": 7997} {"info/global_step": 7998, "train_info/time_within_train_step": 2.75604248046875, "step": 7998} {"train_info/time_between_train_steps": 0.003316164016723633, "step": 7998} {"info/global_step": 7999, "train_info/time_within_train_step": 2.7573273181915283, "step": 7999} {"train_info/time_between_train_steps": 0.0033295154571533203, "step": 7999} {"info/global_step": 8000, "train_info/time_within_train_step": 2.7564096450805664, "step": 8000} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746589090, "_runtime": 23099}, "step": 8000} {"logs": {"train/loss": 3.0976, "train/learning_rate": 0.0001333333333333333, "train/epoch": 9.03, "_timestamp": 1746589090, "_runtime": 23099}, "step": 8000} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746589095, "_runtime": 23104}, "step": 8000} {"logs": {"eval/loss": 4.820436000823975, "eval/runtime": 5.126, "eval/samples_per_second": 37.066, "eval/steps_per_second": 1.171, "train/epoch": 9.03, "_timestamp": 1746589095, "_runtime": 23104}, "step": 8000} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746589095, "_runtime": 23104}, "step": 8000} {"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.820436000823975, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 124.01915144593909, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 5.126, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 37.066, "train/epoch": 9.03, "_timestamp": 1746589095, "_runtime": 23104}, "step": 8000} {"train_info/time_between_train_steps": 18.34610867500305, "step": 8000} {"info/global_step": 8001, "train_info/time_within_train_step": 2.5447936058044434, "step": 8001} {"train_info/time_between_train_steps": 0.003301382064819336, "step": 8001} {"info/global_step": 8002, "train_info/time_within_train_step": 2.5667312145233154, "step": 8002} {"train_info/time_between_train_steps": 0.0033271312713623047, "step": 8002} {"info/global_step": 8003, "train_info/time_within_train_step": 2.7307372093200684, "step": 8003} {"train_info/time_between_train_steps": 0.0033490657806396484, "step": 8003} {"info/global_step": 8004, "train_info/time_within_train_step": 2.750518798828125, "step": 8004} {"train_info/time_between_train_steps": 0.0033059120178222656, "step": 8004} {"info/global_step": 8005, "train_info/time_within_train_step": 2.7569472789764404, "step": 8005} {"train_info/time_between_train_steps": 0.0033333301544189453, "step": 8005} {"info/global_step": 8006, "train_info/time_within_train_step": 2.758310079574585, "step": 8006} {"train_info/time_between_train_steps": 0.0033025741577148438, "step": 8006} {"info/global_step": 8007, "train_info/time_within_train_step": 2.757153034210205, "step": 8007} {"train_info/time_between_train_steps": 0.0032846927642822266, "step": 8007} {"info/global_step": 8008, "train_info/time_within_train_step": 2.757432699203491, "step": 8008} {"train_info/time_between_train_steps": 0.0033333301544189453, "step": 8008} {"info/global_step": 8009, "train_info/time_within_train_step": 3.021635055541992, "step": 8009} {"train_info/time_between_train_steps": 0.003298521041870117, "step": 8009} {"info/global_step": 8010, "train_info/time_within_train_step": 2.757553815841675, "step": 8010} {"train_info/time_between_train_steps": 0.0033261775970458984, "step": 8010} {"info/global_step": 8011, "train_info/time_within_train_step": 2.757885456085205, "step": 8011} {"train_info/time_between_train_steps": 0.003342151641845703, "step": 8011} {"info/global_step": 8012, "train_info/time_within_train_step": 2.7584025859832764, "step": 8012} {"train_info/time_between_train_steps": 0.0033292770385742188, "step": 8012} {"info/global_step": 8013, "train_info/time_within_train_step": 2.7578229904174805, "step": 8013} {"train_info/time_between_train_steps": 0.0033240318298339844, "step": 8013} {"info/global_step": 8014, "train_info/time_within_train_step": 2.7590324878692627, "step": 8014} {"train_info/time_between_train_steps": 0.0034399032592773438, "step": 8014} {"info/global_step": 8015, "train_info/time_within_train_step": 2.7572121620178223, "step": 8015} {"train_info/time_between_train_steps": 0.0033600330352783203, "step": 8015} {"info/global_step": 8016, "train_info/time_within_train_step": 2.7565460205078125, "step": 8016} {"train_info/time_between_train_steps": 0.003137826919555664, "step": 8016} {"info/global_step": 8017, "train_info/time_within_train_step": 2.7574706077575684, "step": 8017} {"train_info/time_between_train_steps": 0.003160715103149414, "step": 8017} {"info/global_step": 8018, "train_info/time_within_train_step": 2.757281541824341, "step": 8018} {"train_info/time_between_train_steps": 0.0031757354736328125, "step": 8018} {"info/global_step": 8019, "train_info/time_within_train_step": 2.7573790550231934, "step": 8019} {"train_info/time_between_train_steps": 0.0031757354736328125, "step": 8019} {"info/global_step": 8020, "train_info/time_within_train_step": 2.7555336952209473, "step": 8020} {"train_info/time_between_train_steps": 0.0031642913818359375, "step": 8020} {"info/global_step": 8021, "train_info/time_within_train_step": 2.7585067749023438, "step": 8021} {"train_info/time_between_train_steps": 0.003349781036376953, "step": 8021} {"info/global_step": 8022, "train_info/time_within_train_step": 2.7577502727508545, "step": 8022} {"train_info/time_between_train_steps": 0.0032634735107421875, "step": 8022} {"info/global_step": 8023, "train_info/time_within_train_step": 2.756106376647949, "step": 8023} {"train_info/time_between_train_steps": 0.0032067298889160156, "step": 8023} {"info/global_step": 8024, "train_info/time_within_train_step": 2.7570016384124756, "step": 8024} {"train_info/time_between_train_steps": 0.003185749053955078, "step": 8024} {"info/global_step": 8025, "train_info/time_within_train_step": 2.7574334144592285, "step": 8025} {"train_info/time_between_train_steps": 0.0031349658966064453, "step": 8025} {"info/global_step": 8026, "train_info/time_within_train_step": 2.7574925422668457, "step": 8026} {"train_info/time_between_train_steps": 0.003274679183959961, "step": 8026} {"info/global_step": 8027, "train_info/time_within_train_step": 2.764104127883911, "step": 8027} {"train_info/time_between_train_steps": 0.003374338150024414, "step": 8027} {"info/global_step": 8028, "train_info/time_within_train_step": 2.7572147846221924, "step": 8028} {"train_info/time_between_train_steps": 0.0032286643981933594, "step": 8028} {"info/global_step": 8029, "train_info/time_within_train_step": 2.7558114528656006, "step": 8029} {"train_info/time_between_train_steps": 0.003206014633178711, "step": 8029} {"info/global_step": 8030, "train_info/time_within_train_step": 2.754878520965576, "step": 8030} {"train_info/time_between_train_steps": 0.0032508373260498047, "step": 8030} {"info/global_step": 8031, "train_info/time_within_train_step": 2.7564926147460938, "step": 8031} {"train_info/time_between_train_steps": 0.003201007843017578, "step": 8031} {"info/global_step": 8032, "train_info/time_within_train_step": 2.755551338195801, "step": 8032} {"train_info/time_between_train_steps": 0.003165006637573242, "step": 8032} {"info/global_step": 8033, "train_info/time_within_train_step": 2.755563735961914, "step": 8033} {"train_info/time_between_train_steps": 0.003201723098754883, "step": 8033} {"info/global_step": 8034, "train_info/time_within_train_step": 2.7565157413482666, "step": 8034} {"train_info/time_between_train_steps": 0.0032241344451904297, "step": 8034} {"info/global_step": 8035, "train_info/time_within_train_step": 2.7566933631896973, "step": 8035} {"train_info/time_between_train_steps": 0.0032155513763427734, "step": 8035} {"info/global_step": 8036, "train_info/time_within_train_step": 2.7569682598114014, "step": 8036} {"train_info/time_between_train_steps": 0.003174304962158203, "step": 8036} {"info/global_step": 8037, "train_info/time_within_train_step": 2.758152961730957, "step": 8037} {"train_info/time_between_train_steps": 0.0032100677490234375, "step": 8037} {"info/global_step": 8038, "train_info/time_within_train_step": 2.757728099822998, "step": 8038} {"train_info/time_between_train_steps": 0.0032243728637695312, "step": 8038} {"info/global_step": 8039, "train_info/time_within_train_step": 2.756824493408203, "step": 8039} {"train_info/time_between_train_steps": 0.003210783004760742, "step": 8039} {"info/global_step": 8040, "train_info/time_within_train_step": 2.754791498184204, "step": 8040} {"train_info/time_between_train_steps": 0.003228902816772461, "step": 8040} {"info/global_step": 8041, "train_info/time_within_train_step": 2.756725549697876, "step": 8041} {"train_info/time_between_train_steps": 0.0032219886779785156, "step": 8041} {"info/global_step": 8042, "train_info/time_within_train_step": 2.7570114135742188, "step": 8042} {"train_info/time_between_train_steps": 0.0032320022583007812, "step": 8042} {"info/global_step": 8043, "train_info/time_within_train_step": 2.7561376094818115, "step": 8043} {"train_info/time_between_train_steps": 0.0032608509063720703, "step": 8043} {"info/global_step": 8044, "train_info/time_within_train_step": 2.7555859088897705, "step": 8044} {"train_info/time_between_train_steps": 0.0032041072845458984, "step": 8044} {"info/global_step": 8045, "train_info/time_within_train_step": 2.757662773132324, "step": 8045} {"train_info/time_between_train_steps": 0.0032300949096679688, "step": 8045} {"info/global_step": 8046, "train_info/time_within_train_step": 2.7551445960998535, "step": 8046} {"train_info/time_between_train_steps": 0.0031387805938720703, "step": 8046} {"info/global_step": 8047, "train_info/time_within_train_step": 2.756241798400879, "step": 8047} {"train_info/time_between_train_steps": 0.003192424774169922, "step": 8047} {"info/global_step": 8048, "train_info/time_within_train_step": 2.7551686763763428, "step": 8048} {"train_info/time_between_train_steps": 0.0032134056091308594, "step": 8048} {"info/global_step": 8049, "train_info/time_within_train_step": 2.7559776306152344, "step": 8049} {"train_info/time_between_train_steps": 0.003173351287841797, "step": 8049} {"info/global_step": 8050, "train_info/time_within_train_step": 3.0355465412139893, "step": 8050} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746589247, "_runtime": 23256}, "step": 8050} {"logs": {"train/loss": 3.1052, "train/learning_rate": 0.00013, "train/epoch": 9.04, "_timestamp": 1746589247, "_runtime": 23256}, "step": 8050} {"train_info/time_between_train_steps": 0.0068378448486328125, "step": 8050} {"info/global_step": 8051, "train_info/time_within_train_step": 2.7543411254882812, "step": 8051} {"train_info/time_between_train_steps": 0.0031435489654541016, "step": 8051} {"info/global_step": 8052, "train_info/time_within_train_step": 2.755929708480835, "step": 8052} {"train_info/time_between_train_steps": 0.13347530364990234, "step": 8052} {"info/global_step": 8053, "train_info/time_within_train_step": 2.783735990524292, "step": 8053} {"train_info/time_between_train_steps": 0.003337860107421875, "step": 8053} {"info/global_step": 8054, "train_info/time_within_train_step": 2.7584774494171143, "step": 8054} {"train_info/time_between_train_steps": 0.0033359527587890625, "step": 8054} {"info/global_step": 8055, "train_info/time_within_train_step": 2.757938861846924, "step": 8055} {"train_info/time_between_train_steps": 0.0033397674560546875, "step": 8055} {"info/global_step": 8056, "train_info/time_within_train_step": 2.758335590362549, "step": 8056} {"train_info/time_between_train_steps": 0.0033800601959228516, "step": 8056} {"info/global_step": 8057, "train_info/time_within_train_step": 2.75764799118042, "step": 8057} {"train_info/time_between_train_steps": 0.0033464431762695312, "step": 8057} {"info/global_step": 8058, "train_info/time_within_train_step": 2.7569398880004883, "step": 8058} {"train_info/time_between_train_steps": 0.003287076950073242, "step": 8058} {"info/global_step": 8059, "train_info/time_within_train_step": 2.757309913635254, "step": 8059} {"train_info/time_between_train_steps": 0.003329038619995117, "step": 8059} {"info/global_step": 8060, "train_info/time_within_train_step": 2.7570416927337646, "step": 8060} {"train_info/time_between_train_steps": 0.0033049583435058594, "step": 8060} {"info/global_step": 8061, "train_info/time_within_train_step": 2.7585506439208984, "step": 8061} {"train_info/time_between_train_steps": 0.003351926803588867, "step": 8061} {"info/global_step": 8062, "train_info/time_within_train_step": 2.7564473152160645, "step": 8062} {"train_info/time_between_train_steps": 0.0033392906188964844, "step": 8062} {"info/global_step": 8063, "train_info/time_within_train_step": 2.7577128410339355, "step": 8063} {"train_info/time_between_train_steps": 0.0033419132232666016, "step": 8063} {"info/global_step": 8064, "train_info/time_within_train_step": 2.7580032348632812, "step": 8064} {"train_info/time_between_train_steps": 0.0033180713653564453, "step": 8064} {"info/global_step": 8065, "train_info/time_within_train_step": 2.757014274597168, "step": 8065} {"train_info/time_between_train_steps": 0.0033669471740722656, "step": 8065} {"info/global_step": 8066, "train_info/time_within_train_step": 2.758371591567993, "step": 8066} {"train_info/time_between_train_steps": 0.003389120101928711, "step": 8066} {"info/global_step": 8067, "train_info/time_within_train_step": 2.758680820465088, "step": 8067} {"train_info/time_between_train_steps": 0.0033309459686279297, "step": 8067} {"info/global_step": 8068, "train_info/time_within_train_step": 2.7571794986724854, "step": 8068} {"train_info/time_between_train_steps": 0.0033142566680908203, "step": 8068} {"info/global_step": 8069, "train_info/time_within_train_step": 2.7571191787719727, "step": 8069} {"train_info/time_between_train_steps": 0.003278970718383789, "step": 8069} {"info/global_step": 8070, "train_info/time_within_train_step": 2.7573060989379883, "step": 8070} {"train_info/time_between_train_steps": 0.0034329891204833984, "step": 8070} {"info/global_step": 8071, "train_info/time_within_train_step": 2.756885528564453, "step": 8071} {"train_info/time_between_train_steps": 0.003318309783935547, "step": 8071} {"info/global_step": 8072, "train_info/time_within_train_step": 2.7573742866516113, "step": 8072} {"train_info/time_between_train_steps": 0.003312826156616211, "step": 8072} {"info/global_step": 8073, "train_info/time_within_train_step": 2.7569832801818848, "step": 8073} {"train_info/time_between_train_steps": 0.0033042430877685547, "step": 8073} {"info/global_step": 8074, "train_info/time_within_train_step": 2.7557015419006348, "step": 8074} {"train_info/time_between_train_steps": 0.0033731460571289062, "step": 8074} {"info/global_step": 8075, "train_info/time_within_train_step": 2.7572946548461914, "step": 8075} {"train_info/time_between_train_steps": 0.00331878662109375, "step": 8075} {"info/global_step": 8076, "train_info/time_within_train_step": 2.754978656768799, "step": 8076} {"train_info/time_between_train_steps": 0.003297090530395508, "step": 8076} {"info/global_step": 8077, "train_info/time_within_train_step": 2.7561824321746826, "step": 8077} {"train_info/time_between_train_steps": 0.0033905506134033203, "step": 8077} {"info/global_step": 8078, "train_info/time_within_train_step": 2.756603479385376, "step": 8078} {"train_info/time_between_train_steps": 0.003448963165283203, "step": 8078} {"info/global_step": 8079, "train_info/time_within_train_step": 2.758694648742676, "step": 8079} {"train_info/time_between_train_steps": 0.003325939178466797, "step": 8079} {"info/global_step": 8080, "train_info/time_within_train_step": 2.758359432220459, "step": 8080} {"train_info/time_between_train_steps": 0.003846883773803711, "step": 8080} {"info/global_step": 8081, "train_info/time_within_train_step": 2.757627010345459, "step": 8081} {"train_info/time_between_train_steps": 0.0032896995544433594, "step": 8081} {"info/global_step": 8082, "train_info/time_within_train_step": 2.7585184574127197, "step": 8082} {"train_info/time_between_train_steps": 0.0033533573150634766, "step": 8082} {"info/global_step": 8083, "train_info/time_within_train_step": 2.757669448852539, "step": 8083} {"train_info/time_between_train_steps": 0.0033800601959228516, "step": 8083} {"info/global_step": 8084, "train_info/time_within_train_step": 2.7557530403137207, "step": 8084} {"train_info/time_between_train_steps": 0.0032987594604492188, "step": 8084} {"info/global_step": 8085, "train_info/time_within_train_step": 2.757051706314087, "step": 8085} {"train_info/time_between_train_steps": 0.003353118896484375, "step": 8085} {"info/global_step": 8086, "train_info/time_within_train_step": 2.756680488586426, "step": 8086} {"train_info/time_between_train_steps": 0.0033109188079833984, "step": 8086} {"info/global_step": 8087, "train_info/time_within_train_step": 2.757283926010132, "step": 8087} {"train_info/time_between_train_steps": 0.003336191177368164, "step": 8087} {"info/global_step": 8088, "train_info/time_within_train_step": 2.757179021835327, "step": 8088} {"train_info/time_between_train_steps": 0.003352642059326172, "step": 8088} {"info/global_step": 8089, "train_info/time_within_train_step": 2.7573390007019043, "step": 8089} {"train_info/time_between_train_steps": 0.0033283233642578125, "step": 8089} {"info/global_step": 8090, "train_info/time_within_train_step": 2.7571768760681152, "step": 8090} {"train_info/time_between_train_steps": 0.0033333301544189453, "step": 8090} {"info/global_step": 8091, "train_info/time_within_train_step": 3.025362968444824, "step": 8091} {"train_info/time_between_train_steps": 0.0033245086669921875, "step": 8091} {"info/global_step": 8092, "train_info/time_within_train_step": 2.756732225418091, "step": 8092} {"train_info/time_between_train_steps": 0.0032930374145507812, "step": 8092} {"info/global_step": 8093, "train_info/time_within_train_step": 2.7560906410217285, "step": 8093} {"train_info/time_between_train_steps": 0.003307819366455078, "step": 8093} {"info/global_step": 8094, "train_info/time_within_train_step": 2.7565982341766357, "step": 8094} {"train_info/time_between_train_steps": 0.0033311843872070312, "step": 8094} {"info/global_step": 8095, "train_info/time_within_train_step": 2.7574191093444824, "step": 8095} {"train_info/time_between_train_steps": 0.0033538341522216797, "step": 8095} {"info/global_step": 8096, "train_info/time_within_train_step": 2.756589412689209, "step": 8096} {"train_info/time_between_train_steps": 0.003374338150024414, "step": 8096} {"info/global_step": 8097, "train_info/time_within_train_step": 2.756777763366699, "step": 8097} {"train_info/time_between_train_steps": 0.003309488296508789, "step": 8097} {"info/global_step": 8098, "train_info/time_within_train_step": 2.7568552494049072, "step": 8098} {"train_info/time_between_train_steps": 0.003345489501953125, "step": 8098} {"info/global_step": 8099, "train_info/time_within_train_step": 2.7574827671051025, "step": 8099} {"train_info/time_between_train_steps": 0.0032181739807128906, "step": 8099} {"info/global_step": 8100, "train_info/time_within_train_step": 2.7556040287017822, "step": 8100} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746589386, "_runtime": 23395}, "step": 8100} {"logs": {"train/loss": 3.0966, "train/learning_rate": 0.00012666666666666666, "train/epoch": 9.04, "_timestamp": 1746589386, "_runtime": 23395}, "step": 8100} {"train_info/time_between_train_steps": 0.006716012954711914, "step": 8100} {"info/global_step": 8101, "train_info/time_within_train_step": 2.755823850631714, "step": 8101} {"train_info/time_between_train_steps": 0.0031270980834960938, "step": 8101} {"info/global_step": 8102, "train_info/time_within_train_step": 2.755186080932617, "step": 8102} {"train_info/time_between_train_steps": 0.003141164779663086, "step": 8102} {"info/global_step": 8103, "train_info/time_within_train_step": 2.756492853164673, "step": 8103} {"train_info/time_between_train_steps": 0.0031518936157226562, "step": 8103} {"info/global_step": 8104, "train_info/time_within_train_step": 2.7558577060699463, "step": 8104} {"train_info/time_between_train_steps": 0.003122568130493164, "step": 8104} {"info/global_step": 8105, "train_info/time_within_train_step": 2.7563393115997314, "step": 8105} {"train_info/time_between_train_steps": 0.0031800270080566406, "step": 8105} {"info/global_step": 8106, "train_info/time_within_train_step": 2.756805658340454, "step": 8106} {"train_info/time_between_train_steps": 0.003144979476928711, "step": 8106} {"info/global_step": 8107, "train_info/time_within_train_step": 2.7561073303222656, "step": 8107} {"train_info/time_between_train_steps": 0.003167867660522461, "step": 8107} {"info/global_step": 8108, "train_info/time_within_train_step": 2.7569522857666016, "step": 8108} {"train_info/time_between_train_steps": 0.0031592845916748047, "step": 8108} {"info/global_step": 8109, "train_info/time_within_train_step": 2.7559762001037598, "step": 8109} {"train_info/time_between_train_steps": 0.003143787384033203, "step": 8109} {"info/global_step": 8110, "train_info/time_within_train_step": 2.756035566329956, "step": 8110} {"train_info/time_between_train_steps": 0.0031371116638183594, "step": 8110} {"info/global_step": 8111, "train_info/time_within_train_step": 2.75620174407959, "step": 8111} {"train_info/time_between_train_steps": 0.0031676292419433594, "step": 8111} {"info/global_step": 8112, "train_info/time_within_train_step": 2.7549593448638916, "step": 8112} {"train_info/time_between_train_steps": 0.003128528594970703, "step": 8112} {"info/global_step": 8113, "train_info/time_within_train_step": 2.7563600540161133, "step": 8113} {"train_info/time_between_train_steps": 0.003158092498779297, "step": 8113} {"info/global_step": 8114, "train_info/time_within_train_step": 2.7555737495422363, "step": 8114} {"train_info/time_between_train_steps": 0.003152132034301758, "step": 8114} {"info/global_step": 8115, "train_info/time_within_train_step": 2.8848648071289062, "step": 8115} {"train_info/time_between_train_steps": 0.003133058547973633, "step": 8115} {"info/global_step": 8116, "train_info/time_within_train_step": 2.7554266452789307, "step": 8116} {"train_info/time_between_train_steps": 0.003191709518432617, "step": 8116} {"info/global_step": 8117, "train_info/time_within_train_step": 2.756099224090576, "step": 8117} {"train_info/time_between_train_steps": 0.003157377243041992, "step": 8117} {"info/global_step": 8118, "train_info/time_within_train_step": 2.756124496459961, "step": 8118} {"train_info/time_between_train_steps": 0.003189563751220703, "step": 8118} {"info/global_step": 8119, "train_info/time_within_train_step": 2.7573132514953613, "step": 8119} {"train_info/time_between_train_steps": 0.003175020217895508, "step": 8119} {"info/global_step": 8120, "train_info/time_within_train_step": 2.7561099529266357, "step": 8120} {"train_info/time_between_train_steps": 0.003174304962158203, "step": 8120} {"info/global_step": 8121, "train_info/time_within_train_step": 2.7568819522857666, "step": 8121} {"train_info/time_between_train_steps": 0.0031442642211914062, "step": 8121} {"info/global_step": 8122, "train_info/time_within_train_step": 2.7563834190368652, "step": 8122} {"train_info/time_between_train_steps": 0.0031585693359375, "step": 8122} {"info/global_step": 8123, "train_info/time_within_train_step": 2.754894256591797, "step": 8123} {"train_info/time_between_train_steps": 0.003173351287841797, "step": 8123} {"info/global_step": 8124, "train_info/time_within_train_step": 2.755899667739868, "step": 8124} {"train_info/time_between_train_steps": 0.003149271011352539, "step": 8124} {"info/global_step": 8125, "train_info/time_within_train_step": 2.7568249702453613, "step": 8125} {"train_info/time_between_train_steps": 0.003335237503051758, "step": 8125} {"info/global_step": 8126, "train_info/time_within_train_step": 2.7562713623046875, "step": 8126} {"train_info/time_between_train_steps": 0.0031592845916748047, "step": 8126} {"info/global_step": 8127, "train_info/time_within_train_step": 2.7564892768859863, "step": 8127} {"train_info/time_between_train_steps": 0.0031447410583496094, "step": 8127} {"info/global_step": 8128, "train_info/time_within_train_step": 2.754650592803955, "step": 8128} {"train_info/time_between_train_steps": 0.0031592845916748047, "step": 8128} {"info/global_step": 8129, "train_info/time_within_train_step": 2.7561721801757812, "step": 8129} {"train_info/time_between_train_steps": 0.0032007694244384766, "step": 8129} {"info/global_step": 8130, "train_info/time_within_train_step": 2.755521535873413, "step": 8130} {"train_info/time_between_train_steps": 0.0031735897064208984, "step": 8130} {"info/global_step": 8131, "train_info/time_within_train_step": 2.7559165954589844, "step": 8131} {"train_info/time_between_train_steps": 0.0032434463500976562, "step": 8131} {"info/global_step": 8132, "train_info/time_within_train_step": 2.754634380340576, "step": 8132} {"train_info/time_between_train_steps": 0.003123760223388672, "step": 8132} {"info/global_step": 8133, "train_info/time_within_train_step": 2.75490665435791, "step": 8133} {"train_info/time_between_train_steps": 0.003149271011352539, "step": 8133} {"info/global_step": 8134, "train_info/time_within_train_step": 2.756814479827881, "step": 8134} {"train_info/time_between_train_steps": 0.003170013427734375, "step": 8134} {"info/global_step": 8135, "train_info/time_within_train_step": 2.755561590194702, "step": 8135} {"train_info/time_between_train_steps": 0.0031621456146240234, "step": 8135} {"info/global_step": 8136, "train_info/time_within_train_step": 2.756564140319824, "step": 8136} {"train_info/time_between_train_steps": 0.0031507015228271484, "step": 8136} {"info/global_step": 8137, "train_info/time_within_train_step": 2.7557289600372314, "step": 8137} {"train_info/time_between_train_steps": 0.0031709671020507812, "step": 8137} {"info/global_step": 8138, "train_info/time_within_train_step": 2.7562122344970703, "step": 8138} {"train_info/time_between_train_steps": 0.0031652450561523438, "step": 8138} {"info/global_step": 8139, "train_info/time_within_train_step": 2.755276679992676, "step": 8139} {"train_info/time_between_train_steps": 0.0031397342681884766, "step": 8139} {"info/global_step": 8140, "train_info/time_within_train_step": 2.755702495574951, "step": 8140} {"train_info/time_between_train_steps": 0.0032210350036621094, "step": 8140} {"info/global_step": 8141, "train_info/time_within_train_step": 2.7551040649414062, "step": 8141} {"train_info/time_between_train_steps": 0.003161907196044922, "step": 8141} {"info/global_step": 8142, "train_info/time_within_train_step": 2.7549068927764893, "step": 8142} {"train_info/time_between_train_steps": 0.0031332969665527344, "step": 8142} {"info/global_step": 8143, "train_info/time_within_train_step": 2.7557992935180664, "step": 8143} {"train_info/time_between_train_steps": 0.0031812191009521484, "step": 8143} {"info/global_step": 8144, "train_info/time_within_train_step": 2.7536873817443848, "step": 8144} {"train_info/time_between_train_steps": 0.003179311752319336, "step": 8144} {"info/global_step": 8145, "train_info/time_within_train_step": 2.7555837631225586, "step": 8145} {"train_info/time_between_train_steps": 0.0031278133392333984, "step": 8145} {"info/global_step": 8146, "train_info/time_within_train_step": 2.754225969314575, "step": 8146} {"train_info/time_between_train_steps": 0.0031452178955078125, "step": 8146} {"info/global_step": 8147, "train_info/time_within_train_step": 2.7552971839904785, "step": 8147} {"train_info/time_between_train_steps": 0.0031762123107910156, "step": 8147} {"info/global_step": 8148, "train_info/time_within_train_step": 2.7549819946289062, "step": 8148} {"train_info/time_between_train_steps": 0.0031464099884033203, "step": 8148} {"info/global_step": 8149, "train_info/time_within_train_step": 2.7533414363861084, "step": 8149} {"train_info/time_between_train_steps": 0.003213167190551758, "step": 8149} {"info/global_step": 8150, "train_info/time_within_train_step": 2.75544810295105, "step": 8150} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746589524, "_runtime": 23533}, "step": 8150} {"logs": {"train/loss": 3.0815, "train/learning_rate": 0.0001233333333333333, "train/epoch": 9.05, "_timestamp": 1746589524, "_runtime": 23533}, "step": 8150} {"train_info/time_between_train_steps": 0.0064373016357421875, "step": 8150} {"info/global_step": 8151, "train_info/time_within_train_step": 2.754606008529663, "step": 8151} {"train_info/time_between_train_steps": 0.0031342506408691406, "step": 8151} {"info/global_step": 8152, "train_info/time_within_train_step": 2.755239486694336, "step": 8152} {"train_info/time_between_train_steps": 0.0031566619873046875, "step": 8152} {"info/global_step": 8153, "train_info/time_within_train_step": 2.756525993347168, "step": 8153} {"train_info/time_between_train_steps": 0.0031430721282958984, "step": 8153} {"info/global_step": 8154, "train_info/time_within_train_step": 2.756483316421509, "step": 8154} {"train_info/time_between_train_steps": 0.003178119659423828, "step": 8154} {"info/global_step": 8155, "train_info/time_within_train_step": 2.7559401988983154, "step": 8155} {"train_info/time_between_train_steps": 0.0031778812408447266, "step": 8155} {"info/global_step": 8156, "train_info/time_within_train_step": 2.756296396255493, "step": 8156} {"train_info/time_between_train_steps": 0.0031311511993408203, "step": 8156} {"info/global_step": 8157, "train_info/time_within_train_step": 2.75587797164917, "step": 8157} {"train_info/time_between_train_steps": 0.0031540393829345703, "step": 8157} {"info/global_step": 8158, "train_info/time_within_train_step": 2.755437135696411, "step": 8158} {"train_info/time_between_train_steps": 0.0031299591064453125, "step": 8158} {"info/global_step": 8159, "train_info/time_within_train_step": 2.7552573680877686, "step": 8159} {"train_info/time_between_train_steps": 0.003102540969848633, "step": 8159} {"info/global_step": 8160, "train_info/time_within_train_step": 2.755650281906128, "step": 8160} {"train_info/time_between_train_steps": 0.0036361217498779297, "step": 8160} {"info/global_step": 8161, "train_info/time_within_train_step": 2.7559118270874023, "step": 8161} {"train_info/time_between_train_steps": 0.0031659603118896484, "step": 8161} {"info/global_step": 8162, "train_info/time_within_train_step": 2.755993366241455, "step": 8162} {"train_info/time_between_train_steps": 0.0031745433807373047, "step": 8162} {"info/global_step": 8163, "train_info/time_within_train_step": 2.756474733352661, "step": 8163} {"train_info/time_between_train_steps": 0.0031354427337646484, "step": 8163} {"info/global_step": 8164, "train_info/time_within_train_step": 2.7553460597991943, "step": 8164} {"train_info/time_between_train_steps": 0.003171682357788086, "step": 8164} {"info/global_step": 8165, "train_info/time_within_train_step": 2.7569034099578857, "step": 8165} {"train_info/time_between_train_steps": 0.0031309127807617188, "step": 8165} {"info/global_step": 8166, "train_info/time_within_train_step": 2.7558164596557617, "step": 8166} {"train_info/time_between_train_steps": 0.00316619873046875, "step": 8166} {"info/global_step": 8167, "train_info/time_within_train_step": 2.7547647953033447, "step": 8167} {"train_info/time_between_train_steps": 0.0031538009643554688, "step": 8167} {"info/global_step": 8168, "train_info/time_within_train_step": 2.754791021347046, "step": 8168} {"train_info/time_between_train_steps": 0.0032024383544921875, "step": 8168} {"info/global_step": 8169, "train_info/time_within_train_step": 2.7558794021606445, "step": 8169} {"train_info/time_between_train_steps": 0.003181934356689453, "step": 8169} {"info/global_step": 8170, "train_info/time_within_train_step": 2.754619836807251, "step": 8170} {"train_info/time_between_train_steps": 0.003161907196044922, "step": 8170} {"info/global_step": 8171, "train_info/time_within_train_step": 2.755650281906128, "step": 8171} {"train_info/time_between_train_steps": 0.0032100677490234375, "step": 8171} {"info/global_step": 8172, "train_info/time_within_train_step": 2.755662679672241, "step": 8172} {"train_info/time_between_train_steps": 0.0031778812408447266, "step": 8172} {"info/global_step": 8173, "train_info/time_within_train_step": 2.7565770149230957, "step": 8173} {"train_info/time_between_train_steps": 0.003197193145751953, "step": 8173} {"info/global_step": 8174, "train_info/time_within_train_step": 2.7560930252075195, "step": 8174} {"train_info/time_between_train_steps": 0.0031325817108154297, "step": 8174} {"info/global_step": 8175, "train_info/time_within_train_step": 2.7560551166534424, "step": 8175} {"train_info/time_between_train_steps": 0.003206968307495117, "step": 8175} {"info/global_step": 8176, "train_info/time_within_train_step": 2.7560386657714844, "step": 8176} {"train_info/time_between_train_steps": 0.003149271011352539, "step": 8176} {"info/global_step": 8177, "train_info/time_within_train_step": 2.756427049636841, "step": 8177} {"train_info/time_between_train_steps": 0.09553790092468262, "step": 8177} {"info/global_step": 8178, "train_info/time_within_train_step": 2.758136749267578, "step": 8178} {"train_info/time_between_train_steps": 0.003379344940185547, "step": 8178} {"info/global_step": 8179, "train_info/time_within_train_step": 2.757765531539917, "step": 8179} {"train_info/time_between_train_steps": 0.0033304691314697266, "step": 8179} {"info/global_step": 8180, "train_info/time_within_train_step": 2.7575645446777344, "step": 8180} {"train_info/time_between_train_steps": 0.0032982826232910156, "step": 8180} {"info/global_step": 8181, "train_info/time_within_train_step": 2.7577171325683594, "step": 8181} {"train_info/time_between_train_steps": 0.003384828567504883, "step": 8181} {"info/global_step": 8182, "train_info/time_within_train_step": 2.758053779602051, "step": 8182} {"train_info/time_between_train_steps": 0.003404378890991211, "step": 8182} {"info/global_step": 8183, "train_info/time_within_train_step": 2.758226156234741, "step": 8183} {"train_info/time_between_train_steps": 0.0033180713653564453, "step": 8183} {"info/global_step": 8184, "train_info/time_within_train_step": 3.02173113822937, "step": 8184} {"train_info/time_between_train_steps": 0.0033833980560302734, "step": 8184} {"info/global_step": 8185, "train_info/time_within_train_step": 2.7571961879730225, "step": 8185} {"train_info/time_between_train_steps": 0.0033338069915771484, "step": 8185} {"info/global_step": 8186, "train_info/time_within_train_step": 2.756566286087036, "step": 8186} {"train_info/time_between_train_steps": 0.003406047821044922, "step": 8186} {"info/global_step": 8187, "train_info/time_within_train_step": 2.7574219703674316, "step": 8187} {"train_info/time_between_train_steps": 0.0033779144287109375, "step": 8187} {"info/global_step": 8188, "train_info/time_within_train_step": 2.7570059299468994, "step": 8188} {"train_info/time_between_train_steps": 0.0033426284790039062, "step": 8188} {"info/global_step": 8189, "train_info/time_within_train_step": 2.7563819885253906, "step": 8189} {"train_info/time_between_train_steps": 0.0033617019653320312, "step": 8189} {"info/global_step": 8190, "train_info/time_within_train_step": 2.756300210952759, "step": 8190} {"train_info/time_between_train_steps": 0.0033342838287353516, "step": 8190} {"info/global_step": 8191, "train_info/time_within_train_step": 2.7566885948181152, "step": 8191} {"train_info/time_between_train_steps": 0.0033621788024902344, "step": 8191} {"info/global_step": 8192, "train_info/time_within_train_step": 2.756086826324463, "step": 8192} {"train_info/time_between_train_steps": 0.003354310989379883, "step": 8192} {"info/global_step": 8193, "train_info/time_within_train_step": 2.756627082824707, "step": 8193} {"train_info/time_between_train_steps": 0.003397703170776367, "step": 8193} {"info/global_step": 8194, "train_info/time_within_train_step": 2.7563345432281494, "step": 8194} {"train_info/time_between_train_steps": 0.003334522247314453, "step": 8194} {"info/global_step": 8195, "train_info/time_within_train_step": 2.7582850456237793, "step": 8195} {"train_info/time_between_train_steps": 0.0035474300384521484, "step": 8195} {"info/global_step": 8196, "train_info/time_within_train_step": 2.757561445236206, "step": 8196} {"train_info/time_between_train_steps": 0.003345966339111328, "step": 8196} {"info/global_step": 8197, "train_info/time_within_train_step": 2.756885051727295, "step": 8197} {"train_info/time_between_train_steps": 0.0033321380615234375, "step": 8197} {"info/global_step": 8198, "train_info/time_within_train_step": 2.758136034011841, "step": 8198} {"train_info/time_between_train_steps": 0.0033435821533203125, "step": 8198} {"info/global_step": 8199, "train_info/time_within_train_step": 2.758028507232666, "step": 8199} {"train_info/time_between_train_steps": 0.0033559799194335938, "step": 8199} {"info/global_step": 8200, "train_info/time_within_train_step": 2.7587220668792725, "step": 8200} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746589662, "_runtime": 23671}, "step": 8200} {"logs": {"train/loss": 3.0729, "train/learning_rate": 0.00011999999999999999, "train/epoch": 9.05, "_timestamp": 1746589662, "_runtime": 23671}, "step": 8200} {"train_info/time_between_train_steps": 13.180069208145142, "step": 8200} {"info/global_step": 8201, "train_info/time_within_train_step": 2.5394222736358643, "step": 8201} {"train_info/time_between_train_steps": 0.0037958621978759766, "step": 8201} {"info/global_step": 8202, "train_info/time_within_train_step": 2.5946290493011475, "step": 8202} {"train_info/time_between_train_steps": 0.0031423568725585938, "step": 8202} {"info/global_step": 8203, "train_info/time_within_train_step": 2.7172467708587646, "step": 8203} {"train_info/time_between_train_steps": 0.0032165050506591797, "step": 8203} {"info/global_step": 8204, "train_info/time_within_train_step": 2.750800848007202, "step": 8204} {"train_info/time_between_train_steps": 0.0032265186309814453, "step": 8204} {"info/global_step": 8205, "train_info/time_within_train_step": 2.755523681640625, "step": 8205} {"train_info/time_between_train_steps": 0.0031883716583251953, "step": 8205} {"info/global_step": 8206, "train_info/time_within_train_step": 2.756669044494629, "step": 8206} {"train_info/time_between_train_steps": 0.003190279006958008, "step": 8206} {"info/global_step": 8207, "train_info/time_within_train_step": 2.7555267810821533, "step": 8207} {"train_info/time_between_train_steps": 0.0031931400299072266, "step": 8207} {"info/global_step": 8208, "train_info/time_within_train_step": 2.755295515060425, "step": 8208} {"train_info/time_between_train_steps": 0.0031511783599853516, "step": 8208} {"info/global_step": 8209, "train_info/time_within_train_step": 2.757498264312744, "step": 8209} {"train_info/time_between_train_steps": 0.003353595733642578, "step": 8209} {"info/global_step": 8210, "train_info/time_within_train_step": 2.7581989765167236, "step": 8210} {"train_info/time_between_train_steps": 0.0033416748046875, "step": 8210} {"info/global_step": 8211, "train_info/time_within_train_step": 2.758922815322876, "step": 8211} {"train_info/time_between_train_steps": 0.003387451171875, "step": 8211} {"info/global_step": 8212, "train_info/time_within_train_step": 2.7597758769989014, "step": 8212} {"train_info/time_between_train_steps": 0.003361225128173828, "step": 8212} {"info/global_step": 8213, "train_info/time_within_train_step": 2.758437395095825, "step": 8213} {"train_info/time_between_train_steps": 0.0033164024353027344, "step": 8213} {"info/global_step": 8214, "train_info/time_within_train_step": 2.7587928771972656, "step": 8214} {"train_info/time_between_train_steps": 0.0033512115478515625, "step": 8214} {"info/global_step": 8215, "train_info/time_within_train_step": 2.7586629390716553, "step": 8215} {"train_info/time_between_train_steps": 0.0033309459686279297, "step": 8215} {"info/global_step": 8216, "train_info/time_within_train_step": 2.7591753005981445, "step": 8216} {"train_info/time_between_train_steps": 0.003395557403564453, "step": 8216} {"info/global_step": 8217, "train_info/time_within_train_step": 2.7589292526245117, "step": 8217} {"train_info/time_between_train_steps": 0.003355264663696289, "step": 8217} {"info/global_step": 8218, "train_info/time_within_train_step": 2.7596025466918945, "step": 8218} {"train_info/time_between_train_steps": 0.01977229118347168, "step": 8218} {"info/global_step": 8219, "train_info/time_within_train_step": 2.759612560272217, "step": 8219} {"train_info/time_between_train_steps": 0.002996683120727539, "step": 8219} {"info/global_step": 8220, "train_info/time_within_train_step": 2.759014368057251, "step": 8220} {"train_info/time_between_train_steps": 0.002958536148071289, "step": 8220} {"info/global_step": 8221, "train_info/time_within_train_step": 2.758528709411621, "step": 8221} {"train_info/time_between_train_steps": 0.0029442310333251953, "step": 8221} {"info/global_step": 8222, "train_info/time_within_train_step": 2.7575085163116455, "step": 8222} {"train_info/time_between_train_steps": 0.002962827682495117, "step": 8222} {"info/global_step": 8223, "train_info/time_within_train_step": 2.7575411796569824, "step": 8223} {"train_info/time_between_train_steps": 0.002952098846435547, "step": 8223} {"info/global_step": 8224, "train_info/time_within_train_step": 2.758908748626709, "step": 8224} {"train_info/time_between_train_steps": 0.002972841262817383, "step": 8224} {"info/global_step": 8225, "train_info/time_within_train_step": 2.757028102874756, "step": 8225} {"train_info/time_between_train_steps": 0.002937793731689453, "step": 8225} {"info/global_step": 8226, "train_info/time_within_train_step": 2.75774884223938, "step": 8226} {"train_info/time_between_train_steps": 0.0029675960540771484, "step": 8226} {"info/global_step": 8227, "train_info/time_within_train_step": 2.7563552856445312, "step": 8227} {"train_info/time_between_train_steps": 0.0029876232147216797, "step": 8227} {"info/global_step": 8228, "train_info/time_within_train_step": 2.75771427154541, "step": 8228} {"train_info/time_between_train_steps": 0.0029594898223876953, "step": 8228} {"info/global_step": 8229, "train_info/time_within_train_step": 2.7567570209503174, "step": 8229} {"train_info/time_between_train_steps": 0.002995014190673828, "step": 8229} {"info/global_step": 8230, "train_info/time_within_train_step": 2.7555644512176514, "step": 8230} {"train_info/time_between_train_steps": 0.0028803348541259766, "step": 8230} {"info/global_step": 8231, "train_info/time_within_train_step": 2.990791082382202, "step": 8231} {"train_info/time_between_train_steps": 0.0028612613677978516, "step": 8231} {"info/global_step": 8232, "train_info/time_within_train_step": 2.755518674850464, "step": 8232} {"train_info/time_between_train_steps": 0.002853870391845703, "step": 8232} {"info/global_step": 8233, "train_info/time_within_train_step": 2.755728244781494, "step": 8233} {"train_info/time_between_train_steps": 0.002842426300048828, "step": 8233} {"info/global_step": 8234, "train_info/time_within_train_step": 2.7560386657714844, "step": 8234} {"train_info/time_between_train_steps": 0.0028543472290039062, "step": 8234} {"info/global_step": 8235, "train_info/time_within_train_step": 2.7562003135681152, "step": 8235} {"train_info/time_between_train_steps": 0.0028808116912841797, "step": 8235} {"info/global_step": 8236, "train_info/time_within_train_step": 2.75689697265625, "step": 8236} {"train_info/time_between_train_steps": 0.0028586387634277344, "step": 8236} {"info/global_step": 8237, "train_info/time_within_train_step": 2.756608724594116, "step": 8237} {"train_info/time_between_train_steps": 0.002893209457397461, "step": 8237} {"info/global_step": 8238, "train_info/time_within_train_step": 2.755441665649414, "step": 8238} {"train_info/time_between_train_steps": 0.0029036998748779297, "step": 8238} {"info/global_step": 8239, "train_info/time_within_train_step": 2.755382537841797, "step": 8239} {"train_info/time_between_train_steps": 0.002856016159057617, "step": 8239} {"info/global_step": 8240, "train_info/time_within_train_step": 2.7546162605285645, "step": 8240} {"train_info/time_between_train_steps": 0.002883434295654297, "step": 8240} {"info/global_step": 8241, "train_info/time_within_train_step": 2.755850315093994, "step": 8241} {"train_info/time_between_train_steps": 0.002895832061767578, "step": 8241} {"info/global_step": 8242, "train_info/time_within_train_step": 2.7550454139709473, "step": 8242} {"train_info/time_between_train_steps": 0.002881288528442383, "step": 8242} {"info/global_step": 8243, "train_info/time_within_train_step": 2.7549679279327393, "step": 8243} {"train_info/time_between_train_steps": 0.002928495407104492, "step": 8243} {"info/global_step": 8244, "train_info/time_within_train_step": 2.754047155380249, "step": 8244} {"train_info/time_between_train_steps": 0.0028667449951171875, "step": 8244} {"info/global_step": 8245, "train_info/time_within_train_step": 2.7555952072143555, "step": 8245} {"train_info/time_between_train_steps": 0.002891063690185547, "step": 8245} {"info/global_step": 8246, "train_info/time_within_train_step": 3.344872236251831, "step": 8246} {"train_info/time_between_train_steps": 0.002946138381958008, "step": 8246} {"info/global_step": 8247, "train_info/time_within_train_step": 2.7567965984344482, "step": 8247} {"train_info/time_between_train_steps": 0.002990245819091797, "step": 8247} {"info/global_step": 8248, "train_info/time_within_train_step": 2.757153272628784, "step": 8248} {"train_info/time_between_train_steps": 0.0030400753021240234, "step": 8248} {"info/global_step": 8249, "train_info/time_within_train_step": 2.756054639816284, "step": 8249} {"train_info/time_between_train_steps": 0.0030214786529541016, "step": 8249} {"info/global_step": 8250, "train_info/time_within_train_step": 2.7570888996124268, "step": 8250} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746589814, "_runtime": 23823}, "step": 8250} {"logs": {"train/loss": 3.0713, "train/learning_rate": 0.00011666666666666665, "train/epoch": 9.06, "_timestamp": 1746589814, "_runtime": 23823}, "step": 8250} {"train_info/time_between_train_steps": 0.0063686370849609375, "step": 8250} {"info/global_step": 8251, "train_info/time_within_train_step": 2.7574820518493652, "step": 8251} {"train_info/time_between_train_steps": 0.0029799938201904297, "step": 8251} {"info/global_step": 8252, "train_info/time_within_train_step": 2.757721424102783, "step": 8252} {"train_info/time_between_train_steps": 0.0029816627502441406, "step": 8252} {"info/global_step": 8253, "train_info/time_within_train_step": 2.756157875061035, "step": 8253} {"train_info/time_between_train_steps": 0.003036022186279297, "step": 8253} {"info/global_step": 8254, "train_info/time_within_train_step": 2.7575109004974365, "step": 8254} {"train_info/time_between_train_steps": 0.003000974655151367, "step": 8254} {"info/global_step": 8255, "train_info/time_within_train_step": 2.7572152614593506, "step": 8255} {"train_info/time_between_train_steps": 0.002971172332763672, "step": 8255} {"info/global_step": 8256, "train_info/time_within_train_step": 2.757280111312866, "step": 8256} {"train_info/time_between_train_steps": 0.0030219554901123047, "step": 8256} {"info/global_step": 8257, "train_info/time_within_train_step": 2.756315231323242, "step": 8257} {"train_info/time_between_train_steps": 0.002985239028930664, "step": 8257} {"info/global_step": 8258, "train_info/time_within_train_step": 2.7569363117218018, "step": 8258} {"train_info/time_between_train_steps": 0.002958536148071289, "step": 8258} {"info/global_step": 8259, "train_info/time_within_train_step": 2.7564611434936523, "step": 8259} {"train_info/time_between_train_steps": 0.002965688705444336, "step": 8259} {"info/global_step": 8260, "train_info/time_within_train_step": 2.7569923400878906, "step": 8260} {"train_info/time_between_train_steps": 0.0029840469360351562, "step": 8260} {"info/global_step": 8261, "train_info/time_within_train_step": 2.7554688453674316, "step": 8261} {"train_info/time_between_train_steps": 0.002965211868286133, "step": 8261} {"info/global_step": 8262, "train_info/time_within_train_step": 2.7570557594299316, "step": 8262} {"train_info/time_between_train_steps": 0.003162384033203125, "step": 8262} {"info/global_step": 8263, "train_info/time_within_train_step": 2.7572786808013916, "step": 8263} {"train_info/time_between_train_steps": 0.0028998851776123047, "step": 8263} {"info/global_step": 8264, "train_info/time_within_train_step": 2.757587432861328, "step": 8264} {"train_info/time_between_train_steps": 0.002883434295654297, "step": 8264} {"info/global_step": 8265, "train_info/time_within_train_step": 2.7566356658935547, "step": 8265} {"train_info/time_between_train_steps": 0.0029211044311523438, "step": 8265} {"info/global_step": 8266, "train_info/time_within_train_step": 2.7566940784454346, "step": 8266} {"train_info/time_between_train_steps": 0.002887248992919922, "step": 8266} {"info/global_step": 8267, "train_info/time_within_train_step": 2.7561612129211426, "step": 8267} {"train_info/time_between_train_steps": 0.0028924942016601562, "step": 8267} {"info/global_step": 8268, "train_info/time_within_train_step": 2.7565362453460693, "step": 8268} {"train_info/time_between_train_steps": 0.002866506576538086, "step": 8268} {"info/global_step": 8269, "train_info/time_within_train_step": 2.755937099456787, "step": 8269} {"train_info/time_between_train_steps": 0.0028955936431884766, "step": 8269} {"info/global_step": 8270, "train_info/time_within_train_step": 2.756302833557129, "step": 8270} {"train_info/time_between_train_steps": 0.002869129180908203, "step": 8270} {"info/global_step": 8271, "train_info/time_within_train_step": 2.756129503250122, "step": 8271} {"train_info/time_between_train_steps": 0.002894878387451172, "step": 8271} {"info/global_step": 8272, "train_info/time_within_train_step": 2.7568359375, "step": 8272} {"train_info/time_between_train_steps": 0.00286865234375, "step": 8272} {"info/global_step": 8273, "train_info/time_within_train_step": 2.7543439865112305, "step": 8273} {"train_info/time_between_train_steps": 0.0028839111328125, "step": 8273} {"info/global_step": 8274, "train_info/time_within_train_step": 2.7556519508361816, "step": 8274} {"train_info/time_between_train_steps": 0.0028772354125976562, "step": 8274} {"info/global_step": 8275, "train_info/time_within_train_step": 2.7559032440185547, "step": 8275} {"train_info/time_between_train_steps": 0.0028591156005859375, "step": 8275} {"info/global_step": 8276, "train_info/time_within_train_step": 2.7551276683807373, "step": 8276} {"train_info/time_between_train_steps": 0.0028963088989257812, "step": 8276} {"info/global_step": 8277, "train_info/time_within_train_step": 2.755922555923462, "step": 8277} {"train_info/time_between_train_steps": 0.002909421920776367, "step": 8277} {"info/global_step": 8278, "train_info/time_within_train_step": 2.754728078842163, "step": 8278} {"train_info/time_between_train_steps": 0.002898693084716797, "step": 8278} {"info/global_step": 8279, "train_info/time_within_train_step": 2.7556471824645996, "step": 8279} {"train_info/time_between_train_steps": 0.0028634071350097656, "step": 8279} {"info/global_step": 8280, "train_info/time_within_train_step": 2.7540953159332275, "step": 8280} {"train_info/time_between_train_steps": 0.0028798580169677734, "step": 8280} {"info/global_step": 8281, "train_info/time_within_train_step": 2.754777669906616, "step": 8281} {"train_info/time_between_train_steps": 0.0028607845306396484, "step": 8281} {"info/global_step": 8282, "train_info/time_within_train_step": 2.75508451461792, "step": 8282} {"train_info/time_between_train_steps": 0.002888202667236328, "step": 8282} {"info/global_step": 8283, "train_info/time_within_train_step": 2.7561559677124023, "step": 8283} {"train_info/time_between_train_steps": 0.002904653549194336, "step": 8283} {"info/global_step": 8284, "train_info/time_within_train_step": 2.7553751468658447, "step": 8284} {"train_info/time_between_train_steps": 0.00289154052734375, "step": 8284} {"info/global_step": 8285, "train_info/time_within_train_step": 2.7557339668273926, "step": 8285} {"train_info/time_between_train_steps": 0.0028705596923828125, "step": 8285} {"info/global_step": 8286, "train_info/time_within_train_step": 2.7562615871429443, "step": 8286} {"train_info/time_between_train_steps": 0.0028753280639648438, "step": 8286} {"info/global_step": 8287, "train_info/time_within_train_step": 2.7563071250915527, "step": 8287} {"train_info/time_between_train_steps": 0.0029363632202148438, "step": 8287} {"info/global_step": 8288, "train_info/time_within_train_step": 2.7556471824645996, "step": 8288} {"train_info/time_between_train_steps": 0.0028533935546875, "step": 8288} {"info/global_step": 8289, "train_info/time_within_train_step": 2.755012273788452, "step": 8289} {"train_info/time_between_train_steps": 0.0029227733612060547, "step": 8289} {"info/global_step": 8290, "train_info/time_within_train_step": 2.754763603210449, "step": 8290} {"train_info/time_between_train_steps": 0.002860546112060547, "step": 8290} {"info/global_step": 8291, "train_info/time_within_train_step": 2.7550976276397705, "step": 8291} {"train_info/time_between_train_steps": 0.0030531883239746094, "step": 8291} {"info/global_step": 8292, "train_info/time_within_train_step": 2.7547247409820557, "step": 8292} {"train_info/time_between_train_steps": 0.002900838851928711, "step": 8292} {"info/global_step": 8293, "train_info/time_within_train_step": 2.75669527053833, "step": 8293} {"train_info/time_between_train_steps": 0.0028753280639648438, "step": 8293} {"info/global_step": 8294, "train_info/time_within_train_step": 2.7559030055999756, "step": 8294} {"train_info/time_between_train_steps": 0.0028870105743408203, "step": 8294} {"info/global_step": 8295, "train_info/time_within_train_step": 2.7553534507751465, "step": 8295} {"train_info/time_between_train_steps": 0.00290679931640625, "step": 8295} {"info/global_step": 8296, "train_info/time_within_train_step": 2.7545578479766846, "step": 8296} {"train_info/time_between_train_steps": 0.0028994083404541016, "step": 8296} {"info/global_step": 8297, "train_info/time_within_train_step": 2.7549145221710205, "step": 8297} {"train_info/time_between_train_steps": 0.002882719039916992, "step": 8297} {"info/global_step": 8298, "train_info/time_within_train_step": 2.7552075386047363, "step": 8298} {"train_info/time_between_train_steps": 0.0028667449951171875, "step": 8298} {"info/global_step": 8299, "train_info/time_within_train_step": 2.756065607070923, "step": 8299} {"train_info/time_between_train_steps": 0.0028688907623291016, "step": 8299} {"info/global_step": 8300, "train_info/time_within_train_step": 2.7546839714050293, "step": 8300} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746589952, "_runtime": 23961}, "step": 8300} {"logs": {"train/loss": 3.0655, "train/learning_rate": 0.00011333333333333331, "train/epoch": 9.06, "_timestamp": 1746589952, "_runtime": 23961}, "step": 8300} {"train_info/time_between_train_steps": 0.006471872329711914, "step": 8300} {"info/global_step": 8301, "train_info/time_within_train_step": 2.7555992603302, "step": 8301} {"train_info/time_between_train_steps": 0.0028934478759765625, "step": 8301} {"info/global_step": 8302, "train_info/time_within_train_step": 2.7554821968078613, "step": 8302} {"train_info/time_between_train_steps": 0.0029153823852539062, "step": 8302} {"info/global_step": 8303, "train_info/time_within_train_step": 2.7542922496795654, "step": 8303} {"train_info/time_between_train_steps": 0.0028977394104003906, "step": 8303} {"info/global_step": 8304, "train_info/time_within_train_step": 2.7561635971069336, "step": 8304} {"train_info/time_between_train_steps": 0.002897977828979492, "step": 8304} {"info/global_step": 8305, "train_info/time_within_train_step": 2.755134344100952, "step": 8305} {"train_info/time_between_train_steps": 0.0029439926147460938, "step": 8305} {"info/global_step": 8306, "train_info/time_within_train_step": 2.756176233291626, "step": 8306} {"train_info/time_between_train_steps": 0.0029075145721435547, "step": 8306} {"info/global_step": 8307, "train_info/time_within_train_step": 2.755715847015381, "step": 8307} {"train_info/time_between_train_steps": 0.002855539321899414, "step": 8307} {"info/global_step": 8308, "train_info/time_within_train_step": 2.7558369636535645, "step": 8308} {"train_info/time_between_train_steps": 0.002869129180908203, "step": 8308} {"info/global_step": 8309, "train_info/time_within_train_step": 2.755575180053711, "step": 8309} {"train_info/time_between_train_steps": 0.003015279769897461, "step": 8309} {"info/global_step": 8310, "train_info/time_within_train_step": 2.7570395469665527, "step": 8310} {"train_info/time_between_train_steps": 0.003073453903198242, "step": 8310} {"info/global_step": 8311, "train_info/time_within_train_step": 2.7558753490448, "step": 8311} {"train_info/time_between_train_steps": 0.0029888153076171875, "step": 8311} {"info/global_step": 8312, "train_info/time_within_train_step": 2.756246566772461, "step": 8312} {"train_info/time_between_train_steps": 0.0030167102813720703, "step": 8312} {"info/global_step": 8313, "train_info/time_within_train_step": 2.75612473487854, "step": 8313} {"train_info/time_between_train_steps": 0.0034918785095214844, "step": 8313} {"info/global_step": 8314, "train_info/time_within_train_step": 2.7554962635040283, "step": 8314} {"train_info/time_between_train_steps": 0.0029671192169189453, "step": 8314} {"info/global_step": 8315, "train_info/time_within_train_step": 2.756582021713257, "step": 8315} {"train_info/time_between_train_steps": 0.002997159957885742, "step": 8315} {"info/global_step": 8316, "train_info/time_within_train_step": 2.756664514541626, "step": 8316} {"train_info/time_between_train_steps": 0.0029993057250976562, "step": 8316} {"info/global_step": 8317, "train_info/time_within_train_step": 2.7571027278900146, "step": 8317} {"train_info/time_between_train_steps": 0.0029497146606445312, "step": 8317} {"info/global_step": 8318, "train_info/time_within_train_step": 2.7562804222106934, "step": 8318} {"train_info/time_between_train_steps": 0.002991914749145508, "step": 8318} {"info/global_step": 8319, "train_info/time_within_train_step": 2.7570765018463135, "step": 8319} {"train_info/time_between_train_steps": 0.0030198097229003906, "step": 8319} {"info/global_step": 8320, "train_info/time_within_train_step": 2.755920171737671, "step": 8320} {"train_info/time_between_train_steps": 0.0029747486114501953, "step": 8320} {"info/global_step": 8321, "train_info/time_within_train_step": 2.7559657096862793, "step": 8321} {"train_info/time_between_train_steps": 0.002994537353515625, "step": 8321} {"info/global_step": 8322, "train_info/time_within_train_step": 2.756953716278076, "step": 8322} {"train_info/time_between_train_steps": 0.0029554367065429688, "step": 8322} {"info/global_step": 8323, "train_info/time_within_train_step": 2.758657217025757, "step": 8323} {"train_info/time_between_train_steps": 0.0029888153076171875, "step": 8323} {"info/global_step": 8324, "train_info/time_within_train_step": 2.7566237449645996, "step": 8324} {"train_info/time_between_train_steps": 0.0030388832092285156, "step": 8324} {"info/global_step": 8325, "train_info/time_within_train_step": 2.7575600147247314, "step": 8325} {"train_info/time_between_train_steps": 0.0029947757720947266, "step": 8325} {"info/global_step": 8326, "train_info/time_within_train_step": 2.7553746700286865, "step": 8326} {"train_info/time_between_train_steps": 0.0030002593994140625, "step": 8326} {"info/global_step": 8327, "train_info/time_within_train_step": 2.7543771266937256, "step": 8327} {"train_info/time_between_train_steps": 0.002981424331665039, "step": 8327} {"info/global_step": 8328, "train_info/time_within_train_step": 2.7563884258270264, "step": 8328} {"train_info/time_between_train_steps": 0.002977132797241211, "step": 8328} {"info/global_step": 8329, "train_info/time_within_train_step": 2.756354808807373, "step": 8329} {"train_info/time_between_train_steps": 0.003000020980834961, "step": 8329} {"info/global_step": 8330, "train_info/time_within_train_step": 2.756385326385498, "step": 8330} {"train_info/time_between_train_steps": 0.002986431121826172, "step": 8330} {"info/global_step": 8331, "train_info/time_within_train_step": 2.7550487518310547, "step": 8331} {"train_info/time_between_train_steps": 0.002980470657348633, "step": 8331} {"info/global_step": 8332, "train_info/time_within_train_step": 2.756995677947998, "step": 8332} {"train_info/time_between_train_steps": 0.003004789352416992, "step": 8332} {"info/global_step": 8333, "train_info/time_within_train_step": 2.7561075687408447, "step": 8333} {"train_info/time_between_train_steps": 0.003001689910888672, "step": 8333} {"info/global_step": 8334, "train_info/time_within_train_step": 2.7576284408569336, "step": 8334} {"train_info/time_between_train_steps": 0.002980470657348633, "step": 8334} {"info/global_step": 8335, "train_info/time_within_train_step": 2.7580389976501465, "step": 8335} {"train_info/time_between_train_steps": 0.0029990673065185547, "step": 8335} {"info/global_step": 8336, "train_info/time_within_train_step": 2.7569499015808105, "step": 8336} {"train_info/time_between_train_steps": 0.0029959678649902344, "step": 8336} {"info/global_step": 8337, "train_info/time_within_train_step": 2.7577273845672607, "step": 8337} {"train_info/time_between_train_steps": 0.0030307769775390625, "step": 8337} {"info/global_step": 8338, "train_info/time_within_train_step": 2.7582807540893555, "step": 8338} {"train_info/time_between_train_steps": 0.0030257701873779297, "step": 8338} {"info/global_step": 8339, "train_info/time_within_train_step": 2.757067918777466, "step": 8339} {"train_info/time_between_train_steps": 0.0029785633087158203, "step": 8339} {"info/global_step": 8340, "train_info/time_within_train_step": 2.7528746128082275, "step": 8340} {"train_info/time_between_train_steps": 0.0030198097229003906, "step": 8340} {"info/global_step": 8341, "train_info/time_within_train_step": 2.7578821182250977, "step": 8341} {"train_info/time_between_train_steps": 0.003016233444213867, "step": 8341} {"info/global_step": 8342, "train_info/time_within_train_step": 2.7564756870269775, "step": 8342} {"train_info/time_between_train_steps": 0.0029878616333007812, "step": 8342} {"info/global_step": 8343, "train_info/time_within_train_step": 2.923103094100952, "step": 8343} {"train_info/time_between_train_steps": 0.0029706954956054688, "step": 8343} {"info/global_step": 8344, "train_info/time_within_train_step": 2.7572386264801025, "step": 8344} {"train_info/time_between_train_steps": 0.0029799938201904297, "step": 8344} {"info/global_step": 8345, "train_info/time_within_train_step": 2.7565066814422607, "step": 8345} {"train_info/time_between_train_steps": 0.0029764175415039062, "step": 8345} {"info/global_step": 8346, "train_info/time_within_train_step": 2.758395195007324, "step": 8346} {"train_info/time_between_train_steps": 0.0030231475830078125, "step": 8346} {"info/global_step": 8347, "train_info/time_within_train_step": 2.756924629211426, "step": 8347} {"train_info/time_between_train_steps": 0.002974987030029297, "step": 8347} {"info/global_step": 8348, "train_info/time_within_train_step": 2.7569046020507812, "step": 8348} {"train_info/time_between_train_steps": 0.0029189586639404297, "step": 8348} {"info/global_step": 8349, "train_info/time_within_train_step": 2.755842924118042, "step": 8349} {"train_info/time_between_train_steps": 0.002921581268310547, "step": 8349} {"info/global_step": 8350, "train_info/time_within_train_step": 2.7550582885742188, "step": 8350} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746590091, "_runtime": 24100}, "step": 8350} {"logs": {"train/loss": 3.0516, "train/learning_rate": 0.00010999999999999998, "train/epoch": 9.07, "_timestamp": 1746590091, "_runtime": 24100}, "step": 8350} {"train_info/time_between_train_steps": 0.006040334701538086, "step": 8350} {"info/global_step": 8351, "train_info/time_within_train_step": 2.7558162212371826, "step": 8351} {"train_info/time_between_train_steps": 0.002869844436645508, "step": 8351} {"info/global_step": 8352, "train_info/time_within_train_step": 2.7561676502227783, "step": 8352} {"train_info/time_between_train_steps": 0.002866506576538086, "step": 8352} {"info/global_step": 8353, "train_info/time_within_train_step": 2.7561800479888916, "step": 8353} {"train_info/time_between_train_steps": 0.0028748512268066406, "step": 8353} {"info/global_step": 8354, "train_info/time_within_train_step": 2.75618839263916, "step": 8354} {"train_info/time_between_train_steps": 0.0030357837677001953, "step": 8354} {"info/global_step": 8355, "train_info/time_within_train_step": 2.756086587905884, "step": 8355} {"train_info/time_between_train_steps": 0.002923250198364258, "step": 8355} {"info/global_step": 8356, "train_info/time_within_train_step": 2.756247043609619, "step": 8356} {"train_info/time_between_train_steps": 0.0028944015502929688, "step": 8356} {"info/global_step": 8357, "train_info/time_within_train_step": 2.755995988845825, "step": 8357} {"train_info/time_between_train_steps": 0.002857208251953125, "step": 8357} {"info/global_step": 8358, "train_info/time_within_train_step": 2.756748676300049, "step": 8358} {"train_info/time_between_train_steps": 0.002890348434448242, "step": 8358} {"info/global_step": 8359, "train_info/time_within_train_step": 2.7557058334350586, "step": 8359} {"train_info/time_between_train_steps": 0.002935171127319336, "step": 8359} {"info/global_step": 8360, "train_info/time_within_train_step": 2.7535910606384277, "step": 8360} {"train_info/time_between_train_steps": 0.0028743743896484375, "step": 8360} {"info/global_step": 8361, "train_info/time_within_train_step": 2.7569408416748047, "step": 8361} {"train_info/time_between_train_steps": 0.002863645553588867, "step": 8361} {"info/global_step": 8362, "train_info/time_within_train_step": 2.755061626434326, "step": 8362} {"train_info/time_between_train_steps": 0.0029153823852539062, "step": 8362} {"info/global_step": 8363, "train_info/time_within_train_step": 2.7558069229125977, "step": 8363} {"train_info/time_between_train_steps": 0.0028569698333740234, "step": 8363} {"info/global_step": 8364, "train_info/time_within_train_step": 2.756378650665283, "step": 8364} {"train_info/time_between_train_steps": 0.003015756607055664, "step": 8364} {"info/global_step": 8365, "train_info/time_within_train_step": 2.757397174835205, "step": 8365} {"train_info/time_between_train_steps": 0.0029816627502441406, "step": 8365} {"info/global_step": 8366, "train_info/time_within_train_step": 2.756152868270874, "step": 8366} {"train_info/time_between_train_steps": 0.002992868423461914, "step": 8366} {"info/global_step": 8367, "train_info/time_within_train_step": 2.756826400756836, "step": 8367} {"train_info/time_between_train_steps": 0.003039836883544922, "step": 8367} {"info/global_step": 8368, "train_info/time_within_train_step": 2.7581112384796143, "step": 8368} {"train_info/time_between_train_steps": 0.002985239028930664, "step": 8368} {"info/global_step": 8369, "train_info/time_within_train_step": 2.757061719894409, "step": 8369} {"train_info/time_between_train_steps": 0.0029795169830322266, "step": 8369} {"info/global_step": 8370, "train_info/time_within_train_step": 2.7562079429626465, "step": 8370} {"train_info/time_between_train_steps": 0.003040790557861328, "step": 8370} {"info/global_step": 8371, "train_info/time_within_train_step": 2.7561874389648438, "step": 8371} {"train_info/time_between_train_steps": 0.002965688705444336, "step": 8371} {"info/global_step": 8372, "train_info/time_within_train_step": 2.7566990852355957, "step": 8372} {"train_info/time_between_train_steps": 0.0030112266540527344, "step": 8372} {"info/global_step": 8373, "train_info/time_within_train_step": 2.7570924758911133, "step": 8373} {"train_info/time_between_train_steps": 0.003009319305419922, "step": 8373} {"info/global_step": 8374, "train_info/time_within_train_step": 2.756248950958252, "step": 8374} {"train_info/time_between_train_steps": 0.0029680728912353516, "step": 8374} {"info/global_step": 8375, "train_info/time_within_train_step": 2.7567942142486572, "step": 8375} {"train_info/time_between_train_steps": 0.0029916763305664062, "step": 8375} {"info/global_step": 8376, "train_info/time_within_train_step": 2.7579450607299805, "step": 8376} {"train_info/time_between_train_steps": 0.002999544143676758, "step": 8376} {"info/global_step": 8377, "train_info/time_within_train_step": 2.756686210632324, "step": 8377} {"train_info/time_between_train_steps": 0.003003835678100586, "step": 8377} {"info/global_step": 8378, "train_info/time_within_train_step": 2.7575623989105225, "step": 8378} {"train_info/time_between_train_steps": 0.002984762191772461, "step": 8378} {"info/global_step": 8379, "train_info/time_within_train_step": 2.7576260566711426, "step": 8379} {"train_info/time_between_train_steps": 0.0029904842376708984, "step": 8379} {"info/global_step": 8380, "train_info/time_within_train_step": 2.756859064102173, "step": 8380} {"train_info/time_between_train_steps": 0.0030035972595214844, "step": 8380} {"info/global_step": 8381, "train_info/time_within_train_step": 2.7565431594848633, "step": 8381} {"train_info/time_between_train_steps": 0.0030260086059570312, "step": 8381} {"info/global_step": 8382, "train_info/time_within_train_step": 2.7566959857940674, "step": 8382} {"train_info/time_between_train_steps": 0.0030002593994140625, "step": 8382} {"info/global_step": 8383, "train_info/time_within_train_step": 2.7570111751556396, "step": 8383} {"train_info/time_between_train_steps": 0.002990245819091797, "step": 8383} {"info/global_step": 8384, "train_info/time_within_train_step": 2.756586790084839, "step": 8384} {"train_info/time_between_train_steps": 0.00299835205078125, "step": 8384} {"info/global_step": 8385, "train_info/time_within_train_step": 2.7571756839752197, "step": 8385} {"train_info/time_between_train_steps": 0.003152132034301758, "step": 8385} {"info/global_step": 8386, "train_info/time_within_train_step": 2.7563095092773438, "step": 8386} {"train_info/time_between_train_steps": 0.0032491683959960938, "step": 8386} {"info/global_step": 8387, "train_info/time_within_train_step": 2.756570816040039, "step": 8387} {"train_info/time_between_train_steps": 0.002980470657348633, "step": 8387} {"info/global_step": 8388, "train_info/time_within_train_step": 2.756917715072632, "step": 8388} {"train_info/time_between_train_steps": 0.002991914749145508, "step": 8388} {"info/global_step": 8389, "train_info/time_within_train_step": 2.757512331008911, "step": 8389} {"train_info/time_between_train_steps": 0.003015279769897461, "step": 8389} {"info/global_step": 8390, "train_info/time_within_train_step": 2.7569806575775146, "step": 8390} {"train_info/time_between_train_steps": 0.0030059814453125, "step": 8390} {"info/global_step": 8391, "train_info/time_within_train_step": 2.756810426712036, "step": 8391} {"train_info/time_between_train_steps": 0.00299835205078125, "step": 8391} {"info/global_step": 8392, "train_info/time_within_train_step": 2.7568843364715576, "step": 8392} {"train_info/time_between_train_steps": 0.0030164718627929688, "step": 8392} {"info/global_step": 8393, "train_info/time_within_train_step": 2.757962465286255, "step": 8393} {"train_info/time_between_train_steps": 0.003027677536010742, "step": 8393} {"info/global_step": 8394, "train_info/time_within_train_step": 2.7562332153320312, "step": 8394} {"train_info/time_between_train_steps": 0.0029802322387695312, "step": 8394} {"info/global_step": 8395, "train_info/time_within_train_step": 2.757180690765381, "step": 8395} {"train_info/time_between_train_steps": 0.0029594898223876953, "step": 8395} {"info/global_step": 8396, "train_info/time_within_train_step": 2.7581138610839844, "step": 8396} {"train_info/time_between_train_steps": 0.003025054931640625, "step": 8396} {"info/global_step": 8397, "train_info/time_within_train_step": 2.7576911449432373, "step": 8397} {"train_info/time_between_train_steps": 0.0029706954956054688, "step": 8397} {"info/global_step": 8398, "train_info/time_within_train_step": 2.757812738418579, "step": 8398} {"train_info/time_between_train_steps": 0.002978801727294922, "step": 8398} {"info/global_step": 8399, "train_info/time_within_train_step": 2.756424903869629, "step": 8399} {"train_info/time_between_train_steps": 0.0029850006103515625, "step": 8399} {"info/global_step": 8400, "train_info/time_within_train_step": 2.7546818256378174, "step": 8400} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746590229, "_runtime": 24238}, "step": 8400} {"logs": {"train/loss": 3.0481, "train/learning_rate": 0.00010666666666666667, "train/epoch": 9.07, "_timestamp": 1746590229, "_runtime": 24238}, "step": 8400} {"train_info/time_between_train_steps": 13.212231874465942, "step": 8400} {"info/global_step": 8401, "train_info/time_within_train_step": 2.657252788543701, "step": 8401} {"train_info/time_between_train_steps": 0.0030641555786132812, "step": 8401} {"info/global_step": 8402, "train_info/time_within_train_step": 2.5979764461517334, "step": 8402} {"train_info/time_between_train_steps": 0.0030891895294189453, "step": 8402} {"info/global_step": 8403, "train_info/time_within_train_step": 2.7336020469665527, "step": 8403} {"train_info/time_between_train_steps": 0.0029985904693603516, "step": 8403} {"info/global_step": 8404, "train_info/time_within_train_step": 2.749436616897583, "step": 8404} {"train_info/time_between_train_steps": 0.0029935836791992188, "step": 8404} {"info/global_step": 8405, "train_info/time_within_train_step": 2.7534449100494385, "step": 8405} {"train_info/time_between_train_steps": 0.003055095672607422, "step": 8405} {"info/global_step": 8406, "train_info/time_within_train_step": 2.7561612129211426, "step": 8406} {"train_info/time_between_train_steps": 0.0029616355895996094, "step": 8406} {"info/global_step": 8407, "train_info/time_within_train_step": 2.756760597229004, "step": 8407} {"train_info/time_between_train_steps": 0.0030105113983154297, "step": 8407} {"info/global_step": 8408, "train_info/time_within_train_step": 2.756295680999756, "step": 8408} {"train_info/time_between_train_steps": 0.0029740333557128906, "step": 8408} {"info/global_step": 8409, "train_info/time_within_train_step": 2.757509231567383, "step": 8409} {"train_info/time_between_train_steps": 0.0030150413513183594, "step": 8409} {"info/global_step": 8410, "train_info/time_within_train_step": 2.757059097290039, "step": 8410} {"train_info/time_between_train_steps": 0.003040790557861328, "step": 8410} {"info/global_step": 8411, "train_info/time_within_train_step": 2.757493495941162, "step": 8411} {"train_info/time_between_train_steps": 0.0029561519622802734, "step": 8411} {"info/global_step": 8412, "train_info/time_within_train_step": 2.757570743560791, "step": 8412} {"train_info/time_between_train_steps": 0.003016948699951172, "step": 8412} {"info/global_step": 8413, "train_info/time_within_train_step": 2.756653308868408, "step": 8413} {"train_info/time_between_train_steps": 0.0030117034912109375, "step": 8413} {"info/global_step": 8414, "train_info/time_within_train_step": 2.755156993865967, "step": 8414} {"train_info/time_between_train_steps": 0.003042936325073242, "step": 8414} {"info/global_step": 8415, "train_info/time_within_train_step": 2.756951332092285, "step": 8415} {"train_info/time_between_train_steps": 0.003023386001586914, "step": 8415} {"info/global_step": 8416, "train_info/time_within_train_step": 2.756474494934082, "step": 8416} {"train_info/time_between_train_steps": 0.002988576889038086, "step": 8416} {"info/global_step": 8417, "train_info/time_within_train_step": 2.757962226867676, "step": 8417} {"train_info/time_between_train_steps": 0.0031735897064208984, "step": 8417} {"info/global_step": 8418, "train_info/time_within_train_step": 2.7572062015533447, "step": 8418} {"train_info/time_between_train_steps": 0.0029778480529785156, "step": 8418} {"info/global_step": 8419, "train_info/time_within_train_step": 2.756804943084717, "step": 8419} {"train_info/time_between_train_steps": 0.0029861927032470703, "step": 8419} {"info/global_step": 8420, "train_info/time_within_train_step": 2.7585809230804443, "step": 8420} {"train_info/time_between_train_steps": 0.0029709339141845703, "step": 8420} {"info/global_step": 8421, "train_info/time_within_train_step": 2.7566020488739014, "step": 8421} {"train_info/time_between_train_steps": 0.00308990478515625, "step": 8421} {"info/global_step": 8422, "train_info/time_within_train_step": 2.7576661109924316, "step": 8422} {"train_info/time_between_train_steps": 0.002988100051879883, "step": 8422} {"info/global_step": 8423, "train_info/time_within_train_step": 2.758500814437866, "step": 8423} {"train_info/time_between_train_steps": 0.0030059814453125, "step": 8423} {"info/global_step": 8424, "train_info/time_within_train_step": 2.757580518722534, "step": 8424} {"train_info/time_between_train_steps": 0.003024578094482422, "step": 8424} {"info/global_step": 8425, "train_info/time_within_train_step": 2.758268356323242, "step": 8425} {"train_info/time_between_train_steps": 0.003149271011352539, "step": 8425} {"info/global_step": 8426, "train_info/time_within_train_step": 2.75692081451416, "step": 8426} {"train_info/time_between_train_steps": 0.0030379295349121094, "step": 8426} {"info/global_step": 8427, "train_info/time_within_train_step": 2.7572133541107178, "step": 8427} {"train_info/time_between_train_steps": 0.002987384796142578, "step": 8427} {"info/global_step": 8428, "train_info/time_within_train_step": 2.7565557956695557, "step": 8428} {"train_info/time_between_train_steps": 0.0030128955841064453, "step": 8428} {"info/global_step": 8429, "train_info/time_within_train_step": 2.757819652557373, "step": 8429} {"train_info/time_between_train_steps": 0.0029540061950683594, "step": 8429} {"info/global_step": 8430, "train_info/time_within_train_step": 2.757114887237549, "step": 8430} {"train_info/time_between_train_steps": 0.003049135208129883, "step": 8430} {"info/global_step": 8431, "train_info/time_within_train_step": 2.757462978363037, "step": 8431} {"train_info/time_between_train_steps": 0.0029799938201904297, "step": 8431} {"info/global_step": 8432, "train_info/time_within_train_step": 2.7567684650421143, "step": 8432} {"train_info/time_between_train_steps": 0.003053426742553711, "step": 8432} {"info/global_step": 8433, "train_info/time_within_train_step": 2.756978750228882, "step": 8433} {"train_info/time_between_train_steps": 0.003219127655029297, "step": 8433} {"info/global_step": 8434, "train_info/time_within_train_step": 2.7577884197235107, "step": 8434} {"train_info/time_between_train_steps": 0.0029964447021484375, "step": 8434} {"info/global_step": 8435, "train_info/time_within_train_step": 2.7575490474700928, "step": 8435} {"train_info/time_between_train_steps": 0.0029745101928710938, "step": 8435} {"info/global_step": 8436, "train_info/time_within_train_step": 2.7575812339782715, "step": 8436} {"train_info/time_between_train_steps": 0.003084421157836914, "step": 8436} {"info/global_step": 8437, "train_info/time_within_train_step": 2.7578697204589844, "step": 8437} {"train_info/time_between_train_steps": 0.003113269805908203, "step": 8437} {"info/global_step": 8438, "train_info/time_within_train_step": 2.7578275203704834, "step": 8438} {"train_info/time_between_train_steps": 0.003106355667114258, "step": 8438} {"info/global_step": 8439, "train_info/time_within_train_step": 2.758406162261963, "step": 8439} {"train_info/time_between_train_steps": 0.003201723098754883, "step": 8439} {"info/global_step": 8440, "train_info/time_within_train_step": 2.758384943008423, "step": 8440} {"train_info/time_between_train_steps": 0.0032019615173339844, "step": 8440} {"info/global_step": 8441, "train_info/time_within_train_step": 2.757026195526123, "step": 8441} {"train_info/time_between_train_steps": 0.0031833648681640625, "step": 8441} {"info/global_step": 8442, "train_info/time_within_train_step": 2.756840229034424, "step": 8442} {"train_info/time_between_train_steps": 0.0031065940856933594, "step": 8442} {"info/global_step": 8443, "train_info/time_within_train_step": 2.7569093704223633, "step": 8443} {"train_info/time_between_train_steps": 0.003091573715209961, "step": 8443} {"info/global_step": 8444, "train_info/time_within_train_step": 2.7553625106811523, "step": 8444} {"train_info/time_between_train_steps": 0.0031337738037109375, "step": 8444} {"info/global_step": 8445, "train_info/time_within_train_step": 2.756645679473877, "step": 8445} {"train_info/time_between_train_steps": 0.003184795379638672, "step": 8445} {"info/global_step": 8446, "train_info/time_within_train_step": 2.7567825317382812, "step": 8446} {"train_info/time_between_train_steps": 0.003082275390625, "step": 8446} {"info/global_step": 8447, "train_info/time_within_train_step": 2.756834030151367, "step": 8447} {"train_info/time_between_train_steps": 0.003162860870361328, "step": 8447} {"info/global_step": 8448, "train_info/time_within_train_step": 2.7576510906219482, "step": 8448} {"train_info/time_between_train_steps": 0.0031108856201171875, "step": 8448} {"info/global_step": 8449, "train_info/time_within_train_step": 2.757075071334839, "step": 8449} {"train_info/time_between_train_steps": 0.003092527389526367, "step": 8449} {"info/global_step": 8450, "train_info/time_within_train_step": 2.757267951965332, "step": 8450} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746590380, "_runtime": 24389}, "step": 8450} {"logs": {"train/loss": 3.0341, "train/learning_rate": 0.00010333333333333333, "train/epoch": 9.08, "_timestamp": 1746590380, "_runtime": 24389}, "step": 8450} {"train_info/time_between_train_steps": 0.006362438201904297, "step": 8450} {"info/global_step": 8451, "train_info/time_within_train_step": 2.7572317123413086, "step": 8451} {"train_info/time_between_train_steps": 0.003078460693359375, "step": 8451} {"info/global_step": 8452, "train_info/time_within_train_step": 2.75779128074646, "step": 8452} {"train_info/time_between_train_steps": 0.0030663013458251953, "step": 8452} {"info/global_step": 8453, "train_info/time_within_train_step": 2.757617235183716, "step": 8453} {"train_info/time_between_train_steps": 0.0031180381774902344, "step": 8453} {"info/global_step": 8454, "train_info/time_within_train_step": 2.757740020751953, "step": 8454} {"train_info/time_between_train_steps": 0.003142118453979492, "step": 8454} {"info/global_step": 8455, "train_info/time_within_train_step": 2.7570254802703857, "step": 8455} {"train_info/time_between_train_steps": 0.003136157989501953, "step": 8455} {"info/global_step": 8456, "train_info/time_within_train_step": 2.757357358932495, "step": 8456} {"train_info/time_between_train_steps": 0.003131389617919922, "step": 8456} {"info/global_step": 8457, "train_info/time_within_train_step": 2.757244110107422, "step": 8457} {"train_info/time_between_train_steps": 0.003110170364379883, "step": 8457} {"info/global_step": 8458, "train_info/time_within_train_step": 2.7566113471984863, "step": 8458} {"train_info/time_between_train_steps": 0.00305938720703125, "step": 8458} {"info/global_step": 8459, "train_info/time_within_train_step": 2.7564806938171387, "step": 8459} {"train_info/time_between_train_steps": 0.0030477046966552734, "step": 8459} {"info/global_step": 8460, "train_info/time_within_train_step": 2.75534987449646, "step": 8460} {"train_info/time_between_train_steps": 0.002964019775390625, "step": 8460} {"info/global_step": 8461, "train_info/time_within_train_step": 2.757484197616577, "step": 8461} {"train_info/time_between_train_steps": 0.0030875205993652344, "step": 8461} {"info/global_step": 8462, "train_info/time_within_train_step": 2.75773286819458, "step": 8462} {"train_info/time_between_train_steps": 0.0031023025512695312, "step": 8462} {"info/global_step": 8463, "train_info/time_within_train_step": 2.757446050643921, "step": 8463} {"train_info/time_between_train_steps": 0.0031135082244873047, "step": 8463} {"info/global_step": 8464, "train_info/time_within_train_step": 2.7563304901123047, "step": 8464} {"train_info/time_between_train_steps": 0.003100872039794922, "step": 8464} {"info/global_step": 8465, "train_info/time_within_train_step": 2.756922483444214, "step": 8465} {"train_info/time_between_train_steps": 0.003147125244140625, "step": 8465} {"info/global_step": 8466, "train_info/time_within_train_step": 2.7566983699798584, "step": 8466} {"train_info/time_between_train_steps": 0.003135204315185547, "step": 8466} {"info/global_step": 8467, "train_info/time_within_train_step": 2.758101463317871, "step": 8467} {"train_info/time_between_train_steps": 0.003083944320678711, "step": 8467} {"info/global_step": 8468, "train_info/time_within_train_step": 2.7579166889190674, "step": 8468} {"train_info/time_between_train_steps": 0.003112316131591797, "step": 8468} {"info/global_step": 8469, "train_info/time_within_train_step": 2.758021593093872, "step": 8469} {"train_info/time_between_train_steps": 0.0030226707458496094, "step": 8469} {"info/global_step": 8470, "train_info/time_within_train_step": 2.7567062377929688, "step": 8470} {"train_info/time_between_train_steps": 0.0030455589294433594, "step": 8470} {"info/global_step": 8471, "train_info/time_within_train_step": 2.75712251663208, "step": 8471} {"train_info/time_between_train_steps": 0.0029816627502441406, "step": 8471} {"info/global_step": 8472, "train_info/time_within_train_step": 2.7557530403137207, "step": 8472} {"train_info/time_between_train_steps": 0.002979278564453125, "step": 8472} {"info/global_step": 8473, "train_info/time_within_train_step": 2.75531268119812, "step": 8473} {"train_info/time_between_train_steps": 0.003004789352416992, "step": 8473} {"info/global_step": 8474, "train_info/time_within_train_step": 2.755486011505127, "step": 8474} {"train_info/time_between_train_steps": 0.002976655960083008, "step": 8474} {"info/global_step": 8475, "train_info/time_within_train_step": 2.754922866821289, "step": 8475} {"train_info/time_between_train_steps": 0.0029642581939697266, "step": 8475} {"info/global_step": 8476, "train_info/time_within_train_step": 2.7556748390197754, "step": 8476} {"train_info/time_between_train_steps": 0.0030090808868408203, "step": 8476} {"info/global_step": 8477, "train_info/time_within_train_step": 2.7548539638519287, "step": 8477} {"train_info/time_between_train_steps": 0.00299835205078125, "step": 8477} {"info/global_step": 8478, "train_info/time_within_train_step": 2.7562665939331055, "step": 8478} {"train_info/time_between_train_steps": 0.002942800521850586, "step": 8478} {"info/global_step": 8479, "train_info/time_within_train_step": 2.755112648010254, "step": 8479} {"train_info/time_between_train_steps": 0.002981424331665039, "step": 8479} {"info/global_step": 8480, "train_info/time_within_train_step": 2.754870891571045, "step": 8480} {"train_info/time_between_train_steps": 0.003004789352416992, "step": 8480} {"info/global_step": 8481, "train_info/time_within_train_step": 2.7546908855438232, "step": 8481} {"train_info/time_between_train_steps": 0.0030045509338378906, "step": 8481} {"info/global_step": 8482, "train_info/time_within_train_step": 2.7558817863464355, "step": 8482} {"train_info/time_between_train_steps": 0.002965688705444336, "step": 8482} {"info/global_step": 8483, "train_info/time_within_train_step": 2.7553884983062744, "step": 8483} {"train_info/time_between_train_steps": 0.0030002593994140625, "step": 8483} {"info/global_step": 8484, "train_info/time_within_train_step": 2.7558603286743164, "step": 8484} {"train_info/time_between_train_steps": 0.003015279769897461, "step": 8484} {"info/global_step": 8485, "train_info/time_within_train_step": 2.75521183013916, "step": 8485} {"train_info/time_between_train_steps": 0.0029802322387695312, "step": 8485} {"info/global_step": 8486, "train_info/time_within_train_step": 2.7538814544677734, "step": 8486} {"train_info/time_between_train_steps": 0.002967357635498047, "step": 8486} {"info/global_step": 8487, "train_info/time_within_train_step": 2.754340171813965, "step": 8487} {"train_info/time_between_train_steps": 0.0029964447021484375, "step": 8487} {"info/global_step": 8488, "train_info/time_within_train_step": 2.7539498805999756, "step": 8488} {"train_info/time_between_train_steps": 0.0030570030212402344, "step": 8488} {"info/global_step": 8489, "train_info/time_within_train_step": 2.7541325092315674, "step": 8489} {"train_info/time_between_train_steps": 0.0029544830322265625, "step": 8489} {"info/global_step": 8490, "train_info/time_within_train_step": 2.7544071674346924, "step": 8490} {"train_info/time_between_train_steps": 0.0029649734497070312, "step": 8490} {"info/global_step": 8491, "train_info/time_within_train_step": 2.7539525032043457, "step": 8491} {"train_info/time_between_train_steps": 0.0029430389404296875, "step": 8491} {"info/global_step": 8492, "train_info/time_within_train_step": 2.7547998428344727, "step": 8492} {"train_info/time_between_train_steps": 0.0029668807983398438, "step": 8492} {"info/global_step": 8493, "train_info/time_within_train_step": 2.75498628616333, "step": 8493} {"train_info/time_between_train_steps": 0.002990245819091797, "step": 8493} {"info/global_step": 8494, "train_info/time_within_train_step": 2.753736972808838, "step": 8494} {"train_info/time_between_train_steps": 0.0030329227447509766, "step": 8494} {"info/global_step": 8495, "train_info/time_within_train_step": 2.756951332092285, "step": 8495} {"train_info/time_between_train_steps": 0.002955198287963867, "step": 8495} {"info/global_step": 8496, "train_info/time_within_train_step": 3.348198890686035, "step": 8496} {"train_info/time_between_train_steps": 0.002996683120727539, "step": 8496} {"info/global_step": 8497, "train_info/time_within_train_step": 2.7554640769958496, "step": 8497} {"train_info/time_between_train_steps": 0.003030538558959961, "step": 8497} {"info/global_step": 8498, "train_info/time_within_train_step": 2.756474256515503, "step": 8498} {"train_info/time_between_train_steps": 0.0030603408813476562, "step": 8498} {"info/global_step": 8499, "train_info/time_within_train_step": 2.7564432621002197, "step": 8499} {"train_info/time_between_train_steps": 0.0029785633087158203, "step": 8499} {"info/global_step": 8500, "train_info/time_within_train_step": 2.7559585571289062, "step": 8500} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746590518, "_runtime": 24527}, "step": 8500} {"logs": {"train/loss": 3.0244, "train/learning_rate": 9.999999999999999e-05, "train/epoch": 9.08, "_timestamp": 1746590518, "_runtime": 24527}, "step": 8500} {"train_info/time_between_train_steps": 0.0067560672760009766, "step": 8500} {"info/global_step": 8501, "train_info/time_within_train_step": 2.756314754486084, "step": 8501} {"train_info/time_between_train_steps": 0.0030100345611572266, "step": 8501} {"info/global_step": 8502, "train_info/time_within_train_step": 2.7558422088623047, "step": 8502} {"train_info/time_between_train_steps": 0.003003358840942383, "step": 8502} {"info/global_step": 8503, "train_info/time_within_train_step": 2.754716634750366, "step": 8503} {"train_info/time_between_train_steps": 0.003066539764404297, "step": 8503} {"info/global_step": 8504, "train_info/time_within_train_step": 2.8101654052734375, "step": 8504} {"train_info/time_between_train_steps": 0.003063678741455078, "step": 8504} {"info/global_step": 8505, "train_info/time_within_train_step": 2.7534873485565186, "step": 8505} {"train_info/time_between_train_steps": 0.0028884410858154297, "step": 8505} {"info/global_step": 8506, "train_info/time_within_train_step": 2.755284070968628, "step": 8506} {"train_info/time_between_train_steps": 0.0029916763305664062, "step": 8506} {"info/global_step": 8507, "train_info/time_within_train_step": 2.756206750869751, "step": 8507} {"train_info/time_between_train_steps": 0.0030455589294433594, "step": 8507} {"info/global_step": 8508, "train_info/time_within_train_step": 2.756333112716675, "step": 8508} {"train_info/time_between_train_steps": 0.0031092166900634766, "step": 8508} {"info/global_step": 8509, "train_info/time_within_train_step": 2.7576515674591064, "step": 8509} {"train_info/time_between_train_steps": 0.0030951499938964844, "step": 8509} {"info/global_step": 8510, "train_info/time_within_train_step": 2.756887912750244, "step": 8510} {"train_info/time_between_train_steps": 0.0030975341796875, "step": 8510} {"info/global_step": 8511, "train_info/time_within_train_step": 2.7563376426696777, "step": 8511} {"train_info/time_between_train_steps": 0.0030548572540283203, "step": 8511} {"info/global_step": 8512, "train_info/time_within_train_step": 2.757054328918457, "step": 8512} {"train_info/time_between_train_steps": 0.003177165985107422, "step": 8512} {"info/global_step": 8513, "train_info/time_within_train_step": 2.7559814453125, "step": 8513} {"train_info/time_between_train_steps": 0.0030329227447509766, "step": 8513} {"info/global_step": 8514, "train_info/time_within_train_step": 2.75589656829834, "step": 8514} {"train_info/time_between_train_steps": 0.003133058547973633, "step": 8514} {"info/global_step": 8515, "train_info/time_within_train_step": 2.75494384765625, "step": 8515} {"train_info/time_between_train_steps": 0.003024578094482422, "step": 8515} {"info/global_step": 8516, "train_info/time_within_train_step": 2.75533390045166, "step": 8516} {"train_info/time_between_train_steps": 0.0029363632202148438, "step": 8516} {"info/global_step": 8517, "train_info/time_within_train_step": 2.75591778755188, "step": 8517} {"train_info/time_between_train_steps": 0.0032215118408203125, "step": 8517} {"info/global_step": 8518, "train_info/time_within_train_step": 2.756161689758301, "step": 8518} {"train_info/time_between_train_steps": 0.003374814987182617, "step": 8518} {"info/global_step": 8519, "train_info/time_within_train_step": 2.75702166557312, "step": 8519} {"train_info/time_between_train_steps": 0.003203153610229492, "step": 8519} {"info/global_step": 8520, "train_info/time_within_train_step": 2.7571308612823486, "step": 8520} {"train_info/time_between_train_steps": 0.003230571746826172, "step": 8520} {"info/global_step": 8521, "train_info/time_within_train_step": 2.757282257080078, "step": 8521} {"train_info/time_between_train_steps": 0.0034825801849365234, "step": 8521} {"info/global_step": 8522, "train_info/time_within_train_step": 2.755934000015259, "step": 8522} {"train_info/time_between_train_steps": 0.0029649734497070312, "step": 8522} {"info/global_step": 8523, "train_info/time_within_train_step": 2.757840633392334, "step": 8523} {"train_info/time_between_train_steps": 0.0032744407653808594, "step": 8523} {"info/global_step": 8524, "train_info/time_within_train_step": 2.7571914196014404, "step": 8524} {"train_info/time_between_train_steps": 0.0031664371490478516, "step": 8524} {"info/global_step": 8525, "train_info/time_within_train_step": 2.757073163986206, "step": 8525} {"train_info/time_between_train_steps": 0.003203868865966797, "step": 8525} {"info/global_step": 8526, "train_info/time_within_train_step": 2.757720708847046, "step": 8526} {"train_info/time_between_train_steps": 0.003166675567626953, "step": 8526} {"info/global_step": 8527, "train_info/time_within_train_step": 2.7563865184783936, "step": 8527} {"train_info/time_between_train_steps": 0.0032258033752441406, "step": 8527} {"info/global_step": 8528, "train_info/time_within_train_step": 2.7566916942596436, "step": 8528} {"train_info/time_between_train_steps": 0.0032122135162353516, "step": 8528} {"info/global_step": 8529, "train_info/time_within_train_step": 2.7554478645324707, "step": 8529} {"train_info/time_between_train_steps": 0.003496885299682617, "step": 8529} {"info/global_step": 8530, "train_info/time_within_train_step": 2.7575981616973877, "step": 8530} {"train_info/time_between_train_steps": 0.003645181655883789, "step": 8530} {"train_info/time_between_train_steps": 3.298861503601074, "step": 8530} {"info/global_step": 8531, "train_info/time_within_train_step": 2.6816415786743164, "step": 8531} {"train_info/time_between_train_steps": 0.0031151771545410156, "step": 8531} {"info/global_step": 8532, "train_info/time_within_train_step": 2.754197597503662, "step": 8532} {"train_info/time_between_train_steps": 0.0031223297119140625, "step": 8532} {"info/global_step": 8533, "train_info/time_within_train_step": 2.7549850940704346, "step": 8533} {"train_info/time_between_train_steps": 0.003161907196044922, "step": 8533} {"info/global_step": 8534, "train_info/time_within_train_step": 2.754875421524048, "step": 8534} {"train_info/time_between_train_steps": 0.0031120777130126953, "step": 8534} {"info/global_step": 8535, "train_info/time_within_train_step": 2.7562918663024902, "step": 8535} {"train_info/time_between_train_steps": 0.0031147003173828125, "step": 8535} {"info/global_step": 8536, "train_info/time_within_train_step": 2.7556569576263428, "step": 8536} {"train_info/time_between_train_steps": 0.0031080245971679688, "step": 8536} {"info/global_step": 8537, "train_info/time_within_train_step": 2.754915952682495, "step": 8537} {"train_info/time_between_train_steps": 0.0031583309173583984, "step": 8537} {"info/global_step": 8538, "train_info/time_within_train_step": 2.755720615386963, "step": 8538} {"train_info/time_between_train_steps": 0.0031654834747314453, "step": 8538} {"info/global_step": 8539, "train_info/time_within_train_step": 2.753343105316162, "step": 8539} {"train_info/time_between_train_steps": 0.003117084503173828, "step": 8539} {"info/global_step": 8540, "train_info/time_within_train_step": 2.7550642490386963, "step": 8540} {"train_info/time_between_train_steps": 0.0032842159271240234, "step": 8540} {"info/global_step": 8541, "train_info/time_within_train_step": 2.756963014602661, "step": 8541} {"train_info/time_between_train_steps": 0.0033457279205322266, "step": 8541} {"info/global_step": 8542, "train_info/time_within_train_step": 2.7581777572631836, "step": 8542} {"train_info/time_between_train_steps": 0.003299236297607422, "step": 8542} {"info/global_step": 8543, "train_info/time_within_train_step": 2.7575647830963135, "step": 8543} {"train_info/time_between_train_steps": 0.0033156871795654297, "step": 8543} {"info/global_step": 8544, "train_info/time_within_train_step": 2.757033109664917, "step": 8544} {"train_info/time_between_train_steps": 0.0033769607543945312, "step": 8544} {"info/global_step": 8545, "train_info/time_within_train_step": 2.7586140632629395, "step": 8545} {"train_info/time_between_train_steps": 0.0032739639282226562, "step": 8545} {"info/global_step": 8546, "train_info/time_within_train_step": 2.7573187351226807, "step": 8546} {"train_info/time_between_train_steps": 0.003339052200317383, "step": 8546} {"info/global_step": 8547, "train_info/time_within_train_step": 2.757490634918213, "step": 8547} {"train_info/time_between_train_steps": 0.0032854080200195312, "step": 8547} {"info/global_step": 8548, "train_info/time_within_train_step": 2.757451057434082, "step": 8548} {"train_info/time_between_train_steps": 0.0033462047576904297, "step": 8548} {"info/global_step": 8549, "train_info/time_within_train_step": 2.7570438385009766, "step": 8549} {"train_info/time_between_train_steps": 0.0033092498779296875, "step": 8549} {"info/global_step": 8550, "train_info/time_within_train_step": 2.756889820098877, "step": 8550} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746590660, "_runtime": 24669}, "step": 8550} {"logs": {"train/loss": 3.0638, "train/learning_rate": 9.666666666666667e-05, "train/epoch": 10.0, "_timestamp": 1746590660, "_runtime": 24669}, "step": 8550} {"train_info/time_between_train_steps": 0.006265163421630859, "step": 8550} {"info/global_step": 8551, "train_info/time_within_train_step": 2.7580361366271973, "step": 8551} {"train_info/time_between_train_steps": 0.003261566162109375, "step": 8551} {"info/global_step": 8552, "train_info/time_within_train_step": 2.7576746940612793, "step": 8552} {"train_info/time_between_train_steps": 0.003330230712890625, "step": 8552} {"info/global_step": 8553, "train_info/time_within_train_step": 2.756993532180786, "step": 8553} {"train_info/time_between_train_steps": 0.0033216476440429688, "step": 8553} {"info/global_step": 8554, "train_info/time_within_train_step": 2.757227659225464, "step": 8554} {"train_info/time_between_train_steps": 0.0032913684844970703, "step": 8554} {"info/global_step": 8555, "train_info/time_within_train_step": 2.7575178146362305, "step": 8555} {"train_info/time_between_train_steps": 0.0033512115478515625, "step": 8555} {"info/global_step": 8556, "train_info/time_within_train_step": 2.757138967514038, "step": 8556} {"train_info/time_between_train_steps": 0.0033102035522460938, "step": 8556} {"info/global_step": 8557, "train_info/time_within_train_step": 2.757538318634033, "step": 8557} {"train_info/time_between_train_steps": 0.0033342838287353516, "step": 8557} {"info/global_step": 8558, "train_info/time_within_train_step": 2.7569632530212402, "step": 8558} {"train_info/time_between_train_steps": 0.003325939178466797, "step": 8558} {"info/global_step": 8559, "train_info/time_within_train_step": 2.7577719688415527, "step": 8559} {"train_info/time_between_train_steps": 0.0032873153686523438, "step": 8559} {"info/global_step": 8560, "train_info/time_within_train_step": 2.755481004714966, "step": 8560} {"train_info/time_between_train_steps": 0.003131866455078125, "step": 8560} {"info/global_step": 8561, "train_info/time_within_train_step": 2.755061149597168, "step": 8561} {"train_info/time_between_train_steps": 0.0031175613403320312, "step": 8561} {"info/global_step": 8562, "train_info/time_within_train_step": 2.7552521228790283, "step": 8562} {"train_info/time_between_train_steps": 0.0030786991119384766, "step": 8562} {"info/global_step": 8563, "train_info/time_within_train_step": 2.755727767944336, "step": 8563} {"train_info/time_between_train_steps": 0.0031228065490722656, "step": 8563} {"info/global_step": 8564, "train_info/time_within_train_step": 2.7555108070373535, "step": 8564} {"train_info/time_between_train_steps": 0.003195524215698242, "step": 8564} {"info/global_step": 8565, "train_info/time_within_train_step": 2.7558231353759766, "step": 8565} {"train_info/time_between_train_steps": 0.0031151771545410156, "step": 8565} {"info/global_step": 8566, "train_info/time_within_train_step": 2.7562308311462402, "step": 8566} {"train_info/time_between_train_steps": 0.0031125545501708984, "step": 8566} {"info/global_step": 8567, "train_info/time_within_train_step": 2.7556893825531006, "step": 8567} {"train_info/time_between_train_steps": 0.003158092498779297, "step": 8567} {"info/global_step": 8568, "train_info/time_within_train_step": 2.7563223838806152, "step": 8568} {"train_info/time_between_train_steps": 0.0031633377075195312, "step": 8568} {"info/global_step": 8569, "train_info/time_within_train_step": 2.754861354827881, "step": 8569} {"train_info/time_between_train_steps": 0.0031168460845947266, "step": 8569} {"info/global_step": 8570, "train_info/time_within_train_step": 2.7560534477233887, "step": 8570} {"train_info/time_between_train_steps": 0.0031518936157226562, "step": 8570} {"info/global_step": 8571, "train_info/time_within_train_step": 2.755260944366455, "step": 8571} {"train_info/time_between_train_steps": 0.0030994415283203125, "step": 8571} {"info/global_step": 8572, "train_info/time_within_train_step": 2.7557833194732666, "step": 8572} {"train_info/time_between_train_steps": 0.0031287670135498047, "step": 8572} {"info/global_step": 8573, "train_info/time_within_train_step": 2.755506992340088, "step": 8573} {"train_info/time_between_train_steps": 0.0031125545501708984, "step": 8573} {"info/global_step": 8574, "train_info/time_within_train_step": 2.756556272506714, "step": 8574} {"train_info/time_between_train_steps": 0.0031120777130126953, "step": 8574} {"info/global_step": 8575, "train_info/time_within_train_step": 2.7557504177093506, "step": 8575} {"train_info/time_between_train_steps": 0.0031328201293945312, "step": 8575} {"info/global_step": 8576, "train_info/time_within_train_step": 2.755791425704956, "step": 8576} {"train_info/time_between_train_steps": 0.003201007843017578, "step": 8576} {"info/global_step": 8577, "train_info/time_within_train_step": 2.7557830810546875, "step": 8577} {"train_info/time_between_train_steps": 0.0032186508178710938, "step": 8577} {"info/global_step": 8578, "train_info/time_within_train_step": 2.75620698928833, "step": 8578} {"train_info/time_between_train_steps": 0.0031375885009765625, "step": 8578} {"info/global_step": 8579, "train_info/time_within_train_step": 2.7559304237365723, "step": 8579} {"train_info/time_between_train_steps": 0.003137350082397461, "step": 8579} {"info/global_step": 8580, "train_info/time_within_train_step": 2.755542039871216, "step": 8580} {"train_info/time_between_train_steps": 0.003117799758911133, "step": 8580} {"info/global_step": 8581, "train_info/time_within_train_step": 2.7590532302856445, "step": 8581} {"train_info/time_between_train_steps": 0.0031282901763916016, "step": 8581} {"info/global_step": 8582, "train_info/time_within_train_step": 2.7560501098632812, "step": 8582} {"train_info/time_between_train_steps": 0.0031347274780273438, "step": 8582} {"info/global_step": 8583, "train_info/time_within_train_step": 2.7562012672424316, "step": 8583} {"train_info/time_between_train_steps": 0.003180265426635742, "step": 8583} {"info/global_step": 8584, "train_info/time_within_train_step": 2.7561776638031006, "step": 8584} {"train_info/time_between_train_steps": 0.0031397342681884766, "step": 8584} {"info/global_step": 8585, "train_info/time_within_train_step": 2.756204128265381, "step": 8585} {"train_info/time_between_train_steps": 0.0031151771545410156, "step": 8585} {"info/global_step": 8586, "train_info/time_within_train_step": 2.7561895847320557, "step": 8586} {"train_info/time_between_train_steps": 0.0031273365020751953, "step": 8586} {"info/global_step": 8587, "train_info/time_within_train_step": 2.7562506198883057, "step": 8587} {"train_info/time_between_train_steps": 0.0031113624572753906, "step": 8587} {"info/global_step": 8588, "train_info/time_within_train_step": 2.7559356689453125, "step": 8588} {"train_info/time_between_train_steps": 0.003237009048461914, "step": 8588} {"info/global_step": 8589, "train_info/time_within_train_step": 2.756255626678467, "step": 8589} {"train_info/time_between_train_steps": 0.003104686737060547, "step": 8589} {"info/global_step": 8590, "train_info/time_within_train_step": 2.7554452419281006, "step": 8590} {"train_info/time_between_train_steps": 0.0031037330627441406, "step": 8590} {"info/global_step": 8591, "train_info/time_within_train_step": 2.7551517486572266, "step": 8591} {"train_info/time_between_train_steps": 0.0031151771545410156, "step": 8591} {"info/global_step": 8592, "train_info/time_within_train_step": 2.755704641342163, "step": 8592} {"train_info/time_between_train_steps": 0.0031211376190185547, "step": 8592} {"info/global_step": 8593, "train_info/time_within_train_step": 2.8782052993774414, "step": 8593} {"train_info/time_between_train_steps": 0.0031859874725341797, "step": 8593} {"info/global_step": 8594, "train_info/time_within_train_step": 2.756673812866211, "step": 8594} {"train_info/time_between_train_steps": 0.003144979476928711, "step": 8594} {"info/global_step": 8595, "train_info/time_within_train_step": 2.756427526473999, "step": 8595} {"train_info/time_between_train_steps": 0.003152608871459961, "step": 8595} {"info/global_step": 8596, "train_info/time_within_train_step": 2.756828546524048, "step": 8596} {"train_info/time_between_train_steps": 0.0031185150146484375, "step": 8596} {"info/global_step": 8597, "train_info/time_within_train_step": 2.7564361095428467, "step": 8597} {"train_info/time_between_train_steps": 0.0031642913818359375, "step": 8597} {"info/global_step": 8598, "train_info/time_within_train_step": 2.7552459239959717, "step": 8598} {"train_info/time_between_train_steps": 0.0031583309173583984, "step": 8598} {"info/global_step": 8599, "train_info/time_within_train_step": 2.7572131156921387, "step": 8599} {"train_info/time_between_train_steps": 0.0032656192779541016, "step": 8599} {"info/global_step": 8600, "train_info/time_within_train_step": 2.7567358016967773, "step": 8600} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746590798, "_runtime": 24807}, "step": 8600} {"logs": {"train/loss": 3.0207, "train/learning_rate": 9.333333333333333e-05, "train/epoch": 10.01, "_timestamp": 1746590798, "_runtime": 24807}, "step": 8600} {"train_info/time_between_train_steps": 13.554368734359741, "step": 8600} {"info/global_step": 8601, "train_info/time_within_train_step": 2.5322940349578857, "step": 8601} {"train_info/time_between_train_steps": 0.003159046173095703, "step": 8601} {"info/global_step": 8602, "train_info/time_within_train_step": 2.5922775268554688, "step": 8602} {"train_info/time_between_train_steps": 0.003180980682373047, "step": 8602} {"info/global_step": 8603, "train_info/time_within_train_step": 2.7333788871765137, "step": 8603} {"train_info/time_between_train_steps": 0.0031626224517822266, "step": 8603} {"info/global_step": 8604, "train_info/time_within_train_step": 2.9841763973236084, "step": 8604} {"train_info/time_between_train_steps": 0.003122568130493164, "step": 8604} {"info/global_step": 8605, "train_info/time_within_train_step": 2.750819683074951, "step": 8605} {"train_info/time_between_train_steps": 0.0031168460845947266, "step": 8605} {"info/global_step": 8606, "train_info/time_within_train_step": 2.7564165592193604, "step": 8606} {"train_info/time_between_train_steps": 0.0031299591064453125, "step": 8606} {"info/global_step": 8607, "train_info/time_within_train_step": 2.754713773727417, "step": 8607} {"train_info/time_between_train_steps": 0.003142833709716797, "step": 8607} {"info/global_step": 8608, "train_info/time_within_train_step": 2.7555456161499023, "step": 8608} {"train_info/time_between_train_steps": 0.0031180381774902344, "step": 8608} {"info/global_step": 8609, "train_info/time_within_train_step": 2.7552146911621094, "step": 8609} {"train_info/time_between_train_steps": 0.003281831741333008, "step": 8609} {"info/global_step": 8610, "train_info/time_within_train_step": 2.7567052841186523, "step": 8610} {"train_info/time_between_train_steps": 0.003117084503173828, "step": 8610} {"info/global_step": 8611, "train_info/time_within_train_step": 2.7557175159454346, "step": 8611} {"train_info/time_between_train_steps": 0.0031549930572509766, "step": 8611} {"info/global_step": 8612, "train_info/time_within_train_step": 2.756920099258423, "step": 8612} {"train_info/time_between_train_steps": 0.003141641616821289, "step": 8612} {"info/global_step": 8613, "train_info/time_within_train_step": 2.756808280944824, "step": 8613} {"train_info/time_between_train_steps": 0.0031387805938720703, "step": 8613} {"info/global_step": 8614, "train_info/time_within_train_step": 2.756847381591797, "step": 8614} {"train_info/time_between_train_steps": 0.0031647682189941406, "step": 8614} {"info/global_step": 8615, "train_info/time_within_train_step": 2.7575957775115967, "step": 8615} {"train_info/time_between_train_steps": 0.003131866455078125, "step": 8615} {"info/global_step": 8616, "train_info/time_within_train_step": 2.7572638988494873, "step": 8616} {"train_info/time_between_train_steps": 0.0031239986419677734, "step": 8616} {"info/global_step": 8617, "train_info/time_within_train_step": 2.75730562210083, "step": 8617} {"train_info/time_between_train_steps": 0.0031347274780273438, "step": 8617} {"info/global_step": 8618, "train_info/time_within_train_step": 2.756277322769165, "step": 8618} {"train_info/time_between_train_steps": 0.003161191940307617, "step": 8618} {"info/global_step": 8619, "train_info/time_within_train_step": 2.756636381149292, "step": 8619} {"train_info/time_between_train_steps": 0.0031156539916992188, "step": 8619} {"info/global_step": 8620, "train_info/time_within_train_step": 2.755964994430542, "step": 8620} {"train_info/time_between_train_steps": 0.0031621456146240234, "step": 8620} {"info/global_step": 8621, "train_info/time_within_train_step": 2.756664514541626, "step": 8621} {"train_info/time_between_train_steps": 0.0031392574310302734, "step": 8621} {"info/global_step": 8622, "train_info/time_within_train_step": 2.7558441162109375, "step": 8622} {"train_info/time_between_train_steps": 0.003116607666015625, "step": 8622} {"info/global_step": 8623, "train_info/time_within_train_step": 2.7561161518096924, "step": 8623} {"train_info/time_between_train_steps": 0.0031571388244628906, "step": 8623} {"info/global_step": 8624, "train_info/time_within_train_step": 2.756446123123169, "step": 8624} {"train_info/time_between_train_steps": 0.003213167190551758, "step": 8624} {"info/global_step": 8625, "train_info/time_within_train_step": 2.75689959526062, "step": 8625} {"train_info/time_between_train_steps": 0.0031273365020751953, "step": 8625} {"info/global_step": 8626, "train_info/time_within_train_step": 2.7567107677459717, "step": 8626} {"train_info/time_between_train_steps": 0.0031495094299316406, "step": 8626} {"info/global_step": 8627, "train_info/time_within_train_step": 2.7559545040130615, "step": 8627} {"train_info/time_between_train_steps": 0.0031228065490722656, "step": 8627} {"info/global_step": 8628, "train_info/time_within_train_step": 2.7556405067443848, "step": 8628} {"train_info/time_between_train_steps": 0.0031375885009765625, "step": 8628} {"info/global_step": 8629, "train_info/time_within_train_step": 2.7561745643615723, "step": 8629} {"train_info/time_between_train_steps": 0.0031838417053222656, "step": 8629} {"info/global_step": 8630, "train_info/time_within_train_step": 2.75675892829895, "step": 8630} {"train_info/time_between_train_steps": 0.0031554698944091797, "step": 8630} {"info/global_step": 8631, "train_info/time_within_train_step": 2.7563302516937256, "step": 8631} {"train_info/time_between_train_steps": 0.003141164779663086, "step": 8631} {"info/global_step": 8632, "train_info/time_within_train_step": 2.7569549083709717, "step": 8632} {"train_info/time_between_train_steps": 0.0031425952911376953, "step": 8632} {"info/global_step": 8633, "train_info/time_within_train_step": 2.7552733421325684, "step": 8633} {"train_info/time_between_train_steps": 0.003099203109741211, "step": 8633} {"info/global_step": 8634, "train_info/time_within_train_step": 2.7560184001922607, "step": 8634} {"train_info/time_between_train_steps": 0.0031201839447021484, "step": 8634} {"info/global_step": 8635, "train_info/time_within_train_step": 2.7557990550994873, "step": 8635} {"train_info/time_between_train_steps": 0.0032134056091308594, "step": 8635} {"info/global_step": 8636, "train_info/time_within_train_step": 2.7554056644439697, "step": 8636} {"train_info/time_between_train_steps": 0.003130197525024414, "step": 8636} {"info/global_step": 8637, "train_info/time_within_train_step": 2.756579637527466, "step": 8637} {"train_info/time_between_train_steps": 0.0031938552856445312, "step": 8637} {"info/global_step": 8638, "train_info/time_within_train_step": 2.7555360794067383, "step": 8638} {"train_info/time_between_train_steps": 0.003139972686767578, "step": 8638} {"info/global_step": 8639, "train_info/time_within_train_step": 2.7566494941711426, "step": 8639} {"train_info/time_between_train_steps": 0.003153562545776367, "step": 8639} {"info/global_step": 8640, "train_info/time_within_train_step": 2.7565975189208984, "step": 8640} {"train_info/time_between_train_steps": 0.0031652450561523438, "step": 8640} {"info/global_step": 8641, "train_info/time_within_train_step": 2.7568588256835938, "step": 8641} {"train_info/time_between_train_steps": 0.0031347274780273438, "step": 8641} {"info/global_step": 8642, "train_info/time_within_train_step": 2.755955457687378, "step": 8642} {"train_info/time_between_train_steps": 0.003139019012451172, "step": 8642} {"info/global_step": 8643, "train_info/time_within_train_step": 2.7570502758026123, "step": 8643} {"train_info/time_between_train_steps": 0.0031442642211914062, "step": 8643} {"info/global_step": 8644, "train_info/time_within_train_step": 2.756911039352417, "step": 8644} {"train_info/time_between_train_steps": 0.0031228065490722656, "step": 8644} {"info/global_step": 8645, "train_info/time_within_train_step": 2.7565863132476807, "step": 8645} {"train_info/time_between_train_steps": 0.003157377243041992, "step": 8645} {"info/global_step": 8646, "train_info/time_within_train_step": 2.7565574645996094, "step": 8646} {"train_info/time_between_train_steps": 0.0031430721282958984, "step": 8646} {"info/global_step": 8647, "train_info/time_within_train_step": 2.7561235427856445, "step": 8647} {"train_info/time_between_train_steps": 0.003134489059448242, "step": 8647} {"info/global_step": 8648, "train_info/time_within_train_step": 2.755714178085327, "step": 8648} {"train_info/time_between_train_steps": 0.003145933151245117, "step": 8648} {"info/global_step": 8649, "train_info/time_within_train_step": 2.7548201084136963, "step": 8649} {"train_info/time_between_train_steps": 0.003168821334838867, "step": 8649} {"info/global_step": 8650, "train_info/time_within_train_step": 2.7565221786499023, "step": 8650} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746590950, "_runtime": 24959}, "step": 8650} {"logs": {"train/loss": 3.012, "train/learning_rate": 8.999999999999999e-05, "train/epoch": 10.01, "_timestamp": 1746590950, "_runtime": 24959}, "step": 8650} {"train_info/time_between_train_steps": 0.00726008415222168, "step": 8650} {"info/global_step": 8651, "train_info/time_within_train_step": 2.7566287517547607, "step": 8651} {"train_info/time_between_train_steps": 0.003097057342529297, "step": 8651} {"info/global_step": 8652, "train_info/time_within_train_step": 2.7553493976593018, "step": 8652} {"train_info/time_between_train_steps": 0.003080129623413086, "step": 8652} {"info/global_step": 8653, "train_info/time_within_train_step": 2.755622625350952, "step": 8653} {"train_info/time_between_train_steps": 0.003167867660522461, "step": 8653} {"info/global_step": 8654, "train_info/time_within_train_step": 2.756974220275879, "step": 8654} {"train_info/time_between_train_steps": 0.0032851696014404297, "step": 8654} {"info/global_step": 8655, "train_info/time_within_train_step": 2.757175922393799, "step": 8655} {"train_info/time_between_train_steps": 0.1281266212463379, "step": 8655} {"info/global_step": 8656, "train_info/time_within_train_step": 2.757577896118164, "step": 8656} {"train_info/time_between_train_steps": 0.003300189971923828, "step": 8656} {"info/global_step": 8657, "train_info/time_within_train_step": 2.7577497959136963, "step": 8657} {"train_info/time_between_train_steps": 0.003304004669189453, "step": 8657} {"info/global_step": 8658, "train_info/time_within_train_step": 2.7585175037384033, "step": 8658} {"train_info/time_between_train_steps": 0.0034792423248291016, "step": 8658} {"info/global_step": 8659, "train_info/time_within_train_step": 2.757777452468872, "step": 8659} {"train_info/time_between_train_steps": 0.003328084945678711, "step": 8659} {"info/global_step": 8660, "train_info/time_within_train_step": 2.757967472076416, "step": 8660} {"train_info/time_between_train_steps": 0.003293275833129883, "step": 8660} {"info/global_step": 8661, "train_info/time_within_train_step": 2.7573792934417725, "step": 8661} {"train_info/time_between_train_steps": 0.003413677215576172, "step": 8661} {"info/global_step": 8662, "train_info/time_within_train_step": 2.757746934890747, "step": 8662} {"train_info/time_between_train_steps": 0.003315448760986328, "step": 8662} {"info/global_step": 8663, "train_info/time_within_train_step": 2.757425308227539, "step": 8663} {"train_info/time_between_train_steps": 0.003320455551147461, "step": 8663} {"info/global_step": 8664, "train_info/time_within_train_step": 2.756915807723999, "step": 8664} {"train_info/time_between_train_steps": 0.0033719539642333984, "step": 8664} {"info/global_step": 8665, "train_info/time_within_train_step": 2.7581865787506104, "step": 8665} {"train_info/time_between_train_steps": 0.003333568572998047, "step": 8665} {"info/global_step": 8666, "train_info/time_within_train_step": 2.7587413787841797, "step": 8666} {"train_info/time_between_train_steps": 0.0033261775970458984, "step": 8666} {"info/global_step": 8667, "train_info/time_within_train_step": 2.757361888885498, "step": 8667} {"train_info/time_between_train_steps": 0.003314495086669922, "step": 8667} {"info/global_step": 8668, "train_info/time_within_train_step": 2.757338285446167, "step": 8668} {"train_info/time_between_train_steps": 0.003300189971923828, "step": 8668} {"info/global_step": 8669, "train_info/time_within_train_step": 2.7579007148742676, "step": 8669} {"train_info/time_between_train_steps": 0.0037751197814941406, "step": 8669} {"info/global_step": 8670, "train_info/time_within_train_step": 2.757525682449341, "step": 8670} {"train_info/time_between_train_steps": 0.003320455551147461, "step": 8670} {"info/global_step": 8671, "train_info/time_within_train_step": 2.757235288619995, "step": 8671} {"train_info/time_between_train_steps": 0.0032901763916015625, "step": 8671} {"info/global_step": 8672, "train_info/time_within_train_step": 2.7581088542938232, "step": 8672} {"train_info/time_between_train_steps": 0.0034029483795166016, "step": 8672} {"info/global_step": 8673, "train_info/time_within_train_step": 2.758674383163452, "step": 8673} {"train_info/time_between_train_steps": 0.003392934799194336, "step": 8673} {"info/global_step": 8674, "train_info/time_within_train_step": 2.7578556537628174, "step": 8674} {"train_info/time_between_train_steps": 0.0033288002014160156, "step": 8674} {"info/global_step": 8675, "train_info/time_within_train_step": 2.7567269802093506, "step": 8675} {"train_info/time_between_train_steps": 0.0033965110778808594, "step": 8675} {"info/global_step": 8676, "train_info/time_within_train_step": 2.758061647415161, "step": 8676} {"train_info/time_between_train_steps": 0.003333568572998047, "step": 8676} {"info/global_step": 8677, "train_info/time_within_train_step": 2.75636625289917, "step": 8677} {"train_info/time_between_train_steps": 0.0034716129302978516, "step": 8677} {"info/global_step": 8678, "train_info/time_within_train_step": 2.757631778717041, "step": 8678} {"train_info/time_between_train_steps": 0.003360748291015625, "step": 8678} {"info/global_step": 8679, "train_info/time_within_train_step": 2.7575531005859375, "step": 8679} {"train_info/time_between_train_steps": 0.003317594528198242, "step": 8679} {"info/global_step": 8680, "train_info/time_within_train_step": 2.755997657775879, "step": 8680} {"train_info/time_between_train_steps": 0.0033121109008789062, "step": 8680} {"info/global_step": 8681, "train_info/time_within_train_step": 2.7568860054016113, "step": 8681} {"train_info/time_between_train_steps": 0.003324747085571289, "step": 8681} {"info/global_step": 8682, "train_info/time_within_train_step": 2.755826950073242, "step": 8682} {"train_info/time_between_train_steps": 0.003332853317260742, "step": 8682} {"info/global_step": 8683, "train_info/time_within_train_step": 2.7565383911132812, "step": 8683} {"train_info/time_between_train_steps": 0.0033082962036132812, "step": 8683} {"info/global_step": 8684, "train_info/time_within_train_step": 2.7566819190979004, "step": 8684} {"train_info/time_between_train_steps": 0.0033257007598876953, "step": 8684} {"info/global_step": 8685, "train_info/time_within_train_step": 2.756897211074829, "step": 8685} {"train_info/time_between_train_steps": 0.0034477710723876953, "step": 8685} {"info/global_step": 8686, "train_info/time_within_train_step": 2.7560601234436035, "step": 8686} {"train_info/time_between_train_steps": 0.006464481353759766, "step": 8686} {"info/global_step": 8687, "train_info/time_within_train_step": 2.7584753036499023, "step": 8687} {"train_info/time_between_train_steps": 0.006472349166870117, "step": 8687} {"info/global_step": 8688, "train_info/time_within_train_step": 2.759544610977173, "step": 8688} {"train_info/time_between_train_steps": 0.006428718566894531, "step": 8688} {"info/global_step": 8689, "train_info/time_within_train_step": 2.7583649158477783, "step": 8689} {"train_info/time_between_train_steps": 0.006443500518798828, "step": 8689} {"info/global_step": 8690, "train_info/time_within_train_step": 2.759373188018799, "step": 8690} {"train_info/time_between_train_steps": 0.006437063217163086, "step": 8690} {"info/global_step": 8691, "train_info/time_within_train_step": 2.7600300312042236, "step": 8691} {"train_info/time_between_train_steps": 0.0064394474029541016, "step": 8691} {"info/global_step": 8692, "train_info/time_within_train_step": 2.760344982147217, "step": 8692} {"train_info/time_between_train_steps": 0.0064699649810791016, "step": 8692} {"info/global_step": 8693, "train_info/time_within_train_step": 2.7595529556274414, "step": 8693} {"train_info/time_between_train_steps": 0.0064029693603515625, "step": 8693} {"info/global_step": 8694, "train_info/time_within_train_step": 2.7581262588500977, "step": 8694} {"train_info/time_between_train_steps": 0.006396770477294922, "step": 8694} {"info/global_step": 8695, "train_info/time_within_train_step": 2.759315252304077, "step": 8695} {"train_info/time_between_train_steps": 0.0065305233001708984, "step": 8695} {"info/global_step": 8696, "train_info/time_within_train_step": 2.759005546569824, "step": 8696} {"train_info/time_between_train_steps": 0.0064563751220703125, "step": 8696} {"info/global_step": 8697, "train_info/time_within_train_step": 2.7593016624450684, "step": 8697} {"train_info/time_between_train_steps": 0.00650334358215332, "step": 8697} {"info/global_step": 8698, "train_info/time_within_train_step": 3.0047104358673096, "step": 8698} {"train_info/time_between_train_steps": 0.006491899490356445, "step": 8698} {"info/global_step": 8699, "train_info/time_within_train_step": 2.7590582370758057, "step": 8699} {"train_info/time_between_train_steps": 0.0064432621002197266, "step": 8699} {"info/global_step": 8700, "train_info/time_within_train_step": 2.7587883472442627, "step": 8700} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746591088, "_runtime": 25097}, "step": 8700} {"logs": {"train/loss": 3.0044, "train/learning_rate": 8.666666666666665e-05, "train/epoch": 10.02, "_timestamp": 1746591088, "_runtime": 25097}, "step": 8700} {"train_info/time_between_train_steps": 0.01125788688659668, "step": 8700} {"info/global_step": 8701, "train_info/time_within_train_step": 2.75726580619812, "step": 8701} {"train_info/time_between_train_steps": 0.0065081119537353516, "step": 8701} {"info/global_step": 8702, "train_info/time_within_train_step": 2.7593092918395996, "step": 8702} {"train_info/time_between_train_steps": 0.0064427852630615234, "step": 8702} {"info/global_step": 8703, "train_info/time_within_train_step": 2.759546995162964, "step": 8703} {"train_info/time_between_train_steps": 0.0031452178955078125, "step": 8703} {"info/global_step": 8704, "train_info/time_within_train_step": 2.7549355030059814, "step": 8704} {"train_info/time_between_train_steps": 0.0031638145446777344, "step": 8704} {"info/global_step": 8705, "train_info/time_within_train_step": 2.7549188137054443, "step": 8705} {"train_info/time_between_train_steps": 0.0031473636627197266, "step": 8705} {"info/global_step": 8706, "train_info/time_within_train_step": 2.7557168006896973, "step": 8706} {"train_info/time_between_train_steps": 0.003183603286743164, "step": 8706} {"info/global_step": 8707, "train_info/time_within_train_step": 2.756206750869751, "step": 8707} {"train_info/time_between_train_steps": 0.0031616687774658203, "step": 8707} {"info/global_step": 8708, "train_info/time_within_train_step": 2.7544937133789062, "step": 8708} {"train_info/time_between_train_steps": 0.0031909942626953125, "step": 8708} {"info/global_step": 8709, "train_info/time_within_train_step": 2.75649356842041, "step": 8709} {"train_info/time_between_train_steps": 0.0031723976135253906, "step": 8709} {"info/global_step": 8710, "train_info/time_within_train_step": 2.7559423446655273, "step": 8710} {"train_info/time_between_train_steps": 0.0031557083129882812, "step": 8710} {"info/global_step": 8711, "train_info/time_within_train_step": 2.7552742958068848, "step": 8711} {"train_info/time_between_train_steps": 0.003133535385131836, "step": 8711} {"info/global_step": 8712, "train_info/time_within_train_step": 2.75703501701355, "step": 8712} {"train_info/time_between_train_steps": 0.006497621536254883, "step": 8712} {"info/global_step": 8713, "train_info/time_within_train_step": 2.7584567070007324, "step": 8713} {"train_info/time_between_train_steps": 0.006392478942871094, "step": 8713} {"info/global_step": 8714, "train_info/time_within_train_step": 2.759263515472412, "step": 8714} {"train_info/time_between_train_steps": 0.0064487457275390625, "step": 8714} {"info/global_step": 8715, "train_info/time_within_train_step": 2.759042501449585, "step": 8715} {"train_info/time_between_train_steps": 0.006556510925292969, "step": 8715} {"info/global_step": 8716, "train_info/time_within_train_step": 2.758798599243164, "step": 8716} {"train_info/time_between_train_steps": 0.0065038204193115234, "step": 8716} {"info/global_step": 8717, "train_info/time_within_train_step": 2.7598609924316406, "step": 8717} {"train_info/time_between_train_steps": 0.006378889083862305, "step": 8717} {"info/global_step": 8718, "train_info/time_within_train_step": 2.8838367462158203, "step": 8718} {"train_info/time_between_train_steps": 0.006466388702392578, "step": 8718} {"info/global_step": 8719, "train_info/time_within_train_step": 2.759284496307373, "step": 8719} {"train_info/time_between_train_steps": 0.003372669219970703, "step": 8719} {"info/global_step": 8720, "train_info/time_within_train_step": 2.7542836666107178, "step": 8720} {"train_info/time_between_train_steps": 0.003364086151123047, "step": 8720} {"info/global_step": 8721, "train_info/time_within_train_step": 2.7569992542266846, "step": 8721} {"train_info/time_between_train_steps": 0.0033326148986816406, "step": 8721} {"info/global_step": 8722, "train_info/time_within_train_step": 2.755850076675415, "step": 8722} {"train_info/time_between_train_steps": 0.003407716751098633, "step": 8722} {"info/global_step": 8723, "train_info/time_within_train_step": 2.756200075149536, "step": 8723} {"train_info/time_between_train_steps": 0.003309011459350586, "step": 8723} {"info/global_step": 8724, "train_info/time_within_train_step": 2.755140542984009, "step": 8724} {"train_info/time_between_train_steps": 0.0033266544342041016, "step": 8724} {"info/global_step": 8725, "train_info/time_within_train_step": 2.7571003437042236, "step": 8725} {"train_info/time_between_train_steps": 0.0033130645751953125, "step": 8725} {"info/global_step": 8726, "train_info/time_within_train_step": 2.75665020942688, "step": 8726} {"train_info/time_between_train_steps": 0.003305196762084961, "step": 8726} {"info/global_step": 8727, "train_info/time_within_train_step": 2.7561347484588623, "step": 8727} {"train_info/time_between_train_steps": 0.0033888816833496094, "step": 8727} {"info/global_step": 8728, "train_info/time_within_train_step": 2.757293462753296, "step": 8728} {"train_info/time_between_train_steps": 0.00334930419921875, "step": 8728} {"info/global_step": 8729, "train_info/time_within_train_step": 2.7578678131103516, "step": 8729} {"train_info/time_between_train_steps": 0.003373861312866211, "step": 8729} {"info/global_step": 8730, "train_info/time_within_train_step": 2.758368492126465, "step": 8730} {"train_info/time_between_train_steps": 0.0034415721893310547, "step": 8730} {"info/global_step": 8731, "train_info/time_within_train_step": 2.758342742919922, "step": 8731} {"train_info/time_between_train_steps": 0.0033066272735595703, "step": 8731} {"info/global_step": 8732, "train_info/time_within_train_step": 2.757802724838257, "step": 8732} {"train_info/time_between_train_steps": 0.003336191177368164, "step": 8732} {"info/global_step": 8733, "train_info/time_within_train_step": 2.7555737495422363, "step": 8733} {"train_info/time_between_train_steps": 0.003351449966430664, "step": 8733} {"info/global_step": 8734, "train_info/time_within_train_step": 2.756415605545044, "step": 8734} {"train_info/time_between_train_steps": 0.0033292770385742188, "step": 8734} {"info/global_step": 8735, "train_info/time_within_train_step": 2.7561838626861572, "step": 8735} {"train_info/time_between_train_steps": 0.0033485889434814453, "step": 8735} {"info/global_step": 8736, "train_info/time_within_train_step": 2.756932258605957, "step": 8736} {"train_info/time_between_train_steps": 0.003320932388305664, "step": 8736} {"info/global_step": 8737, "train_info/time_within_train_step": 2.7571356296539307, "step": 8737} {"train_info/time_between_train_steps": 0.003320455551147461, "step": 8737} {"info/global_step": 8738, "train_info/time_within_train_step": 2.7563629150390625, "step": 8738} {"train_info/time_between_train_steps": 0.003467082977294922, "step": 8738} {"info/global_step": 8739, "train_info/time_within_train_step": 2.757249116897583, "step": 8739} {"train_info/time_between_train_steps": 0.003312826156616211, "step": 8739} {"info/global_step": 8740, "train_info/time_within_train_step": 2.7537693977355957, "step": 8740} {"train_info/time_between_train_steps": 0.003145933151245117, "step": 8740} {"info/global_step": 8741, "train_info/time_within_train_step": 2.754744052886963, "step": 8741} {"train_info/time_between_train_steps": 0.003216981887817383, "step": 8741} {"info/global_step": 8742, "train_info/time_within_train_step": 2.7549984455108643, "step": 8742} {"train_info/time_between_train_steps": 0.0031557083129882812, "step": 8742} {"info/global_step": 8743, "train_info/time_within_train_step": 2.7560572624206543, "step": 8743} {"train_info/time_between_train_steps": 0.0033097267150878906, "step": 8743} {"info/global_step": 8744, "train_info/time_within_train_step": 2.7567989826202393, "step": 8744} {"train_info/time_between_train_steps": 0.003326416015625, "step": 8744} {"info/global_step": 8745, "train_info/time_within_train_step": 3.333453893661499, "step": 8745} {"train_info/time_between_train_steps": 0.003375530242919922, "step": 8745} {"info/global_step": 8746, "train_info/time_within_train_step": 2.7536041736602783, "step": 8746} {"train_info/time_between_train_steps": 0.003347158432006836, "step": 8746} {"info/global_step": 8747, "train_info/time_within_train_step": 2.7567176818847656, "step": 8747} {"train_info/time_between_train_steps": 0.003309965133666992, "step": 8747} {"info/global_step": 8748, "train_info/time_within_train_step": 2.7572717666625977, "step": 8748} {"train_info/time_between_train_steps": 0.003360271453857422, "step": 8748} {"info/global_step": 8749, "train_info/time_within_train_step": 2.7568557262420654, "step": 8749} {"train_info/time_between_train_steps": 0.0033273696899414062, "step": 8749} {"info/global_step": 8750, "train_info/time_within_train_step": 2.7573728561401367, "step": 8750} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746591227, "_runtime": 25236}, "step": 8750} {"logs": {"train/loss": 2.9891, "train/learning_rate": 8.333333333333333e-05, "train/epoch": 10.02, "_timestamp": 1746591227, "_runtime": 25236}, "step": 8750} {"train_info/time_between_train_steps": 0.00716400146484375, "step": 8750} {"info/global_step": 8751, "train_info/time_within_train_step": 2.757627010345459, "step": 8751} {"train_info/time_between_train_steps": 0.0032987594604492188, "step": 8751} {"info/global_step": 8752, "train_info/time_within_train_step": 2.7555389404296875, "step": 8752} {"train_info/time_between_train_steps": 0.003345966339111328, "step": 8752} {"info/global_step": 8753, "train_info/time_within_train_step": 2.7557926177978516, "step": 8753} {"train_info/time_between_train_steps": 0.0033805370330810547, "step": 8753} {"info/global_step": 8754, "train_info/time_within_train_step": 2.7571330070495605, "step": 8754} {"train_info/time_between_train_steps": 0.0037670135498046875, "step": 8754} {"info/global_step": 8755, "train_info/time_within_train_step": 3.0054726600646973, "step": 8755} {"train_info/time_between_train_steps": 0.003292083740234375, "step": 8755} {"info/global_step": 8756, "train_info/time_within_train_step": 2.756953001022339, "step": 8756} {"train_info/time_between_train_steps": 0.0033104419708251953, "step": 8756} {"info/global_step": 8757, "train_info/time_within_train_step": 2.757310390472412, "step": 8757} {"train_info/time_between_train_steps": 0.0033409595489501953, "step": 8757} {"info/global_step": 8758, "train_info/time_within_train_step": 2.756063461303711, "step": 8758} {"train_info/time_between_train_steps": 0.003307819366455078, "step": 8758} {"info/global_step": 8759, "train_info/time_within_train_step": 2.7572362422943115, "step": 8759} {"train_info/time_between_train_steps": 0.0033402442932128906, "step": 8759} {"info/global_step": 8760, "train_info/time_within_train_step": 2.75801420211792, "step": 8760} {"train_info/time_between_train_steps": 0.0033447742462158203, "step": 8760} {"info/global_step": 8761, "train_info/time_within_train_step": 2.75728440284729, "step": 8761} {"train_info/time_between_train_steps": 0.0033135414123535156, "step": 8761} {"info/global_step": 8762, "train_info/time_within_train_step": 2.756927728652954, "step": 8762} {"train_info/time_between_train_steps": 0.0032663345336914062, "step": 8762} {"info/global_step": 8763, "train_info/time_within_train_step": 2.758157968521118, "step": 8763} {"train_info/time_between_train_steps": 0.0033032894134521484, "step": 8763} {"info/global_step": 8764, "train_info/time_within_train_step": 2.7575736045837402, "step": 8764} {"train_info/time_between_train_steps": 0.0033807754516601562, "step": 8764} {"info/global_step": 8765, "train_info/time_within_train_step": 2.756861448287964, "step": 8765} {"train_info/time_between_train_steps": 0.0032994747161865234, "step": 8765} {"info/global_step": 8766, "train_info/time_within_train_step": 2.757434368133545, "step": 8766} {"train_info/time_between_train_steps": 0.0034096240997314453, "step": 8766} {"info/global_step": 8767, "train_info/time_within_train_step": 2.756133794784546, "step": 8767} {"train_info/time_between_train_steps": 0.003129243850708008, "step": 8767} {"info/global_step": 8768, "train_info/time_within_train_step": 2.7546567916870117, "step": 8768} {"train_info/time_between_train_steps": 0.003169536590576172, "step": 8768} {"info/global_step": 8769, "train_info/time_within_train_step": 2.7545440196990967, "step": 8769} {"train_info/time_between_train_steps": 0.003100156784057617, "step": 8769} {"info/global_step": 8770, "train_info/time_within_train_step": 2.754915237426758, "step": 8770} {"train_info/time_between_train_steps": 0.0031638145446777344, "step": 8770} {"info/global_step": 8771, "train_info/time_within_train_step": 2.754486322402954, "step": 8771} {"train_info/time_between_train_steps": 0.003127574920654297, "step": 8771} {"info/global_step": 8772, "train_info/time_within_train_step": 2.7551262378692627, "step": 8772} {"train_info/time_between_train_steps": 0.0031456947326660156, "step": 8772} {"info/global_step": 8773, "train_info/time_within_train_step": 2.7552733421325684, "step": 8773} {"train_info/time_between_train_steps": 0.0031409263610839844, "step": 8773} {"info/global_step": 8774, "train_info/time_within_train_step": 2.7554047107696533, "step": 8774} {"train_info/time_between_train_steps": 0.0031232833862304688, "step": 8774} {"info/global_step": 8775, "train_info/time_within_train_step": 2.755234479904175, "step": 8775} {"train_info/time_between_train_steps": 0.0031402111053466797, "step": 8775} {"info/global_step": 8776, "train_info/time_within_train_step": 2.7558975219726562, "step": 8776} {"train_info/time_between_train_steps": 0.0031309127807617188, "step": 8776} {"info/global_step": 8777, "train_info/time_within_train_step": 2.7555415630340576, "step": 8777} {"train_info/time_between_train_steps": 0.0031766891479492188, "step": 8777} {"info/global_step": 8778, "train_info/time_within_train_step": 2.7554099559783936, "step": 8778} {"train_info/time_between_train_steps": 0.0031585693359375, "step": 8778} {"info/global_step": 8779, "train_info/time_within_train_step": 2.754884719848633, "step": 8779} {"train_info/time_between_train_steps": 0.0031518936157226562, "step": 8779} {"info/global_step": 8780, "train_info/time_within_train_step": 2.7563140392303467, "step": 8780} {"train_info/time_between_train_steps": 0.1287841796875, "step": 8780} {"info/global_step": 8781, "train_info/time_within_train_step": 2.7799055576324463, "step": 8781} {"train_info/time_between_train_steps": 0.0031998157501220703, "step": 8781} {"info/global_step": 8782, "train_info/time_within_train_step": 2.7565605640411377, "step": 8782} {"train_info/time_between_train_steps": 0.0031435489654541016, "step": 8782} {"info/global_step": 8783, "train_info/time_within_train_step": 2.754450559616089, "step": 8783} {"train_info/time_between_train_steps": 0.0031626224517822266, "step": 8783} {"info/global_step": 8784, "train_info/time_within_train_step": 2.7551801204681396, "step": 8784} {"train_info/time_between_train_steps": 0.0032134056091308594, "step": 8784} {"info/global_step": 8785, "train_info/time_within_train_step": 2.7549095153808594, "step": 8785} {"train_info/time_between_train_steps": 0.003142833709716797, "step": 8785} {"info/global_step": 8786, "train_info/time_within_train_step": 2.754481792449951, "step": 8786} {"train_info/time_between_train_steps": 0.0031690597534179688, "step": 8786} {"info/global_step": 8787, "train_info/time_within_train_step": 2.754455327987671, "step": 8787} {"train_info/time_between_train_steps": 0.003176450729370117, "step": 8787} {"info/global_step": 8788, "train_info/time_within_train_step": 2.7565231323242188, "step": 8788} {"train_info/time_between_train_steps": 0.003374814987182617, "step": 8788} {"info/global_step": 8789, "train_info/time_within_train_step": 2.7574849128723145, "step": 8789} {"train_info/time_between_train_steps": 0.003330707550048828, "step": 8789} {"info/global_step": 8790, "train_info/time_within_train_step": 2.7570018768310547, "step": 8790} {"train_info/time_between_train_steps": 0.003382444381713867, "step": 8790} {"info/global_step": 8791, "train_info/time_within_train_step": 2.7566120624542236, "step": 8791} {"train_info/time_between_train_steps": 0.0032982826232910156, "step": 8791} {"info/global_step": 8792, "train_info/time_within_train_step": 2.757251262664795, "step": 8792} {"train_info/time_between_train_steps": 0.0034034252166748047, "step": 8792} {"info/global_step": 8793, "train_info/time_within_train_step": 2.757260799407959, "step": 8793} {"train_info/time_between_train_steps": 0.003316640853881836, "step": 8793} {"info/global_step": 8794, "train_info/time_within_train_step": 2.757092237472534, "step": 8794} {"train_info/time_between_train_steps": 0.003381013870239258, "step": 8794} {"info/global_step": 8795, "train_info/time_within_train_step": 2.756866455078125, "step": 8795} {"train_info/time_between_train_steps": 0.0033371448516845703, "step": 8795} {"info/global_step": 8796, "train_info/time_within_train_step": 3.0075018405914307, "step": 8796} {"train_info/time_between_train_steps": 0.0032923221588134766, "step": 8796} {"info/global_step": 8797, "train_info/time_within_train_step": 2.7573084831237793, "step": 8797} {"train_info/time_between_train_steps": 0.0033140182495117188, "step": 8797} {"info/global_step": 8798, "train_info/time_within_train_step": 2.755612373352051, "step": 8798} {"train_info/time_between_train_steps": 0.003175973892211914, "step": 8798} {"info/global_step": 8799, "train_info/time_within_train_step": 2.7549266815185547, "step": 8799} {"train_info/time_between_train_steps": 0.0031244754791259766, "step": 8799} {"info/global_step": 8800, "train_info/time_within_train_step": 2.75561785697937, "step": 8800} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746591366, "_runtime": 25375}, "step": 8800} {"logs": {"train/loss": 2.9796, "train/learning_rate": 7.999999999999999e-05, "train/epoch": 10.03, "_timestamp": 1746591366, "_runtime": 25375}, "step": 8800} {"train_info/time_between_train_steps": 13.418513536453247, "step": 8800} {"info/global_step": 8801, "train_info/time_within_train_step": 2.5387063026428223, "step": 8801} {"train_info/time_between_train_steps": 0.003161907196044922, "step": 8801} {"info/global_step": 8802, "train_info/time_within_train_step": 2.6169016361236572, "step": 8802} {"train_info/time_between_train_steps": 0.003206491470336914, "step": 8802} {"info/global_step": 8803, "train_info/time_within_train_step": 2.723553419113159, "step": 8803} {"train_info/time_between_train_steps": 0.0031731128692626953, "step": 8803} {"info/global_step": 8804, "train_info/time_within_train_step": 2.748406410217285, "step": 8804} {"train_info/time_between_train_steps": 0.003159761428833008, "step": 8804} {"info/global_step": 8805, "train_info/time_within_train_step": 2.750516414642334, "step": 8805} {"train_info/time_between_train_steps": 0.0031790733337402344, "step": 8805} {"info/global_step": 8806, "train_info/time_within_train_step": 2.7548272609710693, "step": 8806} {"train_info/time_between_train_steps": 0.0031974315643310547, "step": 8806} {"info/global_step": 8807, "train_info/time_within_train_step": 2.7541747093200684, "step": 8807} {"train_info/time_between_train_steps": 0.003187894821166992, "step": 8807} {"info/global_step": 8808, "train_info/time_within_train_step": 2.7554216384887695, "step": 8808} {"train_info/time_between_train_steps": 0.0031905174255371094, "step": 8808} {"info/global_step": 8809, "train_info/time_within_train_step": 2.754884958267212, "step": 8809} {"train_info/time_between_train_steps": 0.003203868865966797, "step": 8809} {"info/global_step": 8810, "train_info/time_within_train_step": 2.7562196254730225, "step": 8810} {"train_info/time_between_train_steps": 0.003174304962158203, "step": 8810} {"info/global_step": 8811, "train_info/time_within_train_step": 2.7556636333465576, "step": 8811} {"train_info/time_between_train_steps": 0.0031816959381103516, "step": 8811} {"info/global_step": 8812, "train_info/time_within_train_step": 2.755282402038574, "step": 8812} {"train_info/time_between_train_steps": 0.0032198429107666016, "step": 8812} {"info/global_step": 8813, "train_info/time_within_train_step": 2.753436803817749, "step": 8813} {"train_info/time_between_train_steps": 0.003153562545776367, "step": 8813} {"info/global_step": 8814, "train_info/time_within_train_step": 2.7562246322631836, "step": 8814} {"train_info/time_between_train_steps": 0.003184080123901367, "step": 8814} {"info/global_step": 8815, "train_info/time_within_train_step": 2.7558093070983887, "step": 8815} {"train_info/time_between_train_steps": 0.0032134056091308594, "step": 8815} {"info/global_step": 8816, "train_info/time_within_train_step": 2.755950450897217, "step": 8816} {"train_info/time_between_train_steps": 0.003146648406982422, "step": 8816} {"info/global_step": 8817, "train_info/time_within_train_step": 2.755962371826172, "step": 8817} {"train_info/time_between_train_steps": 0.0031867027282714844, "step": 8817} {"info/global_step": 8818, "train_info/time_within_train_step": 2.755354642868042, "step": 8818} {"train_info/time_between_train_steps": 0.0031545162200927734, "step": 8818} {"info/global_step": 8819, "train_info/time_within_train_step": 2.7559690475463867, "step": 8819} {"train_info/time_between_train_steps": 0.003176450729370117, "step": 8819} {"info/global_step": 8820, "train_info/time_within_train_step": 2.7558493614196777, "step": 8820} {"train_info/time_between_train_steps": 0.0031936168670654297, "step": 8820} {"info/global_step": 8821, "train_info/time_within_train_step": 2.755966901779175, "step": 8821} {"train_info/time_between_train_steps": 0.0031452178955078125, "step": 8821} {"info/global_step": 8822, "train_info/time_within_train_step": 2.7557756900787354, "step": 8822} {"train_info/time_between_train_steps": 0.0032231807708740234, "step": 8822} {"info/global_step": 8823, "train_info/time_within_train_step": 2.754916191101074, "step": 8823} {"train_info/time_between_train_steps": 0.003150463104248047, "step": 8823} {"info/global_step": 8824, "train_info/time_within_train_step": 2.7557342052459717, "step": 8824} {"train_info/time_between_train_steps": 0.0031654834747314453, "step": 8824} {"info/global_step": 8825, "train_info/time_within_train_step": 2.756091594696045, "step": 8825} {"train_info/time_between_train_steps": 0.0032324790954589844, "step": 8825} {"info/global_step": 8826, "train_info/time_within_train_step": 2.7555675506591797, "step": 8826} {"train_info/time_between_train_steps": 0.0032308101654052734, "step": 8826} {"info/global_step": 8827, "train_info/time_within_train_step": 2.7565667629241943, "step": 8827} {"train_info/time_between_train_steps": 0.0031490325927734375, "step": 8827} {"info/global_step": 8828, "train_info/time_within_train_step": 2.756448268890381, "step": 8828} {"train_info/time_between_train_steps": 0.0031685829162597656, "step": 8828} {"info/global_step": 8829, "train_info/time_within_train_step": 2.7565815448760986, "step": 8829} {"train_info/time_between_train_steps": 0.003223419189453125, "step": 8829} {"info/global_step": 8830, "train_info/time_within_train_step": 2.7568511962890625, "step": 8830} {"train_info/time_between_train_steps": 0.0031480789184570312, "step": 8830} {"info/global_step": 8831, "train_info/time_within_train_step": 2.755948305130005, "step": 8831} {"train_info/time_between_train_steps": 0.003180265426635742, "step": 8831} {"info/global_step": 8832, "train_info/time_within_train_step": 2.7562015056610107, "step": 8832} {"train_info/time_between_train_steps": 0.003204345703125, "step": 8832} {"info/global_step": 8833, "train_info/time_within_train_step": 2.756340265274048, "step": 8833} {"train_info/time_between_train_steps": 0.0031974315643310547, "step": 8833} {"info/global_step": 8834, "train_info/time_within_train_step": 2.755906105041504, "step": 8834} {"train_info/time_between_train_steps": 0.0031354427337646484, "step": 8834} {"info/global_step": 8835, "train_info/time_within_train_step": 2.7547760009765625, "step": 8835} {"train_info/time_between_train_steps": 0.0031249523162841797, "step": 8835} {"info/global_step": 8836, "train_info/time_within_train_step": 2.754782199859619, "step": 8836} {"train_info/time_between_train_steps": 0.003125905990600586, "step": 8836} {"info/global_step": 8837, "train_info/time_within_train_step": 2.7559823989868164, "step": 8837} {"train_info/time_between_train_steps": 0.003156900405883789, "step": 8837} {"info/global_step": 8838, "train_info/time_within_train_step": 2.75542950630188, "step": 8838} {"train_info/time_between_train_steps": 0.0033075809478759766, "step": 8838} {"info/global_step": 8839, "train_info/time_within_train_step": 2.757209062576294, "step": 8839} {"train_info/time_between_train_steps": 0.003359556198120117, "step": 8839} {"info/global_step": 8840, "train_info/time_within_train_step": 2.756072998046875, "step": 8840} {"train_info/time_between_train_steps": 0.003378629684448242, "step": 8840} {"info/global_step": 8841, "train_info/time_within_train_step": 2.7563037872314453, "step": 8841} {"train_info/time_between_train_steps": 0.0034911632537841797, "step": 8841} {"info/global_step": 8842, "train_info/time_within_train_step": 2.7564213275909424, "step": 8842} {"train_info/time_between_train_steps": 0.003282308578491211, "step": 8842} {"info/global_step": 8843, "train_info/time_within_train_step": 2.882927417755127, "step": 8843} {"train_info/time_between_train_steps": 0.003400564193725586, "step": 8843} {"info/global_step": 8844, "train_info/time_within_train_step": 2.757128953933716, "step": 8844} {"train_info/time_between_train_steps": 0.003373384475708008, "step": 8844} {"info/global_step": 8845, "train_info/time_within_train_step": 2.757098913192749, "step": 8845} {"train_info/time_between_train_steps": 0.003331899642944336, "step": 8845} {"info/global_step": 8846, "train_info/time_within_train_step": 2.757176399230957, "step": 8846} {"train_info/time_between_train_steps": 0.0033693313598632812, "step": 8846} {"info/global_step": 8847, "train_info/time_within_train_step": 2.758448362350464, "step": 8847} {"train_info/time_between_train_steps": 0.0033235549926757812, "step": 8847} {"info/global_step": 8848, "train_info/time_within_train_step": 2.7573704719543457, "step": 8848} {"train_info/time_between_train_steps": 0.0033295154571533203, "step": 8848} {"info/global_step": 8849, "train_info/time_within_train_step": 2.7579236030578613, "step": 8849} {"train_info/time_between_train_steps": 0.0033757686614990234, "step": 8849} {"info/global_step": 8850, "train_info/time_within_train_step": 2.7576282024383545, "step": 8850} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746591517, "_runtime": 25526}, "step": 8850} {"logs": {"train/loss": 2.9743, "train/learning_rate": 7.666666666666666e-05, "train/epoch": 10.03, "_timestamp": 1746591517, "_runtime": 25526}, "step": 8850} {"train_info/time_between_train_steps": 0.0071849822998046875, "step": 8850} {"info/global_step": 8851, "train_info/time_within_train_step": 2.7585573196411133, "step": 8851} {"train_info/time_between_train_steps": 0.0033838748931884766, "step": 8851} {"info/global_step": 8852, "train_info/time_within_train_step": 2.7577645778656006, "step": 8852} {"train_info/time_between_train_steps": 0.003361940383911133, "step": 8852} {"info/global_step": 8853, "train_info/time_within_train_step": 3.0157315731048584, "step": 8853} {"train_info/time_between_train_steps": 0.003199338912963867, "step": 8853} {"info/global_step": 8854, "train_info/time_within_train_step": 2.755023956298828, "step": 8854} {"train_info/time_between_train_steps": 0.0033884048461914062, "step": 8854} {"info/global_step": 8855, "train_info/time_within_train_step": 2.7572364807128906, "step": 8855} {"train_info/time_between_train_steps": 0.003390073776245117, "step": 8855} {"info/global_step": 8856, "train_info/time_within_train_step": 2.7559421062469482, "step": 8856} {"train_info/time_between_train_steps": 0.003339052200317383, "step": 8856} {"info/global_step": 8857, "train_info/time_within_train_step": 2.7562501430511475, "step": 8857} {"train_info/time_between_train_steps": 0.003332853317260742, "step": 8857} {"info/global_step": 8858, "train_info/time_within_train_step": 2.7568864822387695, "step": 8858} {"train_info/time_between_train_steps": 0.003351449966430664, "step": 8858} {"info/global_step": 8859, "train_info/time_within_train_step": 2.756619930267334, "step": 8859} {"train_info/time_between_train_steps": 0.0032889842987060547, "step": 8859} {"info/global_step": 8860, "train_info/time_within_train_step": 2.7575531005859375, "step": 8860} {"train_info/time_between_train_steps": 0.0033159255981445312, "step": 8860} {"info/global_step": 8861, "train_info/time_within_train_step": 2.756031036376953, "step": 8861} {"train_info/time_between_train_steps": 0.0033228397369384766, "step": 8861} {"info/global_step": 8862, "train_info/time_within_train_step": 2.7563858032226562, "step": 8862} {"train_info/time_between_train_steps": 0.003312826156616211, "step": 8862} {"info/global_step": 8863, "train_info/time_within_train_step": 2.7575838565826416, "step": 8863} {"train_info/time_between_train_steps": 0.003356456756591797, "step": 8863} {"info/global_step": 8864, "train_info/time_within_train_step": 2.757397174835205, "step": 8864} {"train_info/time_between_train_steps": 0.003301382064819336, "step": 8864} {"info/global_step": 8865, "train_info/time_within_train_step": 2.7559499740600586, "step": 8865} {"train_info/time_between_train_steps": 0.0034682750701904297, "step": 8865} {"info/global_step": 8866, "train_info/time_within_train_step": 2.7573461532592773, "step": 8866} {"train_info/time_between_train_steps": 0.0033538341522216797, "step": 8866} {"info/global_step": 8867, "train_info/time_within_train_step": 2.756965398788452, "step": 8867} {"train_info/time_between_train_steps": 0.003281831741333008, "step": 8867} {"info/global_step": 8868, "train_info/time_within_train_step": 2.757537364959717, "step": 8868} {"train_info/time_between_train_steps": 0.003325939178466797, "step": 8868} {"info/global_step": 8869, "train_info/time_within_train_step": 2.7568721771240234, "step": 8869} {"train_info/time_between_train_steps": 0.0033118724822998047, "step": 8869} {"info/global_step": 8870, "train_info/time_within_train_step": 2.756514072418213, "step": 8870} {"train_info/time_between_train_steps": 0.0033104419708251953, "step": 8870} {"info/global_step": 8871, "train_info/time_within_train_step": 2.757134437561035, "step": 8871} {"train_info/time_between_train_steps": 0.0033588409423828125, "step": 8871} {"info/global_step": 8872, "train_info/time_within_train_step": 2.7557477951049805, "step": 8872} {"train_info/time_between_train_steps": 0.003355264663696289, "step": 8872} {"info/global_step": 8873, "train_info/time_within_train_step": 2.7575926780700684, "step": 8873} {"train_info/time_between_train_steps": 0.003290891647338867, "step": 8873} {"info/global_step": 8874, "train_info/time_within_train_step": 2.757054567337036, "step": 8874} {"train_info/time_between_train_steps": 0.003421306610107422, "step": 8874} {"info/global_step": 8875, "train_info/time_within_train_step": 2.756627321243286, "step": 8875} {"train_info/time_between_train_steps": 0.0033750534057617188, "step": 8875} {"info/global_step": 8876, "train_info/time_within_train_step": 2.7571418285369873, "step": 8876} {"train_info/time_between_train_steps": 0.003331422805786133, "step": 8876} {"info/global_step": 8877, "train_info/time_within_train_step": 2.756967782974243, "step": 8877} {"train_info/time_between_train_steps": 0.0033674240112304688, "step": 8877} {"info/global_step": 8878, "train_info/time_within_train_step": 2.7571768760681152, "step": 8878} {"train_info/time_between_train_steps": 0.003313779830932617, "step": 8878} {"info/global_step": 8879, "train_info/time_within_train_step": 2.7581770420074463, "step": 8879} {"train_info/time_between_train_steps": 0.003329753875732422, "step": 8879} {"info/global_step": 8880, "train_info/time_within_train_step": 2.757397413253784, "step": 8880} {"train_info/time_between_train_steps": 0.0033414363861083984, "step": 8880} {"info/global_step": 8881, "train_info/time_within_train_step": 2.757012367248535, "step": 8881} {"train_info/time_between_train_steps": 0.0033233165740966797, "step": 8881} {"info/global_step": 8882, "train_info/time_within_train_step": 2.7569615840911865, "step": 8882} {"train_info/time_between_train_steps": 0.0033071041107177734, "step": 8882} {"info/global_step": 8883, "train_info/time_within_train_step": 2.7567338943481445, "step": 8883} {"train_info/time_between_train_steps": 0.003341197967529297, "step": 8883} {"info/global_step": 8884, "train_info/time_within_train_step": 2.7575812339782715, "step": 8884} {"train_info/time_between_train_steps": 0.003326892852783203, "step": 8884} {"info/global_step": 8885, "train_info/time_within_train_step": 2.7570433616638184, "step": 8885} {"train_info/time_between_train_steps": 0.003308534622192383, "step": 8885} {"info/global_step": 8886, "train_info/time_within_train_step": 2.7557194232940674, "step": 8886} {"train_info/time_between_train_steps": 0.003339052200317383, "step": 8886} {"info/global_step": 8887, "train_info/time_within_train_step": 2.7571353912353516, "step": 8887} {"train_info/time_between_train_steps": 0.0033445358276367188, "step": 8887} {"info/global_step": 8888, "train_info/time_within_train_step": 2.7554101943969727, "step": 8888} {"train_info/time_between_train_steps": 0.003369569778442383, "step": 8888} {"info/global_step": 8889, "train_info/time_within_train_step": 2.7567150592803955, "step": 8889} {"train_info/time_between_train_steps": 0.003351449966430664, "step": 8889} {"info/global_step": 8890, "train_info/time_within_train_step": 2.756361246109009, "step": 8890} {"train_info/time_between_train_steps": 0.003319978713989258, "step": 8890} {"info/global_step": 8891, "train_info/time_within_train_step": 2.7563116550445557, "step": 8891} {"train_info/time_between_train_steps": 0.003314971923828125, "step": 8891} {"info/global_step": 8892, "train_info/time_within_train_step": 2.7555296421051025, "step": 8892} {"train_info/time_between_train_steps": 0.0033676624298095703, "step": 8892} {"info/global_step": 8893, "train_info/time_within_train_step": 2.756376266479492, "step": 8893} {"train_info/time_between_train_steps": 0.003343820571899414, "step": 8893} {"info/global_step": 8894, "train_info/time_within_train_step": 2.756579875946045, "step": 8894} {"train_info/time_between_train_steps": 0.003324747085571289, "step": 8894} {"info/global_step": 8895, "train_info/time_within_train_step": 3.016239881515503, "step": 8895} {"train_info/time_between_train_steps": 0.0033223628997802734, "step": 8895} {"info/global_step": 8896, "train_info/time_within_train_step": 2.7581465244293213, "step": 8896} {"train_info/time_between_train_steps": 0.0033359527587890625, "step": 8896} {"info/global_step": 8897, "train_info/time_within_train_step": 2.7565362453460693, "step": 8897} {"train_info/time_between_train_steps": 0.003348827362060547, "step": 8897} {"info/global_step": 8898, "train_info/time_within_train_step": 2.7569074630737305, "step": 8898} {"train_info/time_between_train_steps": 0.0033316612243652344, "step": 8898} {"info/global_step": 8899, "train_info/time_within_train_step": 2.756969690322876, "step": 8899} {"train_info/time_between_train_steps": 0.0033121109008789062, "step": 8899} {"info/global_step": 8900, "train_info/time_within_train_step": 2.757991313934326, "step": 8900} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746591656, "_runtime": 25665}, "step": 8900} {"logs": {"train/loss": 2.9805, "train/learning_rate": 7.333333333333332e-05, "train/epoch": 10.04, "_timestamp": 1746591656, "_runtime": 25665}, "step": 8900} {"train_info/time_between_train_steps": 0.006757020950317383, "step": 8900} {"info/global_step": 8901, "train_info/time_within_train_step": 2.7570295333862305, "step": 8901} {"train_info/time_between_train_steps": 0.0033028125762939453, "step": 8901} {"info/global_step": 8902, "train_info/time_within_train_step": 2.756852388381958, "step": 8902} {"train_info/time_between_train_steps": 0.0032927989959716797, "step": 8902} {"info/global_step": 8903, "train_info/time_within_train_step": 2.7564945220947266, "step": 8903} {"train_info/time_between_train_steps": 0.003368854522705078, "step": 8903} {"info/global_step": 8904, "train_info/time_within_train_step": 2.7578985691070557, "step": 8904} {"train_info/time_between_train_steps": 0.0033164024353027344, "step": 8904} {"info/global_step": 8905, "train_info/time_within_train_step": 2.7562294006347656, "step": 8905} {"train_info/time_between_train_steps": 0.12971282005310059, "step": 8905} {"info/global_step": 8906, "train_info/time_within_train_step": 2.7564914226531982, "step": 8906} {"train_info/time_between_train_steps": 0.003392934799194336, "step": 8906} {"info/global_step": 8907, "train_info/time_within_train_step": 2.756030797958374, "step": 8907} {"train_info/time_between_train_steps": 0.003305196762084961, "step": 8907} {"info/global_step": 8908, "train_info/time_within_train_step": 2.756906270980835, "step": 8908} {"train_info/time_between_train_steps": 0.0033538341522216797, "step": 8908} {"info/global_step": 8909, "train_info/time_within_train_step": 2.7572755813598633, "step": 8909} {"train_info/time_between_train_steps": 0.003321409225463867, "step": 8909} {"info/global_step": 8910, "train_info/time_within_train_step": 2.7561545372009277, "step": 8910} {"train_info/time_between_train_steps": 0.0033037662506103516, "step": 8910} {"info/global_step": 8911, "train_info/time_within_train_step": 2.757627248764038, "step": 8911} {"train_info/time_between_train_steps": 0.003312349319458008, "step": 8911} {"info/global_step": 8912, "train_info/time_within_train_step": 2.756889581680298, "step": 8912} {"train_info/time_between_train_steps": 0.0033447742462158203, "step": 8912} {"info/global_step": 8913, "train_info/time_within_train_step": 2.7569923400878906, "step": 8913} {"train_info/time_between_train_steps": 0.003312826156616211, "step": 8913} {"info/global_step": 8914, "train_info/time_within_train_step": 2.757866382598877, "step": 8914} {"train_info/time_between_train_steps": 0.0033597946166992188, "step": 8914} {"info/global_step": 8915, "train_info/time_within_train_step": 2.757533073425293, "step": 8915} {"train_info/time_between_train_steps": 0.003342866897583008, "step": 8915} {"info/global_step": 8916, "train_info/time_within_train_step": 2.7570881843566895, "step": 8916} {"train_info/time_between_train_steps": 0.003572225570678711, "step": 8916} {"info/global_step": 8917, "train_info/time_within_train_step": 2.7567853927612305, "step": 8917} {"train_info/time_between_train_steps": 0.003373861312866211, "step": 8917} {"info/global_step": 8918, "train_info/time_within_train_step": 2.7562668323516846, "step": 8918} {"train_info/time_between_train_steps": 0.0033719539642333984, "step": 8918} {"info/global_step": 8919, "train_info/time_within_train_step": 2.7570953369140625, "step": 8919} {"train_info/time_between_train_steps": 0.003370046615600586, "step": 8919} {"info/global_step": 8920, "train_info/time_within_train_step": 2.7570993900299072, "step": 8920} {"train_info/time_between_train_steps": 0.0033617019653320312, "step": 8920} {"info/global_step": 8921, "train_info/time_within_train_step": 2.7573142051696777, "step": 8921} {"train_info/time_between_train_steps": 0.003481626510620117, "step": 8921} {"info/global_step": 8922, "train_info/time_within_train_step": 2.757341146469116, "step": 8922} {"train_info/time_between_train_steps": 0.0032987594604492188, "step": 8922} {"info/global_step": 8923, "train_info/time_within_train_step": 2.7572433948516846, "step": 8923} {"train_info/time_between_train_steps": 0.003334522247314453, "step": 8923} {"info/global_step": 8924, "train_info/time_within_train_step": 2.7578299045562744, "step": 8924} {"train_info/time_between_train_steps": 0.0033235549926757812, "step": 8924} {"info/global_step": 8925, "train_info/time_within_train_step": 2.756852626800537, "step": 8925} {"train_info/time_between_train_steps": 0.0033097267150878906, "step": 8925} {"info/global_step": 8926, "train_info/time_within_train_step": 2.7570433616638184, "step": 8926} {"train_info/time_between_train_steps": 0.003374338150024414, "step": 8926} {"info/global_step": 8927, "train_info/time_within_train_step": 2.7563247680664062, "step": 8927} {"train_info/time_between_train_steps": 0.0033364295959472656, "step": 8927} {"info/global_step": 8928, "train_info/time_within_train_step": 2.756319522857666, "step": 8928} {"train_info/time_between_train_steps": 0.003359556198120117, "step": 8928} {"info/global_step": 8929, "train_info/time_within_train_step": 2.757512331008911, "step": 8929} {"train_info/time_between_train_steps": 0.0033082962036132812, "step": 8929} {"info/global_step": 8930, "train_info/time_within_train_step": 2.7557969093322754, "step": 8930} {"train_info/time_between_train_steps": 0.0033266544342041016, "step": 8930} {"info/global_step": 8931, "train_info/time_within_train_step": 2.756453275680542, "step": 8931} {"train_info/time_between_train_steps": 0.0033152103424072266, "step": 8931} {"info/global_step": 8932, "train_info/time_within_train_step": 2.7572195529937744, "step": 8932} {"train_info/time_between_train_steps": 0.003342866897583008, "step": 8932} {"info/global_step": 8933, "train_info/time_within_train_step": 2.758146047592163, "step": 8933} {"train_info/time_between_train_steps": 0.0033028125762939453, "step": 8933} {"info/global_step": 8934, "train_info/time_within_train_step": 2.757486343383789, "step": 8934} {"train_info/time_between_train_steps": 0.0033349990844726562, "step": 8934} {"info/global_step": 8935, "train_info/time_within_train_step": 2.757150173187256, "step": 8935} {"train_info/time_between_train_steps": 0.0033783912658691406, "step": 8935} {"info/global_step": 8936, "train_info/time_within_train_step": 3.018730878829956, "step": 8936} {"train_info/time_between_train_steps": 0.0032799243927001953, "step": 8936} {"info/global_step": 8937, "train_info/time_within_train_step": 2.7575488090515137, "step": 8937} {"train_info/time_between_train_steps": 0.0033364295959472656, "step": 8937} {"info/global_step": 8938, "train_info/time_within_train_step": 2.7571403980255127, "step": 8938} {"train_info/time_between_train_steps": 0.0032770633697509766, "step": 8938} {"info/global_step": 8939, "train_info/time_within_train_step": 2.7575581073760986, "step": 8939} {"train_info/time_between_train_steps": 0.003325939178466797, "step": 8939} {"info/global_step": 8940, "train_info/time_within_train_step": 2.7574808597564697, "step": 8940} {"train_info/time_between_train_steps": 0.0033364295959472656, "step": 8940} {"info/global_step": 8941, "train_info/time_within_train_step": 2.7558016777038574, "step": 8941} {"train_info/time_between_train_steps": 0.0033185482025146484, "step": 8941} {"info/global_step": 8942, "train_info/time_within_train_step": 2.7566514015197754, "step": 8942} {"train_info/time_between_train_steps": 0.0033402442932128906, "step": 8942} {"info/global_step": 8943, "train_info/time_within_train_step": 2.756460428237915, "step": 8943} {"train_info/time_between_train_steps": 0.003349781036376953, "step": 8943} {"info/global_step": 8944, "train_info/time_within_train_step": 2.7568650245666504, "step": 8944} {"train_info/time_between_train_steps": 0.0033266544342041016, "step": 8944} {"info/global_step": 8945, "train_info/time_within_train_step": 2.756490468978882, "step": 8945} {"train_info/time_between_train_steps": 0.003289461135864258, "step": 8945} {"info/global_step": 8946, "train_info/time_within_train_step": 2.756260871887207, "step": 8946} {"train_info/time_between_train_steps": 0.0033271312713623047, "step": 8946} {"info/global_step": 8947, "train_info/time_within_train_step": 2.7556300163269043, "step": 8947} {"train_info/time_between_train_steps": 0.0033266544342041016, "step": 8947} {"info/global_step": 8948, "train_info/time_within_train_step": 2.7561793327331543, "step": 8948} {"train_info/time_between_train_steps": 0.003395557403564453, "step": 8948} {"info/global_step": 8949, "train_info/time_within_train_step": 2.7574713230133057, "step": 8949} {"train_info/time_between_train_steps": 0.003368854522705078, "step": 8949} {"info/global_step": 8950, "train_info/time_within_train_step": 2.756528377532959, "step": 8950} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746591794, "_runtime": 25803}, "step": 8950} {"logs": {"train/loss": 2.9763, "train/learning_rate": 7e-05, "train/epoch": 10.04, "_timestamp": 1746591794, "_runtime": 25803}, "step": 8950} {"train_info/time_between_train_steps": 0.007064342498779297, "step": 8950} {"info/global_step": 8951, "train_info/time_within_train_step": 2.7568397521972656, "step": 8951} {"train_info/time_between_train_steps": 0.0033059120178222656, "step": 8951} {"info/global_step": 8952, "train_info/time_within_train_step": 2.7571260929107666, "step": 8952} {"train_info/time_between_train_steps": 0.0033168792724609375, "step": 8952} {"info/global_step": 8953, "train_info/time_within_train_step": 2.757028102874756, "step": 8953} {"train_info/time_between_train_steps": 0.0033369064331054688, "step": 8953} {"info/global_step": 8954, "train_info/time_within_train_step": 2.756403684616089, "step": 8954} {"train_info/time_between_train_steps": 0.003294229507446289, "step": 8954} {"info/global_step": 8955, "train_info/time_within_train_step": 2.7570173740386963, "step": 8955} {"train_info/time_between_train_steps": 0.0032935142517089844, "step": 8955} {"info/global_step": 8956, "train_info/time_within_train_step": 2.7566232681274414, "step": 8956} {"train_info/time_between_train_steps": 0.0033178329467773438, "step": 8956} {"info/global_step": 8957, "train_info/time_within_train_step": 2.7581911087036133, "step": 8957} {"train_info/time_between_train_steps": 0.0033304691314697266, "step": 8957} {"info/global_step": 8958, "train_info/time_within_train_step": 2.7572526931762695, "step": 8958} {"train_info/time_between_train_steps": 0.003326416015625, "step": 8958} {"info/global_step": 8959, "train_info/time_within_train_step": 2.7576911449432373, "step": 8959} {"train_info/time_between_train_steps": 0.0033376216888427734, "step": 8959} {"info/global_step": 8960, "train_info/time_within_train_step": 2.7569327354431152, "step": 8960} {"train_info/time_between_train_steps": 0.003346681594848633, "step": 8960} {"info/global_step": 8961, "train_info/time_within_train_step": 2.7556982040405273, "step": 8961} {"train_info/time_between_train_steps": 0.003182649612426758, "step": 8961} {"info/global_step": 8962, "train_info/time_within_train_step": 2.754399061203003, "step": 8962} {"train_info/time_between_train_steps": 0.003124713897705078, "step": 8962} {"info/global_step": 8963, "train_info/time_within_train_step": 2.754946708679199, "step": 8963} {"train_info/time_between_train_steps": 0.0032057762145996094, "step": 8963} {"info/global_step": 8964, "train_info/time_within_train_step": 2.7546627521514893, "step": 8964} {"train_info/time_between_train_steps": 0.0031585693359375, "step": 8964} {"info/global_step": 8965, "train_info/time_within_train_step": 2.754939556121826, "step": 8965} {"train_info/time_between_train_steps": 0.0031354427337646484, "step": 8965} {"info/global_step": 8966, "train_info/time_within_train_step": 2.7555956840515137, "step": 8966} {"train_info/time_between_train_steps": 0.0031442642211914062, "step": 8966} {"info/global_step": 8967, "train_info/time_within_train_step": 2.755023717880249, "step": 8967} {"train_info/time_between_train_steps": 0.0031609535217285156, "step": 8967} {"info/global_step": 8968, "train_info/time_within_train_step": 2.8812096118927, "step": 8968} {"train_info/time_between_train_steps": 0.0031566619873046875, "step": 8968} {"info/global_step": 8969, "train_info/time_within_train_step": 2.754516363143921, "step": 8969} {"train_info/time_between_train_steps": 0.0031883716583251953, "step": 8969} {"info/global_step": 8970, "train_info/time_within_train_step": 2.756047010421753, "step": 8970} {"train_info/time_between_train_steps": 0.0032393932342529297, "step": 8970} {"info/global_step": 8971, "train_info/time_within_train_step": 2.7560317516326904, "step": 8971} {"train_info/time_between_train_steps": 0.0031843185424804688, "step": 8971} {"info/global_step": 8972, "train_info/time_within_train_step": 2.755183696746826, "step": 8972} {"train_info/time_between_train_steps": 0.0032281875610351562, "step": 8972} {"info/global_step": 8973, "train_info/time_within_train_step": 2.7547764778137207, "step": 8973} {"train_info/time_between_train_steps": 0.003152608871459961, "step": 8973} {"info/global_step": 8974, "train_info/time_within_train_step": 2.755164623260498, "step": 8974} {"train_info/time_between_train_steps": 0.0031633377075195312, "step": 8974} {"info/global_step": 8975, "train_info/time_within_train_step": 2.7550811767578125, "step": 8975} {"train_info/time_between_train_steps": 0.0032134056091308594, "step": 8975} {"info/global_step": 8976, "train_info/time_within_train_step": 2.7559967041015625, "step": 8976} {"train_info/time_between_train_steps": 0.0031845569610595703, "step": 8976} {"info/global_step": 8977, "train_info/time_within_train_step": 2.755704402923584, "step": 8977} {"train_info/time_between_train_steps": 0.003319263458251953, "step": 8977} {"info/global_step": 8978, "train_info/time_within_train_step": 2.7570533752441406, "step": 8978} {"train_info/time_between_train_steps": 0.003336191177368164, "step": 8978} {"info/global_step": 8979, "train_info/time_within_train_step": 2.7572340965270996, "step": 8979} {"train_info/time_between_train_steps": 0.0033416748046875, "step": 8979} {"info/global_step": 8980, "train_info/time_within_train_step": 2.756880760192871, "step": 8980} {"train_info/time_between_train_steps": 0.003358125686645508, "step": 8980} {"info/global_step": 8981, "train_info/time_within_train_step": 2.7568535804748535, "step": 8981} {"train_info/time_between_train_steps": 0.0034177303314208984, "step": 8981} {"info/global_step": 8982, "train_info/time_within_train_step": 2.7583553791046143, "step": 8982} {"train_info/time_between_train_steps": 0.003334522247314453, "step": 8982} {"info/global_step": 8983, "train_info/time_within_train_step": 2.7576708793640137, "step": 8983} {"train_info/time_between_train_steps": 0.0033855438232421875, "step": 8983} {"info/global_step": 8984, "train_info/time_within_train_step": 2.7575104236602783, "step": 8984} {"train_info/time_between_train_steps": 0.0033462047576904297, "step": 8984} {"info/global_step": 8985, "train_info/time_within_train_step": 2.7574880123138428, "step": 8985} {"train_info/time_between_train_steps": 0.003299713134765625, "step": 8985} {"info/global_step": 8986, "train_info/time_within_train_step": 2.7564172744750977, "step": 8986} {"train_info/time_between_train_steps": 0.0033843517303466797, "step": 8986} {"info/global_step": 8987, "train_info/time_within_train_step": 2.755458354949951, "step": 8987} {"train_info/time_between_train_steps": 0.0033676624298095703, "step": 8987} {"info/global_step": 8988, "train_info/time_within_train_step": 2.757564067840576, "step": 8988} {"train_info/time_between_train_steps": 0.0033397674560546875, "step": 8988} {"info/global_step": 8989, "train_info/time_within_train_step": 2.757434129714966, "step": 8989} {"train_info/time_between_train_steps": 0.003343820571899414, "step": 8989} {"info/global_step": 8990, "train_info/time_within_train_step": 2.7564547061920166, "step": 8990} {"train_info/time_between_train_steps": 0.0034580230712890625, "step": 8990} {"info/global_step": 8991, "train_info/time_within_train_step": 2.7576470375061035, "step": 8991} {"train_info/time_between_train_steps": 0.0033485889434814453, "step": 8991} {"info/global_step": 8992, "train_info/time_within_train_step": 2.7579305171966553, "step": 8992} {"train_info/time_between_train_steps": 0.0034012794494628906, "step": 8992} {"info/global_step": 8993, "train_info/time_within_train_step": 2.7581658363342285, "step": 8993} {"train_info/time_between_train_steps": 0.0033578872680664062, "step": 8993} {"info/global_step": 8994, "train_info/time_within_train_step": 2.756718158721924, "step": 8994} {"train_info/time_between_train_steps": 0.003385305404663086, "step": 8994} {"info/global_step": 8995, "train_info/time_within_train_step": 3.333460569381714, "step": 8995} {"train_info/time_between_train_steps": 0.003360271453857422, "step": 8995} {"info/global_step": 8996, "train_info/time_within_train_step": 2.7524943351745605, "step": 8996} {"train_info/time_between_train_steps": 0.0034024715423583984, "step": 8996} {"info/global_step": 8997, "train_info/time_within_train_step": 2.7556965351104736, "step": 8997} {"train_info/time_between_train_steps": 0.0033416748046875, "step": 8997} {"info/global_step": 8998, "train_info/time_within_train_step": 2.7548983097076416, "step": 8998} {"train_info/time_between_train_steps": 0.0031762123107910156, "step": 8998} {"info/global_step": 8999, "train_info/time_within_train_step": 2.7552149295806885, "step": 8999} {"train_info/time_between_train_steps": 0.0032160282135009766, "step": 8999} {"info/global_step": 9000, "train_info/time_within_train_step": 2.75575852394104, "step": 9000} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746591933, "_runtime": 25942}, "step": 9000} {"logs": {"train/loss": 2.9634, "train/learning_rate": 6.666666666666666e-05, "train/epoch": 10.05, "_timestamp": 1746591933, "_runtime": 25942}, "step": 9000} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746591938, "_runtime": 25947}, "step": 9000} {"logs": {"eval/loss": 4.856907367706299, "eval/runtime": 5.1267, "eval/samples_per_second": 37.061, "eval/steps_per_second": 1.17, "train/epoch": 10.05, "_timestamp": 1746591938, "_runtime": 25947}, "step": 9000} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746591938, "_runtime": 25947}, "step": 9000} {"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.856907367706299, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 128.6257940755881, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 5.1267, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 37.061, "train/epoch": 10.05, "_timestamp": 1746591938, "_runtime": 25947}, "step": 9000} {"train_info/time_between_train_steps": 18.315775156021118, "step": 9000} {"info/global_step": 9001, "train_info/time_within_train_step": 2.536684989929199, "step": 9001} {"train_info/time_between_train_steps": 0.003378629684448242, "step": 9001} {"info/global_step": 9002, "train_info/time_within_train_step": 2.5731453895568848, "step": 9002} {"train_info/time_between_train_steps": 0.0032079219818115234, "step": 9002} {"info/global_step": 9003, "train_info/time_within_train_step": 2.701124668121338, "step": 9003} {"train_info/time_between_train_steps": 0.0033235549926757812, "step": 9003} {"info/global_step": 9004, "train_info/time_within_train_step": 2.7508480548858643, "step": 9004} {"train_info/time_between_train_steps": 0.003314495086669922, "step": 9004} {"info/global_step": 9005, "train_info/time_within_train_step": 2.750889778137207, "step": 9005} {"train_info/time_between_train_steps": 0.0037288665771484375, "step": 9005} {"info/global_step": 9006, "train_info/time_within_train_step": 2.754603624343872, "step": 9006} {"train_info/time_between_train_steps": 0.003808259963989258, "step": 9006} {"info/global_step": 9007, "train_info/time_within_train_step": 2.7569327354431152, "step": 9007} {"train_info/time_between_train_steps": 0.003194093704223633, "step": 9007} {"info/global_step": 9008, "train_info/time_within_train_step": 2.7555713653564453, "step": 9008} {"train_info/time_between_train_steps": 0.0032112598419189453, "step": 9008} {"info/global_step": 9009, "train_info/time_within_train_step": 2.7544631958007812, "step": 9009} {"train_info/time_between_train_steps": 0.003193378448486328, "step": 9009} {"info/global_step": 9010, "train_info/time_within_train_step": 2.7580087184906006, "step": 9010} {"train_info/time_between_train_steps": 0.0034410953521728516, "step": 9010} {"info/global_step": 9011, "train_info/time_within_train_step": 2.7564806938171387, "step": 9011} {"train_info/time_between_train_steps": 0.0033445358276367188, "step": 9011} {"info/global_step": 9012, "train_info/time_within_train_step": 2.7566001415252686, "step": 9012} {"train_info/time_between_train_steps": 0.0032453536987304688, "step": 9012} {"info/global_step": 9013, "train_info/time_within_train_step": 2.75765323638916, "step": 9013} {"train_info/time_between_train_steps": 0.0033447742462158203, "step": 9013} {"info/global_step": 9014, "train_info/time_within_train_step": 2.7567834854125977, "step": 9014} {"train_info/time_between_train_steps": 0.0032842159271240234, "step": 9014} {"info/global_step": 9015, "train_info/time_within_train_step": 2.7580230236053467, "step": 9015} {"train_info/time_between_train_steps": 0.003734588623046875, "step": 9015} {"info/global_step": 9016, "train_info/time_within_train_step": 3.0503246784210205, "step": 9016} {"train_info/time_between_train_steps": 0.0033292770385742188, "step": 9016} {"info/global_step": 9017, "train_info/time_within_train_step": 2.759174346923828, "step": 9017} {"train_info/time_between_train_steps": 0.0034093856811523438, "step": 9017} {"info/global_step": 9018, "train_info/time_within_train_step": 2.7593917846679688, "step": 9018} {"train_info/time_between_train_steps": 0.003378629684448242, "step": 9018} {"info/global_step": 9019, "train_info/time_within_train_step": 2.75974178314209, "step": 9019} {"train_info/time_between_train_steps": 0.004026889801025391, "step": 9019} {"info/global_step": 9020, "train_info/time_within_train_step": 2.7584080696105957, "step": 9020} {"train_info/time_between_train_steps": 0.003440380096435547, "step": 9020} {"info/global_step": 9021, "train_info/time_within_train_step": 2.7584519386291504, "step": 9021} {"train_info/time_between_train_steps": 0.003539562225341797, "step": 9021} {"info/global_step": 9022, "train_info/time_within_train_step": 2.758570432662964, "step": 9022} {"train_info/time_between_train_steps": 0.0034651756286621094, "step": 9022} {"info/global_step": 9023, "train_info/time_within_train_step": 2.7584822177886963, "step": 9023} {"train_info/time_between_train_steps": 0.0032396316528320312, "step": 9023} {"info/global_step": 9024, "train_info/time_within_train_step": 2.756944179534912, "step": 9024} {"train_info/time_between_train_steps": 0.003402233123779297, "step": 9024} {"info/global_step": 9025, "train_info/time_within_train_step": 2.7575247287750244, "step": 9025} {"train_info/time_between_train_steps": 0.003209352493286133, "step": 9025} {"info/global_step": 9026, "train_info/time_within_train_step": 2.7570302486419678, "step": 9026} {"train_info/time_between_train_steps": 0.003396749496459961, "step": 9026} {"info/global_step": 9027, "train_info/time_within_train_step": 2.7580618858337402, "step": 9027} {"train_info/time_between_train_steps": 0.003268003463745117, "step": 9027} {"info/global_step": 9028, "train_info/time_within_train_step": 2.757246971130371, "step": 9028} {"train_info/time_between_train_steps": 0.003271341323852539, "step": 9028} {"info/global_step": 9029, "train_info/time_within_train_step": 2.7582778930664062, "step": 9029} {"train_info/time_between_train_steps": 0.003270864486694336, "step": 9029} {"info/global_step": 9030, "train_info/time_within_train_step": 2.758810520172119, "step": 9030} {"train_info/time_between_train_steps": 0.10239291191101074, "step": 9030} {"info/global_step": 9031, "train_info/time_within_train_step": 2.765071392059326, "step": 9031} {"train_info/time_between_train_steps": 0.0032918453216552734, "step": 9031} {"info/global_step": 9032, "train_info/time_within_train_step": 2.7568256855010986, "step": 9032} {"train_info/time_between_train_steps": 0.003201723098754883, "step": 9032} {"info/global_step": 9033, "train_info/time_within_train_step": 2.757899522781372, "step": 9033} {"train_info/time_between_train_steps": 0.003214597702026367, "step": 9033} {"info/global_step": 9034, "train_info/time_within_train_step": 2.758077383041382, "step": 9034} {"train_info/time_between_train_steps": 0.0034918785095214844, "step": 9034} {"info/global_step": 9035, "train_info/time_within_train_step": 2.7574737071990967, "step": 9035} {"train_info/time_between_train_steps": 0.003350973129272461, "step": 9035} {"info/global_step": 9036, "train_info/time_within_train_step": 2.756701707839966, "step": 9036} {"train_info/time_between_train_steps": 0.003290891647338867, "step": 9036} {"info/global_step": 9037, "train_info/time_within_train_step": 2.756596565246582, "step": 9037} {"train_info/time_between_train_steps": 0.0032591819763183594, "step": 9037} {"info/global_step": 9038, "train_info/time_within_train_step": 2.7570953369140625, "step": 9038} {"train_info/time_between_train_steps": 0.0033283233642578125, "step": 9038} {"info/global_step": 9039, "train_info/time_within_train_step": 2.756288766860962, "step": 9039} {"train_info/time_between_train_steps": 0.0033299922943115234, "step": 9039} {"info/global_step": 9040, "train_info/time_within_train_step": 2.7564287185668945, "step": 9040} {"train_info/time_between_train_steps": 0.0032808780670166016, "step": 9040} {"info/global_step": 9041, "train_info/time_within_train_step": 2.7566444873809814, "step": 9041} {"train_info/time_between_train_steps": 0.003269672393798828, "step": 9041} {"info/global_step": 9042, "train_info/time_within_train_step": 2.7553608417510986, "step": 9042} {"train_info/time_between_train_steps": 0.0033245086669921875, "step": 9042} {"info/global_step": 9043, "train_info/time_within_train_step": 2.7561092376708984, "step": 9043} {"train_info/time_between_train_steps": 0.0033316612243652344, "step": 9043} {"info/global_step": 9044, "train_info/time_within_train_step": 2.7565407752990723, "step": 9044} {"train_info/time_between_train_steps": 0.0033180713653564453, "step": 9044} {"info/global_step": 9045, "train_info/time_within_train_step": 2.7570433616638184, "step": 9045} {"train_info/time_between_train_steps": 0.0033524036407470703, "step": 9045} {"info/global_step": 9046, "train_info/time_within_train_step": 2.756706714630127, "step": 9046} {"train_info/time_between_train_steps": 0.003347635269165039, "step": 9046} {"info/global_step": 9047, "train_info/time_within_train_step": 2.7559094429016113, "step": 9047} {"train_info/time_between_train_steps": 0.003389596939086914, "step": 9047} {"info/global_step": 9048, "train_info/time_within_train_step": 2.756925582885742, "step": 9048} {"train_info/time_between_train_steps": 0.003385305404663086, "step": 9048} {"info/global_step": 9049, "train_info/time_within_train_step": 2.7565624713897705, "step": 9049} {"train_info/time_between_train_steps": 0.0033173561096191406, "step": 9049} {"info/global_step": 9050, "train_info/time_within_train_step": 2.756704330444336, "step": 9050} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746592090, "_runtime": 26099}, "step": 9050} {"logs": {"train/loss": 2.9559, "train/learning_rate": 6.333333333333333e-05, "train/epoch": 10.05, "_timestamp": 1746592090, "_runtime": 26099}, "step": 9050} {"train_info/time_between_train_steps": 0.007457733154296875, "step": 9050} {"info/global_step": 9051, "train_info/time_within_train_step": 2.756842851638794, "step": 9051} {"train_info/time_between_train_steps": 0.0033464431762695312, "step": 9051} {"info/global_step": 9052, "train_info/time_within_train_step": 2.7569031715393066, "step": 9052} {"train_info/time_between_train_steps": 0.0032813549041748047, "step": 9052} {"info/global_step": 9053, "train_info/time_within_train_step": 2.756664276123047, "step": 9053} {"train_info/time_between_train_steps": 0.0032837390899658203, "step": 9053} {"info/global_step": 9054, "train_info/time_within_train_step": 2.7565231323242188, "step": 9054} {"train_info/time_between_train_steps": 0.0032825469970703125, "step": 9054} {"info/global_step": 9055, "train_info/time_within_train_step": 2.7563958168029785, "step": 9055} {"train_info/time_between_train_steps": 0.003317594528198242, "step": 9055} {"info/global_step": 9056, "train_info/time_within_train_step": 2.7556207180023193, "step": 9056} {"train_info/time_between_train_steps": 0.0033104419708251953, "step": 9056} {"info/global_step": 9057, "train_info/time_within_train_step": 2.7559404373168945, "step": 9057} {"train_info/time_between_train_steps": 0.0033025741577148438, "step": 9057} {"info/global_step": 9058, "train_info/time_within_train_step": 2.7560818195343018, "step": 9058} {"train_info/time_between_train_steps": 0.003315448760986328, "step": 9058} {"info/global_step": 9059, "train_info/time_within_train_step": 2.756619453430176, "step": 9059} {"train_info/time_between_train_steps": 0.003728151321411133, "step": 9059} {"info/global_step": 9060, "train_info/time_within_train_step": 2.755721092224121, "step": 9060} {"train_info/time_between_train_steps": 0.003229379653930664, "step": 9060} {"info/global_step": 9061, "train_info/time_within_train_step": 2.755502223968506, "step": 9061} {"train_info/time_between_train_steps": 0.0032858848571777344, "step": 9061} {"info/global_step": 9062, "train_info/time_within_train_step": 2.7556774616241455, "step": 9062} {"train_info/time_between_train_steps": 0.003459453582763672, "step": 9062} {"info/global_step": 9063, "train_info/time_within_train_step": 2.755746364593506, "step": 9063} {"train_info/time_between_train_steps": 0.0032880306243896484, "step": 9063} {"info/global_step": 9064, "train_info/time_within_train_step": 2.7560155391693115, "step": 9064} {"train_info/time_between_train_steps": 0.0033016204833984375, "step": 9064} {"info/global_step": 9065, "train_info/time_within_train_step": 2.755966901779175, "step": 9065} {"train_info/time_between_train_steps": 0.003289461135864258, "step": 9065} {"info/global_step": 9066, "train_info/time_within_train_step": 2.755688428878784, "step": 9066} {"train_info/time_between_train_steps": 0.003265380859375, "step": 9066} {"info/global_step": 9067, "train_info/time_within_train_step": 2.754169225692749, "step": 9067} {"train_info/time_between_train_steps": 0.0032663345336914062, "step": 9067} {"info/global_step": 9068, "train_info/time_within_train_step": 2.7552449703216553, "step": 9068} {"train_info/time_between_train_steps": 0.003239870071411133, "step": 9068} {"info/global_step": 9069, "train_info/time_within_train_step": 2.7561516761779785, "step": 9069} {"train_info/time_between_train_steps": 0.003369569778442383, "step": 9069} {"info/global_step": 9070, "train_info/time_within_train_step": 2.7557528018951416, "step": 9070} {"train_info/time_between_train_steps": 0.003404378890991211, "step": 9070} {"info/global_step": 9071, "train_info/time_within_train_step": 2.755492925643921, "step": 9071} {"train_info/time_between_train_steps": 0.02089715003967285, "step": 9071} {"info/global_step": 9072, "train_info/time_within_train_step": 2.7545533180236816, "step": 9072} {"train_info/time_between_train_steps": 0.0029249191284179688, "step": 9072} {"info/global_step": 9073, "train_info/time_within_train_step": 2.7547855377197266, "step": 9073} {"train_info/time_between_train_steps": 0.0029401779174804688, "step": 9073} {"info/global_step": 9074, "train_info/time_within_train_step": 3.0196404457092285, "step": 9074} {"train_info/time_between_train_steps": 0.0029201507568359375, "step": 9074} {"info/global_step": 9075, "train_info/time_within_train_step": 2.755460500717163, "step": 9075} {"train_info/time_between_train_steps": 0.002923727035522461, "step": 9075} {"info/global_step": 9076, "train_info/time_within_train_step": 2.75439715385437, "step": 9076} {"train_info/time_between_train_steps": 0.0029044151306152344, "step": 9076} {"info/global_step": 9077, "train_info/time_within_train_step": 2.751558542251587, "step": 9077} {"train_info/time_between_train_steps": 0.0029287338256835938, "step": 9077} {"info/global_step": 9078, "train_info/time_within_train_step": 2.754788875579834, "step": 9078} {"train_info/time_between_train_steps": 0.0028984546661376953, "step": 9078} {"info/global_step": 9079, "train_info/time_within_train_step": 2.7551300525665283, "step": 9079} {"train_info/time_between_train_steps": 0.0029282569885253906, "step": 9079} {"info/global_step": 9080, "train_info/time_within_train_step": 2.75512957572937, "step": 9080} {"train_info/time_between_train_steps": 0.002971649169921875, "step": 9080} {"info/global_step": 9081, "train_info/time_within_train_step": 2.75610613822937, "step": 9081} {"train_info/time_between_train_steps": 0.0029969215393066406, "step": 9081} {"info/global_step": 9082, "train_info/time_within_train_step": 2.7550745010375977, "step": 9082} {"train_info/time_between_train_steps": 0.003015279769897461, "step": 9082} {"info/global_step": 9083, "train_info/time_within_train_step": 2.754971981048584, "step": 9083} {"train_info/time_between_train_steps": 0.0030400753021240234, "step": 9083} {"info/global_step": 9084, "train_info/time_within_train_step": 2.7560434341430664, "step": 9084} {"train_info/time_between_train_steps": 0.002997159957885742, "step": 9084} {"info/global_step": 9085, "train_info/time_within_train_step": 2.7553622722625732, "step": 9085} {"train_info/time_between_train_steps": 0.0029609203338623047, "step": 9085} {"info/global_step": 9086, "train_info/time_within_train_step": 2.75555419921875, "step": 9086} {"train_info/time_between_train_steps": 0.0029942989349365234, "step": 9086} {"info/global_step": 9087, "train_info/time_within_train_step": 2.755800724029541, "step": 9087} {"train_info/time_between_train_steps": 0.0029828548431396484, "step": 9087} {"info/global_step": 9088, "train_info/time_within_train_step": 2.7562081813812256, "step": 9088} {"train_info/time_between_train_steps": 0.0029969215393066406, "step": 9088} {"info/global_step": 9089, "train_info/time_within_train_step": 2.761963367462158, "step": 9089} {"train_info/time_between_train_steps": 0.002866506576538086, "step": 9089} {"info/global_step": 9090, "train_info/time_within_train_step": 2.7559080123901367, "step": 9090} {"train_info/time_between_train_steps": 0.002957582473754883, "step": 9090} {"info/global_step": 9091, "train_info/time_within_train_step": 2.7556989192962646, "step": 9091} {"train_info/time_between_train_steps": 0.0029213428497314453, "step": 9091} {"info/global_step": 9092, "train_info/time_within_train_step": 2.7552664279937744, "step": 9092} {"train_info/time_between_train_steps": 0.0029609203338623047, "step": 9092} {"info/global_step": 9093, "train_info/time_within_train_step": 2.753762722015381, "step": 9093} {"train_info/time_between_train_steps": 0.0028777122497558594, "step": 9093} {"info/global_step": 9094, "train_info/time_within_train_step": 2.75526762008667, "step": 9094} {"train_info/time_between_train_steps": 0.002884387969970703, "step": 9094} {"info/global_step": 9095, "train_info/time_within_train_step": 2.754822015762329, "step": 9095} {"train_info/time_between_train_steps": 0.002888917922973633, "step": 9095} {"info/global_step": 9096, "train_info/time_within_train_step": 2.7547390460968018, "step": 9096} {"train_info/time_between_train_steps": 0.0029015541076660156, "step": 9096} {"info/global_step": 9097, "train_info/time_within_train_step": 2.7546956539154053, "step": 9097} {"train_info/time_between_train_steps": 0.0029180049896240234, "step": 9097} {"info/global_step": 9098, "train_info/time_within_train_step": 2.7542407512664795, "step": 9098} {"train_info/time_between_train_steps": 0.0029141902923583984, "step": 9098} {"info/global_step": 9099, "train_info/time_within_train_step": 2.7541189193725586, "step": 9099} {"train_info/time_between_train_steps": 0.002928018569946289, "step": 9099} {"info/global_step": 9100, "train_info/time_within_train_step": 2.7548859119415283, "step": 9100} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746592228, "_runtime": 26237}, "step": 9100} {"logs": {"train/loss": 2.9528, "train/learning_rate": 5.9999999999999995e-05, "train/epoch": 10.06, "_timestamp": 1746592228, "_runtime": 26237}, "step": 9100} {"train_info/time_between_train_steps": 0.006616115570068359, "step": 9100} {"info/global_step": 9101, "train_info/time_within_train_step": 2.7546043395996094, "step": 9101} {"train_info/time_between_train_steps": 0.0028769969940185547, "step": 9101} {"info/global_step": 9102, "train_info/time_within_train_step": 2.754101276397705, "step": 9102} {"train_info/time_between_train_steps": 0.0029273033142089844, "step": 9102} {"info/global_step": 9103, "train_info/time_within_train_step": 2.7548341751098633, "step": 9103} {"train_info/time_between_train_steps": 0.002960681915283203, "step": 9103} {"info/global_step": 9104, "train_info/time_within_train_step": 2.7556161880493164, "step": 9104} {"train_info/time_between_train_steps": 0.002917051315307617, "step": 9104} {"info/global_step": 9105, "train_info/time_within_train_step": 2.756376028060913, "step": 9105} {"train_info/time_between_train_steps": 0.0029344558715820312, "step": 9105} {"info/global_step": 9106, "train_info/time_within_train_step": 2.7620582580566406, "step": 9106} {"train_info/time_between_train_steps": 0.003954887390136719, "step": 9106} {"info/global_step": 9107, "train_info/time_within_train_step": 2.75610613822937, "step": 9107} {"train_info/time_between_train_steps": 0.0029823780059814453, "step": 9107} {"info/global_step": 9108, "train_info/time_within_train_step": 2.7573463916778564, "step": 9108} {"train_info/time_between_train_steps": 0.0035071372985839844, "step": 9108} {"info/global_step": 9109, "train_info/time_within_train_step": 2.7578976154327393, "step": 9109} {"train_info/time_between_train_steps": 0.002922534942626953, "step": 9109} {"info/global_step": 9110, "train_info/time_within_train_step": 2.7557461261749268, "step": 9110} {"train_info/time_between_train_steps": 0.0029273033142089844, "step": 9110} {"info/global_step": 9111, "train_info/time_within_train_step": 2.7546072006225586, "step": 9111} {"train_info/time_between_train_steps": 0.0028769969940185547, "step": 9111} {"info/global_step": 9112, "train_info/time_within_train_step": 2.754537343978882, "step": 9112} {"train_info/time_between_train_steps": 0.0029048919677734375, "step": 9112} {"info/global_step": 9113, "train_info/time_within_train_step": 2.754676580429077, "step": 9113} {"train_info/time_between_train_steps": 0.0029103755950927734, "step": 9113} {"info/global_step": 9114, "train_info/time_within_train_step": 2.754993438720703, "step": 9114} {"train_info/time_between_train_steps": 0.002916574478149414, "step": 9114} {"info/global_step": 9115, "train_info/time_within_train_step": 2.755387306213379, "step": 9115} {"train_info/time_between_train_steps": 0.002892732620239258, "step": 9115} {"info/global_step": 9116, "train_info/time_within_train_step": 2.755413055419922, "step": 9116} {"train_info/time_between_train_steps": 0.0029015541076660156, "step": 9116} {"info/global_step": 9117, "train_info/time_within_train_step": 2.7545180320739746, "step": 9117} {"train_info/time_between_train_steps": 0.0029103755950927734, "step": 9117} {"info/global_step": 9118, "train_info/time_within_train_step": 2.7551701068878174, "step": 9118} {"train_info/time_between_train_steps": 0.002890348434448242, "step": 9118} {"info/global_step": 9119, "train_info/time_within_train_step": 2.951674699783325, "step": 9119} {"train_info/time_between_train_steps": 0.0029337406158447266, "step": 9119} {"info/global_step": 9120, "train_info/time_within_train_step": 2.755563735961914, "step": 9120} {"train_info/time_between_train_steps": 0.0028967857360839844, "step": 9120} {"info/global_step": 9121, "train_info/time_within_train_step": 2.7563700675964355, "step": 9121} {"train_info/time_between_train_steps": 0.0029075145721435547, "step": 9121} {"info/global_step": 9122, "train_info/time_within_train_step": 2.7558538913726807, "step": 9122} {"train_info/time_between_train_steps": 0.002899169921875, "step": 9122} {"info/global_step": 9123, "train_info/time_within_train_step": 2.755397081375122, "step": 9123} {"train_info/time_between_train_steps": 0.003353118896484375, "step": 9123} {"info/global_step": 9124, "train_info/time_within_train_step": 2.7549474239349365, "step": 9124} {"train_info/time_between_train_steps": 0.0028760433197021484, "step": 9124} {"info/global_step": 9125, "train_info/time_within_train_step": 2.7549283504486084, "step": 9125} {"train_info/time_between_train_steps": 0.002912759780883789, "step": 9125} {"info/global_step": 9126, "train_info/time_within_train_step": 2.756220579147339, "step": 9126} {"train_info/time_between_train_steps": 0.0029807090759277344, "step": 9126} {"info/global_step": 9127, "train_info/time_within_train_step": 2.7569937705993652, "step": 9127} {"train_info/time_between_train_steps": 0.0029723644256591797, "step": 9127} {"info/global_step": 9128, "train_info/time_within_train_step": 2.756103515625, "step": 9128} {"train_info/time_between_train_steps": 0.0030031204223632812, "step": 9128} {"info/global_step": 9129, "train_info/time_within_train_step": 2.7566006183624268, "step": 9129} {"train_info/time_between_train_steps": 0.0029692649841308594, "step": 9129} {"info/global_step": 9130, "train_info/time_within_train_step": 2.7568185329437256, "step": 9130} {"train_info/time_between_train_steps": 0.0030040740966796875, "step": 9130} {"info/global_step": 9131, "train_info/time_within_train_step": 2.755789041519165, "step": 9131} {"train_info/time_between_train_steps": 0.0030183792114257812, "step": 9131} {"info/global_step": 9132, "train_info/time_within_train_step": 2.75535249710083, "step": 9132} {"train_info/time_between_train_steps": 0.0029926300048828125, "step": 9132} {"info/global_step": 9133, "train_info/time_within_train_step": 2.7557835578918457, "step": 9133} {"train_info/time_between_train_steps": 0.0029823780059814453, "step": 9133} {"info/global_step": 9134, "train_info/time_within_train_step": 2.7568492889404297, "step": 9134} {"train_info/time_between_train_steps": 0.002970457077026367, "step": 9134} {"info/global_step": 9135, "train_info/time_within_train_step": 2.7572407722473145, "step": 9135} {"train_info/time_between_train_steps": 0.003004312515258789, "step": 9135} {"info/global_step": 9136, "train_info/time_within_train_step": 2.7566587924957275, "step": 9136} {"train_info/time_between_train_steps": 0.0030164718627929688, "step": 9136} {"info/global_step": 9137, "train_info/time_within_train_step": 2.756972312927246, "step": 9137} {"train_info/time_between_train_steps": 0.002991914749145508, "step": 9137} {"info/global_step": 9138, "train_info/time_within_train_step": 2.756726026535034, "step": 9138} {"train_info/time_between_train_steps": 0.0029888153076171875, "step": 9138} {"info/global_step": 9139, "train_info/time_within_train_step": 2.7556211948394775, "step": 9139} {"train_info/time_between_train_steps": 0.0029044151306152344, "step": 9139} {"info/global_step": 9140, "train_info/time_within_train_step": 2.7553870677948, "step": 9140} {"train_info/time_between_train_steps": 0.0028905868530273438, "step": 9140} {"info/global_step": 9141, "train_info/time_within_train_step": 2.7560019493103027, "step": 9141} {"train_info/time_between_train_steps": 0.002937793731689453, "step": 9141} {"info/global_step": 9142, "train_info/time_within_train_step": 2.754533052444458, "step": 9142} {"train_info/time_between_train_steps": 0.0029144287109375, "step": 9142} {"info/global_step": 9143, "train_info/time_within_train_step": 2.756352663040161, "step": 9143} {"train_info/time_between_train_steps": 0.002935171127319336, "step": 9143} {"info/global_step": 9144, "train_info/time_within_train_step": 2.7546842098236084, "step": 9144} {"train_info/time_between_train_steps": 0.0028836727142333984, "step": 9144} {"info/global_step": 9145, "train_info/time_within_train_step": 2.7542977333068848, "step": 9145} {"train_info/time_between_train_steps": 0.0029501914978027344, "step": 9145} {"info/global_step": 9146, "train_info/time_within_train_step": 2.7545154094696045, "step": 9146} {"train_info/time_between_train_steps": 0.002900362014770508, "step": 9146} {"info/global_step": 9147, "train_info/time_within_train_step": 2.755498170852661, "step": 9147} {"train_info/time_between_train_steps": 0.0028913021087646484, "step": 9147} {"info/global_step": 9148, "train_info/time_within_train_step": 2.755042791366577, "step": 9148} {"train_info/time_between_train_steps": 0.002894878387451172, "step": 9148} {"info/global_step": 9149, "train_info/time_within_train_step": 2.7560153007507324, "step": 9149} {"train_info/time_between_train_steps": 0.002994060516357422, "step": 9149} {"info/global_step": 9150, "train_info/time_within_train_step": 2.756927251815796, "step": 9150} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746592366, "_runtime": 26375}, "step": 9150} {"logs": {"train/loss": 2.95, "train/learning_rate": 5.666666666666666e-05, "train/epoch": 10.06, "_timestamp": 1746592366, "_runtime": 26375}, "step": 9150} {"train_info/time_between_train_steps": 0.006599903106689453, "step": 9150} {"info/global_step": 9151, "train_info/time_within_train_step": 2.756436824798584, "step": 9151} {"train_info/time_between_train_steps": 0.0029838085174560547, "step": 9151} {"info/global_step": 9152, "train_info/time_within_train_step": 2.757225275039673, "step": 9152} {"train_info/time_between_train_steps": 0.0034189224243164062, "step": 9152} {"info/global_step": 9153, "train_info/time_within_train_step": 2.756822109222412, "step": 9153} {"train_info/time_between_train_steps": 0.003040313720703125, "step": 9153} {"info/global_step": 9154, "train_info/time_within_train_step": 2.7562971115112305, "step": 9154} {"train_info/time_between_train_steps": 0.0030059814453125, "step": 9154} {"info/global_step": 9155, "train_info/time_within_train_step": 2.7559258937835693, "step": 9155} {"train_info/time_between_train_steps": 0.003012418746948242, "step": 9155} {"info/global_step": 9156, "train_info/time_within_train_step": 2.756340265274048, "step": 9156} {"train_info/time_between_train_steps": 0.0030078887939453125, "step": 9156} {"info/global_step": 9157, "train_info/time_within_train_step": 2.755223512649536, "step": 9157} {"train_info/time_between_train_steps": 0.0029032230377197266, "step": 9157} {"info/global_step": 9158, "train_info/time_within_train_step": 2.755523204803467, "step": 9158} {"train_info/time_between_train_steps": 0.0028998851776123047, "step": 9158} {"info/global_step": 9159, "train_info/time_within_train_step": 2.755286455154419, "step": 9159} {"train_info/time_between_train_steps": 0.002917051315307617, "step": 9159} {"info/global_step": 9160, "train_info/time_within_train_step": 2.753950834274292, "step": 9160} {"train_info/time_between_train_steps": 0.002883434295654297, "step": 9160} {"info/global_step": 9161, "train_info/time_within_train_step": 2.754932403564453, "step": 9161} {"train_info/time_between_train_steps": 0.0028917789459228516, "step": 9161} {"info/global_step": 9162, "train_info/time_within_train_step": 2.7556064128875732, "step": 9162} {"train_info/time_between_train_steps": 0.0029861927032470703, "step": 9162} {"info/global_step": 9163, "train_info/time_within_train_step": 2.7554500102996826, "step": 9163} {"train_info/time_between_train_steps": 0.0029463768005371094, "step": 9163} {"info/global_step": 9164, "train_info/time_within_train_step": 2.754507064819336, "step": 9164} {"train_info/time_between_train_steps": 0.0028831958770751953, "step": 9164} {"info/global_step": 9165, "train_info/time_within_train_step": 2.755939245223999, "step": 9165} {"train_info/time_between_train_steps": 0.0029032230377197266, "step": 9165} {"info/global_step": 9166, "train_info/time_within_train_step": 2.754655361175537, "step": 9166} {"train_info/time_between_train_steps": 0.0029256343841552734, "step": 9166} {"info/global_step": 9167, "train_info/time_within_train_step": 2.7546677589416504, "step": 9167} {"train_info/time_between_train_steps": 0.00296783447265625, "step": 9167} {"info/global_step": 9168, "train_info/time_within_train_step": 2.755598545074463, "step": 9168} {"train_info/time_between_train_steps": 0.0029382705688476562, "step": 9168} {"info/global_step": 9169, "train_info/time_within_train_step": 2.7566168308258057, "step": 9169} {"train_info/time_between_train_steps": 0.0029020309448242188, "step": 9169} {"info/global_step": 9170, "train_info/time_within_train_step": 2.7549517154693604, "step": 9170} {"train_info/time_between_train_steps": 0.002875804901123047, "step": 9170} {"info/global_step": 9171, "train_info/time_within_train_step": 2.755732774734497, "step": 9171} {"train_info/time_between_train_steps": 0.002931833267211914, "step": 9171} {"info/global_step": 9172, "train_info/time_within_train_step": 2.7557334899902344, "step": 9172} {"train_info/time_between_train_steps": 0.0029168128967285156, "step": 9172} {"info/global_step": 9173, "train_info/time_within_train_step": 2.755464553833008, "step": 9173} {"train_info/time_between_train_steps": 0.0029134750366210938, "step": 9173} {"info/global_step": 9174, "train_info/time_within_train_step": 2.755645513534546, "step": 9174} {"train_info/time_between_train_steps": 0.0029397010803222656, "step": 9174} {"info/global_step": 9175, "train_info/time_within_train_step": 2.7551307678222656, "step": 9175} {"train_info/time_between_train_steps": 0.0029120445251464844, "step": 9175} {"info/global_step": 9176, "train_info/time_within_train_step": 2.7553822994232178, "step": 9176} {"train_info/time_between_train_steps": 0.00290679931640625, "step": 9176} {"info/global_step": 9177, "train_info/time_within_train_step": 2.752653121948242, "step": 9177} {"train_info/time_between_train_steps": 0.0029382705688476562, "step": 9177} {"info/global_step": 9178, "train_info/time_within_train_step": 2.754589319229126, "step": 9178} {"train_info/time_between_train_steps": 0.002900362014770508, "step": 9178} {"info/global_step": 9179, "train_info/time_within_train_step": 2.7562663555145264, "step": 9179} {"train_info/time_between_train_steps": 0.0029044151306152344, "step": 9179} {"info/global_step": 9180, "train_info/time_within_train_step": 2.7557907104492188, "step": 9180} {"train_info/time_between_train_steps": 0.0028688907623291016, "step": 9180} {"info/global_step": 9181, "train_info/time_within_train_step": 2.7561798095703125, "step": 9181} {"train_info/time_between_train_steps": 0.0028595924377441406, "step": 9181} {"info/global_step": 9182, "train_info/time_within_train_step": 2.7561912536621094, "step": 9182} {"train_info/time_between_train_steps": 0.0028676986694335938, "step": 9182} {"info/global_step": 9183, "train_info/time_within_train_step": 2.7561419010162354, "step": 9183} {"train_info/time_between_train_steps": 0.002931356430053711, "step": 9183} {"info/global_step": 9184, "train_info/time_within_train_step": 2.7561521530151367, "step": 9184} {"train_info/time_between_train_steps": 0.0029153823852539062, "step": 9184} {"info/global_step": 9185, "train_info/time_within_train_step": 2.7551870346069336, "step": 9185} {"train_info/time_between_train_steps": 0.002926349639892578, "step": 9185} {"info/global_step": 9186, "train_info/time_within_train_step": 2.7573094367980957, "step": 9186} {"train_info/time_between_train_steps": 0.002916097640991211, "step": 9186} {"info/global_step": 9187, "train_info/time_within_train_step": 2.7558517456054688, "step": 9187} {"train_info/time_between_train_steps": 0.0029015541076660156, "step": 9187} {"info/global_step": 9188, "train_info/time_within_train_step": 2.7564687728881836, "step": 9188} {"train_info/time_between_train_steps": 0.0029191970825195312, "step": 9188} {"info/global_step": 9189, "train_info/time_within_train_step": 2.7549729347229004, "step": 9189} {"train_info/time_between_train_steps": 0.002933979034423828, "step": 9189} {"info/global_step": 9190, "train_info/time_within_train_step": 2.7542943954467773, "step": 9190} {"train_info/time_between_train_steps": 0.0029032230377197266, "step": 9190} {"info/global_step": 9191, "train_info/time_within_train_step": 2.7551205158233643, "step": 9191} {"train_info/time_between_train_steps": 0.002977609634399414, "step": 9191} {"info/global_step": 9192, "train_info/time_within_train_step": 2.7553162574768066, "step": 9192} {"train_info/time_between_train_steps": 0.0029048919677734375, "step": 9192} {"info/global_step": 9193, "train_info/time_within_train_step": 2.7559571266174316, "step": 9193} {"train_info/time_between_train_steps": 0.002920866012573242, "step": 9193} {"info/global_step": 9194, "train_info/time_within_train_step": 2.7549867630004883, "step": 9194} {"train_info/time_between_train_steps": 0.0029544830322265625, "step": 9194} {"info/global_step": 9195, "train_info/time_within_train_step": 2.7554452419281006, "step": 9195} {"train_info/time_between_train_steps": 0.0029578208923339844, "step": 9195} {"info/global_step": 9196, "train_info/time_within_train_step": 2.755784749984741, "step": 9196} {"train_info/time_between_train_steps": 0.0028972625732421875, "step": 9196} {"info/global_step": 9197, "train_info/time_within_train_step": 2.756486177444458, "step": 9197} {"train_info/time_between_train_steps": 0.002908945083618164, "step": 9197} {"info/global_step": 9198, "train_info/time_within_train_step": 2.75386905670166, "step": 9198} {"train_info/time_between_train_steps": 0.0029320716857910156, "step": 9198} {"info/global_step": 9199, "train_info/time_within_train_step": 2.7553980350494385, "step": 9199} {"train_info/time_between_train_steps": 0.0029015541076660156, "step": 9199} {"info/global_step": 9200, "train_info/time_within_train_step": 2.75504732131958, "step": 9200} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746592504, "_runtime": 26513}, "step": 9200} {"logs": {"train/loss": 2.9388, "train/learning_rate": 5.333333333333333e-05, "train/epoch": 10.07, "_timestamp": 1746592504, "_runtime": 26513}, "step": 9200} {"train_info/time_between_train_steps": 13.404761552810669, "step": 9200} {"info/global_step": 9201, "train_info/time_within_train_step": 2.5324816703796387, "step": 9201} {"train_info/time_between_train_steps": 0.0029947757720947266, "step": 9201} {"info/global_step": 9202, "train_info/time_within_train_step": 2.6181087493896484, "step": 9202} {"train_info/time_between_train_steps": 0.003032684326171875, "step": 9202} {"info/global_step": 9203, "train_info/time_within_train_step": 2.734400987625122, "step": 9203} {"train_info/time_between_train_steps": 0.0029942989349365234, "step": 9203} {"info/global_step": 9204, "train_info/time_within_train_step": 2.751145124435425, "step": 9204} {"train_info/time_between_train_steps": 0.0029840469360351562, "step": 9204} {"info/global_step": 9205, "train_info/time_within_train_step": 2.7540407180786133, "step": 9205} {"train_info/time_between_train_steps": 0.0030248165130615234, "step": 9205} {"info/global_step": 9206, "train_info/time_within_train_step": 2.756591558456421, "step": 9206} {"train_info/time_between_train_steps": 0.0030257701873779297, "step": 9206} {"info/global_step": 9207, "train_info/time_within_train_step": 2.755854606628418, "step": 9207} {"train_info/time_between_train_steps": 0.002969503402709961, "step": 9207} {"info/global_step": 9208, "train_info/time_within_train_step": 2.75673246383667, "step": 9208} {"train_info/time_between_train_steps": 0.0029878616333007812, "step": 9208} {"info/global_step": 9209, "train_info/time_within_train_step": 2.7552542686462402, "step": 9209} {"train_info/time_between_train_steps": 0.0030133724212646484, "step": 9209} {"info/global_step": 9210, "train_info/time_within_train_step": 2.756380319595337, "step": 9210} {"train_info/time_between_train_steps": 0.0029802322387695312, "step": 9210} {"info/global_step": 9211, "train_info/time_within_train_step": 2.7567198276519775, "step": 9211} {"train_info/time_between_train_steps": 0.0030443668365478516, "step": 9211} {"info/global_step": 9212, "train_info/time_within_train_step": 2.903552293777466, "step": 9212} {"train_info/time_between_train_steps": 0.0029578208923339844, "step": 9212} {"info/global_step": 9213, "train_info/time_within_train_step": 2.7578306198120117, "step": 9213} {"train_info/time_between_train_steps": 0.0029375553131103516, "step": 9213} {"info/global_step": 9214, "train_info/time_within_train_step": 2.757309913635254, "step": 9214} {"train_info/time_between_train_steps": 0.002968311309814453, "step": 9214} {"info/global_step": 9215, "train_info/time_within_train_step": 2.7553467750549316, "step": 9215} {"train_info/time_between_train_steps": 0.0029757022857666016, "step": 9215} {"info/global_step": 9216, "train_info/time_within_train_step": 2.757134199142456, "step": 9216} {"train_info/time_between_train_steps": 0.002973794937133789, "step": 9216} {"info/global_step": 9217, "train_info/time_within_train_step": 2.7580368518829346, "step": 9217} {"train_info/time_between_train_steps": 0.0029506683349609375, "step": 9217} {"info/global_step": 9218, "train_info/time_within_train_step": 2.7572336196899414, "step": 9218} {"train_info/time_between_train_steps": 0.0030450820922851562, "step": 9218} {"info/global_step": 9219, "train_info/time_within_train_step": 2.757244110107422, "step": 9219} {"train_info/time_between_train_steps": 0.002998828887939453, "step": 9219} {"info/global_step": 9220, "train_info/time_within_train_step": 2.7575900554656982, "step": 9220} {"train_info/time_between_train_steps": 0.0030002593994140625, "step": 9220} {"info/global_step": 9221, "train_info/time_within_train_step": 2.7557785511016846, "step": 9221} {"train_info/time_between_train_steps": 0.002959728240966797, "step": 9221} {"info/global_step": 9222, "train_info/time_within_train_step": 2.7563555240631104, "step": 9222} {"train_info/time_between_train_steps": 0.002969026565551758, "step": 9222} {"info/global_step": 9223, "train_info/time_within_train_step": 2.7567427158355713, "step": 9223} {"train_info/time_between_train_steps": 0.003000497817993164, "step": 9223} {"info/global_step": 9224, "train_info/time_within_train_step": 2.7572438716888428, "step": 9224} {"train_info/time_between_train_steps": 0.002943754196166992, "step": 9224} {"info/global_step": 9225, "train_info/time_within_train_step": 2.7566843032836914, "step": 9225} {"train_info/time_between_train_steps": 0.002985715866088867, "step": 9225} {"info/global_step": 9226, "train_info/time_within_train_step": 2.757305383682251, "step": 9226} {"train_info/time_between_train_steps": 0.0029740333557128906, "step": 9226} {"info/global_step": 9227, "train_info/time_within_train_step": 2.759105682373047, "step": 9227} {"train_info/time_between_train_steps": 0.0029401779174804688, "step": 9227} {"info/global_step": 9228, "train_info/time_within_train_step": 2.757828950881958, "step": 9228} {"train_info/time_between_train_steps": 0.0030024051666259766, "step": 9228} {"info/global_step": 9229, "train_info/time_within_train_step": 2.7571864128112793, "step": 9229} {"train_info/time_between_train_steps": 0.0029916763305664062, "step": 9229} {"info/global_step": 9230, "train_info/time_within_train_step": 2.757120370864868, "step": 9230} {"train_info/time_between_train_steps": 0.0029358863830566406, "step": 9230} {"info/global_step": 9231, "train_info/time_within_train_step": 2.7573282718658447, "step": 9231} {"train_info/time_between_train_steps": 0.0029506683349609375, "step": 9231} {"info/global_step": 9232, "train_info/time_within_train_step": 2.758402109146118, "step": 9232} {"train_info/time_between_train_steps": 0.0030171871185302734, "step": 9232} {"info/global_step": 9233, "train_info/time_within_train_step": 2.7573015689849854, "step": 9233} {"train_info/time_between_train_steps": 0.003022432327270508, "step": 9233} {"info/global_step": 9234, "train_info/time_within_train_step": 2.756737232208252, "step": 9234} {"train_info/time_between_train_steps": 0.0030329227447509766, "step": 9234} {"info/global_step": 9235, "train_info/time_within_train_step": 2.7563672065734863, "step": 9235} {"train_info/time_between_train_steps": 0.0029702186584472656, "step": 9235} {"info/global_step": 9236, "train_info/time_within_train_step": 2.7568206787109375, "step": 9236} {"train_info/time_between_train_steps": 0.002978086471557617, "step": 9236} {"info/global_step": 9237, "train_info/time_within_train_step": 2.7569267749786377, "step": 9237} {"train_info/time_between_train_steps": 0.0029747486114501953, "step": 9237} {"info/global_step": 9238, "train_info/time_within_train_step": 2.757699489593506, "step": 9238} {"train_info/time_between_train_steps": 0.002969503402709961, "step": 9238} {"info/global_step": 9239, "train_info/time_within_train_step": 2.7569990158081055, "step": 9239} {"train_info/time_between_train_steps": 0.0029144287109375, "step": 9239} {"info/global_step": 9240, "train_info/time_within_train_step": 2.7557411193847656, "step": 9240} {"train_info/time_between_train_steps": 0.0028977394104003906, "step": 9240} {"info/global_step": 9241, "train_info/time_within_train_step": 2.7554996013641357, "step": 9241} {"train_info/time_between_train_steps": 0.0028848648071289062, "step": 9241} {"info/global_step": 9242, "train_info/time_within_train_step": 2.754502296447754, "step": 9242} {"train_info/time_between_train_steps": 0.0029480457305908203, "step": 9242} {"info/global_step": 9243, "train_info/time_within_train_step": 2.7552576065063477, "step": 9243} {"train_info/time_between_train_steps": 0.0029277801513671875, "step": 9243} {"info/global_step": 9244, "train_info/time_within_train_step": 2.755969285964966, "step": 9244} {"train_info/time_between_train_steps": 0.0028924942016601562, "step": 9244} {"info/global_step": 9245, "train_info/time_within_train_step": 3.3486382961273193, "step": 9245} {"train_info/time_between_train_steps": 0.0029277801513671875, "step": 9245} {"info/global_step": 9246, "train_info/time_within_train_step": 2.755662441253662, "step": 9246} {"train_info/time_between_train_steps": 0.002971649169921875, "step": 9246} {"info/global_step": 9247, "train_info/time_within_train_step": 2.7559330463409424, "step": 9247} {"train_info/time_between_train_steps": 0.0029098987579345703, "step": 9247} {"info/global_step": 9248, "train_info/time_within_train_step": 2.7557976245880127, "step": 9248} {"train_info/time_between_train_steps": 0.0030052661895751953, "step": 9248} {"info/global_step": 9249, "train_info/time_within_train_step": 2.75546932220459, "step": 9249} {"train_info/time_between_train_steps": 0.002911090850830078, "step": 9249} {"info/global_step": 9250, "train_info/time_within_train_step": 2.755181074142456, "step": 9250} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746592656, "_runtime": 26665}, "step": 9250} {"logs": {"train/loss": 2.9366, "train/learning_rate": 4.9999999999999996e-05, "train/epoch": 10.07, "_timestamp": 1746592656, "_runtime": 26665}, "step": 9250} {"train_info/time_between_train_steps": 0.00655817985534668, "step": 9250} {"info/global_step": 9251, "train_info/time_within_train_step": 2.7552847862243652, "step": 9251} {"train_info/time_between_train_steps": 0.0029535293579101562, "step": 9251} {"info/global_step": 9252, "train_info/time_within_train_step": 2.7558658123016357, "step": 9252} {"train_info/time_between_train_steps": 0.0029144287109375, "step": 9252} {"info/global_step": 9253, "train_info/time_within_train_step": 2.755044460296631, "step": 9253} {"train_info/time_between_train_steps": 0.002920866012573242, "step": 9253} {"info/global_step": 9254, "train_info/time_within_train_step": 2.75484561920166, "step": 9254} {"train_info/time_between_train_steps": 0.002964019775390625, "step": 9254} {"info/global_step": 9255, "train_info/time_within_train_step": 2.7552428245544434, "step": 9255} {"train_info/time_between_train_steps": 0.0029366016387939453, "step": 9255} {"info/global_step": 9256, "train_info/time_within_train_step": 2.7553369998931885, "step": 9256} {"train_info/time_between_train_steps": 0.0029518604278564453, "step": 9256} {"info/global_step": 9257, "train_info/time_within_train_step": 2.7556276321411133, "step": 9257} {"train_info/time_between_train_steps": 0.0029218196868896484, "step": 9257} {"info/global_step": 9258, "train_info/time_within_train_step": 2.7555580139160156, "step": 9258} {"train_info/time_between_train_steps": 0.002974987030029297, "step": 9258} {"info/global_step": 9259, "train_info/time_within_train_step": 2.7557668685913086, "step": 9259} {"train_info/time_between_train_steps": 0.002888917922973633, "step": 9259} {"info/global_step": 9260, "train_info/time_within_train_step": 2.7549428939819336, "step": 9260} {"train_info/time_between_train_steps": 0.0029327869415283203, "step": 9260} {"info/global_step": 9261, "train_info/time_within_train_step": 2.754694700241089, "step": 9261} {"train_info/time_between_train_steps": 0.0029680728912353516, "step": 9261} {"info/global_step": 9262, "train_info/time_within_train_step": 2.75594425201416, "step": 9262} {"train_info/time_between_train_steps": 0.002920389175415039, "step": 9262} {"info/global_step": 9263, "train_info/time_within_train_step": 2.754178524017334, "step": 9263} {"train_info/time_between_train_steps": 0.002978086471557617, "step": 9263} {"info/global_step": 9264, "train_info/time_within_train_step": 2.7546348571777344, "step": 9264} {"train_info/time_between_train_steps": 0.0029098987579345703, "step": 9264} {"info/global_step": 9265, "train_info/time_within_train_step": 2.7555623054504395, "step": 9265} {"train_info/time_between_train_steps": 0.003071308135986328, "step": 9265} {"info/global_step": 9266, "train_info/time_within_train_step": 2.7566864490509033, "step": 9266} {"train_info/time_between_train_steps": 0.003003358840942383, "step": 9266} {"info/global_step": 9267, "train_info/time_within_train_step": 2.757253646850586, "step": 9267} {"train_info/time_between_train_steps": 0.0031180381774902344, "step": 9267} {"info/global_step": 9268, "train_info/time_within_train_step": 2.755680799484253, "step": 9268} {"train_info/time_between_train_steps": 0.0030059814453125, "step": 9268} {"info/global_step": 9269, "train_info/time_within_train_step": 2.756638526916504, "step": 9269} {"train_info/time_between_train_steps": 0.0029785633087158203, "step": 9269} {"info/global_step": 9270, "train_info/time_within_train_step": 2.7561349868774414, "step": 9270} {"train_info/time_between_train_steps": 0.0029959678649902344, "step": 9270} {"info/global_step": 9271, "train_info/time_within_train_step": 2.756202459335327, "step": 9271} {"train_info/time_between_train_steps": 0.0030105113983154297, "step": 9271} {"info/global_step": 9272, "train_info/time_within_train_step": 2.7573082447052, "step": 9272} {"train_info/time_between_train_steps": 0.003031492233276367, "step": 9272} {"info/global_step": 9273, "train_info/time_within_train_step": 2.7568273544311523, "step": 9273} {"train_info/time_between_train_steps": 0.002985239028930664, "step": 9273} {"info/global_step": 9274, "train_info/time_within_train_step": 2.756065845489502, "step": 9274} {"train_info/time_between_train_steps": 0.0030405521392822266, "step": 9274} {"info/global_step": 9275, "train_info/time_within_train_step": 2.7564024925231934, "step": 9275} {"train_info/time_between_train_steps": 0.002984285354614258, "step": 9275} {"info/global_step": 9276, "train_info/time_within_train_step": 2.756258726119995, "step": 9276} {"train_info/time_between_train_steps": 0.0030231475830078125, "step": 9276} {"info/global_step": 9277, "train_info/time_within_train_step": 2.7578067779541016, "step": 9277} {"train_info/time_between_train_steps": 0.003010272979736328, "step": 9277} {"info/global_step": 9278, "train_info/time_within_train_step": 2.7553389072418213, "step": 9278} {"train_info/time_between_train_steps": 0.0030274391174316406, "step": 9278} {"info/global_step": 9279, "train_info/time_within_train_step": 2.7543749809265137, "step": 9279} {"train_info/time_between_train_steps": 0.0030596256256103516, "step": 9279} {"info/global_step": 9280, "train_info/time_within_train_step": 2.7563962936401367, "step": 9280} {"train_info/time_between_train_steps": 0.005934953689575195, "step": 9280} {"info/global_step": 9281, "train_info/time_within_train_step": 2.7581353187561035, "step": 9281} {"train_info/time_between_train_steps": 0.005944728851318359, "step": 9281} {"info/global_step": 9282, "train_info/time_within_train_step": 2.7566444873809814, "step": 9282} {"train_info/time_between_train_steps": 0.005928754806518555, "step": 9282} {"info/global_step": 9283, "train_info/time_within_train_step": 2.7591018676757812, "step": 9283} {"train_info/time_between_train_steps": 0.00304412841796875, "step": 9283} {"info/global_step": 9284, "train_info/time_within_train_step": 2.756610155105591, "step": 9284} {"train_info/time_between_train_steps": 0.005856752395629883, "step": 9284} {"info/global_step": 9285, "train_info/time_within_train_step": 2.75909161567688, "step": 9285} {"train_info/time_between_train_steps": 0.005856990814208984, "step": 9285} {"info/global_step": 9286, "train_info/time_within_train_step": 2.75829815864563, "step": 9286} {"train_info/time_between_train_steps": 0.005846738815307617, "step": 9286} {"info/global_step": 9287, "train_info/time_within_train_step": 2.756512403488159, "step": 9287} {"train_info/time_between_train_steps": 0.006018161773681641, "step": 9287} {"info/global_step": 9288, "train_info/time_within_train_step": 2.758310079574585, "step": 9288} {"train_info/time_between_train_steps": 0.006025552749633789, "step": 9288} {"info/global_step": 9289, "train_info/time_within_train_step": 2.758402109146118, "step": 9289} {"train_info/time_between_train_steps": 0.0058917999267578125, "step": 9289} {"info/global_step": 9290, "train_info/time_within_train_step": 2.758605480194092, "step": 9290} {"train_info/time_between_train_steps": 0.005826234817504883, "step": 9290} {"info/global_step": 9291, "train_info/time_within_train_step": 2.7583534717559814, "step": 9291} {"train_info/time_between_train_steps": 0.00596165657043457, "step": 9291} {"info/global_step": 9292, "train_info/time_within_train_step": 2.7596497535705566, "step": 9292} {"train_info/time_between_train_steps": 0.006072282791137695, "step": 9292} {"info/global_step": 9293, "train_info/time_within_train_step": 2.758607864379883, "step": 9293} {"train_info/time_between_train_steps": 0.005934715270996094, "step": 9293} {"info/global_step": 9294, "train_info/time_within_train_step": 2.7580959796905518, "step": 9294} {"train_info/time_between_train_steps": 0.006022453308105469, "step": 9294} {"info/global_step": 9295, "train_info/time_within_train_step": 2.7604315280914307, "step": 9295} {"train_info/time_between_train_steps": 0.005955934524536133, "step": 9295} {"info/global_step": 9296, "train_info/time_within_train_step": 2.759033679962158, "step": 9296} {"train_info/time_between_train_steps": 0.0060312747955322266, "step": 9296} {"info/global_step": 9297, "train_info/time_within_train_step": 2.7588441371917725, "step": 9297} {"train_info/time_between_train_steps": 0.005891323089599609, "step": 9297} {"info/global_step": 9298, "train_info/time_within_train_step": 2.75913667678833, "step": 9298} {"train_info/time_between_train_steps": 0.005944252014160156, "step": 9298} {"info/global_step": 9299, "train_info/time_within_train_step": 2.758969306945801, "step": 9299} {"train_info/time_between_train_steps": 0.005934238433837891, "step": 9299} {"info/global_step": 9300, "train_info/time_within_train_step": 2.7607123851776123, "step": 9300} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746592795, "_runtime": 26804}, "step": 9300} {"logs": {"train/loss": 2.9265, "train/learning_rate": 4.6666666666666665e-05, "train/epoch": 10.08, "_timestamp": 1746592795, "_runtime": 26804}, "step": 9300} {"train_info/time_between_train_steps": 0.010603904724121094, "step": 9300} {"info/global_step": 9301, "train_info/time_within_train_step": 2.7570207118988037, "step": 9301} {"train_info/time_between_train_steps": 0.005910158157348633, "step": 9301} {"info/global_step": 9302, "train_info/time_within_train_step": 2.75866436958313, "step": 9302} {"train_info/time_between_train_steps": 0.002978086471557617, "step": 9302} {"info/global_step": 9303, "train_info/time_within_train_step": 2.755993366241455, "step": 9303} {"train_info/time_between_train_steps": 0.003001689910888672, "step": 9303} {"info/global_step": 9304, "train_info/time_within_train_step": 2.756739377975464, "step": 9304} {"train_info/time_between_train_steps": 0.002972126007080078, "step": 9304} {"info/global_step": 9305, "train_info/time_within_train_step": 2.756600856781006, "step": 9305} {"train_info/time_between_train_steps": 0.0030412673950195312, "step": 9305} {"info/global_step": 9306, "train_info/time_within_train_step": 2.757124900817871, "step": 9306} {"train_info/time_between_train_steps": 0.003000497817993164, "step": 9306} {"info/global_step": 9307, "train_info/time_within_train_step": 2.756012439727783, "step": 9307} {"train_info/time_between_train_steps": 0.0030128955841064453, "step": 9307} {"info/global_step": 9308, "train_info/time_within_train_step": 2.7558743953704834, "step": 9308} {"train_info/time_between_train_steps": 0.00299072265625, "step": 9308} {"info/global_step": 9309, "train_info/time_within_train_step": 2.7554049491882324, "step": 9309} {"train_info/time_between_train_steps": 0.00590205192565918, "step": 9309} {"info/global_step": 9310, "train_info/time_within_train_step": 2.757802963256836, "step": 9310} {"train_info/time_between_train_steps": 0.005882978439331055, "step": 9310} {"info/global_step": 9311, "train_info/time_within_train_step": 2.757693290710449, "step": 9311} {"train_info/time_between_train_steps": 0.005934476852416992, "step": 9311} {"info/global_step": 9312, "train_info/time_within_train_step": 2.7579164505004883, "step": 9312} {"train_info/time_between_train_steps": 0.005905628204345703, "step": 9312} {"info/global_step": 9313, "train_info/time_within_train_step": 2.7580270767211914, "step": 9313} {"train_info/time_between_train_steps": 0.005899667739868164, "step": 9313} {"info/global_step": 9314, "train_info/time_within_train_step": 2.757549285888672, "step": 9314} {"train_info/time_between_train_steps": 0.006026029586791992, "step": 9314} {"info/global_step": 9315, "train_info/time_within_train_step": 2.757007122039795, "step": 9315} {"train_info/time_between_train_steps": 0.00601959228515625, "step": 9315} {"info/global_step": 9316, "train_info/time_within_train_step": 2.757628917694092, "step": 9316} {"train_info/time_between_train_steps": 0.005997180938720703, "step": 9316} {"info/global_step": 9317, "train_info/time_within_train_step": 2.758622169494629, "step": 9317} {"train_info/time_between_train_steps": 0.006279945373535156, "step": 9317} {"info/global_step": 9318, "train_info/time_within_train_step": 2.840528726577759, "step": 9318} {"train_info/time_between_train_steps": 0.006010532379150391, "step": 9318} {"info/global_step": 9319, "train_info/time_within_train_step": 2.7581467628479004, "step": 9319} {"train_info/time_between_train_steps": 0.005995273590087891, "step": 9319} {"info/global_step": 9320, "train_info/time_within_train_step": 2.7558419704437256, "step": 9320} {"train_info/time_between_train_steps": 0.005950212478637695, "step": 9320} {"info/global_step": 9321, "train_info/time_within_train_step": 2.757777452468872, "step": 9321} {"train_info/time_between_train_steps": 0.005948305130004883, "step": 9321} {"info/global_step": 9322, "train_info/time_within_train_step": 2.7575342655181885, "step": 9322} {"train_info/time_between_train_steps": 0.005858182907104492, "step": 9322} {"info/global_step": 9323, "train_info/time_within_train_step": 2.7567825317382812, "step": 9323} {"train_info/time_between_train_steps": 0.005903482437133789, "step": 9323} {"info/global_step": 9324, "train_info/time_within_train_step": 2.757211446762085, "step": 9324} {"train_info/time_between_train_steps": 0.0058863162994384766, "step": 9324} {"info/global_step": 9325, "train_info/time_within_train_step": 2.7574732303619385, "step": 9325} {"train_info/time_between_train_steps": 0.005995273590087891, "step": 9325} {"info/global_step": 9326, "train_info/time_within_train_step": 2.75711727142334, "step": 9326} {"train_info/time_between_train_steps": 0.005941629409790039, "step": 9326} {"info/global_step": 9327, "train_info/time_within_train_step": 2.7552034854888916, "step": 9327} {"train_info/time_between_train_steps": 0.005963325500488281, "step": 9327} {"info/global_step": 9328, "train_info/time_within_train_step": 2.7574756145477295, "step": 9328} {"train_info/time_between_train_steps": 0.002980947494506836, "step": 9328} {"info/global_step": 9329, "train_info/time_within_train_step": 2.75536847114563, "step": 9329} {"train_info/time_between_train_steps": 0.0029213428497314453, "step": 9329} {"info/global_step": 9330, "train_info/time_within_train_step": 2.7546327114105225, "step": 9330} {"train_info/time_between_train_steps": 0.002936124801635742, "step": 9330} {"info/global_step": 9331, "train_info/time_within_train_step": 2.7538623809814453, "step": 9331} {"train_info/time_between_train_steps": 0.0029497146606445312, "step": 9331} {"info/global_step": 9332, "train_info/time_within_train_step": 2.754415988922119, "step": 9332} {"train_info/time_between_train_steps": 0.0029296875, "step": 9332} {"info/global_step": 9333, "train_info/time_within_train_step": 2.7549889087677, "step": 9333} {"train_info/time_between_train_steps": 0.002856731414794922, "step": 9333} {"info/global_step": 9334, "train_info/time_within_train_step": 2.754415988922119, "step": 9334} {"train_info/time_between_train_steps": 0.0029306411743164062, "step": 9334} {"info/global_step": 9335, "train_info/time_within_train_step": 2.7536325454711914, "step": 9335} {"train_info/time_between_train_steps": 0.002920866012573242, "step": 9335} {"info/global_step": 9336, "train_info/time_within_train_step": 2.754448175430298, "step": 9336} {"train_info/time_between_train_steps": 0.002941131591796875, "step": 9336} {"info/global_step": 9337, "train_info/time_within_train_step": 2.754317045211792, "step": 9337} {"train_info/time_between_train_steps": 0.0029380321502685547, "step": 9337} {"info/global_step": 9338, "train_info/time_within_train_step": 2.754002094268799, "step": 9338} {"train_info/time_between_train_steps": 0.002953767776489258, "step": 9338} {"info/global_step": 9339, "train_info/time_within_train_step": 2.754241704940796, "step": 9339} {"train_info/time_between_train_steps": 0.0029489994049072266, "step": 9339} {"info/global_step": 9340, "train_info/time_within_train_step": 2.7536940574645996, "step": 9340} {"train_info/time_between_train_steps": 0.002925872802734375, "step": 9340} {"info/global_step": 9341, "train_info/time_within_train_step": 2.754319667816162, "step": 9341} {"train_info/time_between_train_steps": 0.002953767776489258, "step": 9341} {"info/global_step": 9342, "train_info/time_within_train_step": 2.754643678665161, "step": 9342} {"train_info/time_between_train_steps": 0.0029022693634033203, "step": 9342} {"info/global_step": 9343, "train_info/time_within_train_step": 2.754734516143799, "step": 9343} {"train_info/time_between_train_steps": 0.0028781890869140625, "step": 9343} {"info/global_step": 9344, "train_info/time_within_train_step": 2.7560765743255615, "step": 9344} {"train_info/time_between_train_steps": 0.003134489059448242, "step": 9344} {"info/global_step": 9345, "train_info/time_within_train_step": 2.756723403930664, "step": 9345} {"train_info/time_between_train_steps": 0.002977609634399414, "step": 9345} {"info/global_step": 9346, "train_info/time_within_train_step": 2.7560789585113525, "step": 9346} {"train_info/time_between_train_steps": 0.0030221939086914062, "step": 9346} {"info/global_step": 9347, "train_info/time_within_train_step": 2.7572953701019287, "step": 9347} {"train_info/time_between_train_steps": 0.003063201904296875, "step": 9347} {"info/global_step": 9348, "train_info/time_within_train_step": 2.7571027278900146, "step": 9348} {"train_info/time_between_train_steps": 0.0030672550201416016, "step": 9348} {"info/global_step": 9349, "train_info/time_within_train_step": 2.7553021907806396, "step": 9349} {"train_info/time_between_train_steps": 0.002946615219116211, "step": 9349} {"info/global_step": 9350, "train_info/time_within_train_step": 2.755453586578369, "step": 9350} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746592933, "_runtime": 26942}, "step": 9350} {"logs": {"train/loss": 2.9112, "train/learning_rate": 4.333333333333333e-05, "train/epoch": 10.08, "_timestamp": 1746592933, "_runtime": 26942}, "step": 9350} {"train_info/time_between_train_steps": 0.006689786911010742, "step": 9350} {"info/global_step": 9351, "train_info/time_within_train_step": 2.755866527557373, "step": 9351} {"train_info/time_between_train_steps": 0.0030434131622314453, "step": 9351} {"info/global_step": 9352, "train_info/time_within_train_step": 2.7559561729431152, "step": 9352} {"train_info/time_between_train_steps": 0.003021717071533203, "step": 9352} {"info/global_step": 9353, "train_info/time_within_train_step": 2.7556726932525635, "step": 9353} {"train_info/time_between_train_steps": 0.003052234649658203, "step": 9353} {"info/global_step": 9354, "train_info/time_within_train_step": 2.7555510997772217, "step": 9354} {"train_info/time_between_train_steps": 0.0029113292694091797, "step": 9354} {"info/global_step": 9355, "train_info/time_within_train_step": 2.75553035736084, "step": 9355} {"train_info/time_between_train_steps": 0.0029304027557373047, "step": 9355} {"info/global_step": 9356, "train_info/time_within_train_step": 2.7544472217559814, "step": 9356} {"train_info/time_between_train_steps": 0.002981901168823242, "step": 9356} {"info/global_step": 9357, "train_info/time_within_train_step": 2.7549257278442383, "step": 9357} {"train_info/time_between_train_steps": 0.0030579566955566406, "step": 9357} {"info/global_step": 9358, "train_info/time_within_train_step": 2.7558460235595703, "step": 9358} {"train_info/time_between_train_steps": 0.0029125213623046875, "step": 9358} {"info/global_step": 9359, "train_info/time_within_train_step": 2.755298376083374, "step": 9359} {"train_info/time_between_train_steps": 0.0029420852661132812, "step": 9359} {"info/global_step": 9360, "train_info/time_within_train_step": 2.7560572624206543, "step": 9360} {"train_info/time_between_train_steps": 0.0029425621032714844, "step": 9360} {"info/global_step": 9361, "train_info/time_within_train_step": 2.756026029586792, "step": 9361} {"train_info/time_between_train_steps": 0.0030603408813476562, "step": 9361} {"info/global_step": 9362, "train_info/time_within_train_step": 2.755225896835327, "step": 9362} {"train_info/time_between_train_steps": 0.0029206275939941406, "step": 9362} {"info/global_step": 9363, "train_info/time_within_train_step": 2.755850076675415, "step": 9363} {"train_info/time_between_train_steps": 0.0029709339141845703, "step": 9363} {"info/global_step": 9364, "train_info/time_within_train_step": 2.7562763690948486, "step": 9364} {"train_info/time_between_train_steps": 0.003069162368774414, "step": 9364} {"info/global_step": 9365, "train_info/time_within_train_step": 2.7555885314941406, "step": 9365} {"train_info/time_between_train_steps": 0.002950429916381836, "step": 9365} {"info/global_step": 9366, "train_info/time_within_train_step": 2.755979537963867, "step": 9366} {"train_info/time_between_train_steps": 0.0030498504638671875, "step": 9366} {"info/global_step": 9367, "train_info/time_within_train_step": 2.7551939487457275, "step": 9367} {"train_info/time_between_train_steps": 0.0031194686889648438, "step": 9367} {"info/global_step": 9368, "train_info/time_within_train_step": 2.7553982734680176, "step": 9368} {"train_info/time_between_train_steps": 0.003225088119506836, "step": 9368} {"info/global_step": 9369, "train_info/time_within_train_step": 2.756218671798706, "step": 9369} {"train_info/time_between_train_steps": 0.0031518936157226562, "step": 9369} {"info/global_step": 9370, "train_info/time_within_train_step": 2.756196975708008, "step": 9370} {"train_info/time_between_train_steps": 0.003151416778564453, "step": 9370} {"info/global_step": 9371, "train_info/time_within_train_step": 2.755842685699463, "step": 9371} {"train_info/time_between_train_steps": 0.0030503273010253906, "step": 9371} {"info/global_step": 9372, "train_info/time_within_train_step": 2.7561936378479004, "step": 9372} {"train_info/time_between_train_steps": 0.0031020641326904297, "step": 9372} {"info/global_step": 9373, "train_info/time_within_train_step": 2.7567293643951416, "step": 9373} {"train_info/time_between_train_steps": 0.0031366348266601562, "step": 9373} {"info/global_step": 9374, "train_info/time_within_train_step": 2.7567505836486816, "step": 9374} {"train_info/time_between_train_steps": 0.0032765865325927734, "step": 9374} {"info/global_step": 9375, "train_info/time_within_train_step": 2.8011510372161865, "step": 9375} {"train_info/time_between_train_steps": 0.003141641616821289, "step": 9375} {"info/global_step": 9376, "train_info/time_within_train_step": 2.757749080657959, "step": 9376} {"train_info/time_between_train_steps": 0.0030710697174072266, "step": 9376} {"info/global_step": 9377, "train_info/time_within_train_step": 2.7560946941375732, "step": 9377} {"train_info/time_between_train_steps": 0.0031561851501464844, "step": 9377} {"info/global_step": 9378, "train_info/time_within_train_step": 2.7581236362457275, "step": 9378} {"train_info/time_between_train_steps": 0.0034258365631103516, "step": 9378} {"info/global_step": 9379, "train_info/time_within_train_step": 2.7564382553100586, "step": 9379} {"train_info/time_between_train_steps": 0.0033140182495117188, "step": 9379} {"info/global_step": 9380, "train_info/time_within_train_step": 2.757619619369507, "step": 9380} {"train_info/time_between_train_steps": 0.003221750259399414, "step": 9380} {"info/global_step": 9381, "train_info/time_within_train_step": 2.7583932876586914, "step": 9381} {"train_info/time_between_train_steps": 0.003220081329345703, "step": 9381} {"info/global_step": 9382, "train_info/time_within_train_step": 2.757469892501831, "step": 9382} {"train_info/time_between_train_steps": 0.0031578540802001953, "step": 9382} {"info/global_step": 9383, "train_info/time_within_train_step": 2.7582554817199707, "step": 9383} {"train_info/time_between_train_steps": 0.0033943653106689453, "step": 9383} {"train_info/time_between_train_steps": 3.0653371810913086, "step": 9383} {"info/global_step": 9384, "train_info/time_within_train_step": 2.699782133102417, "step": 9384} {"train_info/time_between_train_steps": 0.0031528472900390625, "step": 9384} {"info/global_step": 9385, "train_info/time_within_train_step": 2.7558493614196777, "step": 9385} {"train_info/time_between_train_steps": 0.003202676773071289, "step": 9385} {"info/global_step": 9386, "train_info/time_within_train_step": 2.7555460929870605, "step": 9386} {"train_info/time_between_train_steps": 0.003185749053955078, "step": 9386} {"info/global_step": 9387, "train_info/time_within_train_step": 2.7562670707702637, "step": 9387} {"train_info/time_between_train_steps": 0.0031235218048095703, "step": 9387} {"info/global_step": 9388, "train_info/time_within_train_step": 2.756639242172241, "step": 9388} {"train_info/time_between_train_steps": 0.003164529800415039, "step": 9388} {"info/global_step": 9389, "train_info/time_within_train_step": 2.984891414642334, "step": 9389} {"train_info/time_between_train_steps": 0.003131389617919922, "step": 9389} {"info/global_step": 9390, "train_info/time_within_train_step": 2.7568647861480713, "step": 9390} {"train_info/time_between_train_steps": 0.0032224655151367188, "step": 9390} {"info/global_step": 9391, "train_info/time_within_train_step": 2.7554092407226562, "step": 9391} {"train_info/time_between_train_steps": 0.003203153610229492, "step": 9391} {"info/global_step": 9392, "train_info/time_within_train_step": 2.756681442260742, "step": 9392} {"train_info/time_between_train_steps": 0.003171682357788086, "step": 9392} {"info/global_step": 9393, "train_info/time_within_train_step": 2.7566139698028564, "step": 9393} {"train_info/time_between_train_steps": 0.003207683563232422, "step": 9393} {"info/global_step": 9394, "train_info/time_within_train_step": 2.7562241554260254, "step": 9394} {"train_info/time_between_train_steps": 0.003206968307495117, "step": 9394} {"info/global_step": 9395, "train_info/time_within_train_step": 2.756045341491699, "step": 9395} {"train_info/time_between_train_steps": 0.0031876564025878906, "step": 9395} {"info/global_step": 9396, "train_info/time_within_train_step": 2.7558979988098145, "step": 9396} {"train_info/time_between_train_steps": 0.0032072067260742188, "step": 9396} {"info/global_step": 9397, "train_info/time_within_train_step": 2.7553396224975586, "step": 9397} {"train_info/time_between_train_steps": 0.0031347274780273438, "step": 9397} {"info/global_step": 9398, "train_info/time_within_train_step": 2.7572407722473145, "step": 9398} {"train_info/time_between_train_steps": 0.0031561851501464844, "step": 9398} {"info/global_step": 9399, "train_info/time_within_train_step": 2.756204605102539, "step": 9399} {"train_info/time_between_train_steps": 0.003195047378540039, "step": 9399} {"info/global_step": 9400, "train_info/time_within_train_step": 2.755653142929077, "step": 9400} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746593074, "_runtime": 27083}, "step": 9400} {"logs": {"train/loss": 2.9589, "train/learning_rate": 3.9999999999999996e-05, "train/epoch": 11.0, "_timestamp": 1746593074, "_runtime": 27083}, "step": 9400} {"train_info/time_between_train_steps": 13.276172399520874, "step": 9400} {"info/global_step": 9401, "train_info/time_within_train_step": 2.537187337875366, "step": 9401} {"train_info/time_between_train_steps": 0.0031642913818359375, "step": 9401} {"info/global_step": 9402, "train_info/time_within_train_step": 2.584266424179077, "step": 9402} {"train_info/time_between_train_steps": 0.0032129287719726562, "step": 9402} {"info/global_step": 9403, "train_info/time_within_train_step": 2.73030424118042, "step": 9403} {"train_info/time_between_train_steps": 0.003161191940307617, "step": 9403} {"info/global_step": 9404, "train_info/time_within_train_step": 2.753101110458374, "step": 9404} {"train_info/time_between_train_steps": 0.0031311511993408203, "step": 9404} {"info/global_step": 9405, "train_info/time_within_train_step": 2.754957675933838, "step": 9405} {"train_info/time_between_train_steps": 0.0032019615173339844, "step": 9405} {"info/global_step": 9406, "train_info/time_within_train_step": 2.7556521892547607, "step": 9406} {"train_info/time_between_train_steps": 0.003189563751220703, "step": 9406} {"info/global_step": 9407, "train_info/time_within_train_step": 2.7559797763824463, "step": 9407} {"train_info/time_between_train_steps": 0.003168344497680664, "step": 9407} {"info/global_step": 9408, "train_info/time_within_train_step": 2.756108283996582, "step": 9408} {"train_info/time_between_train_steps": 0.003145456314086914, "step": 9408} {"info/global_step": 9409, "train_info/time_within_train_step": 2.7564830780029297, "step": 9409} {"train_info/time_between_train_steps": 0.0031549930572509766, "step": 9409} {"info/global_step": 9410, "train_info/time_within_train_step": 2.7564339637756348, "step": 9410} {"train_info/time_between_train_steps": 0.003350496292114258, "step": 9410} {"info/global_step": 9411, "train_info/time_within_train_step": 2.755178928375244, "step": 9411} {"train_info/time_between_train_steps": 0.0031995773315429688, "step": 9411} {"info/global_step": 9412, "train_info/time_within_train_step": 2.7566518783569336, "step": 9412} {"train_info/time_between_train_steps": 0.003152608871459961, "step": 9412} {"info/global_step": 9413, "train_info/time_within_train_step": 2.755821704864502, "step": 9413} {"train_info/time_between_train_steps": 0.0032281875610351562, "step": 9413} {"info/global_step": 9414, "train_info/time_within_train_step": 2.7554538249969482, "step": 9414} {"train_info/time_between_train_steps": 0.003112316131591797, "step": 9414} {"info/global_step": 9415, "train_info/time_within_train_step": 2.7555017471313477, "step": 9415} {"train_info/time_between_train_steps": 0.0031583309173583984, "step": 9415} {"info/global_step": 9416, "train_info/time_within_train_step": 2.7578465938568115, "step": 9416} {"train_info/time_between_train_steps": 0.003313779830932617, "step": 9416} {"info/global_step": 9417, "train_info/time_within_train_step": 2.7579727172851562, "step": 9417} {"train_info/time_between_train_steps": 0.003381490707397461, "step": 9417} {"info/global_step": 9418, "train_info/time_within_train_step": 2.757518768310547, "step": 9418} {"train_info/time_between_train_steps": 0.003195524215698242, "step": 9418} {"info/global_step": 9419, "train_info/time_within_train_step": 2.7566356658935547, "step": 9419} {"train_info/time_between_train_steps": 0.0031511783599853516, "step": 9419} {"info/global_step": 9420, "train_info/time_within_train_step": 2.756791114807129, "step": 9420} {"train_info/time_between_train_steps": 0.0031554698944091797, "step": 9420} {"info/global_step": 9421, "train_info/time_within_train_step": 2.7590694427490234, "step": 9421} {"train_info/time_between_train_steps": 0.0032973289489746094, "step": 9421} {"info/global_step": 9422, "train_info/time_within_train_step": 2.7580573558807373, "step": 9422} {"train_info/time_between_train_steps": 0.0033233165740966797, "step": 9422} {"info/global_step": 9423, "train_info/time_within_train_step": 2.758214235305786, "step": 9423} {"train_info/time_between_train_steps": 0.0033559799194335938, "step": 9423} {"info/global_step": 9424, "train_info/time_within_train_step": 2.7581233978271484, "step": 9424} {"train_info/time_between_train_steps": 0.0031833648681640625, "step": 9424} {"info/global_step": 9425, "train_info/time_within_train_step": 2.7574071884155273, "step": 9425} {"train_info/time_between_train_steps": 0.003242015838623047, "step": 9425} {"info/global_step": 9426, "train_info/time_within_train_step": 2.757577657699585, "step": 9426} {"train_info/time_between_train_steps": 0.003192424774169922, "step": 9426} {"info/global_step": 9427, "train_info/time_within_train_step": 2.757883071899414, "step": 9427} {"train_info/time_between_train_steps": 0.003179788589477539, "step": 9427} {"info/global_step": 9428, "train_info/time_within_train_step": 2.757000207901001, "step": 9428} {"train_info/time_between_train_steps": 0.0032122135162353516, "step": 9428} {"info/global_step": 9429, "train_info/time_within_train_step": 2.756253480911255, "step": 9429} {"train_info/time_between_train_steps": 0.003160238265991211, "step": 9429} {"info/global_step": 9430, "train_info/time_within_train_step": 2.7577288150787354, "step": 9430} {"train_info/time_between_train_steps": 0.0031838417053222656, "step": 9430} {"info/global_step": 9431, "train_info/time_within_train_step": 2.7563188076019287, "step": 9431} {"train_info/time_between_train_steps": 0.003181934356689453, "step": 9431} {"info/global_step": 9432, "train_info/time_within_train_step": 2.756622791290283, "step": 9432} {"train_info/time_between_train_steps": 0.0031669139862060547, "step": 9432} {"info/global_step": 9433, "train_info/time_within_train_step": 2.755354404449463, "step": 9433} {"train_info/time_between_train_steps": 0.003176450729370117, "step": 9433} {"info/global_step": 9434, "train_info/time_within_train_step": 2.75662899017334, "step": 9434} {"train_info/time_between_train_steps": 0.003152608871459961, "step": 9434} {"info/global_step": 9435, "train_info/time_within_train_step": 2.756415367126465, "step": 9435} {"train_info/time_between_train_steps": 0.0031790733337402344, "step": 9435} {"info/global_step": 9436, "train_info/time_within_train_step": 2.7564167976379395, "step": 9436} {"train_info/time_between_train_steps": 0.0031838417053222656, "step": 9436} {"info/global_step": 9437, "train_info/time_within_train_step": 2.755748987197876, "step": 9437} {"train_info/time_between_train_steps": 0.0032024383544921875, "step": 9437} {"info/global_step": 9438, "train_info/time_within_train_step": 2.7564663887023926, "step": 9438} {"train_info/time_between_train_steps": 0.0031316280364990234, "step": 9438} {"info/global_step": 9439, "train_info/time_within_train_step": 2.756256580352783, "step": 9439} {"train_info/time_between_train_steps": 0.003215789794921875, "step": 9439} {"info/global_step": 9440, "train_info/time_within_train_step": 2.756589412689209, "step": 9440} {"train_info/time_between_train_steps": 0.0031681060791015625, "step": 9440} {"info/global_step": 9441, "train_info/time_within_train_step": 2.755218744277954, "step": 9441} {"train_info/time_between_train_steps": 0.0032050609588623047, "step": 9441} {"info/global_step": 9442, "train_info/time_within_train_step": 2.756906270980835, "step": 9442} {"train_info/time_between_train_steps": 0.003179311752319336, "step": 9442} {"info/global_step": 9443, "train_info/time_within_train_step": 2.756196975708008, "step": 9443} {"train_info/time_between_train_steps": 0.003395557403564453, "step": 9443} {"info/global_step": 9444, "train_info/time_within_train_step": 2.756218194961548, "step": 9444} {"train_info/time_between_train_steps": 0.003164529800415039, "step": 9444} {"info/global_step": 9445, "train_info/time_within_train_step": 2.756261110305786, "step": 9445} {"train_info/time_between_train_steps": 0.0033893585205078125, "step": 9445} {"info/global_step": 9446, "train_info/time_within_train_step": 2.8832573890686035, "step": 9446} {"train_info/time_between_train_steps": 0.0031900405883789062, "step": 9446} {"info/global_step": 9447, "train_info/time_within_train_step": 2.7552905082702637, "step": 9447} {"train_info/time_between_train_steps": 0.00319671630859375, "step": 9447} {"info/global_step": 9448, "train_info/time_within_train_step": 2.756345510482788, "step": 9448} {"train_info/time_between_train_steps": 0.003171682357788086, "step": 9448} {"info/global_step": 9449, "train_info/time_within_train_step": 2.7556869983673096, "step": 9449} {"train_info/time_between_train_steps": 0.0031807422637939453, "step": 9449} {"info/global_step": 9450, "train_info/time_within_train_step": 2.756298065185547, "step": 9450} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746593225, "_runtime": 27234}, "step": 9450} {"logs": {"train/loss": 2.9153, "train/learning_rate": 3.666666666666666e-05, "train/epoch": 11.01, "_timestamp": 1746593225, "_runtime": 27234}, "step": 9450} {"train_info/time_between_train_steps": 0.00693202018737793, "step": 9450} {"info/global_step": 9451, "train_info/time_within_train_step": 2.754695177078247, "step": 9451} {"train_info/time_between_train_steps": 0.0031785964965820312, "step": 9451} {"info/global_step": 9452, "train_info/time_within_train_step": 2.756417989730835, "step": 9452} {"train_info/time_between_train_steps": 0.0032091140747070312, "step": 9452} {"info/global_step": 9453, "train_info/time_within_train_step": 2.7564806938171387, "step": 9453} {"train_info/time_between_train_steps": 0.003273487091064453, "step": 9453} {"info/global_step": 9454, "train_info/time_within_train_step": 2.756610155105591, "step": 9454} {"train_info/time_between_train_steps": 0.003206014633178711, "step": 9454} {"info/global_step": 9455, "train_info/time_within_train_step": 2.756516933441162, "step": 9455} {"train_info/time_between_train_steps": 0.003190755844116211, "step": 9455} {"info/global_step": 9456, "train_info/time_within_train_step": 2.7568442821502686, "step": 9456} {"train_info/time_between_train_steps": 0.0032052993774414062, "step": 9456} {"info/global_step": 9457, "train_info/time_within_train_step": 2.7558510303497314, "step": 9457} {"train_info/time_between_train_steps": 0.0031766891479492188, "step": 9457} {"info/global_step": 9458, "train_info/time_within_train_step": 2.75635027885437, "step": 9458} {"train_info/time_between_train_steps": 0.003185749053955078, "step": 9458} {"info/global_step": 9459, "train_info/time_within_train_step": 2.7561779022216797, "step": 9459} {"train_info/time_between_train_steps": 0.0032625198364257812, "step": 9459} {"info/global_step": 9460, "train_info/time_within_train_step": 2.7564120292663574, "step": 9460} {"train_info/time_between_train_steps": 0.0032243728637695312, "step": 9460} {"info/global_step": 9461, "train_info/time_within_train_step": 2.756385564804077, "step": 9461} {"train_info/time_between_train_steps": 0.003215789794921875, "step": 9461} {"info/global_step": 9462, "train_info/time_within_train_step": 2.7552614212036133, "step": 9462} {"train_info/time_between_train_steps": 0.003197908401489258, "step": 9462} {"info/global_step": 9463, "train_info/time_within_train_step": 2.756153106689453, "step": 9463} {"train_info/time_between_train_steps": 0.003179311752319336, "step": 9463} {"info/global_step": 9464, "train_info/time_within_train_step": 2.7553138732910156, "step": 9464} {"train_info/time_between_train_steps": 0.0031659603118896484, "step": 9464} {"info/global_step": 9465, "train_info/time_within_train_step": 2.754476308822632, "step": 9465} {"train_info/time_between_train_steps": 0.0031981468200683594, "step": 9465} {"info/global_step": 9466, "train_info/time_within_train_step": 2.7558999061584473, "step": 9466} {"train_info/time_between_train_steps": 0.003187894821166992, "step": 9466} {"info/global_step": 9467, "train_info/time_within_train_step": 2.756324291229248, "step": 9467} {"train_info/time_between_train_steps": 0.003215312957763672, "step": 9467} {"info/global_step": 9468, "train_info/time_within_train_step": 2.755418539047241, "step": 9468} {"train_info/time_between_train_steps": 0.0031671524047851562, "step": 9468} {"info/global_step": 9469, "train_info/time_within_train_step": 2.756455421447754, "step": 9469} {"train_info/time_between_train_steps": 0.003176450729370117, "step": 9469} {"info/global_step": 9470, "train_info/time_within_train_step": 2.7571518421173096, "step": 9470} {"train_info/time_between_train_steps": 0.003238201141357422, "step": 9470} {"info/global_step": 9471, "train_info/time_within_train_step": 2.7566394805908203, "step": 9471} {"train_info/time_between_train_steps": 0.003222227096557617, "step": 9471} {"info/global_step": 9472, "train_info/time_within_train_step": 2.7564384937286377, "step": 9472} {"train_info/time_between_train_steps": 0.0032231807708740234, "step": 9472} {"info/global_step": 9473, "train_info/time_within_train_step": 2.7564401626586914, "step": 9473} {"train_info/time_between_train_steps": 0.0031867027282714844, "step": 9473} {"info/global_step": 9474, "train_info/time_within_train_step": 2.756052017211914, "step": 9474} {"train_info/time_between_train_steps": 0.0032265186309814453, "step": 9474} {"info/global_step": 9475, "train_info/time_within_train_step": 3.008810043334961, "step": 9475} {"train_info/time_between_train_steps": 0.0031986236572265625, "step": 9475} {"info/global_step": 9476, "train_info/time_within_train_step": 2.7559428215026855, "step": 9476} {"train_info/time_between_train_steps": 0.0031905174255371094, "step": 9476} {"info/global_step": 9477, "train_info/time_within_train_step": 2.755202054977417, "step": 9477} {"train_info/time_between_train_steps": 0.003197908401489258, "step": 9477} {"info/global_step": 9478, "train_info/time_within_train_step": 2.755145788192749, "step": 9478} {"train_info/time_between_train_steps": 0.003170013427734375, "step": 9478} {"info/global_step": 9479, "train_info/time_within_train_step": 2.756152629852295, "step": 9479} {"train_info/time_between_train_steps": 0.0031747817993164062, "step": 9479} {"info/global_step": 9480, "train_info/time_within_train_step": 2.7555530071258545, "step": 9480} {"train_info/time_between_train_steps": 0.0032088756561279297, "step": 9480} {"info/global_step": 9481, "train_info/time_within_train_step": 2.7536888122558594, "step": 9481} {"train_info/time_between_train_steps": 0.0031740665435791016, "step": 9481} {"info/global_step": 9482, "train_info/time_within_train_step": 2.7560153007507324, "step": 9482} {"train_info/time_between_train_steps": 0.003324747085571289, "step": 9482} {"info/global_step": 9483, "train_info/time_within_train_step": 2.7557146549224854, "step": 9483} {"train_info/time_between_train_steps": 0.003336191177368164, "step": 9483} {"info/global_step": 9484, "train_info/time_within_train_step": 2.757577896118164, "step": 9484} {"train_info/time_between_train_steps": 0.003299713134765625, "step": 9484} {"info/global_step": 9485, "train_info/time_within_train_step": 2.758094310760498, "step": 9485} {"train_info/time_between_train_steps": 0.0033082962036132812, "step": 9485} {"info/global_step": 9486, "train_info/time_within_train_step": 2.75679612159729, "step": 9486} {"train_info/time_between_train_steps": 0.003312826156616211, "step": 9486} {"info/global_step": 9487, "train_info/time_within_train_step": 2.755988121032715, "step": 9487} {"train_info/time_between_train_steps": 0.0032761096954345703, "step": 9487} {"info/global_step": 9488, "train_info/time_within_train_step": 2.7577052116394043, "step": 9488} {"train_info/time_between_train_steps": 0.0033082962036132812, "step": 9488} {"info/global_step": 9489, "train_info/time_within_train_step": 2.7581944465637207, "step": 9489} {"train_info/time_between_train_steps": 0.0033063888549804688, "step": 9489} {"info/global_step": 9490, "train_info/time_within_train_step": 2.7571229934692383, "step": 9490} {"train_info/time_between_train_steps": 0.003364086151123047, "step": 9490} {"info/global_step": 9491, "train_info/time_within_train_step": 2.755570888519287, "step": 9491} {"train_info/time_between_train_steps": 0.0031495094299316406, "step": 9491} {"info/global_step": 9492, "train_info/time_within_train_step": 2.7553484439849854, "step": 9492} {"train_info/time_between_train_steps": 0.0032155513763427734, "step": 9492} {"info/global_step": 9493, "train_info/time_within_train_step": 2.7554776668548584, "step": 9493} {"train_info/time_between_train_steps": 0.0031752586364746094, "step": 9493} {"info/global_step": 9494, "train_info/time_within_train_step": 2.755699634552002, "step": 9494} {"train_info/time_between_train_steps": 0.0032110214233398438, "step": 9494} {"info/global_step": 9495, "train_info/time_within_train_step": 3.3302674293518066, "step": 9495} {"train_info/time_between_train_steps": 0.003186464309692383, "step": 9495} {"info/global_step": 9496, "train_info/time_within_train_step": 2.755479335784912, "step": 9496} {"train_info/time_between_train_steps": 0.0032012462615966797, "step": 9496} {"info/global_step": 9497, "train_info/time_within_train_step": 2.7554807662963867, "step": 9497} {"train_info/time_between_train_steps": 0.0031599998474121094, "step": 9497} {"info/global_step": 9498, "train_info/time_within_train_step": 2.755680799484253, "step": 9498} {"train_info/time_between_train_steps": 0.0031774044036865234, "step": 9498} {"info/global_step": 9499, "train_info/time_within_train_step": 2.7553045749664307, "step": 9499} {"train_info/time_between_train_steps": 0.003168344497680664, "step": 9499} {"info/global_step": 9500, "train_info/time_within_train_step": 2.755711793899536, "step": 9500} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746593364, "_runtime": 27373}, "step": 9500} {"logs": {"train/loss": 2.9087, "train/learning_rate": 3.333333333333333e-05, "train/epoch": 11.01, "_timestamp": 1746593364, "_runtime": 27373}, "step": 9500} {"train_info/time_between_train_steps": 0.007644176483154297, "step": 9500} {"info/global_step": 9501, "train_info/time_within_train_step": 2.756286382675171, "step": 9501} {"train_info/time_between_train_steps": 0.003173828125, "step": 9501} {"info/global_step": 9502, "train_info/time_within_train_step": 2.756239891052246, "step": 9502} {"train_info/time_between_train_steps": 0.003178119659423828, "step": 9502} {"info/global_step": 9503, "train_info/time_within_train_step": 2.7561399936676025, "step": 9503} {"train_info/time_between_train_steps": 0.003175020217895508, "step": 9503} {"info/global_step": 9504, "train_info/time_within_train_step": 2.756228446960449, "step": 9504} {"train_info/time_between_train_steps": 0.0031862258911132812, "step": 9504} {"info/global_step": 9505, "train_info/time_within_train_step": 2.755953311920166, "step": 9505} {"train_info/time_between_train_steps": 0.0032050609588623047, "step": 9505} {"info/global_step": 9506, "train_info/time_within_train_step": 2.755795478820801, "step": 9506} {"train_info/time_between_train_steps": 0.0031533241271972656, "step": 9506} {"info/global_step": 9507, "train_info/time_within_train_step": 2.756047010421753, "step": 9507} {"train_info/time_between_train_steps": 0.003227710723876953, "step": 9507} {"info/global_step": 9508, "train_info/time_within_train_step": 2.756216526031494, "step": 9508} {"train_info/time_between_train_steps": 0.13337230682373047, "step": 9508} {"info/global_step": 9509, "train_info/time_within_train_step": 2.7563416957855225, "step": 9509} {"train_info/time_between_train_steps": 0.0032088756561279297, "step": 9509} {"info/global_step": 9510, "train_info/time_within_train_step": 2.7557904720306396, "step": 9510} {"train_info/time_between_train_steps": 0.003256559371948242, "step": 9510} {"info/global_step": 9511, "train_info/time_within_train_step": 2.7552669048309326, "step": 9511} {"train_info/time_between_train_steps": 0.0031914710998535156, "step": 9511} {"info/global_step": 9512, "train_info/time_within_train_step": 2.7538750171661377, "step": 9512} {"train_info/time_between_train_steps": 0.0031926631927490234, "step": 9512} {"info/global_step": 9513, "train_info/time_within_train_step": 2.7550692558288574, "step": 9513} {"train_info/time_between_train_steps": 0.003217458724975586, "step": 9513} {"info/global_step": 9514, "train_info/time_within_train_step": 2.7558579444885254, "step": 9514} {"train_info/time_between_train_steps": 0.003194570541381836, "step": 9514} {"info/global_step": 9515, "train_info/time_within_train_step": 2.756232500076294, "step": 9515} {"train_info/time_between_train_steps": 0.003171682357788086, "step": 9515} {"info/global_step": 9516, "train_info/time_within_train_step": 2.755838394165039, "step": 9516} {"train_info/time_between_train_steps": 0.0032074451446533203, "step": 9516} {"info/global_step": 9517, "train_info/time_within_train_step": 2.755803346633911, "step": 9517} {"train_info/time_between_train_steps": 0.0032045841217041016, "step": 9517} {"info/global_step": 9518, "train_info/time_within_train_step": 2.7555902004241943, "step": 9518} {"train_info/time_between_train_steps": 0.003165721893310547, "step": 9518} {"info/global_step": 9519, "train_info/time_within_train_step": 2.755476236343384, "step": 9519} {"train_info/time_between_train_steps": 0.003177165985107422, "step": 9519} {"info/global_step": 9520, "train_info/time_within_train_step": 2.755204677581787, "step": 9520} {"train_info/time_between_train_steps": 0.003209352493286133, "step": 9520} {"info/global_step": 9521, "train_info/time_within_train_step": 2.7569825649261475, "step": 9521} {"train_info/time_between_train_steps": 0.0032227039337158203, "step": 9521} {"info/global_step": 9522, "train_info/time_within_train_step": 2.755352735519409, "step": 9522} {"train_info/time_between_train_steps": 0.003211498260498047, "step": 9522} {"info/global_step": 9523, "train_info/time_within_train_step": 2.755463123321533, "step": 9523} {"train_info/time_between_train_steps": 0.003186941146850586, "step": 9523} {"info/global_step": 9524, "train_info/time_within_train_step": 2.7568976879119873, "step": 9524} {"train_info/time_between_train_steps": 0.0032155513763427734, "step": 9524} {"info/global_step": 9525, "train_info/time_within_train_step": 2.757416248321533, "step": 9525} {"train_info/time_between_train_steps": 0.0032379627227783203, "step": 9525} {"info/global_step": 9526, "train_info/time_within_train_step": 2.7558679580688477, "step": 9526} {"train_info/time_between_train_steps": 0.003176450729370117, "step": 9526} {"info/global_step": 9527, "train_info/time_within_train_step": 2.75555157661438, "step": 9527} {"train_info/time_between_train_steps": 0.0032172203063964844, "step": 9527} {"info/global_step": 9528, "train_info/time_within_train_step": 2.7559943199157715, "step": 9528} {"train_info/time_between_train_steps": 0.003175020217895508, "step": 9528} {"info/global_step": 9529, "train_info/time_within_train_step": 2.7556238174438477, "step": 9529} {"train_info/time_between_train_steps": 0.003183126449584961, "step": 9529} {"info/global_step": 9530, "train_info/time_within_train_step": 2.7559714317321777, "step": 9530} {"train_info/time_between_train_steps": 0.0031888484954833984, "step": 9530} {"info/global_step": 9531, "train_info/time_within_train_step": 2.7558867931365967, "step": 9531} {"train_info/time_between_train_steps": 0.003202199935913086, "step": 9531} {"info/global_step": 9532, "train_info/time_within_train_step": 3.0060226917266846, "step": 9532} {"train_info/time_between_train_steps": 0.0032057762145996094, "step": 9532} {"info/global_step": 9533, "train_info/time_within_train_step": 2.7552011013031006, "step": 9533} {"train_info/time_between_train_steps": 0.0032613277435302734, "step": 9533} {"info/global_step": 9534, "train_info/time_within_train_step": 2.75508451461792, "step": 9534} {"train_info/time_between_train_steps": 0.003226757049560547, "step": 9534} {"info/global_step": 9535, "train_info/time_within_train_step": 2.755946636199951, "step": 9535} {"train_info/time_between_train_steps": 0.0031714439392089844, "step": 9535} {"info/global_step": 9536, "train_info/time_within_train_step": 2.7556450366973877, "step": 9536} {"train_info/time_between_train_steps": 0.0032591819763183594, "step": 9536} {"info/global_step": 9537, "train_info/time_within_train_step": 2.7555184364318848, "step": 9537} {"train_info/time_between_train_steps": 0.003175497055053711, "step": 9537} {"info/global_step": 9538, "train_info/time_within_train_step": 2.755854845046997, "step": 9538} {"train_info/time_between_train_steps": 0.0031862258911132812, "step": 9538} {"info/global_step": 9539, "train_info/time_within_train_step": 2.756037712097168, "step": 9539} {"train_info/time_between_train_steps": 0.0031943321228027344, "step": 9539} {"info/global_step": 9540, "train_info/time_within_train_step": 2.756833076477051, "step": 9540} {"train_info/time_between_train_steps": 0.0031659603118896484, "step": 9540} {"info/global_step": 9541, "train_info/time_within_train_step": 2.7555792331695557, "step": 9541} {"train_info/time_between_train_steps": 0.003178119659423828, "step": 9541} {"info/global_step": 9542, "train_info/time_within_train_step": 2.7559664249420166, "step": 9542} {"train_info/time_between_train_steps": 0.0031931400299072266, "step": 9542} {"info/global_step": 9543, "train_info/time_within_train_step": 2.7573866844177246, "step": 9543} {"train_info/time_between_train_steps": 0.0032138824462890625, "step": 9543} {"info/global_step": 9544, "train_info/time_within_train_step": 2.756605863571167, "step": 9544} {"train_info/time_between_train_steps": 0.003164529800415039, "step": 9544} {"info/global_step": 9545, "train_info/time_within_train_step": 2.7562875747680664, "step": 9545} {"train_info/time_between_train_steps": 0.0031659603118896484, "step": 9545} {"info/global_step": 9546, "train_info/time_within_train_step": 2.7555806636810303, "step": 9546} {"train_info/time_between_train_steps": 0.003169536590576172, "step": 9546} {"info/global_step": 9547, "train_info/time_within_train_step": 2.7548696994781494, "step": 9547} {"train_info/time_between_train_steps": 0.0032224655151367188, "step": 9547} {"info/global_step": 9548, "train_info/time_within_train_step": 2.755462646484375, "step": 9548} {"train_info/time_between_train_steps": 0.003179311752319336, "step": 9548} {"info/global_step": 9549, "train_info/time_within_train_step": 2.7545223236083984, "step": 9549} {"train_info/time_between_train_steps": 0.0031676292419433594, "step": 9549} {"info/global_step": 9550, "train_info/time_within_train_step": 2.7550222873687744, "step": 9550} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746593503, "_runtime": 27512}, "step": 9550} {"logs": {"train/loss": 2.9057, "train/learning_rate": 2.9999999999999997e-05, "train/epoch": 11.02, "_timestamp": 1746593503, "_runtime": 27512}, "step": 9550} {"train_info/time_between_train_steps": 0.00686955451965332, "step": 9550} {"info/global_step": 9551, "train_info/time_within_train_step": 2.7560577392578125, "step": 9551} {"train_info/time_between_train_steps": 0.003147125244140625, "step": 9551} {"info/global_step": 9552, "train_info/time_within_train_step": 2.7558562755584717, "step": 9552} {"train_info/time_between_train_steps": 0.003131866455078125, "step": 9552} {"info/global_step": 9553, "train_info/time_within_train_step": 2.755758285522461, "step": 9553} {"train_info/time_between_train_steps": 0.0031654834747314453, "step": 9553} {"info/global_step": 9554, "train_info/time_within_train_step": 2.7552502155303955, "step": 9554} {"train_info/time_between_train_steps": 0.003230571746826172, "step": 9554} {"info/global_step": 9555, "train_info/time_within_train_step": 2.75602388381958, "step": 9555} {"train_info/time_between_train_steps": 0.003152132034301758, "step": 9555} {"info/global_step": 9556, "train_info/time_within_train_step": 2.7556605339050293, "step": 9556} {"train_info/time_between_train_steps": 0.0031833648681640625, "step": 9556} {"info/global_step": 9557, "train_info/time_within_train_step": 2.7564010620117188, "step": 9557} {"train_info/time_between_train_steps": 0.0031685829162597656, "step": 9557} {"info/global_step": 9558, "train_info/time_within_train_step": 2.755582332611084, "step": 9558} {"train_info/time_between_train_steps": 0.003179311752319336, "step": 9558} {"info/global_step": 9559, "train_info/time_within_train_step": 2.7549524307250977, "step": 9559} {"train_info/time_between_train_steps": 0.003212451934814453, "step": 9559} {"info/global_step": 9560, "train_info/time_within_train_step": 2.7574851512908936, "step": 9560} {"train_info/time_between_train_steps": 0.003167867660522461, "step": 9560} {"info/global_step": 9561, "train_info/time_within_train_step": 2.756767511367798, "step": 9561} {"train_info/time_between_train_steps": 0.0031740665435791016, "step": 9561} {"info/global_step": 9562, "train_info/time_within_train_step": 2.7563321590423584, "step": 9562} {"train_info/time_between_train_steps": 0.0031502246856689453, "step": 9562} {"info/global_step": 9563, "train_info/time_within_train_step": 2.7555742263793945, "step": 9563} {"train_info/time_between_train_steps": 0.003131866455078125, "step": 9563} {"info/global_step": 9564, "train_info/time_within_train_step": 2.75543212890625, "step": 9564} {"train_info/time_between_train_steps": 0.00313568115234375, "step": 9564} {"info/global_step": 9565, "train_info/time_within_train_step": 2.7543914318084717, "step": 9565} {"train_info/time_between_train_steps": 0.0031778812408447266, "step": 9565} {"info/global_step": 9566, "train_info/time_within_train_step": 2.754378318786621, "step": 9566} {"train_info/time_between_train_steps": 0.003172636032104492, "step": 9566} {"info/global_step": 9567, "train_info/time_within_train_step": 2.755310297012329, "step": 9567} {"train_info/time_between_train_steps": 0.0031859874725341797, "step": 9567} {"info/global_step": 9568, "train_info/time_within_train_step": 2.755228042602539, "step": 9568} {"train_info/time_between_train_steps": 0.0031692981719970703, "step": 9568} {"info/global_step": 9569, "train_info/time_within_train_step": 2.756610870361328, "step": 9569} {"train_info/time_between_train_steps": 0.003209352493286133, "step": 9569} {"info/global_step": 9570, "train_info/time_within_train_step": 2.7556755542755127, "step": 9570} {"train_info/time_between_train_steps": 0.0031588077545166016, "step": 9570} {"info/global_step": 9571, "train_info/time_within_train_step": 2.886406421661377, "step": 9571} {"train_info/time_between_train_steps": 0.003201007843017578, "step": 9571} {"info/global_step": 9572, "train_info/time_within_train_step": 2.756056070327759, "step": 9572} {"train_info/time_between_train_steps": 0.003189563751220703, "step": 9572} {"info/global_step": 9573, "train_info/time_within_train_step": 3.012033700942993, "step": 9573} {"train_info/time_between_train_steps": 0.0031957626342773438, "step": 9573} {"info/global_step": 9574, "train_info/time_within_train_step": 2.757061004638672, "step": 9574} {"train_info/time_between_train_steps": 0.003184795379638672, "step": 9574} {"info/global_step": 9575, "train_info/time_within_train_step": 2.754777193069458, "step": 9575} {"train_info/time_between_train_steps": 0.0031714439392089844, "step": 9575} {"info/global_step": 9576, "train_info/time_within_train_step": 2.7554330825805664, "step": 9576} {"train_info/time_between_train_steps": 0.003242015838623047, "step": 9576} {"info/global_step": 9577, "train_info/time_within_train_step": 2.7551558017730713, "step": 9577} {"train_info/time_between_train_steps": 0.0032057762145996094, "step": 9577} {"info/global_step": 9578, "train_info/time_within_train_step": 2.755202054977417, "step": 9578} {"train_info/time_between_train_steps": 0.003206968307495117, "step": 9578} {"info/global_step": 9579, "train_info/time_within_train_step": 2.754714250564575, "step": 9579} {"train_info/time_between_train_steps": 0.0031800270080566406, "step": 9579} {"info/global_step": 9580, "train_info/time_within_train_step": 2.755316972732544, "step": 9580} {"train_info/time_between_train_steps": 0.003191709518432617, "step": 9580} {"info/global_step": 9581, "train_info/time_within_train_step": 2.7549538612365723, "step": 9581} {"train_info/time_between_train_steps": 0.0031647682189941406, "step": 9581} {"info/global_step": 9582, "train_info/time_within_train_step": 2.75469708442688, "step": 9582} {"train_info/time_between_train_steps": 0.003196239471435547, "step": 9582} {"info/global_step": 9583, "train_info/time_within_train_step": 2.7552666664123535, "step": 9583} {"train_info/time_between_train_steps": 0.0031719207763671875, "step": 9583} {"info/global_step": 9584, "train_info/time_within_train_step": 2.7555527687072754, "step": 9584} {"train_info/time_between_train_steps": 0.0031952857971191406, "step": 9584} {"info/global_step": 9585, "train_info/time_within_train_step": 2.755214214324951, "step": 9585} {"train_info/time_between_train_steps": 0.0031654834747314453, "step": 9585} {"info/global_step": 9586, "train_info/time_within_train_step": 2.756192922592163, "step": 9586} {"train_info/time_between_train_steps": 0.003186941146850586, "step": 9586} {"info/global_step": 9587, "train_info/time_within_train_step": 2.7566075325012207, "step": 9587} {"train_info/time_between_train_steps": 0.0032057762145996094, "step": 9587} {"info/global_step": 9588, "train_info/time_within_train_step": 2.756762981414795, "step": 9588} {"train_info/time_between_train_steps": 0.0031783580780029297, "step": 9588} {"info/global_step": 9589, "train_info/time_within_train_step": 2.7570462226867676, "step": 9589} {"train_info/time_between_train_steps": 0.0031938552856445312, "step": 9589} {"info/global_step": 9590, "train_info/time_within_train_step": 2.7573201656341553, "step": 9590} {"train_info/time_between_train_steps": 0.0031964778900146484, "step": 9590} {"info/global_step": 9591, "train_info/time_within_train_step": 2.754976272583008, "step": 9591} {"train_info/time_between_train_steps": 0.003198385238647461, "step": 9591} {"info/global_step": 9592, "train_info/time_within_train_step": 2.756741762161255, "step": 9592} {"train_info/time_between_train_steps": 0.003174304962158203, "step": 9592} {"info/global_step": 9593, "train_info/time_within_train_step": 2.7555737495422363, "step": 9593} {"train_info/time_between_train_steps": 0.0031723976135253906, "step": 9593} {"info/global_step": 9594, "train_info/time_within_train_step": 2.7558512687683105, "step": 9594} {"train_info/time_between_train_steps": 0.003153562545776367, "step": 9594} {"info/global_step": 9595, "train_info/time_within_train_step": 2.756563425064087, "step": 9595} {"train_info/time_between_train_steps": 0.0031583309173583984, "step": 9595} {"info/global_step": 9596, "train_info/time_within_train_step": 2.7552576065063477, "step": 9596} {"train_info/time_between_train_steps": 0.0031871795654296875, "step": 9596} {"info/global_step": 9597, "train_info/time_within_train_step": 2.757011651992798, "step": 9597} {"train_info/time_between_train_steps": 0.003220796585083008, "step": 9597} {"info/global_step": 9598, "train_info/time_within_train_step": 2.7556345462799072, "step": 9598} {"train_info/time_between_train_steps": 0.0031974315643310547, "step": 9598} {"info/global_step": 9599, "train_info/time_within_train_step": 2.756319046020508, "step": 9599} {"train_info/time_between_train_steps": 0.00316619873046875, "step": 9599} {"info/global_step": 9600, "train_info/time_within_train_step": 2.755455493927002, "step": 9600} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746593641, "_runtime": 27650}, "step": 9600} {"logs": {"train/loss": 2.89, "train/learning_rate": 2.6666666666666667e-05, "train/epoch": 11.02, "_timestamp": 1746593641, "_runtime": 27650}, "step": 9600} {"train_info/time_between_train_steps": 13.151220321655273, "step": 9600} {"info/global_step": 9601, "train_info/time_within_train_step": 2.5381505489349365, "step": 9601} {"train_info/time_between_train_steps": 0.006415367126464844, "step": 9601} {"info/global_step": 9602, "train_info/time_within_train_step": 2.612501621246338, "step": 9602} {"train_info/time_between_train_steps": 0.006559133529663086, "step": 9602} {"info/global_step": 9603, "train_info/time_within_train_step": 2.7428689002990723, "step": 9603} {"train_info/time_between_train_steps": 0.006312131881713867, "step": 9603} {"info/global_step": 9604, "train_info/time_within_train_step": 2.754626750946045, "step": 9604} {"train_info/time_between_train_steps": 0.006397724151611328, "step": 9604} {"info/global_step": 9605, "train_info/time_within_train_step": 2.757934808731079, "step": 9605} {"train_info/time_between_train_steps": 0.006489753723144531, "step": 9605} {"info/global_step": 9606, "train_info/time_within_train_step": 2.759312868118286, "step": 9606} {"train_info/time_between_train_steps": 0.006487846374511719, "step": 9606} {"info/global_step": 9607, "train_info/time_within_train_step": 2.758885622024536, "step": 9607} {"train_info/time_between_train_steps": 0.006482362747192383, "step": 9607} {"info/global_step": 9608, "train_info/time_within_train_step": 2.759812116622925, "step": 9608} {"train_info/time_between_train_steps": 0.0065343379974365234, "step": 9608} {"info/global_step": 9609, "train_info/time_within_train_step": 2.7598061561584473, "step": 9609} {"train_info/time_between_train_steps": 0.006510734558105469, "step": 9609} {"info/global_step": 9610, "train_info/time_within_train_step": 2.7589471340179443, "step": 9610} {"train_info/time_between_train_steps": 0.006491899490356445, "step": 9610} {"info/global_step": 9611, "train_info/time_within_train_step": 2.7595720291137695, "step": 9611} {"train_info/time_between_train_steps": 0.006455898284912109, "step": 9611} {"info/global_step": 9612, "train_info/time_within_train_step": 2.7602384090423584, "step": 9612} {"train_info/time_between_train_steps": 0.006554603576660156, "step": 9612} {"info/global_step": 9613, "train_info/time_within_train_step": 2.759612560272217, "step": 9613} {"train_info/time_between_train_steps": 0.006531953811645508, "step": 9613} {"info/global_step": 9614, "train_info/time_within_train_step": 2.760235548019409, "step": 9614} {"train_info/time_between_train_steps": 0.006531238555908203, "step": 9614} {"info/global_step": 9615, "train_info/time_within_train_step": 2.760786771774292, "step": 9615} {"train_info/time_between_train_steps": 0.006438493728637695, "step": 9615} {"info/global_step": 9616, "train_info/time_within_train_step": 2.7597830295562744, "step": 9616} {"train_info/time_between_train_steps": 0.0065190792083740234, "step": 9616} {"info/global_step": 9617, "train_info/time_within_train_step": 2.7589433193206787, "step": 9617} {"train_info/time_between_train_steps": 0.006507158279418945, "step": 9617} {"info/global_step": 9618, "train_info/time_within_train_step": 2.7593932151794434, "step": 9618} {"train_info/time_between_train_steps": 0.006479024887084961, "step": 9618} {"info/global_step": 9619, "train_info/time_within_train_step": 2.7593045234680176, "step": 9619} {"train_info/time_between_train_steps": 0.0065767765045166016, "step": 9619} {"info/global_step": 9620, "train_info/time_within_train_step": 2.7583484649658203, "step": 9620} {"train_info/time_between_train_steps": 0.0031425952911376953, "step": 9620} {"info/global_step": 9621, "train_info/time_within_train_step": 2.7564375400543213, "step": 9621} {"train_info/time_between_train_steps": 0.0031805038452148438, "step": 9621} {"info/global_step": 9622, "train_info/time_within_train_step": 2.7565202713012695, "step": 9622} {"train_info/time_between_train_steps": 0.0031576156616210938, "step": 9622} {"info/global_step": 9623, "train_info/time_within_train_step": 2.7571723461151123, "step": 9623} {"train_info/time_between_train_steps": 0.0031998157501220703, "step": 9623} {"info/global_step": 9624, "train_info/time_within_train_step": 2.7563984394073486, "step": 9624} {"train_info/time_between_train_steps": 0.0031914710998535156, "step": 9624} {"info/global_step": 9625, "train_info/time_within_train_step": 2.7573401927948, "step": 9625} {"train_info/time_between_train_steps": 0.003144979476928711, "step": 9625} {"info/global_step": 9626, "train_info/time_within_train_step": 2.755145788192749, "step": 9626} {"train_info/time_between_train_steps": 0.0031485557556152344, "step": 9626} {"info/global_step": 9627, "train_info/time_within_train_step": 2.7566304206848145, "step": 9627} {"train_info/time_between_train_steps": 0.0031626224517822266, "step": 9627} {"info/global_step": 9628, "train_info/time_within_train_step": 2.758678913116455, "step": 9628} {"train_info/time_between_train_steps": 0.003153085708618164, "step": 9628} {"info/global_step": 9629, "train_info/time_within_train_step": 3.0164926052093506, "step": 9629} {"train_info/time_between_train_steps": 0.003207683563232422, "step": 9629} {"info/global_step": 9630, "train_info/time_within_train_step": 2.7576961517333984, "step": 9630} {"train_info/time_between_train_steps": 0.0064220428466796875, "step": 9630} {"info/global_step": 9631, "train_info/time_within_train_step": 2.759765625, "step": 9631} {"train_info/time_between_train_steps": 0.006481647491455078, "step": 9631} {"info/global_step": 9632, "train_info/time_within_train_step": 2.7600643634796143, "step": 9632} {"train_info/time_between_train_steps": 0.0065419673919677734, "step": 9632} {"info/global_step": 9633, "train_info/time_within_train_step": 2.759775400161743, "step": 9633} {"train_info/time_between_train_steps": 0.13381671905517578, "step": 9633} {"info/global_step": 9634, "train_info/time_within_train_step": 2.7585089206695557, "step": 9634} {"train_info/time_between_train_steps": 0.006493091583251953, "step": 9634} {"info/global_step": 9635, "train_info/time_within_train_step": 2.760923385620117, "step": 9635} {"train_info/time_between_train_steps": 0.006504535675048828, "step": 9635} {"info/global_step": 9636, "train_info/time_within_train_step": 2.759870767593384, "step": 9636} {"train_info/time_between_train_steps": 0.006476402282714844, "step": 9636} {"info/global_step": 9637, "train_info/time_within_train_step": 2.7606375217437744, "step": 9637} {"train_info/time_between_train_steps": 0.0033266544342041016, "step": 9637} {"info/global_step": 9638, "train_info/time_within_train_step": 2.757654905319214, "step": 9638} {"train_info/time_between_train_steps": 0.0033512115478515625, "step": 9638} {"info/global_step": 9639, "train_info/time_within_train_step": 2.757528305053711, "step": 9639} {"train_info/time_between_train_steps": 0.003227710723876953, "step": 9639} {"info/global_step": 9640, "train_info/time_within_train_step": 2.7563257217407227, "step": 9640} {"train_info/time_between_train_steps": 0.003648519515991211, "step": 9640} {"info/global_step": 9641, "train_info/time_within_train_step": 2.7556183338165283, "step": 9641} {"train_info/time_between_train_steps": 0.003252267837524414, "step": 9641} {"info/global_step": 9642, "train_info/time_within_train_step": 2.7547671794891357, "step": 9642} {"train_info/time_between_train_steps": 0.0031976699829101562, "step": 9642} {"info/global_step": 9643, "train_info/time_within_train_step": 2.756819725036621, "step": 9643} {"train_info/time_between_train_steps": 0.0031893253326416016, "step": 9643} {"info/global_step": 9644, "train_info/time_within_train_step": 2.7560994625091553, "step": 9644} {"train_info/time_between_train_steps": 0.003186941146850586, "step": 9644} {"info/global_step": 9645, "train_info/time_within_train_step": 2.7547707557678223, "step": 9645} {"train_info/time_between_train_steps": 0.0032320022583007812, "step": 9645} {"info/global_step": 9646, "train_info/time_within_train_step": 2.755425214767456, "step": 9646} {"train_info/time_between_train_steps": 0.0031807422637939453, "step": 9646} {"info/global_step": 9647, "train_info/time_within_train_step": 2.7557222843170166, "step": 9647} {"train_info/time_between_train_steps": 0.00323486328125, "step": 9647} {"info/global_step": 9648, "train_info/time_within_train_step": 2.755810499191284, "step": 9648} {"train_info/time_between_train_steps": 0.003165006637573242, "step": 9648} {"info/global_step": 9649, "train_info/time_within_train_step": 2.7557754516601562, "step": 9649} {"train_info/time_between_train_steps": 0.0031995773315429688, "step": 9649} {"info/global_step": 9650, "train_info/time_within_train_step": 2.7552547454833984, "step": 9650} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746593793, "_runtime": 27802}, "step": 9650} {"logs": {"train/loss": 2.8844, "train/learning_rate": 2.3333333333333332e-05, "train/epoch": 11.03, "_timestamp": 1746593793, "_runtime": 27802}, "step": 9650} {"train_info/time_between_train_steps": 0.007314205169677734, "step": 9650} {"info/global_step": 9651, "train_info/time_within_train_step": 2.754971504211426, "step": 9651} {"train_info/time_between_train_steps": 0.0031914710998535156, "step": 9651} {"info/global_step": 9652, "train_info/time_within_train_step": 2.755589246749878, "step": 9652} {"train_info/time_between_train_steps": 0.0032160282135009766, "step": 9652} {"info/global_step": 9653, "train_info/time_within_train_step": 2.75486159324646, "step": 9653} {"train_info/time_between_train_steps": 0.003396749496459961, "step": 9653} {"info/global_step": 9654, "train_info/time_within_train_step": 2.7565815448760986, "step": 9654} {"train_info/time_between_train_steps": 0.003245830535888672, "step": 9654} {"info/global_step": 9655, "train_info/time_within_train_step": 2.75642728805542, "step": 9655} {"train_info/time_between_train_steps": 0.0032029151916503906, "step": 9655} {"info/global_step": 9656, "train_info/time_within_train_step": 2.7544589042663574, "step": 9656} {"train_info/time_between_train_steps": 0.0032052993774414062, "step": 9656} {"info/global_step": 9657, "train_info/time_within_train_step": 2.7558538913726807, "step": 9657} {"train_info/time_between_train_steps": 0.0032019615173339844, "step": 9657} {"info/global_step": 9658, "train_info/time_within_train_step": 2.7562942504882812, "step": 9658} {"train_info/time_between_train_steps": 0.003179311752319336, "step": 9658} {"info/global_step": 9659, "train_info/time_within_train_step": 2.7547435760498047, "step": 9659} {"train_info/time_between_train_steps": 0.0031952857971191406, "step": 9659} {"info/global_step": 9660, "train_info/time_within_train_step": 2.7534713745117188, "step": 9660} {"train_info/time_between_train_steps": 0.003177165985107422, "step": 9660} {"info/global_step": 9661, "train_info/time_within_train_step": 2.7561066150665283, "step": 9661} {"train_info/time_between_train_steps": 0.0032024383544921875, "step": 9661} {"info/global_step": 9662, "train_info/time_within_train_step": 2.756510019302368, "step": 9662} {"train_info/time_between_train_steps": 0.003195524215698242, "step": 9662} {"info/global_step": 9663, "train_info/time_within_train_step": 2.7551891803741455, "step": 9663} {"train_info/time_between_train_steps": 0.0032405853271484375, "step": 9663} {"info/global_step": 9664, "train_info/time_within_train_step": 2.7555832862854004, "step": 9664} {"train_info/time_between_train_steps": 0.003240823745727539, "step": 9664} {"info/global_step": 9665, "train_info/time_within_train_step": 2.7548530101776123, "step": 9665} {"train_info/time_between_train_steps": 0.003224611282348633, "step": 9665} {"info/global_step": 9666, "train_info/time_within_train_step": 2.7543437480926514, "step": 9666} {"train_info/time_between_train_steps": 0.0031616687774658203, "step": 9666} {"info/global_step": 9667, "train_info/time_within_train_step": 2.7554943561553955, "step": 9667} {"train_info/time_between_train_steps": 0.0032377243041992188, "step": 9667} {"info/global_step": 9668, "train_info/time_within_train_step": 2.754931926727295, "step": 9668} {"train_info/time_between_train_steps": 0.003164052963256836, "step": 9668} {"info/global_step": 9669, "train_info/time_within_train_step": 2.7557129859924316, "step": 9669} {"train_info/time_between_train_steps": 0.0036306381225585938, "step": 9669} {"info/global_step": 9670, "train_info/time_within_train_step": 2.7554819583892822, "step": 9670} {"train_info/time_between_train_steps": 0.0032515525817871094, "step": 9670} {"info/global_step": 9671, "train_info/time_within_train_step": 2.7552502155303955, "step": 9671} {"train_info/time_between_train_steps": 0.0032324790954589844, "step": 9671} {"info/global_step": 9672, "train_info/time_within_train_step": 2.7559051513671875, "step": 9672} {"train_info/time_between_train_steps": 0.0032050609588623047, "step": 9672} {"info/global_step": 9673, "train_info/time_within_train_step": 2.7541849613189697, "step": 9673} {"train_info/time_between_train_steps": 0.003186464309692383, "step": 9673} {"info/global_step": 9674, "train_info/time_within_train_step": 2.756321668624878, "step": 9674} {"train_info/time_between_train_steps": 0.0031859874725341797, "step": 9674} {"info/global_step": 9675, "train_info/time_within_train_step": 2.7538158893585205, "step": 9675} {"train_info/time_between_train_steps": 0.0031960010528564453, "step": 9675} {"info/global_step": 9676, "train_info/time_within_train_step": 2.7550153732299805, "step": 9676} {"train_info/time_between_train_steps": 0.0031931400299072266, "step": 9676} {"info/global_step": 9677, "train_info/time_within_train_step": 2.753185987472534, "step": 9677} {"train_info/time_between_train_steps": 0.0031778812408447266, "step": 9677} {"info/global_step": 9678, "train_info/time_within_train_step": 2.75557541847229, "step": 9678} {"train_info/time_between_train_steps": 0.0032172203063964844, "step": 9678} {"info/global_step": 9679, "train_info/time_within_train_step": 2.7562177181243896, "step": 9679} {"train_info/time_between_train_steps": 0.0032014846801757812, "step": 9679} {"info/global_step": 9680, "train_info/time_within_train_step": 2.756748914718628, "step": 9680} {"train_info/time_between_train_steps": 0.003197908401489258, "step": 9680} {"info/global_step": 9681, "train_info/time_within_train_step": 2.7546753883361816, "step": 9681} {"train_info/time_between_train_steps": 0.0032041072845458984, "step": 9681} {"info/global_step": 9682, "train_info/time_within_train_step": 2.7549309730529785, "step": 9682} {"train_info/time_between_train_steps": 0.0032160282135009766, "step": 9682} {"info/global_step": 9683, "train_info/time_within_train_step": 2.7561583518981934, "step": 9683} {"train_info/time_between_train_steps": 0.0031647682189941406, "step": 9683} {"info/global_step": 9684, "train_info/time_within_train_step": 2.753817558288574, "step": 9684} {"train_info/time_between_train_steps": 0.0031583309173583984, "step": 9684} {"info/global_step": 9685, "train_info/time_within_train_step": 2.75434947013855, "step": 9685} {"train_info/time_between_train_steps": 0.0032646656036376953, "step": 9685} {"info/global_step": 9686, "train_info/time_within_train_step": 2.7549312114715576, "step": 9686} {"train_info/time_between_train_steps": 0.0031838417053222656, "step": 9686} {"info/global_step": 9687, "train_info/time_within_train_step": 2.75413179397583, "step": 9687} {"train_info/time_between_train_steps": 0.0031616687774658203, "step": 9687} {"info/global_step": 9688, "train_info/time_within_train_step": 2.754652976989746, "step": 9688} {"train_info/time_between_train_steps": 0.0031969547271728516, "step": 9688} {"info/global_step": 9689, "train_info/time_within_train_step": 2.754135847091675, "step": 9689} {"train_info/time_between_train_steps": 0.00319671630859375, "step": 9689} {"info/global_step": 9690, "train_info/time_within_train_step": 2.755279541015625, "step": 9690} {"train_info/time_between_train_steps": 0.00319671630859375, "step": 9690} {"info/global_step": 9691, "train_info/time_within_train_step": 2.756027936935425, "step": 9691} {"train_info/time_between_train_steps": 0.003152132034301758, "step": 9691} {"info/global_step": 9692, "train_info/time_within_train_step": 2.7555623054504395, "step": 9692} {"train_info/time_between_train_steps": 0.003210783004760742, "step": 9692} {"info/global_step": 9693, "train_info/time_within_train_step": 2.755689859390259, "step": 9693} {"train_info/time_between_train_steps": 0.003196239471435547, "step": 9693} {"info/global_step": 9694, "train_info/time_within_train_step": 2.755667209625244, "step": 9694} {"train_info/time_between_train_steps": 0.0032079219818115234, "step": 9694} {"info/global_step": 9695, "train_info/time_within_train_step": 2.755547523498535, "step": 9695} {"train_info/time_between_train_steps": 0.003138303756713867, "step": 9695} {"info/global_step": 9696, "train_info/time_within_train_step": 2.8896069526672363, "step": 9696} {"train_info/time_between_train_steps": 0.0032432079315185547, "step": 9696} {"info/global_step": 9697, "train_info/time_within_train_step": 2.756098747253418, "step": 9697} {"train_info/time_between_train_steps": 0.003229856491088867, "step": 9697} {"info/global_step": 9698, "train_info/time_within_train_step": 2.7546772956848145, "step": 9698} {"train_info/time_between_train_steps": 0.003167390823364258, "step": 9698} {"info/global_step": 9699, "train_info/time_within_train_step": 2.7551822662353516, "step": 9699} {"train_info/time_between_train_steps": 0.003224611282348633, "step": 9699} {"info/global_step": 9700, "train_info/time_within_train_step": 2.7545487880706787, "step": 9700} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746593931, "_runtime": 27940}, "step": 9700} {"logs": {"train/loss": 2.8821, "train/learning_rate": 1.9999999999999998e-05, "train/epoch": 11.03, "_timestamp": 1746593931, "_runtime": 27940}, "step": 9700} {"train_info/time_between_train_steps": 0.007299184799194336, "step": 9700} {"info/global_step": 9701, "train_info/time_within_train_step": 2.753908395767212, "step": 9701} {"train_info/time_between_train_steps": 0.0032045841217041016, "step": 9701} {"info/global_step": 9702, "train_info/time_within_train_step": 2.756071090698242, "step": 9702} {"train_info/time_between_train_steps": 0.003188610076904297, "step": 9702} {"info/global_step": 9703, "train_info/time_within_train_step": 2.754899024963379, "step": 9703} {"train_info/time_between_train_steps": 0.003191709518432617, "step": 9703} {"info/global_step": 9704, "train_info/time_within_train_step": 2.754631757736206, "step": 9704} {"train_info/time_between_train_steps": 0.0031642913818359375, "step": 9704} {"info/global_step": 9705, "train_info/time_within_train_step": 2.7542524337768555, "step": 9705} {"train_info/time_between_train_steps": 0.0032205581665039062, "step": 9705} {"info/global_step": 9706, "train_info/time_within_train_step": 2.7545437812805176, "step": 9706} {"train_info/time_between_train_steps": 0.0032329559326171875, "step": 9706} {"info/global_step": 9707, "train_info/time_within_train_step": 2.7550997734069824, "step": 9707} {"train_info/time_between_train_steps": 0.0031898021697998047, "step": 9707} {"info/global_step": 9708, "train_info/time_within_train_step": 2.7549641132354736, "step": 9708} {"train_info/time_between_train_steps": 0.0031850337982177734, "step": 9708} {"info/global_step": 9709, "train_info/time_within_train_step": 2.754570484161377, "step": 9709} {"train_info/time_between_train_steps": 0.0031774044036865234, "step": 9709} {"info/global_step": 9710, "train_info/time_within_train_step": 2.755871534347534, "step": 9710} {"train_info/time_between_train_steps": 0.003161191940307617, "step": 9710} {"info/global_step": 9711, "train_info/time_within_train_step": 2.756834030151367, "step": 9711} {"train_info/time_between_train_steps": 0.003365755081176758, "step": 9711} {"info/global_step": 9712, "train_info/time_within_train_step": 2.7569150924682617, "step": 9712} {"train_info/time_between_train_steps": 0.003350496292114258, "step": 9712} {"info/global_step": 9713, "train_info/time_within_train_step": 2.756192922592163, "step": 9713} {"train_info/time_between_train_steps": 0.0033271312713623047, "step": 9713} {"info/global_step": 9714, "train_info/time_within_train_step": 2.7565412521362305, "step": 9714} {"train_info/time_between_train_steps": 0.0033190250396728516, "step": 9714} {"info/global_step": 9715, "train_info/time_within_train_step": 2.7563860416412354, "step": 9715} {"train_info/time_between_train_steps": 0.0033164024353027344, "step": 9715} {"info/global_step": 9716, "train_info/time_within_train_step": 2.755415678024292, "step": 9716} {"train_info/time_between_train_steps": 0.003321409225463867, "step": 9716} {"info/global_step": 9717, "train_info/time_within_train_step": 2.7558035850524902, "step": 9717} {"train_info/time_between_train_steps": 0.0033521652221679688, "step": 9717} {"info/global_step": 9718, "train_info/time_within_train_step": 2.756596326828003, "step": 9718} {"train_info/time_between_train_steps": 0.0033063888549804688, "step": 9718} {"info/global_step": 9719, "train_info/time_within_train_step": 2.7565903663635254, "step": 9719} {"train_info/time_between_train_steps": 0.0033338069915771484, "step": 9719} {"info/global_step": 9720, "train_info/time_within_train_step": 2.7570526599884033, "step": 9720} {"train_info/time_between_train_steps": 0.003413677215576172, "step": 9720} {"info/global_step": 9721, "train_info/time_within_train_step": 2.7551708221435547, "step": 9721} {"train_info/time_between_train_steps": 0.003303050994873047, "step": 9721} {"info/global_step": 9722, "train_info/time_within_train_step": 3.030914545059204, "step": 9722} {"train_info/time_between_train_steps": 0.0033349990844726562, "step": 9722} {"info/global_step": 9723, "train_info/time_within_train_step": 2.755669593811035, "step": 9723} {"train_info/time_between_train_steps": 0.0033333301544189453, "step": 9723} {"info/global_step": 9724, "train_info/time_within_train_step": 2.757154941558838, "step": 9724} {"train_info/time_between_train_steps": 0.0033521652221679688, "step": 9724} {"info/global_step": 9725, "train_info/time_within_train_step": 2.7566535472869873, "step": 9725} {"train_info/time_between_train_steps": 0.003343343734741211, "step": 9725} {"info/global_step": 9726, "train_info/time_within_train_step": 2.756330728530884, "step": 9726} {"train_info/time_between_train_steps": 0.003331422805786133, "step": 9726} {"info/global_step": 9727, "train_info/time_within_train_step": 2.756312847137451, "step": 9727} {"train_info/time_between_train_steps": 0.003316164016723633, "step": 9727} {"info/global_step": 9728, "train_info/time_within_train_step": 2.757228136062622, "step": 9728} {"train_info/time_between_train_steps": 0.003342151641845703, "step": 9728} {"info/global_step": 9729, "train_info/time_within_train_step": 2.756761074066162, "step": 9729} {"train_info/time_between_train_steps": 0.0033159255981445312, "step": 9729} {"info/global_step": 9730, "train_info/time_within_train_step": 2.757364273071289, "step": 9730} {"train_info/time_between_train_steps": 0.0034112930297851562, "step": 9730} {"info/global_step": 9731, "train_info/time_within_train_step": 2.75624680519104, "step": 9731} {"train_info/time_between_train_steps": 0.003360271453857422, "step": 9731} {"info/global_step": 9732, "train_info/time_within_train_step": 2.757035732269287, "step": 9732} {"train_info/time_between_train_steps": 0.0033478736877441406, "step": 9732} {"info/global_step": 9733, "train_info/time_within_train_step": 2.7560880184173584, "step": 9733} {"train_info/time_between_train_steps": 0.0032999515533447266, "step": 9733} {"info/global_step": 9734, "train_info/time_within_train_step": 2.755803108215332, "step": 9734} {"train_info/time_between_train_steps": 0.003359556198120117, "step": 9734} {"info/global_step": 9735, "train_info/time_within_train_step": 2.7557144165039062, "step": 9735} {"train_info/time_between_train_steps": 0.003364086151123047, "step": 9735} {"info/global_step": 9736, "train_info/time_within_train_step": 2.7543766498565674, "step": 9736} {"train_info/time_between_train_steps": 0.003337383270263672, "step": 9736} {"info/global_step": 9737, "train_info/time_within_train_step": 2.756362199783325, "step": 9737} {"train_info/time_between_train_steps": 0.003379344940185547, "step": 9737} {"info/global_step": 9738, "train_info/time_within_train_step": 2.7559471130371094, "step": 9738} {"train_info/time_between_train_steps": 0.0033092498779296875, "step": 9738} {"info/global_step": 9739, "train_info/time_within_train_step": 2.7575249671936035, "step": 9739} {"train_info/time_between_train_steps": 0.003343820571899414, "step": 9739} {"info/global_step": 9740, "train_info/time_within_train_step": 2.7570934295654297, "step": 9740} {"train_info/time_between_train_steps": 0.003325223922729492, "step": 9740} {"info/global_step": 9741, "train_info/time_within_train_step": 2.7561159133911133, "step": 9741} {"train_info/time_between_train_steps": 0.003316164016723633, "step": 9741} {"info/global_step": 9742, "train_info/time_within_train_step": 2.7572014331817627, "step": 9742} {"train_info/time_between_train_steps": 0.003322124481201172, "step": 9742} {"info/global_step": 9743, "train_info/time_within_train_step": 2.755704402923584, "step": 9743} {"train_info/time_between_train_steps": 0.003362417221069336, "step": 9743} {"info/global_step": 9744, "train_info/time_within_train_step": 2.7550160884857178, "step": 9744} {"train_info/time_between_train_steps": 0.0033605098724365234, "step": 9744} {"info/global_step": 9745, "train_info/time_within_train_step": 3.3243801593780518, "step": 9745} {"train_info/time_between_train_steps": 0.0033416748046875, "step": 9745} {"info/global_step": 9746, "train_info/time_within_train_step": 2.756540298461914, "step": 9746} {"train_info/time_between_train_steps": 0.003370046615600586, "step": 9746} {"info/global_step": 9747, "train_info/time_within_train_step": 2.7553763389587402, "step": 9747} {"train_info/time_between_train_steps": 0.003362894058227539, "step": 9747} {"info/global_step": 9748, "train_info/time_within_train_step": 2.756248950958252, "step": 9748} {"train_info/time_between_train_steps": 0.003310680389404297, "step": 9748} {"info/global_step": 9749, "train_info/time_within_train_step": 2.756622076034546, "step": 9749} {"train_info/time_between_train_steps": 0.0033104419708251953, "step": 9749} {"info/global_step": 9750, "train_info/time_within_train_step": 2.756376266479492, "step": 9750} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746594070, "_runtime": 28079}, "step": 9750} {"logs": {"train/loss": 2.8918, "train/learning_rate": 1.6666666666666664e-05, "train/epoch": 11.04, "_timestamp": 1746594070, "_runtime": 28079}, "step": 9750} {"train_info/time_between_train_steps": 0.00712275505065918, "step": 9750} {"info/global_step": 9751, "train_info/time_within_train_step": 2.7569661140441895, "step": 9751} {"train_info/time_between_train_steps": 0.0033636093139648438, "step": 9751} {"info/global_step": 9752, "train_info/time_within_train_step": 2.7564573287963867, "step": 9752} {"train_info/time_between_train_steps": 0.003303050994873047, "step": 9752} {"info/global_step": 9753, "train_info/time_within_train_step": 2.7560057640075684, "step": 9753} {"train_info/time_between_train_steps": 0.0033817291259765625, "step": 9753} {"info/global_step": 9754, "train_info/time_within_train_step": 2.7570345401763916, "step": 9754} {"train_info/time_between_train_steps": 0.003302335739135742, "step": 9754} {"info/global_step": 9755, "train_info/time_within_train_step": 2.756796360015869, "step": 9755} {"train_info/time_between_train_steps": 0.003278017044067383, "step": 9755} {"info/global_step": 9756, "train_info/time_within_train_step": 2.757295608520508, "step": 9756} {"train_info/time_between_train_steps": 0.00335693359375, "step": 9756} {"info/global_step": 9757, "train_info/time_within_train_step": 2.7548794746398926, "step": 9757} {"train_info/time_between_train_steps": 0.0034165382385253906, "step": 9757} {"info/global_step": 9758, "train_info/time_within_train_step": 2.756500244140625, "step": 9758} {"train_info/time_between_train_steps": 0.13520359992980957, "step": 9758} {"info/global_step": 9759, "train_info/time_within_train_step": 2.755455732345581, "step": 9759} {"train_info/time_between_train_steps": 0.0032083988189697266, "step": 9759} {"info/global_step": 9760, "train_info/time_within_train_step": 2.7553932666778564, "step": 9760} {"train_info/time_between_train_steps": 0.0031507015228271484, "step": 9760} {"info/global_step": 9761, "train_info/time_within_train_step": 2.755664348602295, "step": 9761} {"train_info/time_between_train_steps": 0.003186941146850586, "step": 9761} {"info/global_step": 9762, "train_info/time_within_train_step": 2.7541916370391846, "step": 9762} {"train_info/time_between_train_steps": 0.0032393932342529297, "step": 9762} {"info/global_step": 9763, "train_info/time_within_train_step": 2.754544258117676, "step": 9763} {"train_info/time_between_train_steps": 0.0033583641052246094, "step": 9763} {"info/global_step": 9764, "train_info/time_within_train_step": 2.7567975521087646, "step": 9764} {"train_info/time_between_train_steps": 0.0033364295959472656, "step": 9764} {"info/global_step": 9765, "train_info/time_within_train_step": 2.7568047046661377, "step": 9765} {"train_info/time_between_train_steps": 0.0033638477325439453, "step": 9765} {"info/global_step": 9766, "train_info/time_within_train_step": 2.756348133087158, "step": 9766} {"train_info/time_between_train_steps": 0.0033385753631591797, "step": 9766} {"info/global_step": 9767, "train_info/time_within_train_step": 2.757038116455078, "step": 9767} {"train_info/time_between_train_steps": 0.0033385753631591797, "step": 9767} {"info/global_step": 9768, "train_info/time_within_train_step": 2.7567903995513916, "step": 9768} {"train_info/time_between_train_steps": 0.0033752918243408203, "step": 9768} {"info/global_step": 9769, "train_info/time_within_train_step": 2.7569074630737305, "step": 9769} {"train_info/time_between_train_steps": 0.0033388137817382812, "step": 9769} {"info/global_step": 9770, "train_info/time_within_train_step": 2.75718355178833, "step": 9770} {"train_info/time_between_train_steps": 0.003347158432006836, "step": 9770} {"info/global_step": 9771, "train_info/time_within_train_step": 2.757755994796753, "step": 9771} {"train_info/time_between_train_steps": 0.0034041404724121094, "step": 9771} {"info/global_step": 9772, "train_info/time_within_train_step": 2.757660388946533, "step": 9772} {"train_info/time_between_train_steps": 0.0034568309783935547, "step": 9772} {"info/global_step": 9773, "train_info/time_within_train_step": 2.7573442459106445, "step": 9773} {"train_info/time_between_train_steps": 0.0033969879150390625, "step": 9773} {"info/global_step": 9774, "train_info/time_within_train_step": 2.757786750793457, "step": 9774} {"train_info/time_between_train_steps": 0.00336456298828125, "step": 9774} {"info/global_step": 9775, "train_info/time_within_train_step": 2.757169246673584, "step": 9775} {"train_info/time_between_train_steps": 0.003408670425415039, "step": 9775} {"info/global_step": 9776, "train_info/time_within_train_step": 2.756366014480591, "step": 9776} {"train_info/time_between_train_steps": 0.0033588409423828125, "step": 9776} {"info/global_step": 9777, "train_info/time_within_train_step": 2.75602126121521, "step": 9777} {"train_info/time_between_train_steps": 0.0033407211303710938, "step": 9777} {"info/global_step": 9778, "train_info/time_within_train_step": 2.756232500076294, "step": 9778} {"train_info/time_between_train_steps": 0.0033621788024902344, "step": 9778} {"info/global_step": 9779, "train_info/time_within_train_step": 3.0373213291168213, "step": 9779} {"train_info/time_between_train_steps": 0.0033135414123535156, "step": 9779} {"info/global_step": 9780, "train_info/time_within_train_step": 2.7571654319763184, "step": 9780} {"train_info/time_between_train_steps": 0.0033414363861083984, "step": 9780} {"info/global_step": 9781, "train_info/time_within_train_step": 2.7564072608947754, "step": 9781} {"train_info/time_between_train_steps": 0.003329038619995117, "step": 9781} {"info/global_step": 9782, "train_info/time_within_train_step": 2.756570816040039, "step": 9782} {"train_info/time_between_train_steps": 0.0033254623413085938, "step": 9782} {"info/global_step": 9783, "train_info/time_within_train_step": 2.7570390701293945, "step": 9783} {"train_info/time_between_train_steps": 0.003316640853881836, "step": 9783} {"info/global_step": 9784, "train_info/time_within_train_step": 2.757685422897339, "step": 9784} {"train_info/time_between_train_steps": 0.003385782241821289, "step": 9784} {"info/global_step": 9785, "train_info/time_within_train_step": 2.7567391395568848, "step": 9785} {"train_info/time_between_train_steps": 0.003353118896484375, "step": 9785} {"info/global_step": 9786, "train_info/time_within_train_step": 2.7564456462860107, "step": 9786} {"train_info/time_between_train_steps": 0.003375530242919922, "step": 9786} {"info/global_step": 9787, "train_info/time_within_train_step": 2.755866765975952, "step": 9787} {"train_info/time_between_train_steps": 0.003320932388305664, "step": 9787} {"info/global_step": 9788, "train_info/time_within_train_step": 2.756575584411621, "step": 9788} {"train_info/time_between_train_steps": 0.0033659934997558594, "step": 9788} {"info/global_step": 9789, "train_info/time_within_train_step": 2.7559561729431152, "step": 9789} {"train_info/time_between_train_steps": 0.003325223922729492, "step": 9789} {"info/global_step": 9790, "train_info/time_within_train_step": 2.7571170330047607, "step": 9790} {"train_info/time_between_train_steps": 0.003392934799194336, "step": 9790} {"info/global_step": 9791, "train_info/time_within_train_step": 2.7563464641571045, "step": 9791} {"train_info/time_between_train_steps": 0.0033724308013916016, "step": 9791} {"info/global_step": 9792, "train_info/time_within_train_step": 2.7557387351989746, "step": 9792} {"train_info/time_between_train_steps": 0.0033211708068847656, "step": 9792} {"info/global_step": 9793, "train_info/time_within_train_step": 2.7563629150390625, "step": 9793} {"train_info/time_between_train_steps": 0.0033321380615234375, "step": 9793} {"info/global_step": 9794, "train_info/time_within_train_step": 2.756276845932007, "step": 9794} {"train_info/time_between_train_steps": 0.003339529037475586, "step": 9794} {"info/global_step": 9795, "train_info/time_within_train_step": 2.756185531616211, "step": 9795} {"train_info/time_between_train_steps": 0.003377676010131836, "step": 9795} {"info/global_step": 9796, "train_info/time_within_train_step": 2.756427049636841, "step": 9796} {"train_info/time_between_train_steps": 0.003353118896484375, "step": 9796} {"info/global_step": 9797, "train_info/time_within_train_step": 2.7572500705718994, "step": 9797} {"train_info/time_between_train_steps": 0.0033750534057617188, "step": 9797} {"info/global_step": 9798, "train_info/time_within_train_step": 2.756382465362549, "step": 9798} {"train_info/time_between_train_steps": 0.0033288002014160156, "step": 9798} {"info/global_step": 9799, "train_info/time_within_train_step": 2.7559096813201904, "step": 9799} {"train_info/time_between_train_steps": 0.003325939178466797, "step": 9799} {"info/global_step": 9800, "train_info/time_within_train_step": 2.757068634033203, "step": 9800} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746594208, "_runtime": 28217}, "step": 9800} {"logs": {"train/loss": 2.8863, "train/learning_rate": 1.3333333333333333e-05, "train/epoch": 11.04, "_timestamp": 1746594208, "_runtime": 28217}, "step": 9800} {"train_info/time_between_train_steps": 13.117829084396362, "step": 9800} {"info/global_step": 9801, "train_info/time_within_train_step": 2.5366435050964355, "step": 9801} {"train_info/time_between_train_steps": 0.003210783004760742, "step": 9801} {"info/global_step": 9802, "train_info/time_within_train_step": 2.575658082962036, "step": 9802} {"train_info/time_between_train_steps": 0.0031948089599609375, "step": 9802} {"info/global_step": 9803, "train_info/time_within_train_step": 2.718106269836426, "step": 9803} {"train_info/time_between_train_steps": 0.003165006637573242, "step": 9803} {"info/global_step": 9804, "train_info/time_within_train_step": 2.7500834465026855, "step": 9804} {"train_info/time_between_train_steps": 0.003171682357788086, "step": 9804} {"info/global_step": 9805, "train_info/time_within_train_step": 2.751918077468872, "step": 9805} {"train_info/time_between_train_steps": 0.0031571388244628906, "step": 9805} {"info/global_step": 9806, "train_info/time_within_train_step": 2.755439281463623, "step": 9806} {"train_info/time_between_train_steps": 0.003143787384033203, "step": 9806} {"info/global_step": 9807, "train_info/time_within_train_step": 2.7557501792907715, "step": 9807} {"train_info/time_between_train_steps": 0.003229379653930664, "step": 9807} {"info/global_step": 9808, "train_info/time_within_train_step": 2.7549703121185303, "step": 9808} {"train_info/time_between_train_steps": 0.0031914710998535156, "step": 9808} {"info/global_step": 9809, "train_info/time_within_train_step": 2.7554636001586914, "step": 9809} {"train_info/time_between_train_steps": 0.0032210350036621094, "step": 9809} {"info/global_step": 9810, "train_info/time_within_train_step": 2.7617595195770264, "step": 9810} {"train_info/time_between_train_steps": 0.003163576126098633, "step": 9810} {"info/global_step": 9811, "train_info/time_within_train_step": 2.7559056282043457, "step": 9811} {"train_info/time_between_train_steps": 0.0031890869140625, "step": 9811} {"info/global_step": 9812, "train_info/time_within_train_step": 2.7567949295043945, "step": 9812} {"train_info/time_between_train_steps": 0.0032885074615478516, "step": 9812} {"info/global_step": 9813, "train_info/time_within_train_step": 2.7567331790924072, "step": 9813} {"train_info/time_between_train_steps": 0.003227710723876953, "step": 9813} {"info/global_step": 9814, "train_info/time_within_train_step": 2.7560930252075195, "step": 9814} {"train_info/time_between_train_steps": 0.0032091140747070312, "step": 9814} {"info/global_step": 9815, "train_info/time_within_train_step": 2.7560949325561523, "step": 9815} {"train_info/time_between_train_steps": 0.0031995773315429688, "step": 9815} {"info/global_step": 9816, "train_info/time_within_train_step": 2.7561750411987305, "step": 9816} {"train_info/time_between_train_steps": 0.0031898021697998047, "step": 9816} {"info/global_step": 9817, "train_info/time_within_train_step": 2.7560744285583496, "step": 9817} {"train_info/time_between_train_steps": 0.003178834915161133, "step": 9817} {"info/global_step": 9818, "train_info/time_within_train_step": 2.7557461261749268, "step": 9818} {"train_info/time_between_train_steps": 0.003221273422241211, "step": 9818} {"info/global_step": 9819, "train_info/time_within_train_step": 2.7562062740325928, "step": 9819} {"train_info/time_between_train_steps": 0.003182649612426758, "step": 9819} {"info/global_step": 9820, "train_info/time_within_train_step": 2.7564444541931152, "step": 9820} {"train_info/time_between_train_steps": 0.0032196044921875, "step": 9820} {"info/global_step": 9821, "train_info/time_within_train_step": 2.893099784851074, "step": 9821} {"train_info/time_between_train_steps": 0.003205537796020508, "step": 9821} {"info/global_step": 9822, "train_info/time_within_train_step": 2.755714178085327, "step": 9822} {"train_info/time_between_train_steps": 0.0031664371490478516, "step": 9822} {"info/global_step": 9823, "train_info/time_within_train_step": 2.75603985786438, "step": 9823} {"train_info/time_between_train_steps": 0.003164052963256836, "step": 9823} {"info/global_step": 9824, "train_info/time_within_train_step": 2.7566311359405518, "step": 9824} {"train_info/time_between_train_steps": 0.003203153610229492, "step": 9824} {"info/global_step": 9825, "train_info/time_within_train_step": 2.756868600845337, "step": 9825} {"train_info/time_between_train_steps": 0.0032019615173339844, "step": 9825} {"info/global_step": 9826, "train_info/time_within_train_step": 2.7568042278289795, "step": 9826} {"train_info/time_between_train_steps": 0.0032036304473876953, "step": 9826} {"info/global_step": 9827, "train_info/time_within_train_step": 2.7570085525512695, "step": 9827} {"train_info/time_between_train_steps": 0.003175497055053711, "step": 9827} {"info/global_step": 9828, "train_info/time_within_train_step": 3.038937568664551, "step": 9828} {"train_info/time_between_train_steps": 0.0031867027282714844, "step": 9828} {"info/global_step": 9829, "train_info/time_within_train_step": 2.7556211948394775, "step": 9829} {"train_info/time_between_train_steps": 0.003257274627685547, "step": 9829} {"info/global_step": 9830, "train_info/time_within_train_step": 2.756077766418457, "step": 9830} {"train_info/time_between_train_steps": 0.0032143592834472656, "step": 9830} {"info/global_step": 9831, "train_info/time_within_train_step": 2.75649094581604, "step": 9831} {"train_info/time_between_train_steps": 0.0032148361206054688, "step": 9831} {"info/global_step": 9832, "train_info/time_within_train_step": 2.75551700592041, "step": 9832} {"train_info/time_between_train_steps": 0.003213167190551758, "step": 9832} {"info/global_step": 9833, "train_info/time_within_train_step": 2.755624771118164, "step": 9833} {"train_info/time_between_train_steps": 0.0031893253326416016, "step": 9833} {"info/global_step": 9834, "train_info/time_within_train_step": 2.7561399936676025, "step": 9834} {"train_info/time_between_train_steps": 0.003251314163208008, "step": 9834} {"info/global_step": 9835, "train_info/time_within_train_step": 2.7567689418792725, "step": 9835} {"train_info/time_between_train_steps": 0.003208160400390625, "step": 9835} {"info/global_step": 9836, "train_info/time_within_train_step": 2.756711959838867, "step": 9836} {"train_info/time_between_train_steps": 0.0031816959381103516, "step": 9836} {"info/global_step": 9837, "train_info/time_within_train_step": 2.7563982009887695, "step": 9837} {"train_info/time_between_train_steps": 0.003171682357788086, "step": 9837} {"info/global_step": 9838, "train_info/time_within_train_step": 2.7564311027526855, "step": 9838} {"train_info/time_between_train_steps": 0.0031690597534179688, "step": 9838} {"info/global_step": 9839, "train_info/time_within_train_step": 2.757176160812378, "step": 9839} {"train_info/time_between_train_steps": 0.0033495426177978516, "step": 9839} {"info/global_step": 9840, "train_info/time_within_train_step": 2.7582192420959473, "step": 9840} {"train_info/time_between_train_steps": 0.0035123825073242188, "step": 9840} {"info/global_step": 9841, "train_info/time_within_train_step": 2.7574942111968994, "step": 9841} {"train_info/time_between_train_steps": 0.0033648014068603516, "step": 9841} {"info/global_step": 9842, "train_info/time_within_train_step": 2.7591402530670166, "step": 9842} {"train_info/time_between_train_steps": 0.003368377685546875, "step": 9842} {"info/global_step": 9843, "train_info/time_within_train_step": 2.7569327354431152, "step": 9843} {"train_info/time_between_train_steps": 0.0033485889434814453, "step": 9843} {"info/global_step": 9844, "train_info/time_within_train_step": 2.7571582794189453, "step": 9844} {"train_info/time_between_train_steps": 0.003363370895385742, "step": 9844} {"info/global_step": 9845, "train_info/time_within_train_step": 2.7578134536743164, "step": 9845} {"train_info/time_between_train_steps": 0.0033185482025146484, "step": 9845} {"info/global_step": 9846, "train_info/time_within_train_step": 2.756088972091675, "step": 9846} {"train_info/time_between_train_steps": 0.0031845569610595703, "step": 9846} {"info/global_step": 9847, "train_info/time_within_train_step": 2.75610613822937, "step": 9847} {"train_info/time_between_train_steps": 0.0032050609588623047, "step": 9847} {"info/global_step": 9848, "train_info/time_within_train_step": 2.7559337615966797, "step": 9848} {"train_info/time_between_train_steps": 0.0031747817993164062, "step": 9848} {"info/global_step": 9849, "train_info/time_within_train_step": 2.754966974258423, "step": 9849} {"train_info/time_between_train_steps": 0.003182649612426758, "step": 9849} {"info/global_step": 9850, "train_info/time_within_train_step": 2.755337953567505, "step": 9850} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746594360, "_runtime": 28369}, "step": 9850} {"logs": {"train/loss": 2.8801, "train/learning_rate": 9.999999999999999e-06, "train/epoch": 11.05, "_timestamp": 1746594360, "_runtime": 28369}, "step": 9850} {"train_info/time_between_train_steps": 0.007240772247314453, "step": 9850} {"info/global_step": 9851, "train_info/time_within_train_step": 2.7555508613586426, "step": 9851} {"train_info/time_between_train_steps": 0.0032193660736083984, "step": 9851} {"info/global_step": 9852, "train_info/time_within_train_step": 2.7553818225860596, "step": 9852} {"train_info/time_between_train_steps": 0.003164529800415039, "step": 9852} {"info/global_step": 9853, "train_info/time_within_train_step": 2.7555947303771973, "step": 9853} {"train_info/time_between_train_steps": 0.0033893585205078125, "step": 9853} {"info/global_step": 9854, "train_info/time_within_train_step": 2.7572736740112305, "step": 9854} {"train_info/time_between_train_steps": 0.003359079360961914, "step": 9854} {"info/global_step": 9855, "train_info/time_within_train_step": 2.756498336791992, "step": 9855} {"train_info/time_between_train_steps": 0.0033273696899414062, "step": 9855} {"info/global_step": 9856, "train_info/time_within_train_step": 2.7562506198883057, "step": 9856} {"train_info/time_between_train_steps": 0.003345012664794922, "step": 9856} {"info/global_step": 9857, "train_info/time_within_train_step": 2.7565183639526367, "step": 9857} {"train_info/time_between_train_steps": 0.003361225128173828, "step": 9857} {"info/global_step": 9858, "train_info/time_within_train_step": 2.757610321044922, "step": 9858} {"train_info/time_between_train_steps": 0.0033578872680664062, "step": 9858} {"info/global_step": 9859, "train_info/time_within_train_step": 2.757448673248291, "step": 9859} {"train_info/time_between_train_steps": 0.0033440589904785156, "step": 9859} {"info/global_step": 9860, "train_info/time_within_train_step": 2.7568624019622803, "step": 9860} {"train_info/time_between_train_steps": 0.003333568572998047, "step": 9860} {"info/global_step": 9861, "train_info/time_within_train_step": 2.7563586235046387, "step": 9861} {"train_info/time_between_train_steps": 0.0033261775970458984, "step": 9861} {"info/global_step": 9862, "train_info/time_within_train_step": 2.7562873363494873, "step": 9862} {"train_info/time_between_train_steps": 0.0033621788024902344, "step": 9862} {"info/global_step": 9863, "train_info/time_within_train_step": 2.7574243545532227, "step": 9863} {"train_info/time_between_train_steps": 0.0033113956451416016, "step": 9863} {"info/global_step": 9864, "train_info/time_within_train_step": 2.7568583488464355, "step": 9864} {"train_info/time_between_train_steps": 0.003391742706298828, "step": 9864} {"info/global_step": 9865, "train_info/time_within_train_step": 2.7578887939453125, "step": 9865} {"train_info/time_between_train_steps": 0.0033173561096191406, "step": 9865} {"info/global_step": 9866, "train_info/time_within_train_step": 2.7571773529052734, "step": 9866} {"train_info/time_between_train_steps": 0.003308534622192383, "step": 9866} {"info/global_step": 9867, "train_info/time_within_train_step": 2.7568886280059814, "step": 9867} {"train_info/time_between_train_steps": 0.0033245086669921875, "step": 9867} {"info/global_step": 9868, "train_info/time_within_train_step": 2.7583205699920654, "step": 9868} {"train_info/time_between_train_steps": 0.003371000289916992, "step": 9868} {"info/global_step": 9869, "train_info/time_within_train_step": 3.031621217727661, "step": 9869} {"train_info/time_between_train_steps": 0.0032939910888671875, "step": 9869} {"info/global_step": 9870, "train_info/time_within_train_step": 2.757835865020752, "step": 9870} {"train_info/time_between_train_steps": 0.003427267074584961, "step": 9870} {"info/global_step": 9871, "train_info/time_within_train_step": 2.7572596073150635, "step": 9871} {"train_info/time_between_train_steps": 0.003309488296508789, "step": 9871} {"info/global_step": 9872, "train_info/time_within_train_step": 2.758014678955078, "step": 9872} {"train_info/time_between_train_steps": 0.0033452510833740234, "step": 9872} {"info/global_step": 9873, "train_info/time_within_train_step": 2.757002353668213, "step": 9873} {"train_info/time_between_train_steps": 0.0034096240997314453, "step": 9873} {"info/global_step": 9874, "train_info/time_within_train_step": 2.7565855979919434, "step": 9874} {"train_info/time_between_train_steps": 0.0033686161041259766, "step": 9874} {"info/global_step": 9875, "train_info/time_within_train_step": 2.763214588165283, "step": 9875} {"train_info/time_between_train_steps": 0.003370046615600586, "step": 9875} {"info/global_step": 9876, "train_info/time_within_train_step": 2.756715774536133, "step": 9876} {"train_info/time_between_train_steps": 0.0033409595489501953, "step": 9876} {"info/global_step": 9877, "train_info/time_within_train_step": 2.7566111087799072, "step": 9877} {"train_info/time_between_train_steps": 0.003336668014526367, "step": 9877} {"info/global_step": 9878, "train_info/time_within_train_step": 2.7560839653015137, "step": 9878} {"train_info/time_between_train_steps": 0.0033774375915527344, "step": 9878} {"info/global_step": 9879, "train_info/time_within_train_step": 2.7558486461639404, "step": 9879} {"train_info/time_between_train_steps": 0.0033583641052246094, "step": 9879} {"info/global_step": 9880, "train_info/time_within_train_step": 2.756162643432617, "step": 9880} {"train_info/time_between_train_steps": 0.0033316612243652344, "step": 9880} {"info/global_step": 9881, "train_info/time_within_train_step": 2.757824420928955, "step": 9881} {"train_info/time_between_train_steps": 0.0033867359161376953, "step": 9881} {"info/global_step": 9882, "train_info/time_within_train_step": 2.7570667266845703, "step": 9882} {"train_info/time_between_train_steps": 0.003305196762084961, "step": 9882} {"info/global_step": 9883, "train_info/time_within_train_step": 2.7568552494049072, "step": 9883} {"train_info/time_between_train_steps": 0.09716296195983887, "step": 9883} {"info/global_step": 9884, "train_info/time_within_train_step": 2.758521795272827, "step": 9884} {"train_info/time_between_train_steps": 0.003404855728149414, "step": 9884} {"info/global_step": 9885, "train_info/time_within_train_step": 2.757359027862549, "step": 9885} {"train_info/time_between_train_steps": 0.00336456298828125, "step": 9885} {"info/global_step": 9886, "train_info/time_within_train_step": 2.7557711601257324, "step": 9886} {"train_info/time_between_train_steps": 0.0032296180725097656, "step": 9886} {"info/global_step": 9887, "train_info/time_within_train_step": 2.757599353790283, "step": 9887} {"train_info/time_between_train_steps": 0.0033669471740722656, "step": 9887} {"info/global_step": 9888, "train_info/time_within_train_step": 2.7572269439697266, "step": 9888} {"train_info/time_between_train_steps": 0.0033316612243652344, "step": 9888} {"info/global_step": 9889, "train_info/time_within_train_step": 2.7559077739715576, "step": 9889} {"train_info/time_between_train_steps": 0.003351926803588867, "step": 9889} {"info/global_step": 9890, "train_info/time_within_train_step": 2.7580714225769043, "step": 9890} {"train_info/time_between_train_steps": 0.0033562183380126953, "step": 9890} {"info/global_step": 9891, "train_info/time_within_train_step": 2.7565507888793945, "step": 9891} {"train_info/time_between_train_steps": 0.003362417221069336, "step": 9891} {"info/global_step": 9892, "train_info/time_within_train_step": 2.7571518421173096, "step": 9892} {"train_info/time_between_train_steps": 0.0033626556396484375, "step": 9892} {"info/global_step": 9893, "train_info/time_within_train_step": 2.757490634918213, "step": 9893} {"train_info/time_between_train_steps": 0.003337860107421875, "step": 9893} {"info/global_step": 9894, "train_info/time_within_train_step": 2.7574706077575684, "step": 9894} {"train_info/time_between_train_steps": 0.003329753875732422, "step": 9894} {"info/global_step": 9895, "train_info/time_within_train_step": 2.7571449279785156, "step": 9895} {"train_info/time_between_train_steps": 0.003366708755493164, "step": 9895} {"info/global_step": 9896, "train_info/time_within_train_step": 2.7563984394073486, "step": 9896} {"train_info/time_between_train_steps": 0.003396272659301758, "step": 9896} {"info/global_step": 9897, "train_info/time_within_train_step": 2.75788950920105, "step": 9897} {"train_info/time_between_train_steps": 0.0036711692810058594, "step": 9897} {"info/global_step": 9898, "train_info/time_within_train_step": 2.75732159614563, "step": 9898} {"train_info/time_between_train_steps": 0.003692626953125, "step": 9898} {"info/global_step": 9899, "train_info/time_within_train_step": 2.7566778659820557, "step": 9899} {"train_info/time_between_train_steps": 0.0037126541137695312, "step": 9899} {"info/global_step": 9900, "train_info/time_within_train_step": 2.7570345401763916, "step": 9900} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746594498, "_runtime": 28507}, "step": 9900} {"logs": {"train/loss": 2.8767, "train/learning_rate": 6.666666666666667e-06, "train/epoch": 11.05, "_timestamp": 1746594498, "_runtime": 28507}, "step": 9900} {"train_info/time_between_train_steps": 0.007578849792480469, "step": 9900} {"info/global_step": 9901, "train_info/time_within_train_step": 2.757800579071045, "step": 9901} {"train_info/time_between_train_steps": 0.0037384033203125, "step": 9901} {"info/global_step": 9902, "train_info/time_within_train_step": 2.757739305496216, "step": 9902} {"train_info/time_between_train_steps": 0.0037212371826171875, "step": 9902} {"info/global_step": 9903, "train_info/time_within_train_step": 2.7586324214935303, "step": 9903} {"train_info/time_between_train_steps": 0.0036573410034179688, "step": 9903} {"info/global_step": 9904, "train_info/time_within_train_step": 2.757720708847046, "step": 9904} {"train_info/time_between_train_steps": 0.0037186145782470703, "step": 9904} {"info/global_step": 9905, "train_info/time_within_train_step": 2.757244348526001, "step": 9905} {"train_info/time_between_train_steps": 0.003792285919189453, "step": 9905} {"info/global_step": 9906, "train_info/time_within_train_step": 2.75869083404541, "step": 9906} {"train_info/time_between_train_steps": 0.0036301612854003906, "step": 9906} {"info/global_step": 9907, "train_info/time_within_train_step": 2.7586214542388916, "step": 9907} {"train_info/time_between_train_steps": 0.0036439895629882812, "step": 9907} {"info/global_step": 9908, "train_info/time_within_train_step": 2.75825834274292, "step": 9908} {"train_info/time_between_train_steps": 0.0037276744842529297, "step": 9908} {"info/global_step": 9909, "train_info/time_within_train_step": 2.757689952850342, "step": 9909} {"train_info/time_between_train_steps": 0.003628253936767578, "step": 9909} {"info/global_step": 9910, "train_info/time_within_train_step": 2.757974624633789, "step": 9910} {"train_info/time_between_train_steps": 0.0035905838012695312, "step": 9910} {"info/global_step": 9911, "train_info/time_within_train_step": 2.7580983638763428, "step": 9911} {"train_info/time_between_train_steps": 0.003618478775024414, "step": 9911} {"info/global_step": 9912, "train_info/time_within_train_step": 2.7582485675811768, "step": 9912} {"train_info/time_between_train_steps": 0.0035886764526367188, "step": 9912} {"info/global_step": 9913, "train_info/time_within_train_step": 2.7574782371520996, "step": 9913} {"train_info/time_between_train_steps": 0.0036094188690185547, "step": 9913} {"info/global_step": 9914, "train_info/time_within_train_step": 2.757185459136963, "step": 9914} {"train_info/time_between_train_steps": 0.00359344482421875, "step": 9914} {"info/global_step": 9915, "train_info/time_within_train_step": 2.757356643676758, "step": 9915} {"train_info/time_between_train_steps": 0.003508329391479492, "step": 9915} {"info/global_step": 9916, "train_info/time_within_train_step": 2.757167100906372, "step": 9916} {"train_info/time_between_train_steps": 0.0036287307739257812, "step": 9916} {"info/global_step": 9917, "train_info/time_within_train_step": 2.7583372592926025, "step": 9917} {"train_info/time_between_train_steps": 0.003716707229614258, "step": 9917} {"info/global_step": 9918, "train_info/time_within_train_step": 2.757995367050171, "step": 9918} {"train_info/time_between_train_steps": 0.0035974979400634766, "step": 9918} {"info/global_step": 9919, "train_info/time_within_train_step": 2.757655143737793, "step": 9919} {"train_info/time_between_train_steps": 0.003701448440551758, "step": 9919} {"info/global_step": 9920, "train_info/time_within_train_step": 2.7577457427978516, "step": 9920} {"train_info/time_between_train_steps": 0.0036318302154541016, "step": 9920} {"info/global_step": 9921, "train_info/time_within_train_step": 2.757540464401245, "step": 9921} {"train_info/time_between_train_steps": 0.0036177635192871094, "step": 9921} {"info/global_step": 9922, "train_info/time_within_train_step": 2.7566816806793213, "step": 9922} {"train_info/time_between_train_steps": 0.00362396240234375, "step": 9922} {"info/global_step": 9923, "train_info/time_within_train_step": 2.756587028503418, "step": 9923} {"train_info/time_between_train_steps": 0.0036470890045166016, "step": 9923} {"info/global_step": 9924, "train_info/time_within_train_step": 2.7566776275634766, "step": 9924} {"train_info/time_between_train_steps": 0.027233123779296875, "step": 9924} {"info/global_step": 9925, "train_info/time_within_train_step": 2.757293224334717, "step": 9925} {"train_info/time_between_train_steps": 0.0031228065490722656, "step": 9925} {"info/global_step": 9926, "train_info/time_within_train_step": 2.756688356399536, "step": 9926} {"train_info/time_between_train_steps": 0.0031185150146484375, "step": 9926} {"info/global_step": 9927, "train_info/time_within_train_step": 2.755765199661255, "step": 9927} {"train_info/time_between_train_steps": 0.0032079219818115234, "step": 9927} {"info/global_step": 9928, "train_info/time_within_train_step": 2.757383346557617, "step": 9928} {"train_info/time_between_train_steps": 0.0031359195709228516, "step": 9928} {"info/global_step": 9929, "train_info/time_within_train_step": 2.756063461303711, "step": 9929} {"train_info/time_between_train_steps": 0.0030891895294189453, "step": 9929} {"info/global_step": 9930, "train_info/time_within_train_step": 2.7565207481384277, "step": 9930} {"train_info/time_between_train_steps": 0.0031549930572509766, "step": 9930} {"info/global_step": 9931, "train_info/time_within_train_step": 2.75640869140625, "step": 9931} {"train_info/time_between_train_steps": 0.00315093994140625, "step": 9931} {"info/global_step": 9932, "train_info/time_within_train_step": 2.7568628787994385, "step": 9932} {"train_info/time_between_train_steps": 0.0031347274780273438, "step": 9932} {"info/global_step": 9933, "train_info/time_within_train_step": 2.7573883533477783, "step": 9933} {"train_info/time_between_train_steps": 0.003100872039794922, "step": 9933} {"info/global_step": 9934, "train_info/time_within_train_step": 2.7563228607177734, "step": 9934} {"train_info/time_between_train_steps": 0.0030908584594726562, "step": 9934} {"info/global_step": 9935, "train_info/time_within_train_step": 2.75679087638855, "step": 9935} {"train_info/time_between_train_steps": 0.003200054168701172, "step": 9935} {"info/global_step": 9936, "train_info/time_within_train_step": 2.7567334175109863, "step": 9936} {"train_info/time_between_train_steps": 0.003124237060546875, "step": 9936} {"info/global_step": 9937, "train_info/time_within_train_step": 2.756527900695801, "step": 9937} {"train_info/time_between_train_steps": 0.0031027793884277344, "step": 9937} {"info/global_step": 9938, "train_info/time_within_train_step": 2.7559385299682617, "step": 9938} {"train_info/time_between_train_steps": 0.003129720687866211, "step": 9938} {"info/global_step": 9939, "train_info/time_within_train_step": 2.755882978439331, "step": 9939} {"train_info/time_between_train_steps": 0.0030841827392578125, "step": 9939} {"info/global_step": 9940, "train_info/time_within_train_step": 2.756556272506714, "step": 9940} {"train_info/time_between_train_steps": 0.003080129623413086, "step": 9940} {"info/global_step": 9941, "train_info/time_within_train_step": 2.75553035736084, "step": 9941} {"train_info/time_between_train_steps": 0.0030951499938964844, "step": 9941} {"info/global_step": 9942, "train_info/time_within_train_step": 2.7564797401428223, "step": 9942} {"train_info/time_between_train_steps": 0.003072977066040039, "step": 9942} {"info/global_step": 9943, "train_info/time_within_train_step": 2.7567949295043945, "step": 9943} {"train_info/time_between_train_steps": 0.0030961036682128906, "step": 9943} {"info/global_step": 9944, "train_info/time_within_train_step": 2.756443738937378, "step": 9944} {"train_info/time_between_train_steps": 0.003060579299926758, "step": 9944} {"info/global_step": 9945, "train_info/time_within_train_step": 2.7568562030792236, "step": 9945} {"train_info/time_between_train_steps": 0.0031032562255859375, "step": 9945} {"info/global_step": 9946, "train_info/time_within_train_step": 2.7570183277130127, "step": 9946} {"train_info/time_between_train_steps": 0.0030145645141601562, "step": 9946} {"info/global_step": 9947, "train_info/time_within_train_step": 2.756174087524414, "step": 9947} {"train_info/time_between_train_steps": 0.003098011016845703, "step": 9947} {"info/global_step": 9948, "train_info/time_within_train_step": 2.756566286087036, "step": 9948} {"train_info/time_between_train_steps": 0.003130674362182617, "step": 9948} {"info/global_step": 9949, "train_info/time_within_train_step": 2.756929874420166, "step": 9949} {"train_info/time_between_train_steps": 0.0030584335327148438, "step": 9949} {"info/global_step": 9950, "train_info/time_within_train_step": 2.7554261684417725, "step": 9950} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746594637, "_runtime": 28646}, "step": 9950} {"logs": {"train/loss": 2.8772, "train/learning_rate": 3.3333333333333333e-06, "train/epoch": 11.06, "_timestamp": 1746594637, "_runtime": 28646}, "step": 9950} {"train_info/time_between_train_steps": 0.006770133972167969, "step": 9950} {"info/global_step": 9951, "train_info/time_within_train_step": 2.7555806636810303, "step": 9951} {"train_info/time_between_train_steps": 0.0030510425567626953, "step": 9951} {"info/global_step": 9952, "train_info/time_within_train_step": 2.755908966064453, "step": 9952} {"train_info/time_between_train_steps": 0.003086090087890625, "step": 9952} {"info/global_step": 9953, "train_info/time_within_train_step": 2.756885528564453, "step": 9953} {"train_info/time_between_train_steps": 0.003029346466064453, "step": 9953} {"info/global_step": 9954, "train_info/time_within_train_step": 2.7561914920806885, "step": 9954} {"train_info/time_between_train_steps": 0.0030422210693359375, "step": 9954} {"info/global_step": 9955, "train_info/time_within_train_step": 2.75606369972229, "step": 9955} {"train_info/time_between_train_steps": 0.003056764602661133, "step": 9955} {"info/global_step": 9956, "train_info/time_within_train_step": 2.7568366527557373, "step": 9956} {"train_info/time_between_train_steps": 0.00308990478515625, "step": 9956} {"info/global_step": 9957, "train_info/time_within_train_step": 2.757838010787964, "step": 9957} {"train_info/time_between_train_steps": 0.0030231475830078125, "step": 9957} {"info/global_step": 9958, "train_info/time_within_train_step": 2.7557783126831055, "step": 9958} {"train_info/time_between_train_steps": 0.0030624866485595703, "step": 9958} {"info/global_step": 9959, "train_info/time_within_train_step": 2.7554569244384766, "step": 9959} {"train_info/time_between_train_steps": 0.00301361083984375, "step": 9959} {"info/global_step": 9960, "train_info/time_within_train_step": 2.755962371826172, "step": 9960} {"train_info/time_between_train_steps": 0.0030171871185302734, "step": 9960} {"info/global_step": 9961, "train_info/time_within_train_step": 2.7561421394348145, "step": 9961} {"train_info/time_between_train_steps": 0.003063678741455078, "step": 9961} {"info/global_step": 9962, "train_info/time_within_train_step": 2.7574284076690674, "step": 9962} {"train_info/time_between_train_steps": 0.003046751022338867, "step": 9962} {"info/global_step": 9963, "train_info/time_within_train_step": 2.757205009460449, "step": 9963} {"train_info/time_between_train_steps": 0.0031054019927978516, "step": 9963} {"info/global_step": 9964, "train_info/time_within_train_step": 2.757319688796997, "step": 9964} {"train_info/time_between_train_steps": 0.003003835678100586, "step": 9964} {"info/global_step": 9965, "train_info/time_within_train_step": 2.7574360370635986, "step": 9965} {"train_info/time_between_train_steps": 0.0030128955841064453, "step": 9965} {"info/global_step": 9966, "train_info/time_within_train_step": 2.997797966003418, "step": 9966} {"train_info/time_between_train_steps": 0.0029883384704589844, "step": 9966} {"info/global_step": 9967, "train_info/time_within_train_step": 2.7555506229400635, "step": 9967} {"train_info/time_between_train_steps": 0.0029821395874023438, "step": 9967} {"info/global_step": 9968, "train_info/time_within_train_step": 2.7543587684631348, "step": 9968} {"train_info/time_between_train_steps": 0.0029997825622558594, "step": 9968} {"info/global_step": 9969, "train_info/time_within_train_step": 2.7554078102111816, "step": 9969} {"train_info/time_between_train_steps": 0.002967357635498047, "step": 9969} {"info/global_step": 9970, "train_info/time_within_train_step": 2.755239725112915, "step": 9970} {"train_info/time_between_train_steps": 0.002969980239868164, "step": 9970} {"info/global_step": 9971, "train_info/time_within_train_step": 2.7546072006225586, "step": 9971} {"train_info/time_between_train_steps": 0.002973318099975586, "step": 9971} {"info/global_step": 9972, "train_info/time_within_train_step": 2.755275249481201, "step": 9972} {"train_info/time_between_train_steps": 0.0030133724212646484, "step": 9972} {"info/global_step": 9973, "train_info/time_within_train_step": 2.7554707527160645, "step": 9973} {"train_info/time_between_train_steps": 0.002972126007080078, "step": 9973} {"info/global_step": 9974, "train_info/time_within_train_step": 2.7552547454833984, "step": 9974} {"train_info/time_between_train_steps": 0.0030193328857421875, "step": 9974} {"info/global_step": 9975, "train_info/time_within_train_step": 2.7555201053619385, "step": 9975} {"train_info/time_between_train_steps": 0.0030095577239990234, "step": 9975} {"info/global_step": 9976, "train_info/time_within_train_step": 2.755164623260498, "step": 9976} {"train_info/time_between_train_steps": 0.0029609203338623047, "step": 9976} {"info/global_step": 9977, "train_info/time_within_train_step": 2.7559309005737305, "step": 9977} {"train_info/time_between_train_steps": 0.0029993057250976562, "step": 9977} {"info/global_step": 9978, "train_info/time_within_train_step": 2.7556357383728027, "step": 9978} {"train_info/time_between_train_steps": 0.0030105113983154297, "step": 9978} {"info/global_step": 9979, "train_info/time_within_train_step": 2.755458354949951, "step": 9979} {"train_info/time_between_train_steps": 0.0029821395874023438, "step": 9979} {"info/global_step": 9980, "train_info/time_within_train_step": 2.7551825046539307, "step": 9980} {"train_info/time_between_train_steps": 0.0029916763305664062, "step": 9980} {"info/global_step": 9981, "train_info/time_within_train_step": 2.75517201423645, "step": 9981} {"train_info/time_between_train_steps": 0.002988100051879883, "step": 9981} {"info/global_step": 9982, "train_info/time_within_train_step": 2.7562990188598633, "step": 9982} {"train_info/time_between_train_steps": 0.0029621124267578125, "step": 9982} {"info/global_step": 9983, "train_info/time_within_train_step": 2.7553505897521973, "step": 9983} {"train_info/time_between_train_steps": 0.0029942989349365234, "step": 9983} {"info/global_step": 9984, "train_info/time_within_train_step": 2.7550604343414307, "step": 9984} {"train_info/time_between_train_steps": 0.0029938220977783203, "step": 9984} {"info/global_step": 9985, "train_info/time_within_train_step": 2.755791425704956, "step": 9985} {"train_info/time_between_train_steps": 0.0030219554901123047, "step": 9985} {"info/global_step": 9986, "train_info/time_within_train_step": 2.75382924079895, "step": 9986} {"train_info/time_between_train_steps": 0.0029222965240478516, "step": 9986} {"info/global_step": 9987, "train_info/time_within_train_step": 2.754375457763672, "step": 9987} {"train_info/time_between_train_steps": 0.002879619598388672, "step": 9987} {"info/global_step": 9988, "train_info/time_within_train_step": 2.752779722213745, "step": 9988} {"train_info/time_between_train_steps": 0.002922534942626953, "step": 9988} {"info/global_step": 9989, "train_info/time_within_train_step": 2.7528235912323, "step": 9989} {"train_info/time_between_train_steps": 0.0029222965240478516, "step": 9989} {"info/global_step": 9990, "train_info/time_within_train_step": 2.754581928253174, "step": 9990} {"train_info/time_between_train_steps": 0.0028896331787109375, "step": 9990} {"info/global_step": 9991, "train_info/time_within_train_step": 2.755241632461548, "step": 9991} {"train_info/time_between_train_steps": 0.00290679931640625, "step": 9991} {"info/global_step": 9992, "train_info/time_within_train_step": 2.7541275024414062, "step": 9992} {"train_info/time_between_train_steps": 0.002907276153564453, "step": 9992} {"info/global_step": 9993, "train_info/time_within_train_step": 2.7538270950317383, "step": 9993} {"train_info/time_between_train_steps": 0.002921581268310547, "step": 9993} {"info/global_step": 9994, "train_info/time_within_train_step": 2.7540345191955566, "step": 9994} {"train_info/time_between_train_steps": 0.0029327869415283203, "step": 9994} {"info/global_step": 9995, "train_info/time_within_train_step": 3.310509443283081, "step": 9995} {"train_info/time_between_train_steps": 0.002917051315307617, "step": 9995} {"info/global_step": 9996, "train_info/time_within_train_step": 2.755645751953125, "step": 9996} {"train_info/time_between_train_steps": 0.0029134750366210938, "step": 9996} {"info/global_step": 9997, "train_info/time_within_train_step": 2.7537381649017334, "step": 9997} {"train_info/time_between_train_steps": 0.0028853416442871094, "step": 9997} {"info/global_step": 9998, "train_info/time_within_train_step": 2.7541775703430176, "step": 9998} {"train_info/time_between_train_steps": 0.0028634071350097656, "step": 9998} {"info/global_step": 9999, "train_info/time_within_train_step": 2.7542247772216797, "step": 9999} {"train_info/time_between_train_steps": 0.002958536148071289, "step": 9999} {"info/global_step": 10000, "train_info/time_within_train_step": 2.7550435066223145, "step": 10000} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746594775, "_runtime": 28784}, "step": 10000} {"logs": {"train/loss": 2.8778, "train/learning_rate": 0.0, "train/epoch": 11.06, "_timestamp": 1746594775, "_runtime": 28784}, "step": 10000} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746594781, "_runtime": 28790}, "step": 10000} {"logs": {"eval/loss": 4.8722100257873535, "eval/runtime": 5.1248, "eval/samples_per_second": 37.075, "eval/steps_per_second": 1.171, "train/epoch": 11.06, "_timestamp": 1746594781, "_runtime": 28790}, "step": 10000} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746594781, "_runtime": 28790}, "step": 10000} {"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.8722100257873535, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 130.6092479756358, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 5.1248, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 37.075, "train/epoch": 11.06, "_timestamp": 1746594781, "_runtime": 28790}, "step": 10000} {"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746594794, "_runtime": 28803}, "step": 10000} {"logs": {"train/train_runtime": 28803.5753, "train/train_samples_per_second": 22.219, "train/train_steps_per_second": 0.347, "train/total_flos": 8.3659437637632e+16, "train/train_loss": 3.844178419303894, "train/epoch": 11.06, "_timestamp": 1746594794, "_runtime": 28803}, "step": 10000} {"train_info": {"train_info/memory_allocated": 1681.771484375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746594804, "_runtime": 28813}, "step": 10000} {"logs": {"eval/loss": 4.8722100257873535, "eval/runtime": 4.8095, "eval/samples_per_second": 39.505, "eval/steps_per_second": 1.248, "train/epoch": 11.06, "_timestamp": 1746594804, "_runtime": 28813}, "step": 10000} {"train_info": {"train_info/memory_allocated": 1681.771484375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746594804, "_runtime": 28813}, "step": 10000} {"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.8722100257873535, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 130.6092479756358, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 4.8095, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 39.505, "train/epoch": 11.06, "_timestamp": 1746594804, "_runtime": 28813}, "step": 10000}