{"current_steps": 5, "total_steps": 38160, "loss": 5.087, "lr": 1.0482180293501048e-06, "epoch": 0.002620545073375262, "percentage": 0.01, "elapsed_time": "0:00:01", "remaining_time": "3:17:09", "throughput": 2415.21, "total_tokens": 3744} {"current_steps": 10, "total_steps": 38160, "loss": 4.7413, "lr": 2.358490566037736e-06, "epoch": 0.005241090146750524, "percentage": 0.03, "elapsed_time": "0:00:02", "remaining_time": "2:27:50", "throughput": 3220.27, "total_tokens": 7488} {"current_steps": 15, "total_steps": 38160, "loss": 4.8611, "lr": 3.668763102725367e-06, "epoch": 0.007861635220125786, "percentage": 0.04, "elapsed_time": "0:00:03", "remaining_time": "2:07:54", "throughput": 3467.3, "total_tokens": 10464} {"current_steps": 20, "total_steps": 38160, "loss": 4.1091, "lr": 4.979035639412998e-06, "epoch": 0.010482180293501049, "percentage": 0.05, "elapsed_time": "0:00:03", "remaining_time": "1:57:56", "throughput": 3647.59, "total_tokens": 13536} {"current_steps": 25, "total_steps": 38160, "loss": 2.8262, "lr": 6.289308176100629e-06, "epoch": 0.01310272536687631, "percentage": 0.07, "elapsed_time": "0:00:04", "remaining_time": "1:57:11", "throughput": 3942.94, "total_tokens": 18176} {"current_steps": 30, "total_steps": 38160, "loss": 1.9392, "lr": 7.59958071278826e-06, "epoch": 0.015723270440251572, "percentage": 0.08, "elapsed_time": "0:00:05", "remaining_time": "1:52:30", "throughput": 3988.81, "total_tokens": 21184} {"current_steps": 35, "total_steps": 38160, "loss": 1.1864, "lr": 8.90985324947589e-06, "epoch": 0.018343815513626835, "percentage": 0.09, "elapsed_time": "0:00:05", "remaining_time": "1:48:21", "throughput": 4015.78, "total_tokens": 23968} {"current_steps": 40, "total_steps": 38160, "loss": 0.8954, "lr": 1.0220125786163522e-05, "epoch": 0.020964360587002098, "percentage": 0.1, "elapsed_time": "0:00:06", "remaining_time": "1:47:14", "throughput": 4104.42, "total_tokens": 27712} {"current_steps": 45, "total_steps": 38160, "loss": 0.974, "lr": 1.1530398322851153e-05, "epoch": 0.02358490566037736, "percentage": 0.12, "elapsed_time": "0:00:07", "remaining_time": "1:44:56", "throughput": 4114.98, "total_tokens": 30592} {"current_steps": 50, "total_steps": 38160, "loss": 0.8576, "lr": 1.2840670859538784e-05, "epoch": 0.02620545073375262, "percentage": 0.13, "elapsed_time": "0:00:08", "remaining_time": "1:43:02", "throughput": 4122.51, "total_tokens": 33440} {"current_steps": 55, "total_steps": 38160, "loss": 1.0613, "lr": 1.4150943396226415e-05, "epoch": 0.028825995807127882, "percentage": 0.14, "elapsed_time": "0:00:08", "remaining_time": "1:42:54", "throughput": 4190.21, "total_tokens": 37344} {"current_steps": 60, "total_steps": 38160, "loss": 0.8696, "lr": 1.5461215932914046e-05, "epoch": 0.031446540880503145, "percentage": 0.16, "elapsed_time": "0:00:09", "remaining_time": "1:42:24", "throughput": 4236.15, "total_tokens": 40992} {"current_steps": 65, "total_steps": 38160, "loss": 0.6031, "lr": 1.6771488469601677e-05, "epoch": 0.034067085953878404, "percentage": 0.17, "elapsed_time": "0:00:10", "remaining_time": "1:40:54", "throughput": 4224.92, "total_tokens": 43648} {"current_steps": 70, "total_steps": 38160, "loss": 0.6284, "lr": 1.8081761006289308e-05, "epoch": 0.03668763102725367, "percentage": 0.18, "elapsed_time": "0:00:11", "remaining_time": "1:40:16", "throughput": 4248.67, "total_tokens": 46976} {"current_steps": 75, "total_steps": 38160, "loss": 0.6625, "lr": 1.9392033542976942e-05, "epoch": 0.03930817610062893, "percentage": 0.2, "elapsed_time": "0:00:11", "remaining_time": "1:39:52", "throughput": 4278.72, "total_tokens": 50496} {"current_steps": 80, "total_steps": 38160, "loss": 0.6551, "lr": 2.070230607966457e-05, "epoch": 0.041928721174004195, "percentage": 0.21, "elapsed_time": "0:00:12", "remaining_time": "1:39:09", "throughput": 4280.66, "total_tokens": 53504} {"current_steps": 85, "total_steps": 38160, "loss": 0.6627, "lr": 2.20125786163522e-05, "epoch": 0.044549266247379454, "percentage": 0.22, "elapsed_time": "0:00:13", "remaining_time": "1:38:00", "throughput": 4268.28, "total_tokens": 56032} {"current_steps": 90, "total_steps": 38160, "loss": 0.6161, "lr": 2.3322851153039832e-05, "epoch": 0.04716981132075472, "percentage": 0.24, "elapsed_time": "0:00:13", "remaining_time": "1:37:44", "throughput": 4283.97, "total_tokens": 59392} {"current_steps": 95, "total_steps": 38160, "loss": 0.5914, "lr": 2.4633123689727463e-05, "epoch": 0.04979035639412998, "percentage": 0.25, "elapsed_time": "0:00:14", "remaining_time": "1:37:37", "throughput": 4305.46, "total_tokens": 62944} {"current_steps": 100, "total_steps": 38160, "loss": 0.4944, "lr": 2.5943396226415097e-05, "epoch": 0.05241090146750524, "percentage": 0.26, "elapsed_time": "0:00:15", "remaining_time": "1:37:30", "throughput": 4322.03, "total_tokens": 66432} {"current_steps": 105, "total_steps": 38160, "loss": 0.7286, "lr": 2.7253668763102725e-05, "epoch": 0.055031446540880505, "percentage": 0.28, "elapsed_time": "0:00:16", "remaining_time": "1:36:54", "throughput": 4318.03, "total_tokens": 69280} {"current_steps": 110, "total_steps": 38160, "loss": 0.5197, "lr": 2.8563941299790356e-05, "epoch": 0.057651991614255764, "percentage": 0.29, "elapsed_time": "0:00:16", "remaining_time": "1:37:00", "throughput": 4343.78, "total_tokens": 73088} {"current_steps": 115, "total_steps": 38160, "loss": 0.7644, "lr": 2.987421383647799e-05, "epoch": 0.06027253668763103, "percentage": 0.3, "elapsed_time": "0:00:17", "remaining_time": "1:36:25", "throughput": 4336.5, "total_tokens": 75840} {"current_steps": 120, "total_steps": 38160, "loss": 0.4954, "lr": 3.118448637316562e-05, "epoch": 0.06289308176100629, "percentage": 0.31, "elapsed_time": "0:00:18", "remaining_time": "1:36:07", "throughput": 4342.46, "total_tokens": 79008} {"current_steps": 125, "total_steps": 38160, "loss": 0.5742, "lr": 3.2494758909853245e-05, "epoch": 0.06551362683438156, "percentage": 0.33, "elapsed_time": "0:00:18", "remaining_time": "1:35:39", "throughput": 4339.72, "total_tokens": 81856} {"current_steps": 130, "total_steps": 38160, "loss": 0.472, "lr": 3.380503144654088e-05, "epoch": 0.06813417190775681, "percentage": 0.34, "elapsed_time": "0:00:19", "remaining_time": "1:35:30", "throughput": 4345.62, "total_tokens": 85120} {"current_steps": 135, "total_steps": 38160, "loss": 0.6883, "lr": 3.5115303983228514e-05, "epoch": 0.07075471698113207, "percentage": 0.35, "elapsed_time": "0:00:20", "remaining_time": "1:35:07", "throughput": 4344.09, "total_tokens": 88032} {"current_steps": 140, "total_steps": 38160, "loss": 0.4858, "lr": 3.642557651991614e-05, "epoch": 0.07337526205450734, "percentage": 0.37, "elapsed_time": "0:00:20", "remaining_time": "1:34:52", "throughput": 4346.14, "total_tokens": 91104} {"current_steps": 145, "total_steps": 38160, "loss": 0.5975, "lr": 3.7735849056603776e-05, "epoch": 0.0759958071278826, "percentage": 0.38, "elapsed_time": "0:00:21", "remaining_time": "1:34:33", "throughput": 4343.37, "total_tokens": 93984} {"current_steps": 150, "total_steps": 38160, "loss": 0.5246, "lr": 3.90461215932914e-05, "epoch": 0.07861635220125786, "percentage": 0.39, "elapsed_time": "0:00:22", "remaining_time": "1:34:11", "throughput": 4343.52, "total_tokens": 96864} {"current_steps": 155, "total_steps": 38160, "loss": 0.5665, "lr": 4.035639412997904e-05, "epoch": 0.08123689727463312, "percentage": 0.41, "elapsed_time": "0:00:22", "remaining_time": "1:33:49", "throughput": 4339.94, "total_tokens": 99648} {"current_steps": 160, "total_steps": 38160, "loss": 1.0498, "lr": 4.1666666666666665e-05, "epoch": 0.08385744234800839, "percentage": 0.42, "elapsed_time": "0:00:23", "remaining_time": "1:33:44", "throughput": 4345.72, "total_tokens": 102912} {"current_steps": 165, "total_steps": 38160, "loss": 0.5317, "lr": 4.29769392033543e-05, "epoch": 0.08647798742138364, "percentage": 0.43, "elapsed_time": "0:00:24", "remaining_time": "1:33:20", "throughput": 4340.22, "total_tokens": 105568} {"current_steps": 170, "total_steps": 38160, "loss": 0.6695, "lr": 4.4287211740041934e-05, "epoch": 0.08909853249475891, "percentage": 0.45, "elapsed_time": "0:00:24", "remaining_time": "1:33:01", "throughput": 4338.37, "total_tokens": 108352} {"current_steps": 175, "total_steps": 38160, "loss": 0.6232, "lr": 4.5597484276729555e-05, "epoch": 0.09171907756813417, "percentage": 0.46, "elapsed_time": "0:00:25", "remaining_time": "1:32:41", "throughput": 4331.09, "total_tokens": 110976} {"current_steps": 180, "total_steps": 38160, "loss": 0.4586, "lr": 4.690775681341719e-05, "epoch": 0.09433962264150944, "percentage": 0.47, "elapsed_time": "0:00:26", "remaining_time": "1:32:35", "throughput": 4336.7, "total_tokens": 114176} {"current_steps": 185, "total_steps": 38160, "loss": 0.5218, "lr": 4.8218029350104823e-05, "epoch": 0.09696016771488469, "percentage": 0.48, "elapsed_time": "0:00:27", "remaining_time": "1:32:24", "throughput": 4334.02, "total_tokens": 117056} {"current_steps": 190, "total_steps": 38160, "loss": 0.5845, "lr": 4.952830188679246e-05, "epoch": 0.09958071278825996, "percentage": 0.5, "elapsed_time": "0:00:27", "remaining_time": "1:32:23", "throughput": 4339.93, "total_tokens": 120384} {"current_steps": 195, "total_steps": 38160, "loss": 0.6016, "lr": 5.0838574423480085e-05, "epoch": 0.10220125786163523, "percentage": 0.51, "elapsed_time": "0:00:28", "remaining_time": "1:32:16", "throughput": 4341.69, "total_tokens": 123456} {"current_steps": 200, "total_steps": 38160, "loss": 0.4651, "lr": 5.214884696016771e-05, "epoch": 0.10482180293501048, "percentage": 0.52, "elapsed_time": "0:00:29", "remaining_time": "1:31:56", "throughput": 4334.76, "total_tokens": 125984} {"current_steps": 205, "total_steps": 38160, "loss": 0.7034, "lr": 5.345911949685535e-05, "epoch": 0.10744234800838574, "percentage": 0.54, "elapsed_time": "0:00:29", "remaining_time": "1:31:57", "throughput": 4338.01, "total_tokens": 129280} {"current_steps": 210, "total_steps": 38160, "loss": 0.6468, "lr": 5.4769392033542975e-05, "epoch": 0.11006289308176101, "percentage": 0.55, "elapsed_time": "0:00:30", "remaining_time": "1:31:45", "throughput": 4336.27, "total_tokens": 132096} {"current_steps": 215, "total_steps": 38160, "loss": 0.5377, "lr": 5.607966457023061e-05, "epoch": 0.11268343815513626, "percentage": 0.56, "elapsed_time": "0:00:31", "remaining_time": "1:31:33", "throughput": 4333.18, "total_tokens": 134880} {"current_steps": 220, "total_steps": 38160, "loss": 0.5866, "lr": 5.7389937106918244e-05, "epoch": 0.11530398322851153, "percentage": 0.58, "elapsed_time": "0:00:31", "remaining_time": "1:31:26", "throughput": 4332.33, "total_tokens": 137824} {"current_steps": 225, "total_steps": 38160, "loss": 0.52, "lr": 5.870020964360587e-05, "epoch": 0.1179245283018868, "percentage": 0.59, "elapsed_time": "0:00:32", "remaining_time": "1:31:21", "throughput": 4332.04, "total_tokens": 140832} {"current_steps": 230, "total_steps": 38160, "loss": 0.4795, "lr": 6.00104821802935e-05, "epoch": 0.12054507337526206, "percentage": 0.6, "elapsed_time": "0:00:33", "remaining_time": "1:31:32", "throughput": 4344.37, "total_tokens": 144704} {"current_steps": 235, "total_steps": 38160, "loss": 0.5782, "lr": 6.132075471698113e-05, "epoch": 0.12316561844863731, "percentage": 0.62, "elapsed_time": "0:00:33", "remaining_time": "1:31:23", "throughput": 4342.16, "total_tokens": 147552} {"current_steps": 240, "total_steps": 38160, "loss": 0.6854, "lr": 6.263102725366875e-05, "epoch": 0.12578616352201258, "percentage": 0.63, "elapsed_time": "0:00:34", "remaining_time": "1:31:25", "throughput": 4346.71, "total_tokens": 150912} {"current_steps": 245, "total_steps": 38160, "loss": 0.5103, "lr": 6.39412997903564e-05, "epoch": 0.12840670859538783, "percentage": 0.64, "elapsed_time": "0:00:35", "remaining_time": "1:31:18", "throughput": 4345.28, "total_tokens": 153824} {"current_steps": 250, "total_steps": 38160, "loss": 0.5253, "lr": 6.525157232704402e-05, "epoch": 0.1310272536687631, "percentage": 0.66, "elapsed_time": "0:00:36", "remaining_time": "1:31:14", "throughput": 4346.64, "total_tokens": 156928} {"current_steps": 255, "total_steps": 38160, "loss": 0.4905, "lr": 6.656184486373166e-05, "epoch": 0.13364779874213836, "percentage": 0.67, "elapsed_time": "0:00:36", "remaining_time": "1:31:25", "throughput": 4361.05, "total_tokens": 160928} {"current_steps": 260, "total_steps": 38160, "loss": 0.3949, "lr": 6.787211740041929e-05, "epoch": 0.13626834381551362, "percentage": 0.68, "elapsed_time": "0:00:37", "remaining_time": "1:31:23", "throughput": 4362.48, "total_tokens": 164096} {"current_steps": 265, "total_steps": 38160, "loss": 0.5952, "lr": 6.918238993710691e-05, "epoch": 0.1388888888888889, "percentage": 0.69, "elapsed_time": "0:00:38", "remaining_time": "1:31:21", "throughput": 4363.58, "total_tokens": 167264} {"current_steps": 270, "total_steps": 38160, "loss": 0.5757, "lr": 7.049266247379455e-05, "epoch": 0.14150943396226415, "percentage": 0.71, "elapsed_time": "0:00:39", "remaining_time": "1:31:18", "throughput": 4364.71, "total_tokens": 170400} {"current_steps": 275, "total_steps": 38160, "loss": 0.5771, "lr": 7.180293501048218e-05, "epoch": 0.1441299790356394, "percentage": 0.72, "elapsed_time": "0:00:39", "remaining_time": "1:31:23", "throughput": 4371.44, "total_tokens": 173984} {"current_steps": 280, "total_steps": 38160, "loss": 0.463, "lr": 7.311320754716982e-05, "epoch": 0.14675052410901468, "percentage": 0.73, "elapsed_time": "0:00:40", "remaining_time": "1:31:13", "throughput": 4367.19, "total_tokens": 176704} {"current_steps": 285, "total_steps": 38160, "loss": 0.4607, "lr": 7.442348008385745e-05, "epoch": 0.14937106918238993, "percentage": 0.75, "elapsed_time": "0:00:41", "remaining_time": "1:31:06", "throughput": 4366.59, "total_tokens": 179616} {"current_steps": 290, "total_steps": 38160, "loss": 0.5602, "lr": 7.573375262054507e-05, "epoch": 0.1519916142557652, "percentage": 0.76, "elapsed_time": "0:00:41", "remaining_time": "1:31:03", "throughput": 4364.82, "total_tokens": 182624} {"current_steps": 295, "total_steps": 38160, "loss": 0.4618, "lr": 7.70440251572327e-05, "epoch": 0.15461215932914046, "percentage": 0.77, "elapsed_time": "0:00:42", "remaining_time": "1:30:59", "throughput": 4363.39, "total_tokens": 185600} {"current_steps": 300, "total_steps": 38160, "loss": 0.5899, "lr": 7.835429769392034e-05, "epoch": 0.15723270440251572, "percentage": 0.79, "elapsed_time": "0:00:43", "remaining_time": "1:31:13", "throughput": 4374.72, "total_tokens": 189728} {"current_steps": 305, "total_steps": 38160, "loss": 0.6022, "lr": 7.966457023060797e-05, "epoch": 0.159853249475891, "percentage": 0.8, "elapsed_time": "0:00:44", "remaining_time": "1:31:12", "throughput": 4378.32, "total_tokens": 193056} {"current_steps": 310, "total_steps": 38160, "loss": 0.5924, "lr": 8.09748427672956e-05, "epoch": 0.16247379454926625, "percentage": 0.81, "elapsed_time": "0:00:44", "remaining_time": "1:31:13", "throughput": 4380.9, "total_tokens": 196384} {"current_steps": 315, "total_steps": 38160, "loss": 0.5828, "lr": 8.228511530398323e-05, "epoch": 0.1650943396226415, "percentage": 0.83, "elapsed_time": "0:00:45", "remaining_time": "1:31:23", "throughput": 4387.08, "total_tokens": 200224} {"current_steps": 320, "total_steps": 38160, "loss": 0.4643, "lr": 8.359538784067086e-05, "epoch": 0.16771488469601678, "percentage": 0.84, "elapsed_time": "0:00:46", "remaining_time": "1:31:24", "throughput": 4389.54, "total_tokens": 203584} {"current_steps": 325, "total_steps": 38160, "loss": 0.419, "lr": 8.490566037735848e-05, "epoch": 0.17033542976939203, "percentage": 0.85, "elapsed_time": "0:00:47", "remaining_time": "1:31:13", "throughput": 4385.55, "total_tokens": 206208} {"current_steps": 330, "total_steps": 38160, "loss": 0.4865, "lr": 8.621593291404613e-05, "epoch": 0.17295597484276728, "percentage": 0.86, "elapsed_time": "0:00:47", "remaining_time": "1:31:23", "throughput": 4391.56, "total_tokens": 210048} {"current_steps": 335, "total_steps": 38160, "loss": 0.5182, "lr": 8.752620545073375e-05, "epoch": 0.17557651991614256, "percentage": 0.88, "elapsed_time": "0:00:48", "remaining_time": "1:31:24", "throughput": 4395.09, "total_tokens": 213472} {"current_steps": 340, "total_steps": 38160, "loss": 0.6853, "lr": 8.883647798742137e-05, "epoch": 0.17819706498951782, "percentage": 0.89, "elapsed_time": "0:00:49", "remaining_time": "1:31:30", "throughput": 4402.63, "total_tokens": 217312} {"current_steps": 345, "total_steps": 38160, "loss": 0.5153, "lr": 9.014675052410902e-05, "epoch": 0.18081761006289307, "percentage": 0.9, "elapsed_time": "0:00:50", "remaining_time": "1:31:24", "throughput": 4400.97, "total_tokens": 220224} {"current_steps": 350, "total_steps": 38160, "loss": 0.4777, "lr": 9.145702306079664e-05, "epoch": 0.18343815513626835, "percentage": 0.92, "elapsed_time": "0:00:50", "remaining_time": "1:31:26", "throughput": 4403.65, "total_tokens": 223648} {"current_steps": 355, "total_steps": 38160, "loss": 0.5687, "lr": 9.276729559748428e-05, "epoch": 0.1860587002096436, "percentage": 0.93, "elapsed_time": "0:00:51", "remaining_time": "1:31:17", "throughput": 4400.62, "total_tokens": 226336} {"current_steps": 360, "total_steps": 38160, "loss": 0.4275, "lr": 9.407756813417191e-05, "epoch": 0.18867924528301888, "percentage": 0.94, "elapsed_time": "0:00:52", "remaining_time": "1:31:06", "throughput": 4395.58, "total_tokens": 228832} {"current_steps": 365, "total_steps": 38160, "loss": 0.7019, "lr": 9.538784067085953e-05, "epoch": 0.19129979035639413, "percentage": 0.96, "elapsed_time": "0:00:52", "remaining_time": "1:31:04", "throughput": 4395.95, "total_tokens": 231968} {"current_steps": 370, "total_steps": 38160, "loss": 0.54, "lr": 9.669811320754718e-05, "epoch": 0.19392033542976939, "percentage": 0.97, "elapsed_time": "0:00:53", "remaining_time": "1:31:13", "throughput": 4403.49, "total_tokens": 236000} {"current_steps": 375, "total_steps": 38160, "loss": 0.7747, "lr": 9.80083857442348e-05, "epoch": 0.19654088050314467, "percentage": 0.98, "elapsed_time": "0:00:54", "remaining_time": "1:31:15", "throughput": 4404.66, "total_tokens": 239360} {"current_steps": 380, "total_steps": 38160, "loss": 0.6216, "lr": 9.931865828092243e-05, "epoch": 0.19916142557651992, "percentage": 1.0, "elapsed_time": "0:00:55", "remaining_time": "1:31:21", "throughput": 4410.22, "total_tokens": 243168} {"current_steps": 385, "total_steps": 38160, "loss": 0.4984, "lr": 0.00010062893081761007, "epoch": 0.20178197064989517, "percentage": 1.01, "elapsed_time": "0:00:55", "remaining_time": "1:31:29", "throughput": 4417.74, "total_tokens": 247168} {"current_steps": 390, "total_steps": 38160, "loss": 0.5427, "lr": 0.0001019392033542977, "epoch": 0.20440251572327045, "percentage": 1.02, "elapsed_time": "0:00:56", "remaining_time": "1:31:28", "throughput": 4418.19, "total_tokens": 250400} {"current_steps": 395, "total_steps": 38160, "loss": 0.4951, "lr": 0.00010324947589098532, "epoch": 0.2070230607966457, "percentage": 1.04, "elapsed_time": "0:00:57", "remaining_time": "1:31:24", "throughput": 4417.26, "total_tokens": 253376} {"current_steps": 400, "total_steps": 38160, "loss": 0.687, "lr": 0.00010455974842767296, "epoch": 0.20964360587002095, "percentage": 1.05, "elapsed_time": "0:00:58", "remaining_time": "1:31:21", "throughput": 4416.61, "total_tokens": 256448} {"current_steps": 405, "total_steps": 38160, "loss": 0.6679, "lr": 0.00010587002096436059, "epoch": 0.21226415094339623, "percentage": 1.06, "elapsed_time": "0:00:58", "remaining_time": "1:31:28", "throughput": 4422.81, "total_tokens": 260384} {"current_steps": 410, "total_steps": 38160, "loss": 0.6014, "lr": 0.00010718029350104821, "epoch": 0.2148846960167715, "percentage": 1.07, "elapsed_time": "0:00:59", "remaining_time": "1:31:23", "throughput": 4420.85, "total_tokens": 263264} {"current_steps": 415, "total_steps": 38160, "loss": 0.4912, "lr": 0.00010849056603773586, "epoch": 0.21750524109014674, "percentage": 1.09, "elapsed_time": "0:01:00", "remaining_time": "1:31:21", "throughput": 4420.05, "total_tokens": 266400} {"current_steps": 420, "total_steps": 38160, "loss": 0.462, "lr": 0.00010980083857442348, "epoch": 0.22012578616352202, "percentage": 1.1, "elapsed_time": "0:01:00", "remaining_time": "1:31:20", "throughput": 4420.66, "total_tokens": 269600} {"current_steps": 425, "total_steps": 38160, "loss": 0.4315, "lr": 0.0001111111111111111, "epoch": 0.22274633123689727, "percentage": 1.11, "elapsed_time": "0:01:01", "remaining_time": "1:31:20", "throughput": 4422.96, "total_tokens": 272992} {"current_steps": 430, "total_steps": 38160, "loss": 0.5666, "lr": 0.00011242138364779875, "epoch": 0.22536687631027252, "percentage": 1.13, "elapsed_time": "0:01:02", "remaining_time": "1:31:28", "throughput": 4429.34, "total_tokens": 277056} {"current_steps": 435, "total_steps": 38160, "loss": 0.553, "lr": 0.00011373165618448637, "epoch": 0.2279874213836478, "percentage": 1.14, "elapsed_time": "0:01:03", "remaining_time": "1:31:23", "throughput": 4427.62, "total_tokens": 279968} {"current_steps": 440, "total_steps": 38160, "loss": 0.4713, "lr": 0.00011504192872117402, "epoch": 0.23060796645702306, "percentage": 1.15, "elapsed_time": "0:01:03", "remaining_time": "1:31:16", "throughput": 4424.11, "total_tokens": 282624} {"current_steps": 445, "total_steps": 38160, "loss": 0.5849, "lr": 0.00011635220125786164, "epoch": 0.23322851153039834, "percentage": 1.17, "elapsed_time": "0:01:04", "remaining_time": "1:31:08", "throughput": 4420.67, "total_tokens": 285248} {"current_steps": 450, "total_steps": 38160, "loss": 0.5078, "lr": 0.00011766247379454926, "epoch": 0.2358490566037736, "percentage": 1.18, "elapsed_time": "0:01:05", "remaining_time": "1:30:58", "throughput": 4415.85, "total_tokens": 287648} {"current_steps": 455, "total_steps": 38160, "loss": 0.8014, "lr": 0.00011897274633123691, "epoch": 0.23846960167714884, "percentage": 1.19, "elapsed_time": "0:01:05", "remaining_time": "1:30:49", "throughput": 4410.61, "total_tokens": 290048} {"current_steps": 460, "total_steps": 38160, "loss": 0.6081, "lr": 0.00012028301886792453, "epoch": 0.24109014675052412, "percentage": 1.21, "elapsed_time": "0:01:06", "remaining_time": "1:30:45", "throughput": 4409.9, "total_tokens": 293024} {"current_steps": 465, "total_steps": 38160, "loss": 0.5142, "lr": 0.00012159329140461216, "epoch": 0.24371069182389937, "percentage": 1.22, "elapsed_time": "0:01:07", "remaining_time": "1:30:52", "throughput": 4415.04, "total_tokens": 296960} {"current_steps": 470, "total_steps": 38160, "loss": 0.4685, "lr": 0.0001229035639412998, "epoch": 0.24633123689727462, "percentage": 1.23, "elapsed_time": "0:01:07", "remaining_time": "1:30:48", "throughput": 4414.24, "total_tokens": 299936} {"current_steps": 475, "total_steps": 38160, "loss": 0.4175, "lr": 0.00012421383647798743, "epoch": 0.2489517819706499, "percentage": 1.24, "elapsed_time": "0:01:08", "remaining_time": "1:30:45", "throughput": 4414.03, "total_tokens": 302976} {"current_steps": 480, "total_steps": 38160, "loss": 0.5388, "lr": 0.00012552410901467507, "epoch": 0.25157232704402516, "percentage": 1.26, "elapsed_time": "0:01:09", "remaining_time": "1:30:40", "throughput": 4412.48, "total_tokens": 305792} {"current_steps": 485, "total_steps": 38160, "loss": 0.6229, "lr": 0.00012683438155136267, "epoch": 0.25419287211740044, "percentage": 1.27, "elapsed_time": "0:01:10", "remaining_time": "1:31:22", "throughput": 4434.23, "total_tokens": 312960} {"current_steps": 490, "total_steps": 38160, "loss": 0.6136, "lr": 0.0001281446540880503, "epoch": 0.25681341719077566, "percentage": 1.28, "elapsed_time": "0:01:11", "remaining_time": "1:31:27", "throughput": 4438.7, "total_tokens": 316832} {"current_steps": 495, "total_steps": 38160, "loss": 0.497, "lr": 0.00012945492662473794, "epoch": 0.25943396226415094, "percentage": 1.3, "elapsed_time": "0:01:12", "remaining_time": "1:31:25", "throughput": 4438.45, "total_tokens": 319968} {"current_steps": 500, "total_steps": 38160, "loss": 0.4552, "lr": 0.00013076519916142558, "epoch": 0.2620545073375262, "percentage": 1.31, "elapsed_time": "0:01:12", "remaining_time": "1:31:20", "throughput": 4436.58, "total_tokens": 322816} {"current_steps": 505, "total_steps": 38160, "loss": 0.6453, "lr": 0.0001320754716981132, "epoch": 0.26467505241090145, "percentage": 1.32, "elapsed_time": "0:01:13", "remaining_time": "1:31:15", "throughput": 4434.67, "total_tokens": 325664} {"current_steps": 510, "total_steps": 38160, "loss": 0.5846, "lr": 0.00013338574423480085, "epoch": 0.2672955974842767, "percentage": 1.34, "elapsed_time": "0:01:14", "remaining_time": "1:31:14", "throughput": 4435.69, "total_tokens": 328960} {"current_steps": 515, "total_steps": 38160, "loss": 0.4266, "lr": 0.00013469601677148845, "epoch": 0.269916142557652, "percentage": 1.35, "elapsed_time": "0:01:14", "remaining_time": "1:31:17", "throughput": 4438.55, "total_tokens": 332608} {"current_steps": 520, "total_steps": 38160, "loss": 0.7158, "lr": 0.0001360062893081761, "epoch": 0.27253668763102723, "percentage": 1.36, "elapsed_time": "0:01:15", "remaining_time": "1:31:13", "throughput": 4437.83, "total_tokens": 335552} {"current_steps": 525, "total_steps": 38160, "loss": 0.5216, "lr": 0.00013731656184486375, "epoch": 0.2751572327044025, "percentage": 1.38, "elapsed_time": "0:01:16", "remaining_time": "1:31:25", "throughput": 4446.31, "total_tokens": 340256} {"current_steps": 530, "total_steps": 38160, "loss": 0.5294, "lr": 0.00013862683438155136, "epoch": 0.2777777777777778, "percentage": 1.39, "elapsed_time": "0:01:17", "remaining_time": "1:31:18", "throughput": 4442.94, "total_tokens": 342848} {"current_steps": 535, "total_steps": 38160, "loss": 0.5951, "lr": 0.000139937106918239, "epoch": 0.280398322851153, "percentage": 1.4, "elapsed_time": "0:01:17", "remaining_time": "1:31:09", "throughput": 4438.78, "total_tokens": 345184} {"current_steps": 540, "total_steps": 38160, "loss": 0.5517, "lr": 0.00014124737945492663, "epoch": 0.2830188679245283, "percentage": 1.42, "elapsed_time": "0:01:18", "remaining_time": "1:31:09", "throughput": 4440.1, "total_tokens": 348608} {"current_steps": 545, "total_steps": 38160, "loss": 0.4835, "lr": 0.00014255765199161423, "epoch": 0.2856394129979036, "percentage": 1.43, "elapsed_time": "0:01:19", "remaining_time": "1:31:06", "throughput": 4439.88, "total_tokens": 351648} {"current_steps": 550, "total_steps": 38160, "loss": 0.6725, "lr": 0.0001438679245283019, "epoch": 0.2882599580712788, "percentage": 1.44, "elapsed_time": "0:01:19", "remaining_time": "1:31:01", "throughput": 4438.2, "total_tokens": 354464} {"current_steps": 555, "total_steps": 38160, "loss": 0.5991, "lr": 0.00014517819706498953, "epoch": 0.2908805031446541, "percentage": 1.45, "elapsed_time": "0:01:20", "remaining_time": "1:31:04", "throughput": 4442.02, "total_tokens": 358240} {"current_steps": 560, "total_steps": 38160, "loss": 0.4813, "lr": 0.00014648846960167716, "epoch": 0.29350104821802936, "percentage": 1.47, "elapsed_time": "0:01:21", "remaining_time": "1:31:04", "throughput": 4442.94, "total_tokens": 361600} {"current_steps": 565, "total_steps": 38160, "loss": 0.4577, "lr": 0.00014779874213836477, "epoch": 0.29612159329140464, "percentage": 1.48, "elapsed_time": "0:01:22", "remaining_time": "1:31:00", "throughput": 4441.13, "total_tokens": 364448} {"current_steps": 570, "total_steps": 38160, "loss": 0.4637, "lr": 0.00014910901467505243, "epoch": 0.29874213836477986, "percentage": 1.49, "elapsed_time": "0:01:22", "remaining_time": "1:30:56", "throughput": 4440.75, "total_tokens": 367424} {"current_steps": 575, "total_steps": 38160, "loss": 0.5578, "lr": 0.00015041928721174007, "epoch": 0.30136268343815514, "percentage": 1.51, "elapsed_time": "0:01:23", "remaining_time": "1:30:50", "throughput": 4438.19, "total_tokens": 370112} {"current_steps": 580, "total_steps": 38160, "loss": 0.6093, "lr": 0.00015172955974842767, "epoch": 0.3039832285115304, "percentage": 1.52, "elapsed_time": "0:01:24", "remaining_time": "1:30:43", "throughput": 4434.91, "total_tokens": 372608} {"current_steps": 585, "total_steps": 38160, "loss": 0.5404, "lr": 0.0001530398322851153, "epoch": 0.30660377358490565, "percentage": 1.53, "elapsed_time": "0:01:24", "remaining_time": "1:30:40", "throughput": 4434.21, "total_tokens": 375584} {"current_steps": 590, "total_steps": 38160, "loss": 0.5763, "lr": 0.00015435010482180294, "epoch": 0.30922431865828093, "percentage": 1.55, "elapsed_time": "0:01:25", "remaining_time": "1:30:38", "throughput": 4434.42, "total_tokens": 378752} {"current_steps": 595, "total_steps": 38160, "loss": 0.4131, "lr": 0.00015566037735849058, "epoch": 0.3118448637316562, "percentage": 1.56, "elapsed_time": "0:01:26", "remaining_time": "1:30:41", "throughput": 4437.26, "total_tokens": 382432} {"current_steps": 600, "total_steps": 38160, "loss": 0.5704, "lr": 0.0001569706498951782, "epoch": 0.31446540880503143, "percentage": 1.57, "elapsed_time": "0:01:26", "remaining_time": "1:30:37", "throughput": 4436.48, "total_tokens": 385344} {"current_steps": 605, "total_steps": 38160, "loss": 0.4817, "lr": 0.00015828092243186584, "epoch": 0.3170859538784067, "percentage": 1.59, "elapsed_time": "0:01:27", "remaining_time": "1:30:38", "throughput": 4438.38, "total_tokens": 388832} {"current_steps": 610, "total_steps": 38160, "loss": 0.5249, "lr": 0.00015959119496855345, "epoch": 0.319706498951782, "percentage": 1.6, "elapsed_time": "0:01:28", "remaining_time": "1:30:41", "throughput": 4441.77, "total_tokens": 392640} {"current_steps": 615, "total_steps": 38160, "loss": 0.564, "lr": 0.00016090146750524109, "epoch": 0.3223270440251572, "percentage": 1.61, "elapsed_time": "0:01:29", "remaining_time": "1:30:54", "throughput": 4449.72, "total_tokens": 397568} {"current_steps": 620, "total_steps": 38160, "loss": 0.4337, "lr": 0.00016221174004192875, "epoch": 0.3249475890985325, "percentage": 1.62, "elapsed_time": "0:01:30", "remaining_time": "1:30:51", "throughput": 4448.68, "total_tokens": 400512} {"current_steps": 625, "total_steps": 38160, "loss": 0.4983, "lr": 0.00016352201257861635, "epoch": 0.3275681341719078, "percentage": 1.64, "elapsed_time": "0:01:30", "remaining_time": "1:30:47", "throughput": 4448.25, "total_tokens": 403520} {"current_steps": 630, "total_steps": 38160, "loss": 0.4935, "lr": 0.000164832285115304, "epoch": 0.330188679245283, "percentage": 1.65, "elapsed_time": "0:01:31", "remaining_time": "1:30:49", "throughput": 4450.13, "total_tokens": 407072} {"current_steps": 635, "total_steps": 38160, "loss": 0.5046, "lr": 0.00016614255765199162, "epoch": 0.3328092243186583, "percentage": 1.66, "elapsed_time": "0:01:32", "remaining_time": "1:31:01", "throughput": 4456.91, "total_tokens": 411872} {"current_steps": 640, "total_steps": 38160, "loss": 0.4818, "lr": 0.00016745283018867923, "epoch": 0.33542976939203356, "percentage": 1.68, "elapsed_time": "0:01:33", "remaining_time": "1:30:57", "throughput": 4455.56, "total_tokens": 414784} {"current_steps": 645, "total_steps": 38160, "loss": 0.5976, "lr": 0.0001687631027253669, "epoch": 0.3380503144654088, "percentage": 1.69, "elapsed_time": "0:01:33", "remaining_time": "1:31:00", "throughput": 4459.04, "total_tokens": 418656} {"current_steps": 650, "total_steps": 38160, "loss": 0.6086, "lr": 0.00017007337526205453, "epoch": 0.34067085953878407, "percentage": 1.7, "elapsed_time": "0:01:34", "remaining_time": "1:30:59", "throughput": 4458.96, "total_tokens": 421824} {"current_steps": 655, "total_steps": 38160, "loss": 0.6018, "lr": 0.00017138364779874213, "epoch": 0.34329140461215935, "percentage": 1.72, "elapsed_time": "0:01:35", "remaining_time": "1:31:02", "throughput": 4461.73, "total_tokens": 425632} {"current_steps": 660, "total_steps": 38160, "loss": 0.4711, "lr": 0.00017269392033542977, "epoch": 0.34591194968553457, "percentage": 1.73, "elapsed_time": "0:01:36", "remaining_time": "1:31:00", "throughput": 4462.23, "total_tokens": 428864} {"current_steps": 665, "total_steps": 38160, "loss": 0.402, "lr": 0.0001740041928721174, "epoch": 0.34853249475890985, "percentage": 1.74, "elapsed_time": "0:01:36", "remaining_time": "1:30:52", "throughput": 4457.85, "total_tokens": 431104} {"current_steps": 670, "total_steps": 38160, "loss": 0.5488, "lr": 0.00017531446540880504, "epoch": 0.35115303983228513, "percentage": 1.76, "elapsed_time": "0:01:37", "remaining_time": "1:30:51", "throughput": 4457.35, "total_tokens": 434240} {"current_steps": 675, "total_steps": 38160, "loss": 0.5394, "lr": 0.00017662473794549267, "epoch": 0.35377358490566035, "percentage": 1.77, "elapsed_time": "0:01:38", "remaining_time": "1:30:52", "throughput": 4458.73, "total_tokens": 437792} {"current_steps": 680, "total_steps": 38160, "loss": 0.6147, "lr": 0.0001779350104821803, "epoch": 0.35639412997903563, "percentage": 1.78, "elapsed_time": "0:01:38", "remaining_time": "1:30:53", "throughput": 4460.26, "total_tokens": 441280} {"current_steps": 685, "total_steps": 38160, "loss": 0.4846, "lr": 0.0001792452830188679, "epoch": 0.3590146750524109, "percentage": 1.8, "elapsed_time": "0:01:39", "remaining_time": "1:30:55", "throughput": 4463.47, "total_tokens": 445120} {"current_steps": 690, "total_steps": 38160, "loss": 0.483, "lr": 0.00018055555555555555, "epoch": 0.36163522012578614, "percentage": 1.81, "elapsed_time": "0:01:40", "remaining_time": "1:31:03", "throughput": 4469.01, "total_tokens": 449600} {"current_steps": 695, "total_steps": 38160, "loss": 0.4768, "lr": 0.0001818658280922432, "epoch": 0.3642557651991614, "percentage": 1.82, "elapsed_time": "0:01:41", "remaining_time": "1:31:04", "throughput": 4470.16, "total_tokens": 453120} {"current_steps": 700, "total_steps": 38160, "loss": 0.5398, "lr": 0.00018317610062893082, "epoch": 0.3668763102725367, "percentage": 1.83, "elapsed_time": "0:01:42", "remaining_time": "1:31:08", "throughput": 4474.48, "total_tokens": 457216} {"current_steps": 705, "total_steps": 38160, "loss": 0.4478, "lr": 0.00018448637316561845, "epoch": 0.3694968553459119, "percentage": 1.85, "elapsed_time": "0:01:42", "remaining_time": "1:31:11", "throughput": 4477.75, "total_tokens": 461152} {"current_steps": 710, "total_steps": 38160, "loss": 0.6427, "lr": 0.00018579664570230608, "epoch": 0.3721174004192872, "percentage": 1.86, "elapsed_time": "0:01:43", "remaining_time": "1:31:10", "throughput": 4478.19, "total_tokens": 464480} {"current_steps": 715, "total_steps": 38160, "loss": 0.525, "lr": 0.0001871069182389937, "epoch": 0.3747379454926625, "percentage": 1.87, "elapsed_time": "0:01:44", "remaining_time": "1:31:09", "throughput": 4478.47, "total_tokens": 467744} {"current_steps": 720, "total_steps": 38160, "loss": 0.4655, "lr": 0.00018841719077568135, "epoch": 0.37735849056603776, "percentage": 1.89, "elapsed_time": "0:01:45", "remaining_time": "1:31:06", "throughput": 4477.09, "total_tokens": 470656} {"current_steps": 725, "total_steps": 38160, "loss": 0.4892, "lr": 0.000189727463312369, "epoch": 0.379979035639413, "percentage": 1.9, "elapsed_time": "0:01:45", "remaining_time": "1:31:06", "throughput": 4478.04, "total_tokens": 474048} {"current_steps": 730, "total_steps": 38160, "loss": 0.5115, "lr": 0.00019103773584905662, "epoch": 0.38259958071278827, "percentage": 1.91, "elapsed_time": "0:01:46", "remaining_time": "1:31:04", "throughput": 4477.68, "total_tokens": 477184} {"current_steps": 735, "total_steps": 38160, "loss": 0.4589, "lr": 0.00019234800838574423, "epoch": 0.38522012578616355, "percentage": 1.93, "elapsed_time": "0:01:47", "remaining_time": "1:31:00", "throughput": 4477.09, "total_tokens": 480160} {"current_steps": 740, "total_steps": 38160, "loss": 0.3785, "lr": 0.00019365828092243186, "epoch": 0.38784067085953877, "percentage": 1.94, "elapsed_time": "0:01:48", "remaining_time": "1:31:19", "throughput": 4486.28, "total_tokens": 486144} {"current_steps": 745, "total_steps": 38160, "loss": 0.5479, "lr": 0.00019496855345911953, "epoch": 0.39046121593291405, "percentage": 1.95, "elapsed_time": "0:01:49", "remaining_time": "1:31:21", "throughput": 4488.54, "total_tokens": 489920} {"current_steps": 750, "total_steps": 38160, "loss": 0.4804, "lr": 0.00019627882599580713, "epoch": 0.39308176100628933, "percentage": 1.97, "elapsed_time": "0:01:49", "remaining_time": "1:31:24", "throughput": 4490.23, "total_tokens": 493728} {"current_steps": 755, "total_steps": 38160, "loss": 0.502, "lr": 0.00019758909853249477, "epoch": 0.39570230607966456, "percentage": 1.98, "elapsed_time": "0:01:50", "remaining_time": "1:31:19", "throughput": 4488.18, "total_tokens": 496416} {"current_steps": 760, "total_steps": 38160, "loss": 0.503, "lr": 0.0001988993710691824, "epoch": 0.39832285115303984, "percentage": 1.99, "elapsed_time": "0:01:51", "remaining_time": "1:31:23", "throughput": 4490.31, "total_tokens": 500320} {"current_steps": 765, "total_steps": 38160, "loss": 0.4651, "lr": 0.00020020964360587, "epoch": 0.4009433962264151, "percentage": 2.0, "elapsed_time": "0:01:52", "remaining_time": "1:31:21", "throughput": 4490.19, "total_tokens": 503520} {"current_steps": 770, "total_steps": 38160, "loss": 0.4948, "lr": 0.00020151991614255767, "epoch": 0.40356394129979034, "percentage": 2.02, "elapsed_time": "0:01:52", "remaining_time": "1:31:19", "throughput": 4489.84, "total_tokens": 506656} {"current_steps": 775, "total_steps": 38160, "loss": 0.545, "lr": 0.0002028301886792453, "epoch": 0.4061844863731656, "percentage": 2.03, "elapsed_time": "0:01:53", "remaining_time": "1:31:16", "throughput": 4488.77, "total_tokens": 509568} {"current_steps": 780, "total_steps": 38160, "loss": 0.4408, "lr": 0.0002041404612159329, "epoch": 0.4088050314465409, "percentage": 2.04, "elapsed_time": "0:01:54", "remaining_time": "1:31:11", "throughput": 4486.2, "total_tokens": 512160} {"current_steps": 785, "total_steps": 38160, "loss": 0.4051, "lr": 0.00020545073375262055, "epoch": 0.4114255765199161, "percentage": 2.06, "elapsed_time": "0:01:54", "remaining_time": "1:31:12", "throughput": 4488.04, "total_tokens": 515872} {"current_steps": 790, "total_steps": 38160, "loss": 0.5233, "lr": 0.00020676100628930818, "epoch": 0.4140461215932914, "percentage": 2.07, "elapsed_time": "0:01:55", "remaining_time": "1:31:11", "throughput": 4488.75, "total_tokens": 519232} {"current_steps": 795, "total_steps": 38160, "loss": 0.343, "lr": 0.00020807127882599581, "epoch": 0.4166666666666667, "percentage": 2.08, "elapsed_time": "0:01:56", "remaining_time": "1:31:10", "throughput": 4488.62, "total_tokens": 522464} {"current_steps": 800, "total_steps": 38160, "loss": 0.5028, "lr": 0.00020938155136268345, "epoch": 0.4192872117400419, "percentage": 2.1, "elapsed_time": "0:01:57", "remaining_time": "1:31:09", "throughput": 4488.29, "total_tokens": 525664} {"current_steps": 805, "total_steps": 38160, "loss": 0.6085, "lr": 0.00021069182389937108, "epoch": 0.4219077568134172, "percentage": 2.11, "elapsed_time": "0:01:57", "remaining_time": "1:31:10", "throughput": 4488.91, "total_tokens": 529216} {"current_steps": 810, "total_steps": 38160, "loss": 0.5685, "lr": 0.0002120020964360587, "epoch": 0.42452830188679247, "percentage": 2.12, "elapsed_time": "0:01:58", "remaining_time": "1:31:14", "throughput": 4492.6, "total_tokens": 533376} {"current_steps": 815, "total_steps": 38160, "loss": 0.5844, "lr": 0.00021331236897274632, "epoch": 0.4271488469601677, "percentage": 2.14, "elapsed_time": "0:01:59", "remaining_time": "1:31:10", "throughput": 4491.01, "total_tokens": 536192} {"current_steps": 820, "total_steps": 38160, "loss": 0.472, "lr": 0.00021462264150943399, "epoch": 0.429769392033543, "percentage": 2.15, "elapsed_time": "0:02:00", "remaining_time": "1:31:08", "throughput": 4491.25, "total_tokens": 539392} {"current_steps": 825, "total_steps": 38160, "loss": 0.4573, "lr": 0.0002159329140461216, "epoch": 0.43238993710691825, "percentage": 2.16, "elapsed_time": "0:02:00", "remaining_time": "1:31:07", "throughput": 4491.49, "total_tokens": 542656} {"current_steps": 830, "total_steps": 38160, "loss": 0.2961, "lr": 0.00021724318658280923, "epoch": 0.4350104821802935, "percentage": 2.18, "elapsed_time": "0:02:01", "remaining_time": "1:31:19", "throughput": 4498.57, "total_tokens": 548064} {"current_steps": 835, "total_steps": 38160, "loss": 0.5164, "lr": 0.00021855345911949686, "epoch": 0.43763102725366876, "percentage": 2.19, "elapsed_time": "0:02:02", "remaining_time": "1:31:16", "throughput": 4498.09, "total_tokens": 551104} {"current_steps": 840, "total_steps": 38160, "loss": 0.7053, "lr": 0.00021986373165618447, "epoch": 0.44025157232704404, "percentage": 2.2, "elapsed_time": "0:02:03", "remaining_time": "1:31:23", "throughput": 4502.08, "total_tokens": 555680} {"current_steps": 845, "total_steps": 38160, "loss": 0.3938, "lr": 0.00022117400419287213, "epoch": 0.44287211740041926, "percentage": 2.21, "elapsed_time": "0:02:04", "remaining_time": "1:31:17", "throughput": 4499.52, "total_tokens": 558144} {"current_steps": 850, "total_steps": 38160, "loss": 0.5376, "lr": 0.00022248427672955977, "epoch": 0.44549266247379454, "percentage": 2.23, "elapsed_time": "0:02:04", "remaining_time": "1:31:10", "throughput": 4496.21, "total_tokens": 560384} {"current_steps": 855, "total_steps": 38160, "loss": 0.502, "lr": 0.00022379454926624737, "epoch": 0.4481132075471698, "percentage": 2.24, "elapsed_time": "0:02:05", "remaining_time": "1:31:06", "throughput": 4494.39, "total_tokens": 563072} {"current_steps": 860, "total_steps": 38160, "loss": 0.5916, "lr": 0.000225104821802935, "epoch": 0.45073375262054505, "percentage": 2.25, "elapsed_time": "0:02:05", "remaining_time": "1:31:02", "throughput": 4492.59, "total_tokens": 565792} {"current_steps": 865, "total_steps": 38160, "loss": 0.3766, "lr": 0.00022641509433962264, "epoch": 0.4533542976939203, "percentage": 2.27, "elapsed_time": "0:02:06", "remaining_time": "1:30:56", "throughput": 4489.42, "total_tokens": 568160} {"current_steps": 870, "total_steps": 38160, "loss": 0.5778, "lr": 0.00022772536687631028, "epoch": 0.4559748427672956, "percentage": 2.28, "elapsed_time": "0:02:07", "remaining_time": "1:30:56", "throughput": 4489.84, "total_tokens": 571584} {"current_steps": 875, "total_steps": 38160, "loss": 0.4738, "lr": 0.0002290356394129979, "epoch": 0.4585953878406709, "percentage": 2.29, "elapsed_time": "0:02:08", "remaining_time": "1:31:03", "throughput": 4494.47, "total_tokens": 576288} {"current_steps": 880, "total_steps": 38160, "loss": 0.5048, "lr": 0.00023034591194968554, "epoch": 0.4612159329140461, "percentage": 2.31, "elapsed_time": "0:02:08", "remaining_time": "1:31:01", "throughput": 4494.39, "total_tokens": 579456} {"current_steps": 885, "total_steps": 38160, "loss": 0.6095, "lr": 0.00023165618448637318, "epoch": 0.4638364779874214, "percentage": 2.32, "elapsed_time": "0:02:09", "remaining_time": "1:31:06", "throughput": 4497.5, "total_tokens": 583680} {"current_steps": 890, "total_steps": 38160, "loss": 0.5889, "lr": 0.00023296645702306079, "epoch": 0.46645702306079667, "percentage": 2.33, "elapsed_time": "0:02:10", "remaining_time": "1:31:05", "throughput": 4497.98, "total_tokens": 587040} {"current_steps": 895, "total_steps": 38160, "loss": 0.3633, "lr": 0.00023427672955974845, "epoch": 0.4690775681341719, "percentage": 2.35, "elapsed_time": "0:02:11", "remaining_time": "1:31:02", "throughput": 4496.7, "total_tokens": 589952} {"current_steps": 900, "total_steps": 38160, "loss": 0.5763, "lr": 0.00023558700209643608, "epoch": 0.4716981132075472, "percentage": 2.36, "elapsed_time": "0:02:11", "remaining_time": "1:31:03", "throughput": 4498.09, "total_tokens": 593600} {"current_steps": 905, "total_steps": 38160, "loss": 0.4922, "lr": 0.0002368972746331237, "epoch": 0.47431865828092246, "percentage": 2.37, "elapsed_time": "0:02:12", "remaining_time": "1:31:03", "throughput": 4499.48, "total_tokens": 597216} {"current_steps": 910, "total_steps": 38160, "loss": 0.6615, "lr": 0.00023820754716981132, "epoch": 0.4769392033542977, "percentage": 2.38, "elapsed_time": "0:02:13", "remaining_time": "1:31:03", "throughput": 4499.75, "total_tokens": 600576} {"current_steps": 915, "total_steps": 38160, "loss": 0.4774, "lr": 0.00023951781970649896, "epoch": 0.47955974842767296, "percentage": 2.4, "elapsed_time": "0:02:14", "remaining_time": "1:31:03", "throughput": 4499.9, "total_tokens": 603936} {"current_steps": 920, "total_steps": 38160, "loss": 0.5874, "lr": 0.0002408280922431866, "epoch": 0.48218029350104824, "percentage": 2.41, "elapsed_time": "0:02:14", "remaining_time": "1:30:59", "throughput": 4498.96, "total_tokens": 606816} {"current_steps": 925, "total_steps": 38160, "loss": 0.4446, "lr": 0.00024213836477987423, "epoch": 0.48480083857442346, "percentage": 2.42, "elapsed_time": "0:02:15", "remaining_time": "1:30:58", "throughput": 4499.03, "total_tokens": 610112} {"current_steps": 930, "total_steps": 38160, "loss": 0.4771, "lr": 0.00024344863731656186, "epoch": 0.48742138364779874, "percentage": 2.44, "elapsed_time": "0:02:16", "remaining_time": "1:30:56", "throughput": 4498.55, "total_tokens": 613216} {"current_steps": 935, "total_steps": 38160, "loss": 0.5798, "lr": 0.00024475890985324947, "epoch": 0.490041928721174, "percentage": 2.45, "elapsed_time": "0:02:16", "remaining_time": "1:30:53", "throughput": 4496.56, "total_tokens": 615904} {"current_steps": 940, "total_steps": 38160, "loss": 0.6769, "lr": 0.0002460691823899371, "epoch": 0.49266247379454925, "percentage": 2.46, "elapsed_time": "0:02:17", "remaining_time": "1:30:53", "throughput": 4497.25, "total_tokens": 619456} {"current_steps": 945, "total_steps": 38160, "loss": 0.5178, "lr": 0.00024737945492662474, "epoch": 0.49528301886792453, "percentage": 2.48, "elapsed_time": "0:02:18", "remaining_time": "1:30:52", "throughput": 4497.01, "total_tokens": 622656} {"current_steps": 950, "total_steps": 38160, "loss": 0.5536, "lr": 0.00024868972746331237, "epoch": 0.4979035639412998, "percentage": 2.49, "elapsed_time": "0:02:19", "remaining_time": "1:30:52", "throughput": 4497.18, "total_tokens": 626016} {"current_steps": 955, "total_steps": 38160, "loss": 0.4922, "lr": 0.00025, "epoch": 0.500524109014675, "percentage": 2.5, "elapsed_time": "0:02:19", "remaining_time": "1:30:50", "throughput": 4496.85, "total_tokens": 629120} {"current_steps": 960, "total_steps": 38160, "loss": 0.539, "lr": 0.00025131027253668764, "epoch": 0.5031446540880503, "percentage": 2.52, "elapsed_time": "0:02:20", "remaining_time": "1:30:48", "throughput": 4496.25, "total_tokens": 632160} {"current_steps": 965, "total_steps": 38160, "loss": 0.4622, "lr": 0.0002526205450733753, "epoch": 0.5057651991614256, "percentage": 2.53, "elapsed_time": "0:02:21", "remaining_time": "1:30:43", "throughput": 4494.45, "total_tokens": 634784} {"current_steps": 970, "total_steps": 38160, "loss": 0.5827, "lr": 0.0002539308176100629, "epoch": 0.5083857442348009, "percentage": 2.54, "elapsed_time": "0:02:21", "remaining_time": "1:30:41", "throughput": 4493.72, "total_tokens": 637792} {"current_steps": 975, "total_steps": 38160, "loss": 0.4433, "lr": 0.0002552410901467505, "epoch": 0.5110062893081762, "percentage": 2.56, "elapsed_time": "0:02:22", "remaining_time": "1:30:42", "throughput": 4494.24, "total_tokens": 641312} {"current_steps": 980, "total_steps": 38160, "loss": 0.5475, "lr": 0.0002565513626834381, "epoch": 0.5136268343815513, "percentage": 2.57, "elapsed_time": "0:02:23", "remaining_time": "1:30:42", "throughput": 4495.11, "total_tokens": 644832} {"current_steps": 985, "total_steps": 38160, "loss": 0.6165, "lr": 0.0002578616352201258, "epoch": 0.5162473794549266, "percentage": 2.58, "elapsed_time": "0:02:24", "remaining_time": "1:30:40", "throughput": 4494.7, "total_tokens": 647904} {"current_steps": 990, "total_steps": 38160, "loss": 0.5711, "lr": 0.00025917190775681345, "epoch": 0.5188679245283019, "percentage": 2.59, "elapsed_time": "0:02:24", "remaining_time": "1:30:36", "throughput": 4493.09, "total_tokens": 650624} {"current_steps": 995, "total_steps": 38160, "loss": 0.5352, "lr": 0.0002604821802935011, "epoch": 0.5214884696016772, "percentage": 2.61, "elapsed_time": "0:02:25", "remaining_time": "1:30:32", "throughput": 4491.14, "total_tokens": 653248} {"current_steps": 1000, "total_steps": 38160, "loss": 0.567, "lr": 0.0002617924528301887, "epoch": 0.5241090146750524, "percentage": 2.62, "elapsed_time": "0:02:26", "remaining_time": "1:30:29", "throughput": 4489.64, "total_tokens": 655936} {"current_steps": 1005, "total_steps": 38160, "loss": 0.438, "lr": 0.0002631027253668763, "epoch": 0.5267295597484277, "percentage": 2.63, "elapsed_time": "0:02:27", "remaining_time": "1:30:42", "throughput": 4495.96, "total_tokens": 661888} {"current_steps": 1010, "total_steps": 38160, "loss": 0.5353, "lr": 0.00026441299790356393, "epoch": 0.5293501048218029, "percentage": 2.65, "elapsed_time": "0:02:27", "remaining_time": "1:30:38", "throughput": 4494.24, "total_tokens": 664512} {"current_steps": 1015, "total_steps": 38160, "loss": 0.3974, "lr": 0.00026572327044025156, "epoch": 0.5319706498951782, "percentage": 2.66, "elapsed_time": "0:02:28", "remaining_time": "1:30:38", "throughput": 4495.35, "total_tokens": 668096} {"current_steps": 1020, "total_steps": 38160, "loss": 0.7355, "lr": 0.0002670335429769392, "epoch": 0.5345911949685535, "percentage": 2.67, "elapsed_time": "0:02:29", "remaining_time": "1:30:40", "throughput": 4495.99, "total_tokens": 671744} {"current_steps": 1025, "total_steps": 38160, "loss": 0.4028, "lr": 0.00026834381551362683, "epoch": 0.5372117400419287, "percentage": 2.69, "elapsed_time": "0:02:30", "remaining_time": "1:30:35", "throughput": 4493.61, "total_tokens": 674144} {"current_steps": 1030, "total_steps": 38160, "loss": 0.7217, "lr": 0.0002696540880503145, "epoch": 0.539832285115304, "percentage": 2.7, "elapsed_time": "0:02:30", "remaining_time": "1:30:33", "throughput": 4493.79, "total_tokens": 677312} {"current_steps": 1035, "total_steps": 38160, "loss": 0.4206, "lr": 0.0002709643605870021, "epoch": 0.5424528301886793, "percentage": 2.71, "elapsed_time": "0:02:31", "remaining_time": "1:30:30", "throughput": 4493.05, "total_tokens": 680256} {"current_steps": 1040, "total_steps": 38160, "loss": 0.4244, "lr": 0.00027227463312368973, "epoch": 0.5450733752620545, "percentage": 2.73, "elapsed_time": "0:02:32", "remaining_time": "1:30:30", "throughput": 4493.75, "total_tokens": 683744} {"current_steps": 1045, "total_steps": 38160, "loss": 0.5124, "lr": 0.00027358490566037737, "epoch": 0.5476939203354297, "percentage": 2.74, "elapsed_time": "0:02:32", "remaining_time": "1:30:32", "throughput": 4495.53, "total_tokens": 687616} {"current_steps": 1050, "total_steps": 38160, "loss": 0.5329, "lr": 0.000274895178197065, "epoch": 0.550314465408805, "percentage": 2.75, "elapsed_time": "0:02:33", "remaining_time": "1:30:34", "throughput": 4496.72, "total_tokens": 691392} {"current_steps": 1055, "total_steps": 38160, "loss": 0.5519, "lr": 0.00027620545073375264, "epoch": 0.5529350104821803, "percentage": 2.76, "elapsed_time": "0:02:34", "remaining_time": "1:30:38", "throughput": 4500.17, "total_tokens": 695904} {"current_steps": 1060, "total_steps": 38160, "loss": 0.4415, "lr": 0.00027751572327044027, "epoch": 0.5555555555555556, "percentage": 2.78, "elapsed_time": "0:02:35", "remaining_time": "1:30:34", "throughput": 4498.26, "total_tokens": 698496} {"current_steps": 1065, "total_steps": 38160, "loss": 0.5836, "lr": 0.00027882599580712785, "epoch": 0.5581761006289309, "percentage": 2.79, "elapsed_time": "0:02:35", "remaining_time": "1:30:31", "throughput": 4497.22, "total_tokens": 701344} {"current_steps": 1070, "total_steps": 38160, "loss": 0.5231, "lr": 0.0002801362683438155, "epoch": 0.560796645702306, "percentage": 2.8, "elapsed_time": "0:02:36", "remaining_time": "1:30:27", "throughput": 4495.66, "total_tokens": 703968} {"current_steps": 1075, "total_steps": 38160, "loss": 0.4473, "lr": 0.0002814465408805031, "epoch": 0.5634171907756813, "percentage": 2.82, "elapsed_time": "0:02:37", "remaining_time": "1:30:25", "throughput": 4495.4, "total_tokens": 707040} {"current_steps": 1080, "total_steps": 38160, "loss": 0.4794, "lr": 0.0002827568134171908, "epoch": 0.5660377358490566, "percentage": 2.83, "elapsed_time": "0:02:37", "remaining_time": "1:30:20", "throughput": 4492.6, "total_tokens": 709280} {"current_steps": 1085, "total_steps": 38160, "loss": 0.4386, "lr": 0.00028406708595387844, "epoch": 0.5686582809224319, "percentage": 2.84, "elapsed_time": "0:02:38", "remaining_time": "1:30:24", "throughput": 4496.38, "total_tokens": 713792} {"current_steps": 1090, "total_steps": 38160, "loss": 0.7812, "lr": 0.0002853773584905661, "epoch": 0.5712788259958071, "percentage": 2.86, "elapsed_time": "0:02:39", "remaining_time": "1:30:21", "throughput": 4494.82, "total_tokens": 716480} {"current_steps": 1095, "total_steps": 38160, "loss": 0.476, "lr": 0.00028668763102725366, "epoch": 0.5738993710691824, "percentage": 2.87, "elapsed_time": "0:02:40", "remaining_time": "1:30:17", "throughput": 4493.4, "total_tokens": 719136} {"current_steps": 1100, "total_steps": 38160, "loss": 0.446, "lr": 0.0002879979035639413, "epoch": 0.5765199161425576, "percentage": 2.88, "elapsed_time": "0:02:40", "remaining_time": "1:30:18", "throughput": 4494.21, "total_tokens": 722752} {"current_steps": 1105, "total_steps": 38160, "loss": 0.6234, "lr": 0.00028930817610062893, "epoch": 0.5791404612159329, "percentage": 2.9, "elapsed_time": "0:02:41", "remaining_time": "1:30:16", "throughput": 4494.29, "total_tokens": 725920} {"current_steps": 1110, "total_steps": 38160, "loss": 0.4598, "lr": 0.00029061844863731656, "epoch": 0.5817610062893082, "percentage": 2.91, "elapsed_time": "0:02:42", "remaining_time": "1:30:13", "throughput": 4493.06, "total_tokens": 728736} {"current_steps": 1115, "total_steps": 38160, "loss": 0.5175, "lr": 0.0002919287211740042, "epoch": 0.5843815513626834, "percentage": 2.92, "elapsed_time": "0:02:42", "remaining_time": "1:30:12", "throughput": 4492.35, "total_tokens": 731776} {"current_steps": 1120, "total_steps": 38160, "loss": 0.493, "lr": 0.00029323899371069183, "epoch": 0.5870020964360587, "percentage": 2.94, "elapsed_time": "0:02:43", "remaining_time": "1:30:09", "throughput": 4491.78, "total_tokens": 734784} {"current_steps": 1125, "total_steps": 38160, "loss": 0.5541, "lr": 0.00029454926624737946, "epoch": 0.589622641509434, "percentage": 2.95, "elapsed_time": "0:02:44", "remaining_time": "1:30:08", "throughput": 4491.54, "total_tokens": 737888} {"current_steps": 1130, "total_steps": 38160, "loss": 0.3686, "lr": 0.0002958595387840671, "epoch": 0.5922431865828093, "percentage": 2.96, "elapsed_time": "0:02:45", "remaining_time": "1:30:10", "throughput": 4493.32, "total_tokens": 741824} {"current_steps": 1135, "total_steps": 38160, "loss": 0.4942, "lr": 0.00029716981132075473, "epoch": 0.5948637316561844, "percentage": 2.97, "elapsed_time": "0:02:45", "remaining_time": "1:30:05", "throughput": 4491.39, "total_tokens": 744288} {"current_steps": 1140, "total_steps": 38160, "loss": 0.4932, "lr": 0.00029848008385744237, "epoch": 0.5974842767295597, "percentage": 2.99, "elapsed_time": "0:02:46", "remaining_time": "1:30:05", "throughput": 4491.39, "total_tokens": 747648} {"current_steps": 1145, "total_steps": 38160, "loss": 0.5235, "lr": 0.00029979035639413, "epoch": 0.600104821802935, "percentage": 3.0, "elapsed_time": "0:02:47", "remaining_time": "1:30:06", "throughput": 4491.93, "total_tokens": 751168} {"current_steps": 1150, "total_steps": 38160, "loss": 0.4722, "lr": 0.00030110062893081764, "epoch": 0.6027253668763103, "percentage": 3.01, "elapsed_time": "0:02:47", "remaining_time": "1:30:05", "throughput": 4492.29, "total_tokens": 754528} {"current_steps": 1155, "total_steps": 38160, "loss": 0.5785, "lr": 0.00030241090146750527, "epoch": 0.6053459119496856, "percentage": 3.03, "elapsed_time": "0:02:48", "remaining_time": "1:30:02", "throughput": 4490.59, "total_tokens": 757152} {"current_steps": 1160, "total_steps": 38160, "loss": 0.6139, "lr": 0.00030372117400419285, "epoch": 0.6079664570230608, "percentage": 3.04, "elapsed_time": "0:02:49", "remaining_time": "1:29:59", "throughput": 4489.85, "total_tokens": 760064} {"current_steps": 1165, "total_steps": 38160, "loss": 0.4821, "lr": 0.0003050314465408805, "epoch": 0.610587002096436, "percentage": 3.05, "elapsed_time": "0:02:49", "remaining_time": "1:29:57", "throughput": 4488.98, "total_tokens": 762976} {"current_steps": 1170, "total_steps": 38160, "loss": 0.4645, "lr": 0.0003063417190775681, "epoch": 0.6132075471698113, "percentage": 3.07, "elapsed_time": "0:02:50", "remaining_time": "1:29:53", "throughput": 4487.57, "total_tokens": 765600} {"current_steps": 1175, "total_steps": 38160, "loss": 0.5225, "lr": 0.00030765199161425575, "epoch": 0.6158280922431866, "percentage": 3.08, "elapsed_time": "0:02:51", "remaining_time": "1:29:50", "throughput": 4486.26, "total_tokens": 768320} {"current_steps": 1180, "total_steps": 38160, "loss": 0.5035, "lr": 0.00030896226415094344, "epoch": 0.6184486373165619, "percentage": 3.09, "elapsed_time": "0:02:51", "remaining_time": "1:29:49", "throughput": 4485.86, "total_tokens": 771392} {"current_steps": 1185, "total_steps": 38160, "loss": 0.4519, "lr": 0.0003102725366876311, "epoch": 0.6210691823899371, "percentage": 3.11, "elapsed_time": "0:02:52", "remaining_time": "1:29:46", "throughput": 4484.29, "total_tokens": 774080} {"current_steps": 1190, "total_steps": 38160, "loss": 0.5028, "lr": 0.00031158280922431866, "epoch": 0.6236897274633124, "percentage": 3.12, "elapsed_time": "0:02:53", "remaining_time": "1:29:44", "throughput": 4483.81, "total_tokens": 777184} {"current_steps": 1195, "total_steps": 38160, "loss": 0.5188, "lr": 0.0003128930817610063, "epoch": 0.6263102725366876, "percentage": 3.13, "elapsed_time": "0:02:54", "remaining_time": "1:29:44", "throughput": 4485.0, "total_tokens": 780768} {"current_steps": 1200, "total_steps": 38160, "loss": 0.6431, "lr": 0.0003142033542976939, "epoch": 0.6289308176100629, "percentage": 3.14, "elapsed_time": "0:02:54", "remaining_time": "1:29:44", "throughput": 4485.14, "total_tokens": 784128} {"current_steps": 1205, "total_steps": 38160, "loss": 0.5443, "lr": 0.00031551362683438156, "epoch": 0.6315513626834381, "percentage": 3.16, "elapsed_time": "0:02:55", "remaining_time": "1:29:43", "throughput": 4484.52, "total_tokens": 787200} {"current_steps": 1210, "total_steps": 38160, "loss": 0.4501, "lr": 0.0003168238993710692, "epoch": 0.6341719077568134, "percentage": 3.17, "elapsed_time": "0:02:56", "remaining_time": "1:29:41", "throughput": 4483.75, "total_tokens": 790176} {"current_steps": 1215, "total_steps": 38160, "loss": 0.5331, "lr": 0.00031813417190775683, "epoch": 0.6367924528301887, "percentage": 3.18, "elapsed_time": "0:02:57", "remaining_time": "1:29:44", "throughput": 4485.94, "total_tokens": 794368} {"current_steps": 1220, "total_steps": 38160, "loss": 0.5395, "lr": 0.0003194444444444444, "epoch": 0.639412997903564, "percentage": 3.2, "elapsed_time": "0:02:57", "remaining_time": "1:29:41", "throughput": 4484.79, "total_tokens": 797120} {"current_steps": 1225, "total_steps": 38160, "loss": 0.4325, "lr": 0.00032075471698113204, "epoch": 0.6420335429769392, "percentage": 3.21, "elapsed_time": "0:02:58", "remaining_time": "1:29:43", "throughput": 4486.7, "total_tokens": 801088} {"current_steps": 1230, "total_steps": 38160, "loss": 0.5181, "lr": 0.00032206498951781973, "epoch": 0.6446540880503144, "percentage": 3.22, "elapsed_time": "0:02:59", "remaining_time": "1:29:43", "throughput": 4487.88, "total_tokens": 804704} {"current_steps": 1235, "total_steps": 38160, "loss": 0.6132, "lr": 0.00032337526205450737, "epoch": 0.6472746331236897, "percentage": 3.24, "elapsed_time": "0:03:00", "remaining_time": "1:29:42", "throughput": 4488.14, "total_tokens": 808000} {"current_steps": 1240, "total_steps": 38160, "loss": 0.5488, "lr": 0.000324685534591195, "epoch": 0.649895178197065, "percentage": 3.25, "elapsed_time": "0:03:00", "remaining_time": "1:29:40", "throughput": 4487.15, "total_tokens": 810848} {"current_steps": 1245, "total_steps": 38160, "loss": 0.5863, "lr": 0.00032599580712788263, "epoch": 0.6525157232704403, "percentage": 3.26, "elapsed_time": "0:03:01", "remaining_time": "1:29:38", "throughput": 4486.29, "total_tokens": 813728} {"current_steps": 1250, "total_steps": 38160, "loss": 0.4873, "lr": 0.0003273060796645702, "epoch": 0.6551362683438156, "percentage": 3.28, "elapsed_time": "0:03:02", "remaining_time": "1:29:36", "throughput": 4486.59, "total_tokens": 816992} {"current_steps": 1255, "total_steps": 38160, "loss": 0.4592, "lr": 0.00032861635220125785, "epoch": 0.6577568134171907, "percentage": 3.29, "elapsed_time": "0:03:02", "remaining_time": "1:29:33", "throughput": 4485.21, "total_tokens": 819584} {"current_steps": 1260, "total_steps": 38160, "loss": 0.5736, "lr": 0.0003299266247379455, "epoch": 0.660377358490566, "percentage": 3.3, "elapsed_time": "0:03:03", "remaining_time": "1:29:31", "throughput": 4484.66, "total_tokens": 822560} {"current_steps": 1265, "total_steps": 38160, "loss": 0.6482, "lr": 0.0003312368972746331, "epoch": 0.6629979035639413, "percentage": 3.31, "elapsed_time": "0:03:04", "remaining_time": "1:29:30", "throughput": 4484.56, "total_tokens": 825792} {"current_steps": 1270, "total_steps": 38160, "loss": 0.4976, "lr": 0.00033254716981132075, "epoch": 0.6656184486373166, "percentage": 3.33, "elapsed_time": "0:03:04", "remaining_time": "1:29:31", "throughput": 4485.97, "total_tokens": 829632} {"current_steps": 1275, "total_steps": 38160, "loss": 0.4729, "lr": 0.0003338574423480084, "epoch": 0.6682389937106918, "percentage": 3.34, "elapsed_time": "0:03:05", "remaining_time": "1:29:30", "throughput": 4485.49, "total_tokens": 832672} {"current_steps": 1280, "total_steps": 38160, "loss": 0.4756, "lr": 0.0003351677148846961, "epoch": 0.6708595387840671, "percentage": 3.35, "elapsed_time": "0:03:06", "remaining_time": "1:29:29", "throughput": 4485.38, "total_tokens": 835840} {"current_steps": 1285, "total_steps": 38160, "loss": 0.4865, "lr": 0.00033647798742138366, "epoch": 0.6734800838574424, "percentage": 3.37, "elapsed_time": "0:03:07", "remaining_time": "1:29:31", "throughput": 4488.16, "total_tokens": 840160} {"current_steps": 1290, "total_steps": 38160, "loss": 0.5699, "lr": 0.0003377882599580713, "epoch": 0.6761006289308176, "percentage": 3.38, "elapsed_time": "0:03:07", "remaining_time": "1:29:31", "throughput": 4487.98, "total_tokens": 843392} {"current_steps": 1295, "total_steps": 38160, "loss": 0.4094, "lr": 0.0003390985324947589, "epoch": 0.6787211740041929, "percentage": 3.39, "elapsed_time": "0:03:08", "remaining_time": "1:29:34", "throughput": 4489.74, "total_tokens": 847616} {"current_steps": 1300, "total_steps": 38160, "loss": 0.5101, "lr": 0.00034040880503144656, "epoch": 0.6813417190775681, "percentage": 3.41, "elapsed_time": "0:03:09", "remaining_time": "1:29:35", "throughput": 4491.0, "total_tokens": 851392} {"current_steps": 1305, "total_steps": 38160, "loss": 0.543, "lr": 0.0003417190775681342, "epoch": 0.6839622641509434, "percentage": 3.42, "elapsed_time": "0:03:10", "remaining_time": "1:29:33", "throughput": 4490.44, "total_tokens": 854336} {"current_steps": 1310, "total_steps": 38160, "loss": 0.4848, "lr": 0.00034302935010482183, "epoch": 0.6865828092243187, "percentage": 3.43, "elapsed_time": "0:03:10", "remaining_time": "1:29:31", "throughput": 4489.99, "total_tokens": 857312} {"current_steps": 1315, "total_steps": 38160, "loss": 0.5321, "lr": 0.0003443396226415094, "epoch": 0.689203354297694, "percentage": 3.45, "elapsed_time": "0:03:11", "remaining_time": "1:29:32", "throughput": 4491.52, "total_tokens": 861152} {"current_steps": 1320, "total_steps": 38160, "loss": 0.6204, "lr": 0.00034564989517819704, "epoch": 0.6918238993710691, "percentage": 3.46, "elapsed_time": "0:03:12", "remaining_time": "1:29:32", "throughput": 4492.22, "total_tokens": 864704} {"current_steps": 1325, "total_steps": 38160, "loss": 0.554, "lr": 0.0003469601677148847, "epoch": 0.6944444444444444, "percentage": 3.47, "elapsed_time": "0:03:13", "remaining_time": "1:29:29", "throughput": 4491.0, "total_tokens": 867360} {"current_steps": 1330, "total_steps": 38160, "loss": 0.598, "lr": 0.00034827044025157236, "epoch": 0.6970649895178197, "percentage": 3.49, "elapsed_time": "0:03:13", "remaining_time": "1:29:27", "throughput": 4490.8, "total_tokens": 870464} {"current_steps": 1335, "total_steps": 38160, "loss": 0.3874, "lr": 0.00034958071278826, "epoch": 0.699685534591195, "percentage": 3.5, "elapsed_time": "0:03:14", "remaining_time": "1:29:27", "throughput": 4490.69, "total_tokens": 873792} {"current_steps": 1340, "total_steps": 38160, "loss": 0.6038, "lr": 0.00035089098532494763, "epoch": 0.7023060796645703, "percentage": 3.51, "elapsed_time": "0:03:15", "remaining_time": "1:29:30", "throughput": 4493.51, "total_tokens": 878336} {"current_steps": 1345, "total_steps": 38160, "loss": 0.667, "lr": 0.0003522012578616352, "epoch": 0.7049266247379455, "percentage": 3.52, "elapsed_time": "0:03:16", "remaining_time": "1:29:31", "throughput": 4494.39, "total_tokens": 881984} {"current_steps": 1350, "total_steps": 38160, "loss": 0.4298, "lr": 0.00035351153039832285, "epoch": 0.7075471698113207, "percentage": 3.54, "elapsed_time": "0:03:17", "remaining_time": "1:29:32", "throughput": 4494.99, "total_tokens": 885632} {"current_steps": 1355, "total_steps": 38160, "loss": 0.4324, "lr": 0.0003548218029350105, "epoch": 0.710167714884696, "percentage": 3.55, "elapsed_time": "0:03:17", "remaining_time": "1:29:30", "throughput": 4494.39, "total_tokens": 888544} {"current_steps": 1360, "total_steps": 38160, "loss": 0.4871, "lr": 0.0003561320754716981, "epoch": 0.7127882599580713, "percentage": 3.56, "elapsed_time": "0:03:18", "remaining_time": "1:29:27", "throughput": 4493.36, "total_tokens": 891328} {"current_steps": 1365, "total_steps": 38160, "loss": 0.6039, "lr": 0.00035744234800838575, "epoch": 0.7154088050314465, "percentage": 3.58, "elapsed_time": "0:03:19", "remaining_time": "1:29:25", "throughput": 4493.15, "total_tokens": 894400} {"current_steps": 1370, "total_steps": 38160, "loss": 0.462, "lr": 0.0003587526205450734, "epoch": 0.7180293501048218, "percentage": 3.59, "elapsed_time": "0:03:19", "remaining_time": "1:29:21", "throughput": 4491.08, "total_tokens": 896704} {"current_steps": 1375, "total_steps": 38160, "loss": 0.4818, "lr": 0.00036006289308176097, "epoch": 0.7206498951781971, "percentage": 3.6, "elapsed_time": "0:03:20", "remaining_time": "1:29:19", "throughput": 4490.03, "total_tokens": 899520} {"current_steps": 1380, "total_steps": 38160, "loss": 0.53, "lr": 0.00036137316561844865, "epoch": 0.7232704402515723, "percentage": 3.62, "elapsed_time": "0:03:21", "remaining_time": "1:29:17", "throughput": 4489.01, "total_tokens": 902304} {"current_steps": 1385, "total_steps": 38160, "loss": 0.5635, "lr": 0.0003626834381551363, "epoch": 0.7258909853249476, "percentage": 3.63, "elapsed_time": "0:03:21", "remaining_time": "1:29:16", "throughput": 4489.55, "total_tokens": 905760} {"current_steps": 1390, "total_steps": 38160, "loss": 0.5573, "lr": 0.0003639937106918239, "epoch": 0.7285115303983228, "percentage": 3.64, "elapsed_time": "0:03:22", "remaining_time": "1:29:14", "throughput": 4488.43, "total_tokens": 908512} {"current_steps": 1395, "total_steps": 38160, "loss": 0.4697, "lr": 0.00036530398322851156, "epoch": 0.7311320754716981, "percentage": 3.66, "elapsed_time": "0:03:23", "remaining_time": "1:29:16", "throughput": 4490.57, "total_tokens": 912736} {"current_steps": 1400, "total_steps": 38160, "loss": 0.8091, "lr": 0.0003666142557651992, "epoch": 0.7337526205450734, "percentage": 3.67, "elapsed_time": "0:03:24", "remaining_time": "1:29:16", "throughput": 4491.58, "total_tokens": 916352} {"current_steps": 1405, "total_steps": 38160, "loss": 0.5876, "lr": 0.00036792452830188677, "epoch": 0.7363731656184487, "percentage": 3.68, "elapsed_time": "0:03:24", "remaining_time": "1:29:14", "throughput": 4490.58, "total_tokens": 919136} {"current_steps": 1410, "total_steps": 38160, "loss": 0.6209, "lr": 0.0003692348008385744, "epoch": 0.7389937106918238, "percentage": 3.69, "elapsed_time": "0:03:25", "remaining_time": "1:29:11", "throughput": 4489.13, "total_tokens": 921760} {"current_steps": 1415, "total_steps": 38160, "loss": 0.4471, "lr": 0.00037054507337526204, "epoch": 0.7416142557651991, "percentage": 3.71, "elapsed_time": "0:03:25", "remaining_time": "1:29:07", "throughput": 4487.29, "total_tokens": 924096} {"current_steps": 1420, "total_steps": 38160, "loss": 0.5425, "lr": 0.0003718553459119497, "epoch": 0.7442348008385744, "percentage": 3.72, "elapsed_time": "0:03:26", "remaining_time": "1:29:03", "throughput": 4484.95, "total_tokens": 926240} {"current_steps": 1425, "total_steps": 38160, "loss": 0.4887, "lr": 0.0003731656184486373, "epoch": 0.7468553459119497, "percentage": 3.73, "elapsed_time": "0:03:27", "remaining_time": "1:29:00", "throughput": 4483.99, "total_tokens": 928928} {"current_steps": 1430, "total_steps": 38160, "loss": 0.6563, "lr": 0.000374475890985325, "epoch": 0.749475890985325, "percentage": 3.75, "elapsed_time": "0:03:27", "remaining_time": "1:28:57", "throughput": 4482.75, "total_tokens": 931552} {"current_steps": 1435, "total_steps": 38160, "loss": 0.4741, "lr": 0.00037578616352201263, "epoch": 0.7520964360587002, "percentage": 3.76, "elapsed_time": "0:03:28", "remaining_time": "1:28:59", "throughput": 4484.75, "total_tokens": 935648} {"current_steps": 1440, "total_steps": 38160, "loss": 0.4865, "lr": 0.0003770964360587002, "epoch": 0.7547169811320755, "percentage": 3.77, "elapsed_time": "0:03:29", "remaining_time": "1:28:56", "throughput": 4483.66, "total_tokens": 938336} {"current_steps": 1445, "total_steps": 38160, "loss": 0.514, "lr": 0.00037840670859538785, "epoch": 0.7573375262054507, "percentage": 3.79, "elapsed_time": "0:03:30", "remaining_time": "1:28:56", "throughput": 4484.48, "total_tokens": 941952} {"current_steps": 1450, "total_steps": 38160, "loss": 0.4452, "lr": 0.0003797169811320755, "epoch": 0.759958071278826, "percentage": 3.8, "elapsed_time": "0:03:30", "remaining_time": "1:28:56", "throughput": 4484.79, "total_tokens": 945248} {"current_steps": 1455, "total_steps": 38160, "loss": 0.5142, "lr": 0.0003810272536687631, "epoch": 0.7625786163522013, "percentage": 3.81, "elapsed_time": "0:03:31", "remaining_time": "1:28:55", "throughput": 4484.7, "total_tokens": 948512} {"current_steps": 1460, "total_steps": 38160, "loss": 0.468, "lr": 0.00038233752620545075, "epoch": 0.7651991614255765, "percentage": 3.83, "elapsed_time": "0:03:32", "remaining_time": "1:28:54", "throughput": 4484.66, "total_tokens": 951744} {"current_steps": 1465, "total_steps": 38160, "loss": 0.5076, "lr": 0.0003836477987421384, "epoch": 0.7678197064989518, "percentage": 3.84, "elapsed_time": "0:03:32", "remaining_time": "1:28:50", "throughput": 4482.44, "total_tokens": 953920} {"current_steps": 1470, "total_steps": 38160, "loss": 0.4649, "lr": 0.00038495807127882596, "epoch": 0.7704402515723271, "percentage": 3.85, "elapsed_time": "0:03:33", "remaining_time": "1:28:50", "throughput": 4482.78, "total_tokens": 957376} {"current_steps": 1475, "total_steps": 38160, "loss": 0.5104, "lr": 0.0003862683438155136, "epoch": 0.7730607966457023, "percentage": 3.87, "elapsed_time": "0:03:34", "remaining_time": "1:28:48", "throughput": 4482.08, "total_tokens": 960288} {"current_steps": 1480, "total_steps": 38160, "loss": 0.4789, "lr": 0.0003875786163522013, "epoch": 0.7756813417190775, "percentage": 3.88, "elapsed_time": "0:03:35", "remaining_time": "1:28:49", "throughput": 4482.65, "total_tokens": 963872} {"current_steps": 1485, "total_steps": 38160, "loss": 0.5305, "lr": 0.0003888888888888889, "epoch": 0.7783018867924528, "percentage": 3.89, "elapsed_time": "0:03:35", "remaining_time": "1:28:46", "throughput": 4481.03, "total_tokens": 966368} {"current_steps": 1490, "total_steps": 38160, "loss": 0.4744, "lr": 0.00039019916142557656, "epoch": 0.7809224318658281, "percentage": 3.9, "elapsed_time": "0:03:36", "remaining_time": "1:28:44", "throughput": 4480.54, "total_tokens": 969344} {"current_steps": 1495, "total_steps": 38160, "loss": 0.5631, "lr": 0.0003915094339622642, "epoch": 0.7835429769392034, "percentage": 3.92, "elapsed_time": "0:03:37", "remaining_time": "1:28:42", "throughput": 4480.02, "total_tokens": 972320} {"current_steps": 1500, "total_steps": 38160, "loss": 0.5202, "lr": 0.00039281970649895177, "epoch": 0.7861635220125787, "percentage": 3.93, "elapsed_time": "0:03:37", "remaining_time": "1:28:45", "throughput": 4481.47, "total_tokens": 976448} {"current_steps": 1505, "total_steps": 38160, "loss": 0.4556, "lr": 0.0003941299790356394, "epoch": 0.7887840670859538, "percentage": 3.94, "elapsed_time": "0:03:38", "remaining_time": "1:28:44", "throughput": 4481.51, "total_tokens": 979648} {"current_steps": 1510, "total_steps": 38160, "loss": 0.3888, "lr": 0.00039544025157232704, "epoch": 0.7914046121593291, "percentage": 3.96, "elapsed_time": "0:03:39", "remaining_time": "1:28:44", "throughput": 4481.55, "total_tokens": 983040} {"current_steps": 1515, "total_steps": 38160, "loss": 0.3768, "lr": 0.0003967505241090147, "epoch": 0.7940251572327044, "percentage": 3.97, "elapsed_time": "0:03:40", "remaining_time": "1:28:41", "throughput": 4480.71, "total_tokens": 985824} {"current_steps": 1520, "total_steps": 38160, "loss": 0.6914, "lr": 0.0003980607966457023, "epoch": 0.7966457023060797, "percentage": 3.98, "elapsed_time": "0:03:40", "remaining_time": "1:28:44", "throughput": 4483.28, "total_tokens": 990368} {"current_steps": 1525, "total_steps": 38160, "loss": 0.5481, "lr": 0.00039937106918238994, "epoch": 0.799266247379455, "percentage": 4.0, "elapsed_time": "0:03:41", "remaining_time": "1:28:44", "throughput": 4483.94, "total_tokens": 993920} {"current_steps": 1530, "total_steps": 38160, "loss": 0.54, "lr": 0.0004006813417190776, "epoch": 0.8018867924528302, "percentage": 4.01, "elapsed_time": "0:03:42", "remaining_time": "1:28:44", "throughput": 4484.15, "total_tokens": 997280} {"current_steps": 1535, "total_steps": 38160, "loss": 0.6919, "lr": 0.0004019916142557652, "epoch": 0.8045073375262054, "percentage": 4.02, "elapsed_time": "0:03:43", "remaining_time": "1:28:42", "throughput": 4483.44, "total_tokens": 1000096} {"current_steps": 1540, "total_steps": 38160, "loss": 0.3974, "lr": 0.00040330188679245284, "epoch": 0.8071278825995807, "percentage": 4.04, "elapsed_time": "0:03:43", "remaining_time": "1:28:39", "throughput": 4482.18, "total_tokens": 1002624} {"current_steps": 1545, "total_steps": 38160, "loss": 0.5033, "lr": 0.0004046121593291405, "epoch": 0.809748427672956, "percentage": 4.05, "elapsed_time": "0:03:44", "remaining_time": "1:28:37", "throughput": 4481.32, "total_tokens": 1005440} {"current_steps": 1550, "total_steps": 38160, "loss": 0.6111, "lr": 0.0004059224318658281, "epoch": 0.8123689727463312, "percentage": 4.06, "elapsed_time": "0:03:45", "remaining_time": "1:28:38", "throughput": 4482.34, "total_tokens": 1009248} {"current_steps": 1555, "total_steps": 38160, "loss": 0.5193, "lr": 0.00040723270440251575, "epoch": 0.8149895178197065, "percentage": 4.07, "elapsed_time": "0:03:45", "remaining_time": "1:28:35", "throughput": 4480.88, "total_tokens": 1011744} {"current_steps": 1560, "total_steps": 38160, "loss": 0.4926, "lr": 0.00040854297693920333, "epoch": 0.8176100628930818, "percentage": 4.09, "elapsed_time": "0:03:46", "remaining_time": "1:28:32", "throughput": 4479.98, "total_tokens": 1014432} {"current_steps": 1565, "total_steps": 38160, "loss": 0.5703, "lr": 0.00040985324947589096, "epoch": 0.820230607966457, "percentage": 4.1, "elapsed_time": "0:03:47", "remaining_time": "1:28:31", "throughput": 4479.59, "total_tokens": 1017472} {"current_steps": 1570, "total_steps": 38160, "loss": 0.6236, "lr": 0.0004111635220125786, "epoch": 0.8228511530398323, "percentage": 4.11, "elapsed_time": "0:03:47", "remaining_time": "1:28:28", "throughput": 4478.46, "total_tokens": 1020128} {"current_steps": 1575, "total_steps": 38160, "loss": 0.4076, "lr": 0.00041247379454926623, "epoch": 0.8254716981132075, "percentage": 4.13, "elapsed_time": "0:03:48", "remaining_time": "1:28:27", "throughput": 4478.44, "total_tokens": 1023200} {"current_steps": 1580, "total_steps": 38160, "loss": 0.648, "lr": 0.0004137840670859539, "epoch": 0.8280922431865828, "percentage": 4.14, "elapsed_time": "0:03:49", "remaining_time": "1:28:26", "throughput": 4478.76, "total_tokens": 1026592} {"current_steps": 1585, "total_steps": 38160, "loss": 0.4616, "lr": 0.00041509433962264155, "epoch": 0.8307127882599581, "percentage": 4.15, "elapsed_time": "0:03:49", "remaining_time": "1:28:24", "throughput": 4477.5, "total_tokens": 1029216} {"current_steps": 1590, "total_steps": 38160, "loss": 0.6045, "lr": 0.00041640461215932913, "epoch": 0.8333333333333334, "percentage": 4.17, "elapsed_time": "0:03:50", "remaining_time": "1:28:25", "throughput": 4478.32, "total_tokens": 1032960} {"current_steps": 1595, "total_steps": 38160, "loss": 0.5001, "lr": 0.00041771488469601677, "epoch": 0.8359538784067087, "percentage": 4.18, "elapsed_time": "0:03:51", "remaining_time": "1:28:24", "throughput": 4478.38, "total_tokens": 1036224} {"current_steps": 1600, "total_steps": 38160, "loss": 0.4573, "lr": 0.0004190251572327044, "epoch": 0.8385744234800838, "percentage": 4.19, "elapsed_time": "0:03:52", "remaining_time": "1:28:26", "throughput": 4480.65, "total_tokens": 1040608} {"current_steps": 1605, "total_steps": 38160, "loss": 0.4586, "lr": 0.00042033542976939204, "epoch": 0.8411949685534591, "percentage": 4.21, "elapsed_time": "0:03:52", "remaining_time": "1:28:25", "throughput": 4480.29, "total_tokens": 1043648} {"current_steps": 1610, "total_steps": 38160, "loss": 0.4629, "lr": 0.00042164570230607967, "epoch": 0.8438155136268344, "percentage": 4.22, "elapsed_time": "0:03:53", "remaining_time": "1:28:23", "throughput": 4479.35, "total_tokens": 1046400} {"current_steps": 1615, "total_steps": 38160, "loss": 0.4952, "lr": 0.0004229559748427673, "epoch": 0.8464360587002097, "percentage": 4.23, "elapsed_time": "0:03:54", "remaining_time": "1:28:22", "throughput": 4479.04, "total_tokens": 1049568} {"current_steps": 1620, "total_steps": 38160, "loss": 0.5862, "lr": 0.00042426624737945494, "epoch": 0.8490566037735849, "percentage": 4.25, "elapsed_time": "0:03:54", "remaining_time": "1:28:20", "throughput": 4478.02, "total_tokens": 1052288} {"current_steps": 1625, "total_steps": 38160, "loss": 0.6671, "lr": 0.0004255765199161425, "epoch": 0.8516771488469602, "percentage": 4.26, "elapsed_time": "0:03:55", "remaining_time": "1:28:21", "throughput": 4479.04, "total_tokens": 1056096} {"current_steps": 1630, "total_steps": 38160, "loss": 0.4759, "lr": 0.0004268867924528302, "epoch": 0.8542976939203354, "percentage": 4.27, "elapsed_time": "0:03:56", "remaining_time": "1:28:22", "throughput": 4480.2, "total_tokens": 1059968} {"current_steps": 1635, "total_steps": 38160, "loss": 0.452, "lr": 0.00042819706498951784, "epoch": 0.8569182389937107, "percentage": 4.28, "elapsed_time": "0:03:57", "remaining_time": "1:28:21", "throughput": 4480.1, "total_tokens": 1063136} {"current_steps": 1640, "total_steps": 38160, "loss": 0.5213, "lr": 0.0004295073375262055, "epoch": 0.859538784067086, "percentage": 4.3, "elapsed_time": "0:03:58", "remaining_time": "1:28:24", "throughput": 4482.11, "total_tokens": 1067616} {"current_steps": 1645, "total_steps": 38160, "loss": 0.5748, "lr": 0.0004308176100628931, "epoch": 0.8621593291404612, "percentage": 4.31, "elapsed_time": "0:03:58", "remaining_time": "1:28:24", "throughput": 4482.78, "total_tokens": 1071168} {"current_steps": 1650, "total_steps": 38160, "loss": 0.3935, "lr": 0.00043212788259958075, "epoch": 0.8647798742138365, "percentage": 4.32, "elapsed_time": "0:03:59", "remaining_time": "1:28:27", "throughput": 4485.14, "total_tokens": 1075808} {"current_steps": 1655, "total_steps": 38160, "loss": 0.5966, "lr": 0.0004334381551362683, "epoch": 0.8674004192872118, "percentage": 4.34, "elapsed_time": "0:04:00", "remaining_time": "1:28:30", "throughput": 4486.84, "total_tokens": 1080224} {"current_steps": 1660, "total_steps": 38160, "loss": 0.6491, "lr": 0.00043474842767295596, "epoch": 0.870020964360587, "percentage": 4.35, "elapsed_time": "0:04:01", "remaining_time": "1:28:30", "throughput": 4487.6, "total_tokens": 1083808} {"current_steps": 1665, "total_steps": 38160, "loss": 0.6254, "lr": 0.0004360587002096436, "epoch": 0.8726415094339622, "percentage": 4.36, "elapsed_time": "0:04:02", "remaining_time": "1:28:27", "throughput": 4486.22, "total_tokens": 1086304} {"current_steps": 1670, "total_steps": 38160, "loss": 0.6262, "lr": 0.00043736897274633123, "epoch": 0.8752620545073375, "percentage": 4.38, "elapsed_time": "0:04:02", "remaining_time": "1:28:27", "throughput": 4486.75, "total_tokens": 1089856} {"current_steps": 1675, "total_steps": 38160, "loss": 0.4421, "lr": 0.00043867924528301886, "epoch": 0.8778825995807128, "percentage": 4.39, "elapsed_time": "0:04:03", "remaining_time": "1:28:25", "throughput": 4486.05, "total_tokens": 1092576} {"current_steps": 1680, "total_steps": 38160, "loss": 0.453, "lr": 0.00043998951781970655, "epoch": 0.8805031446540881, "percentage": 4.4, "elapsed_time": "0:04:04", "remaining_time": "1:28:25", "throughput": 4487.37, "total_tokens": 1096448} {"current_steps": 1685, "total_steps": 38160, "loss": 0.4301, "lr": 0.00044129979035639413, "epoch": 0.8831236897274634, "percentage": 4.42, "elapsed_time": "0:04:05", "remaining_time": "1:28:27", "throughput": 4488.59, "total_tokens": 1100448} {"current_steps": 1690, "total_steps": 38160, "loss": 0.5105, "lr": 0.00044261006289308177, "epoch": 0.8857442348008385, "percentage": 4.43, "elapsed_time": "0:04:05", "remaining_time": "1:28:25", "throughput": 4488.14, "total_tokens": 1103520} {"current_steps": 1695, "total_steps": 38160, "loss": 0.3949, "lr": 0.0004439203354297694, "epoch": 0.8883647798742138, "percentage": 4.44, "elapsed_time": "0:04:06", "remaining_time": "1:28:23", "throughput": 4487.37, "total_tokens": 1106304} {"current_steps": 1700, "total_steps": 38160, "loss": 0.5114, "lr": 0.00044523060796645704, "epoch": 0.8909853249475891, "percentage": 4.45, "elapsed_time": "0:04:07", "remaining_time": "1:28:24", "throughput": 4488.52, "total_tokens": 1110176} {"current_steps": 1705, "total_steps": 38160, "loss": 0.4924, "lr": 0.00044654088050314467, "epoch": 0.8936058700209644, "percentage": 4.47, "elapsed_time": "0:04:07", "remaining_time": "1:28:21", "throughput": 4487.02, "total_tokens": 1112640} {"current_steps": 1710, "total_steps": 38160, "loss": 0.516, "lr": 0.0004478511530398323, "epoch": 0.8962264150943396, "percentage": 4.48, "elapsed_time": "0:04:08", "remaining_time": "1:28:23", "throughput": 4488.6, "total_tokens": 1116736} {"current_steps": 1715, "total_steps": 38160, "loss": 0.4428, "lr": 0.0004491614255765199, "epoch": 0.8988469601677149, "percentage": 4.49, "elapsed_time": "0:04:09", "remaining_time": "1:28:22", "throughput": 4488.68, "total_tokens": 1120000} {"current_steps": 1720, "total_steps": 38160, "loss": 0.4131, "lr": 0.0004504716981132075, "epoch": 0.9014675052410901, "percentage": 4.51, "elapsed_time": "0:04:10", "remaining_time": "1:28:20", "throughput": 4487.51, "total_tokens": 1122656} {"current_steps": 1725, "total_steps": 38160, "loss": 0.4884, "lr": 0.00045178197064989515, "epoch": 0.9040880503144654, "percentage": 4.52, "elapsed_time": "0:04:10", "remaining_time": "1:28:19", "throughput": 4487.38, "total_tokens": 1125856} {"current_steps": 1730, "total_steps": 38160, "loss": 0.4906, "lr": 0.00045309224318658284, "epoch": 0.9067085953878407, "percentage": 4.53, "elapsed_time": "0:04:11", "remaining_time": "1:28:16", "throughput": 4486.02, "total_tokens": 1128288} {"current_steps": 1735, "total_steps": 38160, "loss": 0.5725, "lr": 0.0004544025157232705, "epoch": 0.9093291404612159, "percentage": 4.55, "elapsed_time": "0:04:12", "remaining_time": "1:28:15", "throughput": 4486.18, "total_tokens": 1131680} {"current_steps": 1740, "total_steps": 38160, "loss": 0.4744, "lr": 0.0004557127882599581, "epoch": 0.9119496855345912, "percentage": 4.56, "elapsed_time": "0:04:12", "remaining_time": "1:28:14", "throughput": 4485.45, "total_tokens": 1134496} {"current_steps": 1745, "total_steps": 38160, "loss": 0.4571, "lr": 0.0004570230607966457, "epoch": 0.9145702306079665, "percentage": 4.57, "elapsed_time": "0:04:13", "remaining_time": "1:28:14", "throughput": 4485.85, "total_tokens": 1138176} {"current_steps": 1750, "total_steps": 38160, "loss": 0.3959, "lr": 0.0004583333333333333, "epoch": 0.9171907756813418, "percentage": 4.59, "elapsed_time": "0:04:14", "remaining_time": "1:28:12", "throughput": 4485.28, "total_tokens": 1141056} {"current_steps": 1755, "total_steps": 38160, "loss": 0.4691, "lr": 0.00045964360587002096, "epoch": 0.9198113207547169, "percentage": 4.6, "elapsed_time": "0:04:15", "remaining_time": "1:28:12", "throughput": 4485.0, "total_tokens": 1144224} {"current_steps": 1760, "total_steps": 38160, "loss": 0.5113, "lr": 0.0004609538784067086, "epoch": 0.9224318658280922, "percentage": 4.61, "elapsed_time": "0:04:15", "remaining_time": "1:28:09", "throughput": 4483.75, "total_tokens": 1146720} {"current_steps": 1765, "total_steps": 38160, "loss": 0.6513, "lr": 0.00046226415094339623, "epoch": 0.9250524109014675, "percentage": 4.63, "elapsed_time": "0:04:16", "remaining_time": "1:28:06", "throughput": 4482.64, "total_tokens": 1149312} {"current_steps": 1770, "total_steps": 38160, "loss": 0.5014, "lr": 0.00046357442348008386, "epoch": 0.9276729559748428, "percentage": 4.64, "elapsed_time": "0:04:17", "remaining_time": "1:28:05", "throughput": 4482.0, "total_tokens": 1152224} {"current_steps": 1775, "total_steps": 38160, "loss": 0.4911, "lr": 0.00046488469601677155, "epoch": 0.9302935010482181, "percentage": 4.65, "elapsed_time": "0:04:17", "remaining_time": "1:28:04", "throughput": 4481.97, "total_tokens": 1155456} {"current_steps": 1780, "total_steps": 38160, "loss": 0.4912, "lr": 0.00046619496855345913, "epoch": 0.9329140461215933, "percentage": 4.66, "elapsed_time": "0:04:18", "remaining_time": "1:28:04", "throughput": 4481.95, "total_tokens": 1158752} {"current_steps": 1785, "total_steps": 38160, "loss": 0.5525, "lr": 0.00046750524109014677, "epoch": 0.9355345911949685, "percentage": 4.68, "elapsed_time": "0:04:19", "remaining_time": "1:28:02", "throughput": 4481.25, "total_tokens": 1161632} {"current_steps": 1790, "total_steps": 38160, "loss": 0.4952, "lr": 0.0004688155136268344, "epoch": 0.9381551362683438, "percentage": 4.69, "elapsed_time": "0:04:20", "remaining_time": "1:28:03", "throughput": 4482.42, "total_tokens": 1165536} {"current_steps": 1795, "total_steps": 38160, "loss": 0.6191, "lr": 0.00047012578616352203, "epoch": 0.9407756813417191, "percentage": 4.7, "elapsed_time": "0:04:20", "remaining_time": "1:28:02", "throughput": 4482.97, "total_tokens": 1168992} {"current_steps": 1800, "total_steps": 38160, "loss": 0.444, "lr": 0.00047143605870020967, "epoch": 0.9433962264150944, "percentage": 4.72, "elapsed_time": "0:04:21", "remaining_time": "1:28:00", "throughput": 4482.13, "total_tokens": 1171648} {"current_steps": 1805, "total_steps": 38160, "loss": 0.6414, "lr": 0.0004727463312368973, "epoch": 0.9460167714884696, "percentage": 4.73, "elapsed_time": "0:04:22", "remaining_time": "1:27:59", "throughput": 4482.13, "total_tokens": 1174912} {"current_steps": 1810, "total_steps": 38160, "loss": 0.4039, "lr": 0.0004740566037735849, "epoch": 0.9486373165618449, "percentage": 4.74, "elapsed_time": "0:04:22", "remaining_time": "1:27:58", "throughput": 4482.28, "total_tokens": 1178144} {"current_steps": 1815, "total_steps": 38160, "loss": 0.403, "lr": 0.0004753668763102725, "epoch": 0.9512578616352201, "percentage": 4.76, "elapsed_time": "0:04:23", "remaining_time": "1:27:59", "throughput": 4482.96, "total_tokens": 1181856} {"current_steps": 1820, "total_steps": 38160, "loss": 0.6034, "lr": 0.00047667714884696015, "epoch": 0.9538784067085954, "percentage": 4.77, "elapsed_time": "0:04:24", "remaining_time": "1:27:58", "throughput": 4482.54, "total_tokens": 1184896} {"current_steps": 1825, "total_steps": 38160, "loss": 0.7188, "lr": 0.00047798742138364784, "epoch": 0.9564989517819706, "percentage": 4.78, "elapsed_time": "0:04:24", "remaining_time": "1:27:54", "throughput": 4481.14, "total_tokens": 1187264} {"current_steps": 1830, "total_steps": 38160, "loss": 0.4858, "lr": 0.0004792976939203355, "epoch": 0.9591194968553459, "percentage": 4.8, "elapsed_time": "0:04:25", "remaining_time": "1:27:55", "throughput": 4482.36, "total_tokens": 1191168} {"current_steps": 1835, "total_steps": 38160, "loss": 0.4371, "lr": 0.0004806079664570231, "epoch": 0.9617400419287212, "percentage": 4.81, "elapsed_time": "0:04:26", "remaining_time": "1:27:52", "throughput": 4481.2, "total_tokens": 1193664} {"current_steps": 1840, "total_steps": 38160, "loss": 0.4543, "lr": 0.0004819182389937107, "epoch": 0.9643605870020965, "percentage": 4.82, "elapsed_time": "0:04:27", "remaining_time": "1:28:03", "throughput": 4486.68, "total_tokens": 1200864} {"current_steps": 1845, "total_steps": 38160, "loss": 0.4646, "lr": 0.0004832285115303983, "epoch": 0.9669811320754716, "percentage": 4.83, "elapsed_time": "0:04:28", "remaining_time": "1:28:01", "throughput": 4485.97, "total_tokens": 1203680} {"current_steps": 1850, "total_steps": 38160, "loss": 0.5537, "lr": 0.00048453878406708596, "epoch": 0.9696016771488469, "percentage": 4.85, "elapsed_time": "0:04:29", "remaining_time": "1:28:02", "throughput": 4487.04, "total_tokens": 1207648} {"current_steps": 1855, "total_steps": 38160, "loss": 0.4967, "lr": 0.0004858490566037736, "epoch": 0.9722222222222222, "percentage": 4.86, "elapsed_time": "0:04:29", "remaining_time": "1:28:02", "throughput": 4487.47, "total_tokens": 1211232} {"current_steps": 1860, "total_steps": 38160, "loss": 0.4525, "lr": 0.0004871593291404612, "epoch": 0.9748427672955975, "percentage": 4.87, "elapsed_time": "0:04:30", "remaining_time": "1:28:01", "throughput": 4487.2, "total_tokens": 1214304} {"current_steps": 1865, "total_steps": 38160, "loss": 0.3894, "lr": 0.0004884696016771489, "epoch": 0.9774633123689728, "percentage": 4.89, "elapsed_time": "0:04:31", "remaining_time": "1:28:00", "throughput": 4487.44, "total_tokens": 1217664} {"current_steps": 1870, "total_steps": 38160, "loss": 0.3924, "lr": 0.0004897798742138365, "epoch": 0.980083857442348, "percentage": 4.9, "elapsed_time": "0:04:32", "remaining_time": "1:28:00", "throughput": 4487.74, "total_tokens": 1221184} {"current_steps": 1875, "total_steps": 38160, "loss": 0.4821, "lr": 0.0004910901467505241, "epoch": 0.9827044025157232, "percentage": 4.91, "elapsed_time": "0:04:32", "remaining_time": "1:28:00", "throughput": 4488.13, "total_tokens": 1224736} {"current_steps": 1880, "total_steps": 38160, "loss": 0.4982, "lr": 0.0004924004192872118, "epoch": 0.9853249475890985, "percentage": 4.93, "elapsed_time": "0:04:33", "remaining_time": "1:28:00", "throughput": 4488.74, "total_tokens": 1228256} {"current_steps": 1885, "total_steps": 38160, "loss": 0.7353, "lr": 0.0004937106918238993, "epoch": 0.9879454926624738, "percentage": 4.94, "elapsed_time": "0:04:34", "remaining_time": "1:27:58", "throughput": 4488.08, "total_tokens": 1231104} {"current_steps": 1890, "total_steps": 38160, "loss": 0.4709, "lr": 0.000495020964360587, "epoch": 0.9905660377358491, "percentage": 4.95, "elapsed_time": "0:04:35", "remaining_time": "1:27:57", "throughput": 4487.81, "total_tokens": 1234176} {"current_steps": 1895, "total_steps": 38160, "loss": 0.4626, "lr": 0.0004963312368972746, "epoch": 0.9931865828092243, "percentage": 4.97, "elapsed_time": "0:04:35", "remaining_time": "1:27:57", "throughput": 4487.97, "total_tokens": 1237568} {"current_steps": 1900, "total_steps": 38160, "loss": 0.6021, "lr": 0.0004976415094339623, "epoch": 0.9958071278825996, "percentage": 4.98, "elapsed_time": "0:04:36", "remaining_time": "1:27:56", "throughput": 4488.16, "total_tokens": 1240896} {"current_steps": 1905, "total_steps": 38160, "loss": 0.6502, "lr": 0.0004989517819706499, "epoch": 0.9984276729559748, "percentage": 4.99, "elapsed_time": "0:04:37", "remaining_time": "1:27:55", "throughput": 4488.58, "total_tokens": 1244288} {"current_steps": 1908, "total_steps": 38160, "eval_loss": 0.5047244429588318, "epoch": 1.0, "percentage": 5.0, "elapsed_time": "0:04:51", "remaining_time": "1:32:15", "throughput": 4274.59, "total_tokens": 1245424} {"current_steps": 1910, "total_steps": 38160, "loss": 0.4655, "lr": 0.0005002620545073376, "epoch": 1.00104821802935, "percentage": 5.01, "elapsed_time": "0:04:53", "remaining_time": "1:32:47", "throughput": 4250.11, "total_tokens": 1246832} {"current_steps": 1915, "total_steps": 38160, "loss": 0.45, "lr": 0.0005015723270440253, "epoch": 1.0036687631027255, "percentage": 5.02, "elapsed_time": "0:04:54", "remaining_time": "1:32:45", "throughput": 4250.58, "total_tokens": 1250000} {"current_steps": 1920, "total_steps": 38160, "loss": 0.5823, "lr": 0.0005028825995807128, "epoch": 1.0062893081761006, "percentage": 5.03, "elapsed_time": "0:04:54", "remaining_time": "1:32:44", "throughput": 4251.57, "total_tokens": 1253488} {"current_steps": 1925, "total_steps": 38160, "loss": 0.527, "lr": 0.0005041928721174004, "epoch": 1.0089098532494758, "percentage": 5.04, "elapsed_time": "0:04:55", "remaining_time": "1:32:45", "throughput": 4253.79, "total_tokens": 1257744} {"current_steps": 1930, "total_steps": 38160, "loss": 0.3572, "lr": 0.0005055031446540881, "epoch": 1.0115303983228512, "percentage": 5.06, "elapsed_time": "0:04:56", "remaining_time": "1:32:43", "throughput": 4253.9, "total_tokens": 1260688} {"current_steps": 1935, "total_steps": 38160, "loss": 0.394, "lr": 0.0005068134171907757, "epoch": 1.0141509433962264, "percentage": 5.07, "elapsed_time": "0:04:57", "remaining_time": "1:32:41", "throughput": 4254.39, "total_tokens": 1263920} {"current_steps": 1940, "total_steps": 38160, "loss": 0.6, "lr": 0.0005081236897274634, "epoch": 1.0167714884696017, "percentage": 5.08, "elapsed_time": "0:04:57", "remaining_time": "1:32:39", "throughput": 4254.5, "total_tokens": 1266992} {"current_steps": 1945, "total_steps": 38160, "loss": 0.4211, "lr": 0.000509433962264151, "epoch": 1.019392033542977, "percentage": 5.1, "elapsed_time": "0:04:58", "remaining_time": "1:32:39", "throughput": 4255.51, "total_tokens": 1270544} {"current_steps": 1950, "total_steps": 38160, "loss": 0.4144, "lr": 0.0005107442348008385, "epoch": 1.0220125786163523, "percentage": 5.11, "elapsed_time": "0:04:59", "remaining_time": "1:32:37", "throughput": 4256.07, "total_tokens": 1273840} {"current_steps": 1955, "total_steps": 38160, "loss": 0.389, "lr": 0.0005120545073375262, "epoch": 1.0246331236897275, "percentage": 5.12, "elapsed_time": "0:04:59", "remaining_time": "1:32:34", "throughput": 4255.68, "total_tokens": 1276464} {"current_steps": 1960, "total_steps": 38160, "loss": 0.4894, "lr": 0.0005133647798742138, "epoch": 1.0272536687631026, "percentage": 5.14, "elapsed_time": "0:05:00", "remaining_time": "1:32:33", "throughput": 4257.05, "total_tokens": 1280144} {"current_steps": 1965, "total_steps": 38160, "loss": 0.4626, "lr": 0.0005146750524109015, "epoch": 1.029874213836478, "percentage": 5.15, "elapsed_time": "0:05:01", "remaining_time": "1:32:31", "throughput": 4257.05, "total_tokens": 1283088} {"current_steps": 1970, "total_steps": 38160, "loss": 0.5955, "lr": 0.0005159853249475891, "epoch": 1.0324947589098532, "percentage": 5.16, "elapsed_time": "0:05:02", "remaining_time": "1:32:32", "throughput": 4258.66, "total_tokens": 1287088} {"current_steps": 1975, "total_steps": 38160, "loss": 0.4859, "lr": 0.0005172955974842768, "epoch": 1.0351153039832286, "percentage": 5.18, "elapsed_time": "0:05:02", "remaining_time": "1:32:30", "throughput": 4259.09, "total_tokens": 1290224} {"current_steps": 1980, "total_steps": 38160, "loss": 0.5623, "lr": 0.0005186058700209643, "epoch": 1.0377358490566038, "percentage": 5.19, "elapsed_time": "0:05:03", "remaining_time": "1:32:28", "throughput": 4259.19, "total_tokens": 1293296} {"current_steps": 1985, "total_steps": 38160, "loss": 0.4466, "lr": 0.0005199161425576519, "epoch": 1.040356394129979, "percentage": 5.2, "elapsed_time": "0:05:04", "remaining_time": "1:32:25", "throughput": 4258.93, "total_tokens": 1296048} {"current_steps": 1990, "total_steps": 38160, "loss": 0.5763, "lr": 0.0005212264150943396, "epoch": 1.0429769392033543, "percentage": 5.21, "elapsed_time": "0:05:05", "remaining_time": "1:32:24", "throughput": 4259.59, "total_tokens": 1299312} {"current_steps": 1995, "total_steps": 38160, "loss": 0.5812, "lr": 0.0005225366876310272, "epoch": 1.0455974842767295, "percentage": 5.23, "elapsed_time": "0:05:05", "remaining_time": "1:32:23", "throughput": 4260.84, "total_tokens": 1303056} {"current_steps": 2000, "total_steps": 38160, "loss": 0.4543, "lr": 0.000523846960167715, "epoch": 1.0482180293501049, "percentage": 5.24, "elapsed_time": "0:05:06", "remaining_time": "1:32:22", "throughput": 4261.32, "total_tokens": 1306288} {"current_steps": 2005, "total_steps": 38160, "loss": 0.55, "lr": 0.0005251572327044026, "epoch": 1.05083857442348, "percentage": 5.25, "elapsed_time": "0:05:07", "remaining_time": "1:32:21", "throughput": 4262.81, "total_tokens": 1310064} {"current_steps": 2010, "total_steps": 38160, "loss": 0.402, "lr": 0.0005264675052410901, "epoch": 1.0534591194968554, "percentage": 5.27, "elapsed_time": "0:05:08", "remaining_time": "1:32:21", "throughput": 4264.17, "total_tokens": 1313936} {"current_steps": 2015, "total_steps": 38160, "loss": 0.4875, "lr": 0.0005277777777777778, "epoch": 1.0560796645702306, "percentage": 5.28, "elapsed_time": "0:05:08", "remaining_time": "1:32:21", "throughput": 4265.69, "total_tokens": 1317840} {"current_steps": 2020, "total_steps": 38160, "loss": 0.5265, "lr": 0.0005290880503144654, "epoch": 1.0587002096436058, "percentage": 5.29, "elapsed_time": "0:05:09", "remaining_time": "1:32:19", "throughput": 4266.03, "total_tokens": 1320880} {"current_steps": 2025, "total_steps": 38160, "loss": 0.4682, "lr": 0.0005303983228511531, "epoch": 1.0613207547169812, "percentage": 5.31, "elapsed_time": "0:05:10", "remaining_time": "1:32:18", "throughput": 4266.87, "total_tokens": 1324400} {"current_steps": 2030, "total_steps": 38160, "loss": 0.5347, "lr": 0.0005317085953878407, "epoch": 1.0639412997903563, "percentage": 5.32, "elapsed_time": "0:05:11", "remaining_time": "1:32:16", "throughput": 4266.81, "total_tokens": 1327216} {"current_steps": 2035, "total_steps": 38160, "loss": 0.5075, "lr": 0.0005330188679245284, "epoch": 1.0665618448637317, "percentage": 5.33, "elapsed_time": "0:05:11", "remaining_time": "1:32:13", "throughput": 4266.17, "total_tokens": 1329712} {"current_steps": 2040, "total_steps": 38160, "loss": 0.6189, "lr": 0.000534329140461216, "epoch": 1.069182389937107, "percentage": 5.35, "elapsed_time": "0:05:12", "remaining_time": "1:32:11", "throughput": 4266.42, "total_tokens": 1332784} {"current_steps": 2045, "total_steps": 38160, "loss": 0.482, "lr": 0.0005356394129979035, "epoch": 1.0718029350104823, "percentage": 5.36, "elapsed_time": "0:05:13", "remaining_time": "1:32:09", "throughput": 4266.87, "total_tokens": 1335984} {"current_steps": 2050, "total_steps": 38160, "loss": 0.5289, "lr": 0.0005369496855345912, "epoch": 1.0744234800838575, "percentage": 5.37, "elapsed_time": "0:05:13", "remaining_time": "1:32:07", "throughput": 4266.98, "total_tokens": 1338960} {"current_steps": 2055, "total_steps": 38160, "loss": 0.4886, "lr": 0.0005382599580712788, "epoch": 1.0770440251572326, "percentage": 5.39, "elapsed_time": "0:05:14", "remaining_time": "1:32:05", "throughput": 4267.21, "total_tokens": 1342000} {"current_steps": 2060, "total_steps": 38160, "loss": 0.5154, "lr": 0.0005395702306079665, "epoch": 1.079664570230608, "percentage": 5.4, "elapsed_time": "0:05:15", "remaining_time": "1:32:02", "throughput": 4266.43, "total_tokens": 1344400} {"current_steps": 2065, "total_steps": 38160, "loss": 0.4868, "lr": 0.0005408805031446541, "epoch": 1.0822851153039832, "percentage": 5.41, "elapsed_time": "0:05:15", "remaining_time": "1:32:00", "throughput": 4266.59, "total_tokens": 1347440} {"current_steps": 2070, "total_steps": 38160, "loss": 0.5274, "lr": 0.0005421907756813418, "epoch": 1.0849056603773586, "percentage": 5.42, "elapsed_time": "0:05:16", "remaining_time": "1:32:01", "throughput": 4269.09, "total_tokens": 1352048} {"current_steps": 2075, "total_steps": 38160, "loss": 0.5403, "lr": 0.0005435010482180293, "epoch": 1.0875262054507338, "percentage": 5.44, "elapsed_time": "0:05:17", "remaining_time": "1:31:59", "throughput": 4269.13, "total_tokens": 1354928} {"current_steps": 2080, "total_steps": 38160, "loss": 0.5154, "lr": 0.0005448113207547169, "epoch": 1.090146750524109, "percentage": 5.45, "elapsed_time": "0:05:18", "remaining_time": "1:31:57", "throughput": 4269.35, "total_tokens": 1357968} {"current_steps": 2085, "total_steps": 38160, "loss": 0.4298, "lr": 0.0005461215932914046, "epoch": 1.0927672955974843, "percentage": 5.46, "elapsed_time": "0:05:18", "remaining_time": "1:31:55", "throughput": 4269.88, "total_tokens": 1361168} {"current_steps": 2090, "total_steps": 38160, "loss": 0.5769, "lr": 0.0005474318658280922, "epoch": 1.0953878406708595, "percentage": 5.48, "elapsed_time": "0:05:19", "remaining_time": "1:31:56", "throughput": 4272.14, "total_tokens": 1365584} {"current_steps": 2095, "total_steps": 38160, "loss": 0.5615, "lr": 0.0005487421383647799, "epoch": 1.0980083857442349, "percentage": 5.49, "elapsed_time": "0:05:20", "remaining_time": "1:31:56", "throughput": 4273.45, "total_tokens": 1369424} {"current_steps": 2100, "total_steps": 38160, "loss": 0.5237, "lr": 0.0005500524109014676, "epoch": 1.10062893081761, "percentage": 5.5, "elapsed_time": "0:05:21", "remaining_time": "1:31:53", "throughput": 4272.84, "total_tokens": 1371952} {"current_steps": 2105, "total_steps": 38160, "loss": 0.4379, "lr": 0.0005513626834381551, "epoch": 1.1032494758909852, "percentage": 5.52, "elapsed_time": "0:05:21", "remaining_time": "1:31:50", "throughput": 4272.19, "total_tokens": 1374352} {"current_steps": 2110, "total_steps": 38160, "loss": 0.3714, "lr": 0.0005526729559748428, "epoch": 1.1058700209643606, "percentage": 5.53, "elapsed_time": "0:05:22", "remaining_time": "1:31:47", "throughput": 4271.52, "total_tokens": 1376848} {"current_steps": 2115, "total_steps": 38160, "loss": 0.5226, "lr": 0.0005539832285115304, "epoch": 1.1084905660377358, "percentage": 5.54, "elapsed_time": "0:05:23", "remaining_time": "1:31:45", "throughput": 4272.32, "total_tokens": 1380240} {"current_steps": 2120, "total_steps": 38160, "loss": 0.4383, "lr": 0.0005552935010482181, "epoch": 1.1111111111111112, "percentage": 5.56, "elapsed_time": "0:05:23", "remaining_time": "1:31:45", "throughput": 4273.59, "total_tokens": 1384048} {"current_steps": 2125, "total_steps": 38160, "loss": 0.4217, "lr": 0.0005566037735849057, "epoch": 1.1137316561844863, "percentage": 5.57, "elapsed_time": "0:05:24", "remaining_time": "1:31:44", "throughput": 4274.4, "total_tokens": 1387504} {"current_steps": 2130, "total_steps": 38160, "loss": 0.4801, "lr": 0.0005579140461215934, "epoch": 1.1163522012578617, "percentage": 5.58, "elapsed_time": "0:05:25", "remaining_time": "1:31:43", "throughput": 4275.11, "total_tokens": 1390960} {"current_steps": 2135, "total_steps": 38160, "loss": 0.4325, "lr": 0.000559224318658281, "epoch": 1.118972746331237, "percentage": 5.59, "elapsed_time": "0:05:26", "remaining_time": "1:31:41", "throughput": 4275.04, "total_tokens": 1393744} {"current_steps": 2140, "total_steps": 38160, "loss": 0.5661, "lr": 0.0005605345911949685, "epoch": 1.121593291404612, "percentage": 5.61, "elapsed_time": "0:05:26", "remaining_time": "1:31:39", "throughput": 4275.68, "total_tokens": 1397040} {"current_steps": 2145, "total_steps": 38160, "loss": 0.4695, "lr": 0.0005618448637316562, "epoch": 1.1242138364779874, "percentage": 5.62, "elapsed_time": "0:05:27", "remaining_time": "1:31:37", "throughput": 4275.84, "total_tokens": 1400080} {"current_steps": 2150, "total_steps": 38160, "loss": 0.5518, "lr": 0.0005631551362683438, "epoch": 1.1268343815513626, "percentage": 5.63, "elapsed_time": "0:05:28", "remaining_time": "1:31:35", "throughput": 4275.58, "total_tokens": 1402864} {"current_steps": 2155, "total_steps": 38160, "loss": 0.588, "lr": 0.0005644654088050315, "epoch": 1.129454926624738, "percentage": 5.65, "elapsed_time": "0:05:28", "remaining_time": "1:31:33", "throughput": 4275.8, "total_tokens": 1405904} {"current_steps": 2160, "total_steps": 38160, "loss": 0.4603, "lr": 0.0005657756813417191, "epoch": 1.1320754716981132, "percentage": 5.66, "elapsed_time": "0:05:29", "remaining_time": "1:31:31", "throughput": 4275.81, "total_tokens": 1408848} {"current_steps": 2165, "total_steps": 38160, "loss": 0.4366, "lr": 0.0005670859538784067, "epoch": 1.1346960167714886, "percentage": 5.67, "elapsed_time": "0:05:30", "remaining_time": "1:31:30", "throughput": 4276.46, "total_tokens": 1412208} {"current_steps": 2170, "total_steps": 38160, "loss": 0.5176, "lr": 0.0005683962264150943, "epoch": 1.1373165618448637, "percentage": 5.69, "elapsed_time": "0:05:30", "remaining_time": "1:31:29", "throughput": 4277.15, "total_tokens": 1415664} {"current_steps": 2175, "total_steps": 38160, "loss": 0.4427, "lr": 0.0005697064989517819, "epoch": 1.139937106918239, "percentage": 5.7, "elapsed_time": "0:05:31", "remaining_time": "1:31:29", "throughput": 4278.69, "total_tokens": 1419696} {"current_steps": 2180, "total_steps": 38160, "loss": 0.5203, "lr": 0.0005710167714884696, "epoch": 1.1425576519916143, "percentage": 5.71, "elapsed_time": "0:05:32", "remaining_time": "1:31:27", "throughput": 4278.73, "total_tokens": 1422672} {"current_steps": 2185, "total_steps": 38160, "loss": 0.5894, "lr": 0.0005723270440251572, "epoch": 1.1451781970649895, "percentage": 5.73, "elapsed_time": "0:05:33", "remaining_time": "1:31:25", "throughput": 4278.57, "total_tokens": 1425520} {"current_steps": 2190, "total_steps": 38160, "loss": 0.6136, "lr": 0.0005736373165618449, "epoch": 1.1477987421383649, "percentage": 5.74, "elapsed_time": "0:05:33", "remaining_time": "1:31:22", "throughput": 4278.05, "total_tokens": 1428016} {"current_steps": 2195, "total_steps": 38160, "loss": 0.4489, "lr": 0.0005749475890985325, "epoch": 1.15041928721174, "percentage": 5.75, "elapsed_time": "0:05:34", "remaining_time": "1:31:19", "throughput": 4277.43, "total_tokens": 1430480} {"current_steps": 2200, "total_steps": 38160, "loss": 0.4657, "lr": 0.0005762578616352201, "epoch": 1.1530398322851152, "percentage": 5.77, "elapsed_time": "0:05:35", "remaining_time": "1:31:16", "throughput": 4276.7, "total_tokens": 1432848} {"current_steps": 2205, "total_steps": 38160, "loss": 0.5685, "lr": 0.0005775681341719078, "epoch": 1.1556603773584906, "percentage": 5.78, "elapsed_time": "0:05:35", "remaining_time": "1:31:14", "throughput": 4276.66, "total_tokens": 1435728} {"current_steps": 2210, "total_steps": 38160, "loss": 0.5196, "lr": 0.0005788784067085954, "epoch": 1.1582809224318658, "percentage": 5.79, "elapsed_time": "0:05:36", "remaining_time": "1:31:11", "throughput": 4276.03, "total_tokens": 1438160} {"current_steps": 2215, "total_steps": 38160, "loss": 0.462, "lr": 0.0005801886792452831, "epoch": 1.1609014675052411, "percentage": 5.8, "elapsed_time": "0:05:36", "remaining_time": "1:31:08", "throughput": 4275.8, "total_tokens": 1440848} {"current_steps": 2220, "total_steps": 38160, "loss": 0.5442, "lr": 0.0005814989517819707, "epoch": 1.1635220125786163, "percentage": 5.82, "elapsed_time": "0:05:37", "remaining_time": "1:31:06", "throughput": 4275.79, "total_tokens": 1443728} {"current_steps": 2225, "total_steps": 38160, "loss": 0.4609, "lr": 0.0005828092243186583, "epoch": 1.1661425576519917, "percentage": 5.83, "elapsed_time": "0:05:38", "remaining_time": "1:31:03", "throughput": 4275.52, "total_tokens": 1446448} {"current_steps": 2230, "total_steps": 38160, "loss": 0.465, "lr": 0.000584119496855346, "epoch": 1.1687631027253669, "percentage": 5.84, "elapsed_time": "0:05:39", "remaining_time": "1:31:03", "throughput": 4276.23, "total_tokens": 1449936} {"current_steps": 2235, "total_steps": 38160, "loss": 0.4845, "lr": 0.0005854297693920335, "epoch": 1.171383647798742, "percentage": 5.86, "elapsed_time": "0:05:39", "remaining_time": "1:31:01", "throughput": 4276.4, "total_tokens": 1452976} {"current_steps": 2240, "total_steps": 38160, "loss": 0.3964, "lr": 0.0005867400419287212, "epoch": 1.1740041928721174, "percentage": 5.87, "elapsed_time": "0:05:40", "remaining_time": "1:30:59", "throughput": 4276.67, "total_tokens": 1456080} {"current_steps": 2245, "total_steps": 38160, "loss": 0.492, "lr": 0.0005880503144654088, "epoch": 1.1766247379454926, "percentage": 5.88, "elapsed_time": "0:05:41", "remaining_time": "1:30:58", "throughput": 4277.19, "total_tokens": 1459344} {"current_steps": 2250, "total_steps": 38160, "loss": 0.5026, "lr": 0.0005893605870020965, "epoch": 1.179245283018868, "percentage": 5.9, "elapsed_time": "0:05:41", "remaining_time": "1:30:56", "throughput": 4277.22, "total_tokens": 1462288} {"current_steps": 2255, "total_steps": 38160, "loss": 0.4884, "lr": 0.0005906708595387841, "epoch": 1.1818658280922432, "percentage": 5.91, "elapsed_time": "0:05:42", "remaining_time": "1:30:54", "throughput": 4277.01, "total_tokens": 1465072} {"current_steps": 2260, "total_steps": 38160, "loss": 0.4727, "lr": 0.0005919811320754716, "epoch": 1.1844863731656186, "percentage": 5.92, "elapsed_time": "0:05:43", "remaining_time": "1:30:52", "throughput": 4277.55, "total_tokens": 1468304} {"current_steps": 2265, "total_steps": 38160, "loss": 0.5812, "lr": 0.0005932914046121593, "epoch": 1.1871069182389937, "percentage": 5.94, "elapsed_time": "0:05:43", "remaining_time": "1:30:50", "throughput": 4277.32, "total_tokens": 1471152} {"current_steps": 2270, "total_steps": 38160, "loss": 0.5111, "lr": 0.0005946016771488469, "epoch": 1.189727463312369, "percentage": 5.95, "elapsed_time": "0:05:44", "remaining_time": "1:30:48", "throughput": 4276.85, "total_tokens": 1473744} {"current_steps": 2275, "total_steps": 38160, "loss": 0.6416, "lr": 0.0005959119496855346, "epoch": 1.1923480083857443, "percentage": 5.96, "elapsed_time": "0:05:45", "remaining_time": "1:30:47", "throughput": 4277.57, "total_tokens": 1477264} {"current_steps": 2280, "total_steps": 38160, "loss": 0.4179, "lr": 0.0005972222222222222, "epoch": 1.1949685534591195, "percentage": 5.97, "elapsed_time": "0:05:46", "remaining_time": "1:30:47", "throughput": 4279.46, "total_tokens": 1481456} {"current_steps": 2285, "total_steps": 38160, "loss": 0.4789, "lr": 0.0005985324947589099, "epoch": 1.1975890985324948, "percentage": 5.99, "elapsed_time": "0:05:46", "remaining_time": "1:30:47", "throughput": 4280.69, "total_tokens": 1485200} {"current_steps": 2290, "total_steps": 38160, "loss": 0.5873, "lr": 0.0005998427672955975, "epoch": 1.20020964360587, "percentage": 6.0, "elapsed_time": "0:05:47", "remaining_time": "1:30:46", "throughput": 4281.33, "total_tokens": 1488656} {"current_steps": 2295, "total_steps": 38160, "loss": 0.7214, "lr": 0.000601153039832285, "epoch": 1.2028301886792452, "percentage": 6.01, "elapsed_time": "0:05:48", "remaining_time": "1:30:45", "throughput": 4281.92, "total_tokens": 1492016} {"current_steps": 2300, "total_steps": 38160, "loss": 0.5006, "lr": 0.0006024633123689728, "epoch": 1.2054507337526206, "percentage": 6.03, "elapsed_time": "0:05:49", "remaining_time": "1:30:45", "throughput": 4283.46, "total_tokens": 1496144} {"current_steps": 2305, "total_steps": 38160, "loss": 0.527, "lr": 0.0006037735849056604, "epoch": 1.2080712788259957, "percentage": 6.04, "elapsed_time": "0:05:49", "remaining_time": "1:30:42", "throughput": 4282.56, "total_tokens": 1498416} {"current_steps": 2310, "total_steps": 38160, "loss": 0.425, "lr": 0.0006050838574423481, "epoch": 1.2106918238993711, "percentage": 6.05, "elapsed_time": "0:05:50", "remaining_time": "1:30:40", "throughput": 4282.42, "total_tokens": 1501264} {"current_steps": 2315, "total_steps": 38160, "loss": 0.5233, "lr": 0.0006063941299790357, "epoch": 1.2133123689727463, "percentage": 6.07, "elapsed_time": "0:05:51", "remaining_time": "1:30:40", "throughput": 4283.66, "total_tokens": 1505040} {"current_steps": 2320, "total_steps": 38160, "loss": 0.5753, "lr": 0.0006077044025157233, "epoch": 1.2159329140461215, "percentage": 6.08, "elapsed_time": "0:05:52", "remaining_time": "1:30:37", "throughput": 4283.4, "total_tokens": 1507760} {"current_steps": 2325, "total_steps": 38160, "loss": 0.5118, "lr": 0.000609014675052411, "epoch": 1.2185534591194969, "percentage": 6.09, "elapsed_time": "0:05:52", "remaining_time": "1:30:37", "throughput": 4284.01, "total_tokens": 1511216} {"current_steps": 2330, "total_steps": 38160, "loss": 0.4259, "lr": 0.0006103249475890985, "epoch": 1.221174004192872, "percentage": 6.11, "elapsed_time": "0:05:53", "remaining_time": "1:30:35", "throughput": 4284.31, "total_tokens": 1514384} {"current_steps": 2335, "total_steps": 38160, "loss": 0.3829, "lr": 0.0006116352201257862, "epoch": 1.2237945492662474, "percentage": 6.12, "elapsed_time": "0:05:54", "remaining_time": "1:30:36", "throughput": 4285.82, "total_tokens": 1518544} {"current_steps": 2340, "total_steps": 38160, "loss": 0.4227, "lr": 0.0006129454926624738, "epoch": 1.2264150943396226, "percentage": 6.13, "elapsed_time": "0:05:55", "remaining_time": "1:30:35", "throughput": 4286.33, "total_tokens": 1521936} {"current_steps": 2345, "total_steps": 38160, "loss": 0.4629, "lr": 0.0006142557651991615, "epoch": 1.229035639412998, "percentage": 6.15, "elapsed_time": "0:05:55", "remaining_time": "1:30:33", "throughput": 4286.71, "total_tokens": 1525072} {"current_steps": 2350, "total_steps": 38160, "loss": 0.5717, "lr": 0.0006155660377358491, "epoch": 1.2316561844863732, "percentage": 6.16, "elapsed_time": "0:05:56", "remaining_time": "1:30:33", "throughput": 4288.21, "total_tokens": 1529168} {"current_steps": 2355, "total_steps": 38160, "loss": 0.4993, "lr": 0.0006168763102725366, "epoch": 1.2342767295597485, "percentage": 6.17, "elapsed_time": "0:05:57", "remaining_time": "1:30:31", "throughput": 4288.15, "total_tokens": 1531984} {"current_steps": 2360, "total_steps": 38160, "loss": 0.6606, "lr": 0.0006181865828092243, "epoch": 1.2368972746331237, "percentage": 6.18, "elapsed_time": "0:05:57", "remaining_time": "1:30:30", "throughput": 4288.48, "total_tokens": 1535216} {"current_steps": 2365, "total_steps": 38160, "loss": 0.3638, "lr": 0.0006194968553459119, "epoch": 1.2395178197064989, "percentage": 6.2, "elapsed_time": "0:05:58", "remaining_time": "1:30:29", "throughput": 4289.13, "total_tokens": 1538672} {"current_steps": 2370, "total_steps": 38160, "loss": 0.3774, "lr": 0.0006208071278825996, "epoch": 1.2421383647798743, "percentage": 6.21, "elapsed_time": "0:05:59", "remaining_time": "1:30:29", "throughput": 4290.14, "total_tokens": 1542352} {"current_steps": 2375, "total_steps": 38160, "loss": 0.5614, "lr": 0.0006221174004192872, "epoch": 1.2447589098532494, "percentage": 6.22, "elapsed_time": "0:06:00", "remaining_time": "1:30:27", "throughput": 4290.48, "total_tokens": 1545616} {"current_steps": 2380, "total_steps": 38160, "loss": 0.5404, "lr": 0.0006234276729559748, "epoch": 1.2473794549266248, "percentage": 6.24, "elapsed_time": "0:06:00", "remaining_time": "1:30:25", "throughput": 4290.21, "total_tokens": 1548304} {"current_steps": 2385, "total_steps": 38160, "loss": 0.4123, "lr": 0.0006247379454926625, "epoch": 1.25, "percentage": 6.25, "elapsed_time": "0:06:01", "remaining_time": "1:30:26", "throughput": 4291.66, "total_tokens": 1552528} {"current_steps": 2390, "total_steps": 38160, "loss": 0.3355, "lr": 0.00062604821802935, "epoch": 1.2526205450733752, "percentage": 6.26, "elapsed_time": "0:06:02", "remaining_time": "1:30:24", "throughput": 4291.3, "total_tokens": 1555216} {"current_steps": 2395, "total_steps": 38160, "loss": 0.5353, "lr": 0.0006273584905660377, "epoch": 1.2552410901467506, "percentage": 6.28, "elapsed_time": "0:06:03", "remaining_time": "1:30:23", "throughput": 4292.28, "total_tokens": 1558928} {"current_steps": 2400, "total_steps": 38160, "loss": 0.3545, "lr": 0.0006286687631027254, "epoch": 1.2578616352201257, "percentage": 6.29, "elapsed_time": "0:06:03", "remaining_time": "1:30:21", "throughput": 4292.01, "total_tokens": 1561648} {"current_steps": 2405, "total_steps": 38160, "loss": 0.5324, "lr": 0.0006299790356394131, "epoch": 1.2604821802935011, "percentage": 6.3, "elapsed_time": "0:06:04", "remaining_time": "1:30:23", "throughput": 4294.48, "total_tokens": 1566640} {"current_steps": 2410, "total_steps": 38160, "loss": 0.5646, "lr": 0.0006312893081761007, "epoch": 1.2631027253668763, "percentage": 6.32, "elapsed_time": "0:06:05", "remaining_time": "1:30:22", "throughput": 4294.93, "total_tokens": 1569904} {"current_steps": 2415, "total_steps": 38160, "loss": 0.6761, "lr": 0.0006325995807127883, "epoch": 1.2657232704402515, "percentage": 6.33, "elapsed_time": "0:06:06", "remaining_time": "1:30:20", "throughput": 4294.75, "total_tokens": 1572720} {"current_steps": 2420, "total_steps": 38160, "loss": 0.5592, "lr": 0.000633909853249476, "epoch": 1.2683438155136268, "percentage": 6.34, "elapsed_time": "0:06:06", "remaining_time": "1:30:18", "throughput": 4294.85, "total_tokens": 1575728} {"current_steps": 2425, "total_steps": 38160, "loss": 0.5293, "lr": 0.0006352201257861635, "epoch": 1.270964360587002, "percentage": 6.35, "elapsed_time": "0:06:07", "remaining_time": "1:30:16", "throughput": 4294.66, "total_tokens": 1578512} {"current_steps": 2430, "total_steps": 38160, "loss": 0.645, "lr": 0.0006365303983228512, "epoch": 1.2735849056603774, "percentage": 6.37, "elapsed_time": "0:06:08", "remaining_time": "1:30:13", "throughput": 4293.98, "total_tokens": 1580912} {"current_steps": 2435, "total_steps": 38160, "loss": 0.4112, "lr": 0.0006378406708595388, "epoch": 1.2762054507337526, "percentage": 6.38, "elapsed_time": "0:06:08", "remaining_time": "1:30:12", "throughput": 4294.51, "total_tokens": 1584304} {"current_steps": 2440, "total_steps": 38160, "loss": 0.5042, "lr": 0.0006391509433962265, "epoch": 1.2788259958071277, "percentage": 6.39, "elapsed_time": "0:06:09", "remaining_time": "1:30:11", "throughput": 4294.86, "total_tokens": 1587536} {"current_steps": 2445, "total_steps": 38160, "loss": 0.5149, "lr": 0.0006404612159329141, "epoch": 1.2814465408805031, "percentage": 6.41, "elapsed_time": "0:06:10", "remaining_time": "1:30:09", "throughput": 4294.92, "total_tokens": 1590544} {"current_steps": 2450, "total_steps": 38160, "loss": 0.5026, "lr": 0.0006417714884696016, "epoch": 1.2840670859538785, "percentage": 6.42, "elapsed_time": "0:06:10", "remaining_time": "1:30:07", "throughput": 4294.63, "total_tokens": 1593200} {"current_steps": 2455, "total_steps": 38160, "loss": 0.43, "lr": 0.0006430817610062893, "epoch": 1.2866876310272537, "percentage": 6.43, "elapsed_time": "0:06:11", "remaining_time": "1:30:05", "throughput": 4294.33, "total_tokens": 1595952} {"current_steps": 2460, "total_steps": 38160, "loss": 0.547, "lr": 0.0006443920335429769, "epoch": 1.2893081761006289, "percentage": 6.45, "elapsed_time": "0:06:12", "remaining_time": "1:30:03", "throughput": 4294.43, "total_tokens": 1598928} {"current_steps": 2465, "total_steps": 38160, "loss": 0.5242, "lr": 0.0006457023060796646, "epoch": 1.2919287211740043, "percentage": 6.46, "elapsed_time": "0:06:13", "remaining_time": "1:30:01", "throughput": 4294.51, "total_tokens": 1601936} {"current_steps": 2470, "total_steps": 38160, "loss": 0.4372, "lr": 0.0006470125786163522, "epoch": 1.2945492662473794, "percentage": 6.47, "elapsed_time": "0:06:13", "remaining_time": "1:29:59", "throughput": 4294.25, "total_tokens": 1604688} {"current_steps": 2475, "total_steps": 38160, "loss": 0.5817, "lr": 0.0006483228511530398, "epoch": 1.2971698113207548, "percentage": 6.49, "elapsed_time": "0:06:14", "remaining_time": "1:29:58", "throughput": 4294.89, "total_tokens": 1608176} {"current_steps": 2480, "total_steps": 38160, "loss": 0.5468, "lr": 0.0006496331236897275, "epoch": 1.29979035639413, "percentage": 6.5, "elapsed_time": "0:06:15", "remaining_time": "1:29:56", "throughput": 4294.97, "total_tokens": 1611152} {"current_steps": 2485, "total_steps": 38160, "loss": 0.3929, "lr": 0.000650943396226415, "epoch": 1.3024109014675052, "percentage": 6.51, "elapsed_time": "0:06:15", "remaining_time": "1:29:55", "throughput": 4294.96, "total_tokens": 1614096} {"current_steps": 2490, "total_steps": 38160, "loss": 0.4275, "lr": 0.0006522536687631027, "epoch": 1.3050314465408805, "percentage": 6.53, "elapsed_time": "0:06:16", "remaining_time": "1:29:52", "throughput": 4294.4, "total_tokens": 1616560} {"current_steps": 2495, "total_steps": 38160, "loss": 0.4832, "lr": 0.0006535639412997903, "epoch": 1.3076519916142557, "percentage": 6.54, "elapsed_time": "0:06:17", "remaining_time": "1:29:50", "throughput": 4294.26, "total_tokens": 1619408} {"current_steps": 2500, "total_steps": 38160, "loss": 0.6137, "lr": 0.0006548742138364781, "epoch": 1.310272536687631, "percentage": 6.55, "elapsed_time": "0:06:17", "remaining_time": "1:29:48", "throughput": 4294.26, "total_tokens": 1622384} {"current_steps": 2505, "total_steps": 38160, "loss": 0.5275, "lr": 0.0006561844863731657, "epoch": 1.3128930817610063, "percentage": 6.56, "elapsed_time": "0:06:18", "remaining_time": "1:29:47", "throughput": 4294.07, "total_tokens": 1625232} {"current_steps": 2510, "total_steps": 38160, "loss": 0.3448, "lr": 0.0006574947589098533, "epoch": 1.3155136268343814, "percentage": 6.58, "elapsed_time": "0:06:19", "remaining_time": "1:29:43", "throughput": 4293.11, "total_tokens": 1627376} {"current_steps": 2515, "total_steps": 38160, "loss": 0.4751, "lr": 0.000658805031446541, "epoch": 1.3181341719077568, "percentage": 6.59, "elapsed_time": "0:06:19", "remaining_time": "1:29:42", "throughput": 4293.26, "total_tokens": 1630384} {"current_steps": 2520, "total_steps": 38160, "loss": 0.5075, "lr": 0.0006601153039832285, "epoch": 1.320754716981132, "percentage": 6.6, "elapsed_time": "0:06:20", "remaining_time": "1:29:41", "throughput": 4294.38, "total_tokens": 1634192} {"current_steps": 2525, "total_steps": 38160, "loss": 0.5823, "lr": 0.0006614255765199162, "epoch": 1.3233752620545074, "percentage": 6.62, "elapsed_time": "0:06:21", "remaining_time": "1:29:39", "throughput": 4294.12, "total_tokens": 1636848} {"current_steps": 2530, "total_steps": 38160, "loss": 0.4161, "lr": 0.0006627358490566038, "epoch": 1.3259958071278826, "percentage": 6.63, "elapsed_time": "0:06:21", "remaining_time": "1:29:38", "throughput": 4294.31, "total_tokens": 1639952} {"current_steps": 2535, "total_steps": 38160, "loss": 0.6436, "lr": 0.0006640461215932914, "epoch": 1.3286163522012577, "percentage": 6.64, "elapsed_time": "0:06:22", "remaining_time": "1:29:35", "throughput": 4293.83, "total_tokens": 1642512} {"current_steps": 2540, "total_steps": 38160, "loss": 0.412, "lr": 0.0006653563941299791, "epoch": 1.3312368972746331, "percentage": 6.66, "elapsed_time": "0:06:23", "remaining_time": "1:29:35", "throughput": 4294.73, "total_tokens": 1646160} {"current_steps": 2545, "total_steps": 38160, "loss": 0.539, "lr": 0.0006666666666666666, "epoch": 1.3338574423480085, "percentage": 6.67, "elapsed_time": "0:06:24", "remaining_time": "1:29:34", "throughput": 4295.58, "total_tokens": 1649840} {"current_steps": 2550, "total_steps": 38160, "loss": 0.5725, "lr": 0.0006679769392033543, "epoch": 1.3364779874213837, "percentage": 6.68, "elapsed_time": "0:06:24", "remaining_time": "1:29:33", "throughput": 4295.91, "total_tokens": 1653104} {"current_steps": 2555, "total_steps": 38160, "loss": 0.4875, "lr": 0.0006692872117400419, "epoch": 1.3390985324947589, "percentage": 6.7, "elapsed_time": "0:06:25", "remaining_time": "1:29:32", "throughput": 4296.19, "total_tokens": 1656336} {"current_steps": 2560, "total_steps": 38160, "loss": 0.6059, "lr": 0.0006705974842767296, "epoch": 1.3417190775681342, "percentage": 6.71, "elapsed_time": "0:06:26", "remaining_time": "1:29:31", "throughput": 4296.84, "total_tokens": 1659824} {"current_steps": 2565, "total_steps": 38160, "loss": 0.5737, "lr": 0.0006719077568134172, "epoch": 1.3443396226415094, "percentage": 6.72, "elapsed_time": "0:06:27", "remaining_time": "1:29:30", "throughput": 4297.05, "total_tokens": 1662992} {"current_steps": 2570, "total_steps": 38160, "loss": 0.4648, "lr": 0.0006732180293501048, "epoch": 1.3469601677148848, "percentage": 6.73, "elapsed_time": "0:06:27", "remaining_time": "1:29:29", "throughput": 4297.55, "total_tokens": 1666320} {"current_steps": 2575, "total_steps": 38160, "loss": 0.4105, "lr": 0.0006745283018867925, "epoch": 1.34958071278826, "percentage": 6.75, "elapsed_time": "0:06:28", "remaining_time": "1:29:27", "throughput": 4297.47, "total_tokens": 1669264} {"current_steps": 2580, "total_steps": 38160, "loss": 0.6386, "lr": 0.00067583857442348, "epoch": 1.3522012578616351, "percentage": 6.76, "elapsed_time": "0:06:29", "remaining_time": "1:29:26", "throughput": 4297.32, "total_tokens": 1672112} {"current_steps": 2585, "total_steps": 38160, "loss": 0.4909, "lr": 0.0006771488469601677, "epoch": 1.3548218029350105, "percentage": 6.77, "elapsed_time": "0:06:29", "remaining_time": "1:29:23", "throughput": 4296.95, "total_tokens": 1674768} {"current_steps": 2590, "total_steps": 38160, "loss": 0.6396, "lr": 0.0006784591194968553, "epoch": 1.3574423480083857, "percentage": 6.79, "elapsed_time": "0:06:30", "remaining_time": "1:29:23", "throughput": 4298.0, "total_tokens": 1678480} {"current_steps": 2595, "total_steps": 38160, "loss": 0.5222, "lr": 0.0006797693920335431, "epoch": 1.360062893081761, "percentage": 6.8, "elapsed_time": "0:06:31", "remaining_time": "1:29:22", "throughput": 4298.45, "total_tokens": 1681744} {"current_steps": 2600, "total_steps": 38160, "loss": 0.5221, "lr": 0.0006810796645702307, "epoch": 1.3626834381551363, "percentage": 6.81, "elapsed_time": "0:06:31", "remaining_time": "1:29:19", "throughput": 4297.75, "total_tokens": 1684080} {"current_steps": 2605, "total_steps": 38160, "loss": 0.5392, "lr": 0.0006823899371069183, "epoch": 1.3653039832285114, "percentage": 6.83, "elapsed_time": "0:06:32", "remaining_time": "1:29:20", "throughput": 4299.4, "total_tokens": 1688432} {"current_steps": 2610, "total_steps": 38160, "loss": 0.6304, "lr": 0.0006837002096436059, "epoch": 1.3679245283018868, "percentage": 6.84, "elapsed_time": "0:06:33", "remaining_time": "1:29:19", "throughput": 4300.17, "total_tokens": 1692144} {"current_steps": 2615, "total_steps": 38160, "loss": 0.4579, "lr": 0.0006850104821802935, "epoch": 1.370545073375262, "percentage": 6.85, "elapsed_time": "0:06:34", "remaining_time": "1:29:19", "throughput": 4300.75, "total_tokens": 1695600} {"current_steps": 2620, "total_steps": 38160, "loss": 0.4402, "lr": 0.0006863207547169812, "epoch": 1.3731656184486374, "percentage": 6.87, "elapsed_time": "0:06:35", "remaining_time": "1:29:18", "throughput": 4301.51, "total_tokens": 1699216} {"current_steps": 2625, "total_steps": 38160, "loss": 0.5409, "lr": 0.0006876310272536688, "epoch": 1.3757861635220126, "percentage": 6.88, "elapsed_time": "0:06:35", "remaining_time": "1:29:16", "throughput": 4301.35, "total_tokens": 1702128} {"current_steps": 2630, "total_steps": 38160, "loss": 0.4763, "lr": 0.0006889412997903564, "epoch": 1.3784067085953877, "percentage": 6.89, "elapsed_time": "0:06:36", "remaining_time": "1:29:15", "throughput": 4301.81, "total_tokens": 1705392} {"current_steps": 2635, "total_steps": 38160, "loss": 0.6215, "lr": 0.0006902515723270441, "epoch": 1.381027253668763, "percentage": 6.91, "elapsed_time": "0:06:37", "remaining_time": "1:29:13", "throughput": 4301.68, "total_tokens": 1708272} {"current_steps": 2640, "total_steps": 38160, "loss": 0.4733, "lr": 0.0006915618448637316, "epoch": 1.3836477987421385, "percentage": 6.92, "elapsed_time": "0:06:37", "remaining_time": "1:29:11", "throughput": 4301.16, "total_tokens": 1710736} {"current_steps": 2645, "total_steps": 38160, "loss": 0.546, "lr": 0.0006928721174004193, "epoch": 1.3862683438155137, "percentage": 6.93, "elapsed_time": "0:06:38", "remaining_time": "1:29:09", "throughput": 4300.85, "total_tokens": 1713424} {"current_steps": 2650, "total_steps": 38160, "loss": 0.4833, "lr": 0.0006941823899371069, "epoch": 1.3888888888888888, "percentage": 6.94, "elapsed_time": "0:06:39", "remaining_time": "1:29:07", "throughput": 4300.82, "total_tokens": 1716336} {"current_steps": 2655, "total_steps": 38160, "loss": 0.3836, "lr": 0.0006954926624737946, "epoch": 1.3915094339622642, "percentage": 6.96, "elapsed_time": "0:06:39", "remaining_time": "1:29:05", "throughput": 4300.4, "total_tokens": 1718960} {"current_steps": 2660, "total_steps": 38160, "loss": 0.516, "lr": 0.0006968029350104822, "epoch": 1.3941299790356394, "percentage": 6.97, "elapsed_time": "0:06:40", "remaining_time": "1:29:03", "throughput": 4300.54, "total_tokens": 1721904} {"current_steps": 2665, "total_steps": 38160, "loss": 0.3457, "lr": 0.0006981132075471698, "epoch": 1.3967505241090148, "percentage": 6.98, "elapsed_time": "0:06:41", "remaining_time": "1:29:02", "throughput": 4301.43, "total_tokens": 1725552} {"current_steps": 2670, "total_steps": 38160, "loss": 0.5589, "lr": 0.0006994234800838574, "epoch": 1.39937106918239, "percentage": 7.0, "elapsed_time": "0:06:41", "remaining_time": "1:29:01", "throughput": 4301.69, "total_tokens": 1728720} {"current_steps": 2675, "total_steps": 38160, "loss": 0.458, "lr": 0.000700733752620545, "epoch": 1.4019916142557651, "percentage": 7.01, "elapsed_time": "0:06:42", "remaining_time": "1:29:00", "throughput": 4301.65, "total_tokens": 1731664} {"current_steps": 2680, "total_steps": 38160, "loss": 0.4907, "lr": 0.0007020440251572327, "epoch": 1.4046121593291405, "percentage": 7.02, "elapsed_time": "0:06:43", "remaining_time": "1:28:58", "throughput": 4301.54, "total_tokens": 1734576} {"current_steps": 2685, "total_steps": 38160, "loss": 0.3672, "lr": 0.0007033542976939203, "epoch": 1.4072327044025157, "percentage": 7.04, "elapsed_time": "0:06:43", "remaining_time": "1:28:55", "throughput": 4300.68, "total_tokens": 1736784} {"current_steps": 2690, "total_steps": 38160, "loss": 0.4759, "lr": 0.0007046645702306079, "epoch": 1.409853249475891, "percentage": 7.05, "elapsed_time": "0:06:44", "remaining_time": "1:28:53", "throughput": 4300.43, "total_tokens": 1739472} {"current_steps": 2695, "total_steps": 38160, "loss": 0.4555, "lr": 0.0007059748427672957, "epoch": 1.4124737945492662, "percentage": 7.06, "elapsed_time": "0:06:45", "remaining_time": "1:28:52", "throughput": 4300.64, "total_tokens": 1742544} {"current_steps": 2700, "total_steps": 38160, "loss": 0.6462, "lr": 0.0007072851153039833, "epoch": 1.4150943396226414, "percentage": 7.08, "elapsed_time": "0:06:45", "remaining_time": "1:28:50", "throughput": 4300.56, "total_tokens": 1745456} {"current_steps": 2705, "total_steps": 38160, "loss": 0.4638, "lr": 0.0007085953878406709, "epoch": 1.4177148846960168, "percentage": 7.09, "elapsed_time": "0:06:46", "remaining_time": "1:28:50", "throughput": 4301.59, "total_tokens": 1749360} {"current_steps": 2710, "total_steps": 38160, "loss": 0.4714, "lr": 0.0007099056603773585, "epoch": 1.420335429769392, "percentage": 7.1, "elapsed_time": "0:06:47", "remaining_time": "1:28:48", "throughput": 4301.3, "total_tokens": 1752048} {"current_steps": 2715, "total_steps": 38160, "loss": 0.4382, "lr": 0.0007112159329140462, "epoch": 1.4229559748427674, "percentage": 7.11, "elapsed_time": "0:06:48", "remaining_time": "1:28:46", "throughput": 4301.42, "total_tokens": 1755088} {"current_steps": 2720, "total_steps": 38160, "loss": 0.5219, "lr": 0.0007125262054507338, "epoch": 1.4255765199161425, "percentage": 7.13, "elapsed_time": "0:06:48", "remaining_time": "1:28:45", "throughput": 4301.83, "total_tokens": 1758416} {"current_steps": 2725, "total_steps": 38160, "loss": 0.5258, "lr": 0.0007138364779874214, "epoch": 1.4281970649895177, "percentage": 7.14, "elapsed_time": "0:06:49", "remaining_time": "1:28:43", "throughput": 4301.25, "total_tokens": 1760848} {"current_steps": 2730, "total_steps": 38160, "loss": 0.4896, "lr": 0.0007151467505241091, "epoch": 1.430817610062893, "percentage": 7.15, "elapsed_time": "0:06:49", "remaining_time": "1:28:40", "throughput": 4300.35, "total_tokens": 1763024} {"current_steps": 2735, "total_steps": 38160, "loss": 0.4547, "lr": 0.0007164570230607966, "epoch": 1.4334381551362683, "percentage": 7.17, "elapsed_time": "0:06:50", "remaining_time": "1:28:39", "throughput": 4300.46, "total_tokens": 1766160} {"current_steps": 2740, "total_steps": 38160, "loss": 0.4177, "lr": 0.0007177672955974843, "epoch": 1.4360587002096437, "percentage": 7.18, "elapsed_time": "0:06:51", "remaining_time": "1:28:37", "throughput": 4300.19, "total_tokens": 1768912} {"current_steps": 2745, "total_steps": 38160, "loss": 0.5176, "lr": 0.0007190775681341719, "epoch": 1.4386792452830188, "percentage": 7.19, "elapsed_time": "0:06:52", "remaining_time": "1:28:35", "throughput": 4300.17, "total_tokens": 1771792} {"current_steps": 2750, "total_steps": 38160, "loss": 0.4662, "lr": 0.0007203878406708596, "epoch": 1.441299790356394, "percentage": 7.21, "elapsed_time": "0:06:52", "remaining_time": "1:28:34", "throughput": 4300.44, "total_tokens": 1775088} {"current_steps": 2755, "total_steps": 38160, "loss": 0.4709, "lr": 0.0007216981132075472, "epoch": 1.4439203354297694, "percentage": 7.22, "elapsed_time": "0:06:53", "remaining_time": "1:28:34", "throughput": 4301.28, "total_tokens": 1778736} {"current_steps": 2760, "total_steps": 38160, "loss": 0.4023, "lr": 0.0007230083857442348, "epoch": 1.4465408805031448, "percentage": 7.23, "elapsed_time": "0:06:54", "remaining_time": "1:28:33", "throughput": 4301.62, "total_tokens": 1782000} {"current_steps": 2765, "total_steps": 38160, "loss": 0.7024, "lr": 0.0007243186582809224, "epoch": 1.44916142557652, "percentage": 7.25, "elapsed_time": "0:06:54", "remaining_time": "1:28:32", "throughput": 4301.93, "total_tokens": 1785168} {"current_steps": 2770, "total_steps": 38160, "loss": 0.5612, "lr": 0.00072562893081761, "epoch": 1.4517819706498951, "percentage": 7.26, "elapsed_time": "0:06:55", "remaining_time": "1:28:32", "throughput": 4303.33, "total_tokens": 1789264} {"current_steps": 2775, "total_steps": 38160, "loss": 0.5072, "lr": 0.0007269392033542977, "epoch": 1.4544025157232705, "percentage": 7.27, "elapsed_time": "0:06:56", "remaining_time": "1:28:30", "throughput": 4303.27, "total_tokens": 1792144} {"current_steps": 2780, "total_steps": 38160, "loss": 0.4751, "lr": 0.0007282494758909853, "epoch": 1.4570230607966457, "percentage": 7.29, "elapsed_time": "0:06:57", "remaining_time": "1:28:30", "throughput": 4304.18, "total_tokens": 1795952} {"current_steps": 2785, "total_steps": 38160, "loss": 0.439, "lr": 0.0007295597484276729, "epoch": 1.459643605870021, "percentage": 7.3, "elapsed_time": "0:06:58", "remaining_time": "1:28:29", "throughput": 4304.98, "total_tokens": 1799632} {"current_steps": 2790, "total_steps": 38160, "loss": 0.4248, "lr": 0.0007308700209643606, "epoch": 1.4622641509433962, "percentage": 7.31, "elapsed_time": "0:06:58", "remaining_time": "1:28:29", "throughput": 4305.6, "total_tokens": 1803088} {"current_steps": 2795, "total_steps": 38160, "loss": 0.4891, "lr": 0.0007321802935010483, "epoch": 1.4648846960167714, "percentage": 7.32, "elapsed_time": "0:06:59", "remaining_time": "1:28:28", "throughput": 4306.19, "total_tokens": 1806576} {"current_steps": 2800, "total_steps": 38160, "loss": 0.4808, "lr": 0.0007334905660377359, "epoch": 1.4675052410901468, "percentage": 7.34, "elapsed_time": "0:07:00", "remaining_time": "1:28:26", "throughput": 4306.09, "total_tokens": 1809360} {"current_steps": 2805, "total_steps": 38160, "loss": 0.4297, "lr": 0.0007348008385744235, "epoch": 1.470125786163522, "percentage": 7.35, "elapsed_time": "0:07:00", "remaining_time": "1:28:25", "throughput": 4306.6, "total_tokens": 1812752} {"current_steps": 2810, "total_steps": 38160, "loss": 0.4955, "lr": 0.0007361111111111112, "epoch": 1.4727463312368974, "percentage": 7.36, "elapsed_time": "0:07:01", "remaining_time": "1:28:24", "throughput": 4306.81, "total_tokens": 1815952} {"current_steps": 2815, "total_steps": 38160, "loss": 0.4365, "lr": 0.0007374213836477988, "epoch": 1.4753668763102725, "percentage": 7.38, "elapsed_time": "0:07:02", "remaining_time": "1:28:22", "throughput": 4306.86, "total_tokens": 1818992} {"current_steps": 2820, "total_steps": 38160, "loss": 0.703, "lr": 0.0007387316561844864, "epoch": 1.4779874213836477, "percentage": 7.39, "elapsed_time": "0:07:03", "remaining_time": "1:28:22", "throughput": 4307.26, "total_tokens": 1822320} {"current_steps": 2825, "total_steps": 38160, "loss": 0.5379, "lr": 0.0007400419287211741, "epoch": 1.480607966457023, "percentage": 7.4, "elapsed_time": "0:07:03", "remaining_time": "1:28:19", "throughput": 4306.42, "total_tokens": 1824560} {"current_steps": 2830, "total_steps": 38160, "loss": 0.3867, "lr": 0.0007413522012578616, "epoch": 1.4832285115303983, "percentage": 7.42, "elapsed_time": "0:07:04", "remaining_time": "1:28:18", "throughput": 4306.71, "total_tokens": 1827728} {"current_steps": 2835, "total_steps": 38160, "loss": 0.5337, "lr": 0.0007426624737945493, "epoch": 1.4858490566037736, "percentage": 7.43, "elapsed_time": "0:07:05", "remaining_time": "1:28:16", "throughput": 4306.67, "total_tokens": 1830672} {"current_steps": 2840, "total_steps": 38160, "loss": 0.537, "lr": 0.0007439727463312369, "epoch": 1.4884696016771488, "percentage": 7.44, "elapsed_time": "0:07:05", "remaining_time": "1:28:14", "throughput": 4306.02, "total_tokens": 1833040} {"current_steps": 2845, "total_steps": 38160, "loss": 0.4736, "lr": 0.0007452830188679245, "epoch": 1.491090146750524, "percentage": 7.46, "elapsed_time": "0:07:06", "remaining_time": "1:28:15", "throughput": 4307.67, "total_tokens": 1837648} {"current_steps": 2850, "total_steps": 38160, "loss": 0.4548, "lr": 0.0007465932914046122, "epoch": 1.4937106918238994, "percentage": 7.47, "elapsed_time": "0:07:07", "remaining_time": "1:28:14", "throughput": 4307.63, "total_tokens": 1840688} {"current_steps": 2855, "total_steps": 38160, "loss": 0.5259, "lr": 0.0007479035639412998, "epoch": 1.4963312368972748, "percentage": 7.48, "elapsed_time": "0:07:07", "remaining_time": "1:28:12", "throughput": 4307.51, "total_tokens": 1843536} {"current_steps": 2860, "total_steps": 38160, "loss": 0.4096, "lr": 0.0007492138364779874, "epoch": 1.49895178197065, "percentage": 7.49, "elapsed_time": "0:07:08", "remaining_time": "1:28:09", "throughput": 4306.64, "total_tokens": 1845712} {"current_steps": 2865, "total_steps": 38160, "loss": 0.4846, "lr": 0.000750524109014675, "epoch": 1.501572327044025, "percentage": 7.51, "elapsed_time": "0:07:09", "remaining_time": "1:28:08", "throughput": 4306.68, "total_tokens": 1848656} {"current_steps": 2870, "total_steps": 38160, "loss": 0.5029, "lr": 0.0007518343815513627, "epoch": 1.5041928721174003, "percentage": 7.52, "elapsed_time": "0:07:10", "remaining_time": "1:28:07", "throughput": 4307.37, "total_tokens": 1852304} {"current_steps": 2875, "total_steps": 38160, "loss": 0.4893, "lr": 0.0007531446540880503, "epoch": 1.5068134171907757, "percentage": 7.53, "elapsed_time": "0:07:10", "remaining_time": "1:28:06", "throughput": 4307.82, "total_tokens": 1855728} {"current_steps": 2880, "total_steps": 38160, "loss": 0.5272, "lr": 0.0007544549266247379, "epoch": 1.509433962264151, "percentage": 7.55, "elapsed_time": "0:07:11", "remaining_time": "1:28:06", "throughput": 4308.46, "total_tokens": 1859344} {"current_steps": 2885, "total_steps": 38160, "loss": 0.5976, "lr": 0.0007557651991614256, "epoch": 1.5120545073375262, "percentage": 7.56, "elapsed_time": "0:07:12", "remaining_time": "1:28:05", "throughput": 4308.62, "total_tokens": 1862384} {"current_steps": 2890, "total_steps": 38160, "loss": 0.5666, "lr": 0.0007570754716981131, "epoch": 1.5146750524109014, "percentage": 7.57, "elapsed_time": "0:07:12", "remaining_time": "1:28:03", "throughput": 4308.69, "total_tokens": 1865360} {"current_steps": 2895, "total_steps": 38160, "loss": 0.4735, "lr": 0.0007583857442348009, "epoch": 1.5172955974842768, "percentage": 7.59, "elapsed_time": "0:07:13", "remaining_time": "1:28:01", "throughput": 4308.64, "total_tokens": 1868272} {"current_steps": 2900, "total_steps": 38160, "loss": 0.5228, "lr": 0.0007596960167714885, "epoch": 1.519916142557652, "percentage": 7.6, "elapsed_time": "0:07:14", "remaining_time": "1:28:01", "throughput": 4309.49, "total_tokens": 1871984} {"current_steps": 2905, "total_steps": 38160, "loss": 0.5279, "lr": 0.0007610062893081762, "epoch": 1.5225366876310273, "percentage": 7.61, "elapsed_time": "0:07:15", "remaining_time": "1:28:01", "throughput": 4310.79, "total_tokens": 1876176} {"current_steps": 2910, "total_steps": 38160, "loss": 0.5516, "lr": 0.0007623165618448638, "epoch": 1.5251572327044025, "percentage": 7.63, "elapsed_time": "0:07:15", "remaining_time": "1:28:00", "throughput": 4310.65, "total_tokens": 1878992} {"current_steps": 2915, "total_steps": 38160, "loss": 0.4287, "lr": 0.0007636268343815514, "epoch": 1.5277777777777777, "percentage": 7.64, "elapsed_time": "0:07:16", "remaining_time": "1:27:59", "throughput": 4311.38, "total_tokens": 1882736} {"current_steps": 2920, "total_steps": 38160, "loss": 0.6979, "lr": 0.0007649371069182391, "epoch": 1.530398322851153, "percentage": 7.65, "elapsed_time": "0:07:17", "remaining_time": "1:27:58", "throughput": 4311.33, "total_tokens": 1885616} {"current_steps": 2925, "total_steps": 38160, "loss": 0.4155, "lr": 0.0007662473794549266, "epoch": 1.5330188679245285, "percentage": 7.67, "elapsed_time": "0:07:18", "remaining_time": "1:27:57", "throughput": 4311.59, "total_tokens": 1888848} {"current_steps": 2930, "total_steps": 38160, "loss": 0.5459, "lr": 0.0007675576519916143, "epoch": 1.5356394129979036, "percentage": 7.68, "elapsed_time": "0:07:18", "remaining_time": "1:27:55", "throughput": 4311.58, "total_tokens": 1891792} {"current_steps": 2935, "total_steps": 38160, "loss": 0.6448, "lr": 0.0007688679245283019, "epoch": 1.5382599580712788, "percentage": 7.69, "elapsed_time": "0:07:19", "remaining_time": "1:27:53", "throughput": 4311.42, "total_tokens": 1894544} {"current_steps": 2940, "total_steps": 38160, "loss": 0.4471, "lr": 0.0007701781970649895, "epoch": 1.540880503144654, "percentage": 7.7, "elapsed_time": "0:07:20", "remaining_time": "1:27:52", "throughput": 4311.14, "total_tokens": 1897264} {"current_steps": 2945, "total_steps": 38160, "loss": 0.3126, "lr": 0.0007714884696016772, "epoch": 1.5435010482180294, "percentage": 7.72, "elapsed_time": "0:07:21", "remaining_time": "1:27:53", "throughput": 4312.71, "total_tokens": 1901904} {"current_steps": 2950, "total_steps": 38160, "loss": 0.5495, "lr": 0.0007727987421383648, "epoch": 1.5461215932914047, "percentage": 7.73, "elapsed_time": "0:07:21", "remaining_time": "1:27:51", "throughput": 4312.62, "total_tokens": 1904848} {"current_steps": 2955, "total_steps": 38160, "loss": 0.5259, "lr": 0.0007741090146750524, "epoch": 1.54874213836478, "percentage": 7.74, "elapsed_time": "0:07:22", "remaining_time": "1:27:50", "throughput": 4312.48, "total_tokens": 1907696} {"current_steps": 2960, "total_steps": 38160, "loss": 0.4677, "lr": 0.00077541928721174, "epoch": 1.551362683438155, "percentage": 7.76, "elapsed_time": "0:07:22", "remaining_time": "1:27:47", "throughput": 4311.96, "total_tokens": 1910128} {"current_steps": 2965, "total_steps": 38160, "loss": 0.4919, "lr": 0.0007767295597484277, "epoch": 1.5539832285115303, "percentage": 7.77, "elapsed_time": "0:07:23", "remaining_time": "1:27:46", "throughput": 4312.0, "total_tokens": 1913136} {"current_steps": 2970, "total_steps": 38160, "loss": 0.5161, "lr": 0.0007780398322851153, "epoch": 1.5566037735849056, "percentage": 7.78, "elapsed_time": "0:07:24", "remaining_time": "1:27:47", "throughput": 4313.6, "total_tokens": 1917776} {"current_steps": 2975, "total_steps": 38160, "loss": 0.5325, "lr": 0.0007793501048218029, "epoch": 1.559224318658281, "percentage": 7.8, "elapsed_time": "0:07:25", "remaining_time": "1:27:45", "throughput": 4313.23, "total_tokens": 1920368} {"current_steps": 2980, "total_steps": 38160, "loss": 0.6414, "lr": 0.0007806603773584906, "epoch": 1.5618448637316562, "percentage": 7.81, "elapsed_time": "0:07:25", "remaining_time": "1:27:43", "throughput": 4312.86, "total_tokens": 1922960} {"current_steps": 2985, "total_steps": 38160, "loss": 0.4745, "lr": 0.0007819706498951781, "epoch": 1.5644654088050314, "percentage": 7.82, "elapsed_time": "0:07:26", "remaining_time": "1:27:42", "throughput": 4312.92, "total_tokens": 1925904} {"current_steps": 2990, "total_steps": 38160, "loss": 0.6032, "lr": 0.0007832809224318658, "epoch": 1.5670859538784065, "percentage": 7.84, "elapsed_time": "0:07:27", "remaining_time": "1:27:48", "throughput": 4317.43, "total_tokens": 1933904} {"current_steps": 2995, "total_steps": 38160, "loss": 0.3317, "lr": 0.0007845911949685535, "epoch": 1.569706498951782, "percentage": 7.85, "elapsed_time": "0:07:28", "remaining_time": "1:27:46", "throughput": 4317.25, "total_tokens": 1936656} {"current_steps": 3000, "total_steps": 38160, "loss": 0.5478, "lr": 0.0007859014675052411, "epoch": 1.5723270440251573, "percentage": 7.86, "elapsed_time": "0:07:29", "remaining_time": "1:27:45", "throughput": 4316.98, "total_tokens": 1939440} {"current_steps": 3005, "total_steps": 38160, "loss": 0.5434, "lr": 0.0007872117400419288, "epoch": 1.5749475890985325, "percentage": 7.87, "elapsed_time": "0:07:29", "remaining_time": "1:27:43", "throughput": 4317.03, "total_tokens": 1942416} {"current_steps": 3010, "total_steps": 38160, "loss": 0.588, "lr": 0.0007885220125786164, "epoch": 1.5775681341719077, "percentage": 7.89, "elapsed_time": "0:07:30", "remaining_time": "1:27:43", "throughput": 4317.82, "total_tokens": 1946288} {"current_steps": 3015, "total_steps": 38160, "loss": 0.4643, "lr": 0.0007898322851153041, "epoch": 1.580188679245283, "percentage": 7.9, "elapsed_time": "0:07:31", "remaining_time": "1:27:46", "throughput": 4320.13, "total_tokens": 1951792} {"current_steps": 3020, "total_steps": 38160, "loss": 0.4532, "lr": 0.0007911425576519916, "epoch": 1.5828092243186582, "percentage": 7.91, "elapsed_time": "0:07:32", "remaining_time": "1:27:46", "throughput": 4320.86, "total_tokens": 1955504} {"current_steps": 3025, "total_steps": 38160, "loss": 0.5254, "lr": 0.0007924528301886793, "epoch": 1.5854297693920336, "percentage": 7.93, "elapsed_time": "0:07:33", "remaining_time": "1:27:44", "throughput": 4320.58, "total_tokens": 1958224} {"current_steps": 3030, "total_steps": 38160, "loss": 0.3934, "lr": 0.0007937631027253669, "epoch": 1.5880503144654088, "percentage": 7.94, "elapsed_time": "0:07:34", "remaining_time": "1:27:44", "throughput": 4321.64, "total_tokens": 1962320} {"current_steps": 3035, "total_steps": 38160, "loss": 0.396, "lr": 0.0007950733752620545, "epoch": 1.590670859538784, "percentage": 7.95, "elapsed_time": "0:07:34", "remaining_time": "1:27:43", "throughput": 4321.87, "total_tokens": 1965616} {"current_steps": 3040, "total_steps": 38160, "loss": 0.5609, "lr": 0.0007963836477987422, "epoch": 1.5932914046121593, "percentage": 7.97, "elapsed_time": "0:07:35", "remaining_time": "1:27:41", "throughput": 4321.47, "total_tokens": 1968272} {"current_steps": 3045, "total_steps": 38160, "loss": 0.4636, "lr": 0.0007976939203354298, "epoch": 1.5959119496855347, "percentage": 7.98, "elapsed_time": "0:07:36", "remaining_time": "1:27:40", "throughput": 4321.81, "total_tokens": 1971504} {"current_steps": 3050, "total_steps": 38160, "loss": 0.5369, "lr": 0.0007990041928721174, "epoch": 1.59853249475891, "percentage": 7.99, "elapsed_time": "0:07:36", "remaining_time": "1:27:40", "throughput": 4322.68, "total_tokens": 1975312} {"current_steps": 3055, "total_steps": 38160, "loss": 0.5006, "lr": 0.000800314465408805, "epoch": 1.601153039832285, "percentage": 8.01, "elapsed_time": "0:07:37", "remaining_time": "1:27:37", "throughput": 4321.91, "total_tokens": 1977552} {"current_steps": 3060, "total_steps": 38160, "loss": 0.5248, "lr": 0.0008016247379454927, "epoch": 1.6037735849056602, "percentage": 8.02, "elapsed_time": "0:07:38", "remaining_time": "1:27:36", "throughput": 4322.32, "total_tokens": 1980912} {"current_steps": 3065, "total_steps": 38160, "loss": 0.5173, "lr": 0.0008029350104821803, "epoch": 1.6063941299790356, "percentage": 8.03, "elapsed_time": "0:07:38", "remaining_time": "1:27:35", "throughput": 4322.34, "total_tokens": 1983920} {"current_steps": 3070, "total_steps": 38160, "loss": 0.4386, "lr": 0.0008042452830188679, "epoch": 1.609014675052411, "percentage": 8.05, "elapsed_time": "0:07:39", "remaining_time": "1:27:34", "throughput": 4322.78, "total_tokens": 1987408} {"current_steps": 3075, "total_steps": 38160, "loss": 0.4703, "lr": 0.0008055555555555556, "epoch": 1.6116352201257862, "percentage": 8.06, "elapsed_time": "0:07:40", "remaining_time": "1:27:35", "throughput": 4323.92, "total_tokens": 1991568} {"current_steps": 3080, "total_steps": 38160, "loss": 0.4625, "lr": 0.0008068658280922431, "epoch": 1.6142557651991614, "percentage": 8.07, "elapsed_time": "0:07:41", "remaining_time": "1:27:35", "throughput": 4324.85, "total_tokens": 1995440} {"current_steps": 3085, "total_steps": 38160, "loss": 0.6685, "lr": 0.0008081761006289308, "epoch": 1.6168763102725365, "percentage": 8.08, "elapsed_time": "0:07:42", "remaining_time": "1:27:34", "throughput": 4325.56, "total_tokens": 1999184} {"current_steps": 3090, "total_steps": 38160, "loss": 0.5055, "lr": 0.0008094863731656184, "epoch": 1.619496855345912, "percentage": 8.1, "elapsed_time": "0:07:42", "remaining_time": "1:27:34", "throughput": 4326.17, "total_tokens": 2002768} {"current_steps": 3095, "total_steps": 38160, "loss": 0.4295, "lr": 0.0008107966457023061, "epoch": 1.6221174004192873, "percentage": 8.11, "elapsed_time": "0:07:43", "remaining_time": "1:27:32", "throughput": 4325.99, "total_tokens": 2005552} {"current_steps": 3100, "total_steps": 38160, "loss": 0.5125, "lr": 0.0008121069182389938, "epoch": 1.6247379454926625, "percentage": 8.12, "elapsed_time": "0:07:44", "remaining_time": "1:27:31", "throughput": 4326.0, "total_tokens": 2008592} {"current_steps": 3105, "total_steps": 38160, "loss": 0.4978, "lr": 0.0008134171907756814, "epoch": 1.6273584905660377, "percentage": 8.14, "elapsed_time": "0:07:45", "remaining_time": "1:27:30", "throughput": 4326.53, "total_tokens": 2012048} {"current_steps": 3110, "total_steps": 38160, "loss": 0.4535, "lr": 0.0008147274633123691, "epoch": 1.629979035639413, "percentage": 8.15, "elapsed_time": "0:07:45", "remaining_time": "1:27:29", "throughput": 4326.73, "total_tokens": 2015312} {"current_steps": 3115, "total_steps": 38160, "loss": 0.2887, "lr": 0.0008160377358490566, "epoch": 1.6325995807127882, "percentage": 8.16, "elapsed_time": "0:07:46", "remaining_time": "1:27:33", "throughput": 4329.23, "total_tokens": 2021424} {"current_steps": 3120, "total_steps": 38160, "loss": 0.4864, "lr": 0.0008173480083857443, "epoch": 1.6352201257861636, "percentage": 8.18, "elapsed_time": "0:07:47", "remaining_time": "1:27:31", "throughput": 4329.28, "total_tokens": 2024464} {"current_steps": 3125, "total_steps": 38160, "loss": 0.5786, "lr": 0.0008186582809224319, "epoch": 1.6378406708595388, "percentage": 8.19, "elapsed_time": "0:07:48", "remaining_time": "1:27:30", "throughput": 4329.49, "total_tokens": 2027728} {"current_steps": 3130, "total_steps": 38160, "loss": 0.4544, "lr": 0.0008199685534591195, "epoch": 1.640461215932914, "percentage": 8.2, "elapsed_time": "0:07:49", "remaining_time": "1:27:29", "throughput": 4329.92, "total_tokens": 2031088} {"current_steps": 3135, "total_steps": 38160, "loss": 0.4611, "lr": 0.0008212788259958072, "epoch": 1.6430817610062893, "percentage": 8.22, "elapsed_time": "0:07:49", "remaining_time": "1:27:29", "throughput": 4330.38, "total_tokens": 2034576} {"current_steps": 3140, "total_steps": 38160, "loss": 0.4867, "lr": 0.0008225890985324948, "epoch": 1.6457023060796647, "percentage": 8.23, "elapsed_time": "0:07:50", "remaining_time": "1:27:30", "throughput": 4332.15, "total_tokens": 2039408} {"current_steps": 3145, "total_steps": 38160, "loss": 0.4243, "lr": 0.0008238993710691824, "epoch": 1.64832285115304, "percentage": 8.24, "elapsed_time": "0:07:51", "remaining_time": "1:27:28", "throughput": 4332.18, "total_tokens": 2042384} {"current_steps": 3150, "total_steps": 38160, "loss": 0.5949, "lr": 0.00082520964360587, "epoch": 1.650943396226415, "percentage": 8.25, "elapsed_time": "0:07:52", "remaining_time": "1:27:27", "throughput": 4332.04, "total_tokens": 2045200} {"current_steps": 3155, "total_steps": 38160, "loss": 0.3712, "lr": 0.0008265199161425576, "epoch": 1.6535639412997902, "percentage": 8.27, "elapsed_time": "0:07:52", "remaining_time": "1:27:26", "throughput": 4332.44, "total_tokens": 2048720} {"current_steps": 3160, "total_steps": 38160, "loss": 0.4132, "lr": 0.0008278301886792453, "epoch": 1.6561844863731656, "percentage": 8.28, "elapsed_time": "0:07:53", "remaining_time": "1:27:25", "throughput": 4332.42, "total_tokens": 2051824} {"current_steps": 3165, "total_steps": 38160, "loss": 0.5982, "lr": 0.0008291404612159329, "epoch": 1.658805031446541, "percentage": 8.29, "elapsed_time": "0:07:54", "remaining_time": "1:27:25", "throughput": 4333.55, "total_tokens": 2055952} {"current_steps": 3170, "total_steps": 38160, "loss": 0.4403, "lr": 0.0008304507337526206, "epoch": 1.6614255765199162, "percentage": 8.31, "elapsed_time": "0:07:55", "remaining_time": "1:27:23", "throughput": 4333.12, "total_tokens": 2058512} {"current_steps": 3175, "total_steps": 38160, "loss": 0.3684, "lr": 0.0008317610062893081, "epoch": 1.6640461215932913, "percentage": 8.32, "elapsed_time": "0:07:55", "remaining_time": "1:27:21", "throughput": 4332.84, "total_tokens": 2061232} {"current_steps": 3180, "total_steps": 38160, "loss": 0.4995, "lr": 0.0008330712788259958, "epoch": 1.6666666666666665, "percentage": 8.33, "elapsed_time": "0:07:56", "remaining_time": "1:27:20", "throughput": 4332.88, "total_tokens": 2064336} {"current_steps": 3185, "total_steps": 38160, "loss": 0.6748, "lr": 0.0008343815513626834, "epoch": 1.669287211740042, "percentage": 8.35, "elapsed_time": "0:07:57", "remaining_time": "1:27:20", "throughput": 4333.45, "total_tokens": 2067984} {"current_steps": 3190, "total_steps": 38160, "loss": 0.4279, "lr": 0.000835691823899371, "epoch": 1.6719077568134173, "percentage": 8.36, "elapsed_time": "0:07:57", "remaining_time": "1:27:18", "throughput": 4333.14, "total_tokens": 2070704} {"current_steps": 3195, "total_steps": 38160, "loss": 0.4786, "lr": 0.0008370020964360588, "epoch": 1.6745283018867925, "percentage": 8.37, "elapsed_time": "0:07:58", "remaining_time": "1:27:18", "throughput": 4333.84, "total_tokens": 2074448} {"current_steps": 3200, "total_steps": 38160, "loss": 0.5169, "lr": 0.0008383123689727464, "epoch": 1.6771488469601676, "percentage": 8.39, "elapsed_time": "0:07:59", "remaining_time": "1:27:17", "throughput": 4334.11, "total_tokens": 2077712} {"current_steps": 3205, "total_steps": 38160, "loss": 0.4505, "lr": 0.000839622641509434, "epoch": 1.679769392033543, "percentage": 8.4, "elapsed_time": "0:08:00", "remaining_time": "1:27:17", "throughput": 4335.12, "total_tokens": 2081808} {"current_steps": 3210, "total_steps": 38160, "loss": 0.479, "lr": 0.0008409329140461216, "epoch": 1.6823899371069182, "percentage": 8.41, "elapsed_time": "0:08:01", "remaining_time": "1:27:18", "throughput": 4336.57, "total_tokens": 2086352} {"current_steps": 3215, "total_steps": 38160, "loss": 0.4856, "lr": 0.0008422431865828093, "epoch": 1.6850104821802936, "percentage": 8.43, "elapsed_time": "0:08:01", "remaining_time": "1:27:15", "throughput": 4335.82, "total_tokens": 2088528} {"current_steps": 3220, "total_steps": 38160, "loss": 0.3479, "lr": 0.0008435534591194969, "epoch": 1.6876310272536688, "percentage": 8.44, "elapsed_time": "0:08:02", "remaining_time": "1:27:15", "throughput": 4336.83, "total_tokens": 2092688} {"current_steps": 3225, "total_steps": 38160, "loss": 0.4925, "lr": 0.0008448637316561845, "epoch": 1.690251572327044, "percentage": 8.45, "elapsed_time": "0:08:03", "remaining_time": "1:27:16", "throughput": 4338.3, "total_tokens": 2097232} {"current_steps": 3230, "total_steps": 38160, "loss": 0.5505, "lr": 0.0008461740041928722, "epoch": 1.6928721174004193, "percentage": 8.46, "elapsed_time": "0:08:04", "remaining_time": "1:27:15", "throughput": 4338.07, "total_tokens": 2100016} {"current_steps": 3235, "total_steps": 38160, "loss": 0.4839, "lr": 0.0008474842767295598, "epoch": 1.6954926624737947, "percentage": 8.48, "elapsed_time": "0:08:04", "remaining_time": "1:27:14", "throughput": 4338.55, "total_tokens": 2103568} {"current_steps": 3240, "total_steps": 38160, "loss": 0.4973, "lr": 0.0008487945492662474, "epoch": 1.6981132075471699, "percentage": 8.49, "elapsed_time": "0:08:05", "remaining_time": "1:27:14", "throughput": 4339.69, "total_tokens": 2107792} {"current_steps": 3245, "total_steps": 38160, "loss": 0.5306, "lr": 0.000850104821802935, "epoch": 1.700733752620545, "percentage": 8.5, "elapsed_time": "0:08:06", "remaining_time": "1:27:13", "throughput": 4339.53, "total_tokens": 2110672} {"current_steps": 3250, "total_steps": 38160, "loss": 0.4757, "lr": 0.0008514150943396226, "epoch": 1.7033542976939202, "percentage": 8.52, "elapsed_time": "0:08:07", "remaining_time": "1:27:11", "throughput": 4339.26, "total_tokens": 2113424} {"current_steps": 3255, "total_steps": 38160, "loss": 0.4548, "lr": 0.0008527253668763103, "epoch": 1.7059748427672956, "percentage": 8.53, "elapsed_time": "0:08:07", "remaining_time": "1:27:11", "throughput": 4339.7, "total_tokens": 2116944} {"current_steps": 3260, "total_steps": 38160, "loss": 0.5558, "lr": 0.0008540356394129979, "epoch": 1.708595387840671, "percentage": 8.54, "elapsed_time": "0:08:08", "remaining_time": "1:27:10", "throughput": 4340.13, "total_tokens": 2120304} {"current_steps": 3265, "total_steps": 38160, "loss": 0.4992, "lr": 0.0008553459119496856, "epoch": 1.7112159329140462, "percentage": 8.56, "elapsed_time": "0:08:09", "remaining_time": "1:27:09", "throughput": 4340.98, "total_tokens": 2124208} {"current_steps": 3270, "total_steps": 38160, "loss": 0.473, "lr": 0.0008566561844863731, "epoch": 1.7138364779874213, "percentage": 8.57, "elapsed_time": "0:08:10", "remaining_time": "1:27:08", "throughput": 4341.32, "total_tokens": 2127536} {"current_steps": 3275, "total_steps": 38160, "loss": 0.3768, "lr": 0.0008579664570230608, "epoch": 1.7164570230607965, "percentage": 8.58, "elapsed_time": "0:08:10", "remaining_time": "1:27:07", "throughput": 4341.67, "total_tokens": 2130896} {"current_steps": 3280, "total_steps": 38160, "loss": 0.5606, "lr": 0.0008592767295597484, "epoch": 1.719077568134172, "percentage": 8.6, "elapsed_time": "0:08:11", "remaining_time": "1:27:06", "throughput": 4341.72, "total_tokens": 2133968} {"current_steps": 3285, "total_steps": 38160, "loss": 0.5378, "lr": 0.000860587002096436, "epoch": 1.7216981132075473, "percentage": 8.61, "elapsed_time": "0:08:12", "remaining_time": "1:27:06", "throughput": 4342.31, "total_tokens": 2137648} {"current_steps": 3290, "total_steps": 38160, "loss": 0.5685, "lr": 0.0008618972746331238, "epoch": 1.7243186582809225, "percentage": 8.62, "elapsed_time": "0:08:12", "remaining_time": "1:27:04", "throughput": 4342.07, "total_tokens": 2140368} {"current_steps": 3295, "total_steps": 38160, "loss": 0.4027, "lr": 0.0008632075471698114, "epoch": 1.7269392033542976, "percentage": 8.63, "elapsed_time": "0:08:13", "remaining_time": "1:27:02", "throughput": 4341.81, "total_tokens": 2143088} {"current_steps": 3300, "total_steps": 38160, "loss": 0.597, "lr": 0.000864517819706499, "epoch": 1.7295597484276728, "percentage": 8.65, "elapsed_time": "0:08:14", "remaining_time": "1:27:01", "throughput": 4342.04, "total_tokens": 2146352} {"current_steps": 3305, "total_steps": 38160, "loss": 0.4695, "lr": 0.0008658280922431866, "epoch": 1.7321802935010482, "percentage": 8.66, "elapsed_time": "0:08:15", "remaining_time": "1:27:01", "throughput": 4342.89, "total_tokens": 2150352} {"current_steps": 3310, "total_steps": 38160, "loss": 0.5415, "lr": 0.0008671383647798742, "epoch": 1.7348008385744236, "percentage": 8.67, "elapsed_time": "0:08:15", "remaining_time": "1:27:00", "throughput": 4343.09, "total_tokens": 2153584} {"current_steps": 3315, "total_steps": 38160, "loss": 0.5263, "lr": 0.0008684486373165619, "epoch": 1.7374213836477987, "percentage": 8.69, "elapsed_time": "0:08:16", "remaining_time": "1:27:00", "throughput": 4343.88, "total_tokens": 2157488} {"current_steps": 3320, "total_steps": 38160, "loss": 0.4566, "lr": 0.0008697589098532495, "epoch": 1.740041928721174, "percentage": 8.7, "elapsed_time": "0:08:17", "remaining_time": "1:26:58", "throughput": 4343.54, "total_tokens": 2160144} {"current_steps": 3325, "total_steps": 38160, "loss": 0.7099, "lr": 0.0008710691823899372, "epoch": 1.7426624737945493, "percentage": 8.71, "elapsed_time": "0:08:17", "remaining_time": "1:26:57", "throughput": 4343.17, "total_tokens": 2162768} {"current_steps": 3330, "total_steps": 38160, "loss": 0.669, "lr": 0.0008723794549266247, "epoch": 1.7452830188679245, "percentage": 8.73, "elapsed_time": "0:08:18", "remaining_time": "1:26:55", "throughput": 4343.09, "total_tokens": 2165616} {"current_steps": 3335, "total_steps": 38160, "loss": 0.4511, "lr": 0.0008736897274633124, "epoch": 1.7479035639412999, "percentage": 8.74, "elapsed_time": "0:08:19", "remaining_time": "1:26:54", "throughput": 4343.07, "total_tokens": 2168656} {"current_steps": 3340, "total_steps": 38160, "loss": 0.4306, "lr": 0.000875, "epoch": 1.750524109014675, "percentage": 8.75, "elapsed_time": "0:08:20", "remaining_time": "1:26:53", "throughput": 4343.38, "total_tokens": 2172048} {"current_steps": 3345, "total_steps": 38160, "loss": 0.3893, "lr": 0.0008763102725366876, "epoch": 1.7531446540880502, "percentage": 8.77, "elapsed_time": "0:08:20", "remaining_time": "1:26:52", "throughput": 4343.33, "total_tokens": 2175056} {"current_steps": 3350, "total_steps": 38160, "loss": 0.5543, "lr": 0.0008776205450733753, "epoch": 1.7557651991614256, "percentage": 8.78, "elapsed_time": "0:08:21", "remaining_time": "1:26:51", "throughput": 4343.8, "total_tokens": 2178512} {"current_steps": 3355, "total_steps": 38160, "loss": 0.4808, "lr": 0.0008789308176100629, "epoch": 1.758385744234801, "percentage": 8.79, "elapsed_time": "0:08:22", "remaining_time": "1:26:50", "throughput": 4344.41, "total_tokens": 2182096} {"current_steps": 3360, "total_steps": 38160, "loss": 0.4555, "lr": 0.0008802410901467506, "epoch": 1.7610062893081762, "percentage": 8.81, "elapsed_time": "0:08:23", "remaining_time": "1:26:50", "throughput": 4345.07, "total_tokens": 2185840} {"current_steps": 3365, "total_steps": 38160, "loss": 0.5172, "lr": 0.0008815513626834381, "epoch": 1.7636268343815513, "percentage": 8.82, "elapsed_time": "0:08:23", "remaining_time": "1:26:48", "throughput": 4344.92, "total_tokens": 2188720} {"current_steps": 3370, "total_steps": 38160, "loss": 0.5401, "lr": 0.0008828616352201258, "epoch": 1.7662473794549265, "percentage": 8.83, "elapsed_time": "0:08:24", "remaining_time": "1:26:48", "throughput": 4345.39, "total_tokens": 2192240} {"current_steps": 3375, "total_steps": 38160, "loss": 0.4379, "lr": 0.0008841719077568134, "epoch": 1.7688679245283019, "percentage": 8.84, "elapsed_time": "0:08:25", "remaining_time": "1:26:47", "throughput": 4346.16, "total_tokens": 2196112} {"current_steps": 3380, "total_steps": 38160, "loss": 0.5925, "lr": 0.000885482180293501, "epoch": 1.7714884696016773, "percentage": 8.86, "elapsed_time": "0:08:26", "remaining_time": "1:26:48", "throughput": 4347.16, "total_tokens": 2200272} {"current_steps": 3385, "total_steps": 38160, "loss": 0.5263, "lr": 0.0008867924528301887, "epoch": 1.7741090146750524, "percentage": 8.87, "elapsed_time": "0:08:26", "remaining_time": "1:26:46", "throughput": 4346.88, "total_tokens": 2203024} {"current_steps": 3390, "total_steps": 38160, "loss": 0.4141, "lr": 0.0008881027253668763, "epoch": 1.7767295597484276, "percentage": 8.88, "elapsed_time": "0:08:27", "remaining_time": "1:26:45", "throughput": 4346.93, "total_tokens": 2206000} {"current_steps": 3395, "total_steps": 38160, "loss": 0.7173, "lr": 0.000889412997903564, "epoch": 1.7793501048218028, "percentage": 8.9, "elapsed_time": "0:08:28", "remaining_time": "1:26:44", "throughput": 4347.26, "total_tokens": 2209392} {"current_steps": 3400, "total_steps": 38160, "loss": 0.4416, "lr": 0.0008907232704402516, "epoch": 1.7819706498951782, "percentage": 8.91, "elapsed_time": "0:08:29", "remaining_time": "1:26:45", "throughput": 4349.12, "total_tokens": 2214480} {"current_steps": 3405, "total_steps": 38160, "loss": 0.4896, "lr": 0.0008920335429769392, "epoch": 1.7845911949685536, "percentage": 8.92, "elapsed_time": "0:08:29", "remaining_time": "1:26:44", "throughput": 4349.48, "total_tokens": 2217904} {"current_steps": 3410, "total_steps": 38160, "loss": 0.4756, "lr": 0.0008933438155136269, "epoch": 1.7872117400419287, "percentage": 8.94, "elapsed_time": "0:08:30", "remaining_time": "1:26:43", "throughput": 4349.91, "total_tokens": 2221328} {"current_steps": 3415, "total_steps": 38160, "loss": 0.562, "lr": 0.0008946540880503145, "epoch": 1.789832285115304, "percentage": 8.95, "elapsed_time": "0:08:31", "remaining_time": "1:26:42", "throughput": 4349.87, "total_tokens": 2224304} {"current_steps": 3420, "total_steps": 38160, "loss": 0.3955, "lr": 0.0008959643605870022, "epoch": 1.7924528301886793, "percentage": 8.96, "elapsed_time": "0:08:31", "remaining_time": "1:26:40", "throughput": 4349.53, "total_tokens": 2226928} {"current_steps": 3425, "total_steps": 38160, "loss": 0.5797, "lr": 0.0008972746331236897, "epoch": 1.7950733752620545, "percentage": 8.98, "elapsed_time": "0:08:32", "remaining_time": "1:26:39", "throughput": 4349.62, "total_tokens": 2230032} {"current_steps": 3430, "total_steps": 38160, "loss": 0.6297, "lr": 0.0008985849056603774, "epoch": 1.7976939203354299, "percentage": 8.99, "elapsed_time": "0:08:33", "remaining_time": "1:26:38", "throughput": 4349.53, "total_tokens": 2232976} {"current_steps": 3435, "total_steps": 38160, "loss": 0.4695, "lr": 0.000899895178197065, "epoch": 1.800314465408805, "percentage": 9.0, "elapsed_time": "0:08:34", "remaining_time": "1:26:36", "throughput": 4349.28, "total_tokens": 2235664} {"current_steps": 3440, "total_steps": 38160, "loss": 0.4583, "lr": 0.0009012054507337526, "epoch": 1.8029350104821802, "percentage": 9.01, "elapsed_time": "0:08:34", "remaining_time": "1:26:34", "throughput": 4349.1, "total_tokens": 2238448} {"current_steps": 3445, "total_steps": 38160, "loss": 0.4612, "lr": 0.0009025157232704403, "epoch": 1.8055555555555556, "percentage": 9.03, "elapsed_time": "0:08:35", "remaining_time": "1:26:33", "throughput": 4349.08, "total_tokens": 2241456} {"current_steps": 3450, "total_steps": 38160, "loss": 0.5867, "lr": 0.0009038259958071279, "epoch": 1.808176100628931, "percentage": 9.04, "elapsed_time": "0:08:36", "remaining_time": "1:26:32", "throughput": 4349.42, "total_tokens": 2244848} {"current_steps": 3455, "total_steps": 38160, "loss": 0.387, "lr": 0.0009051362683438156, "epoch": 1.8107966457023061, "percentage": 9.05, "elapsed_time": "0:08:36", "remaining_time": "1:26:30", "throughput": 4348.86, "total_tokens": 2247216} {"current_steps": 3460, "total_steps": 38160, "loss": 0.6554, "lr": 0.0009064465408805031, "epoch": 1.8134171907756813, "percentage": 9.07, "elapsed_time": "0:08:37", "remaining_time": "1:26:29", "throughput": 4348.78, "total_tokens": 2250160} {"current_steps": 3465, "total_steps": 38160, "loss": 0.45, "lr": 0.0009077568134171907, "epoch": 1.8160377358490565, "percentage": 9.08, "elapsed_time": "0:08:38", "remaining_time": "1:26:27", "throughput": 4348.45, "total_tokens": 2252784} {"current_steps": 3470, "total_steps": 38160, "loss": 0.4851, "lr": 0.0009090670859538784, "epoch": 1.8186582809224319, "percentage": 9.09, "elapsed_time": "0:08:38", "remaining_time": "1:26:25", "throughput": 4348.16, "total_tokens": 2255504} {"current_steps": 3475, "total_steps": 38160, "loss": 0.4736, "lr": 0.000910377358490566, "epoch": 1.8212788259958073, "percentage": 9.11, "elapsed_time": "0:08:39", "remaining_time": "1:26:27", "throughput": 4350.46, "total_tokens": 2261040} {"current_steps": 3480, "total_steps": 38160, "loss": 0.4346, "lr": 0.0009116876310272537, "epoch": 1.8238993710691824, "percentage": 9.12, "elapsed_time": "0:08:40", "remaining_time": "1:26:26", "throughput": 4350.98, "total_tokens": 2264656} {"current_steps": 3485, "total_steps": 38160, "loss": 0.4021, "lr": 0.0009129979035639413, "epoch": 1.8265199161425576, "percentage": 9.13, "elapsed_time": "0:08:41", "remaining_time": "1:26:26", "throughput": 4351.61, "total_tokens": 2268368} {"current_steps": 3490, "total_steps": 38160, "loss": 0.5934, "lr": 0.000914308176100629, "epoch": 1.8291404612159328, "percentage": 9.15, "elapsed_time": "0:08:41", "remaining_time": "1:26:24", "throughput": 4351.38, "total_tokens": 2271056} {"current_steps": 3495, "total_steps": 38160, "loss": 0.8365, "lr": 0.0009156184486373166, "epoch": 1.8317610062893082, "percentage": 9.16, "elapsed_time": "0:08:42", "remaining_time": "1:26:24", "throughput": 4351.9, "total_tokens": 2274672} {"current_steps": 3500, "total_steps": 38160, "loss": 0.4064, "lr": 0.0009169287211740042, "epoch": 1.8343815513626835, "percentage": 9.17, "elapsed_time": "0:08:43", "remaining_time": "1:26:23", "throughput": 4352.25, "total_tokens": 2278064} {"current_steps": 3505, "total_steps": 38160, "loss": 0.5108, "lr": 0.0009182389937106919, "epoch": 1.8370020964360587, "percentage": 9.19, "elapsed_time": "0:08:44", "remaining_time": "1:26:21", "throughput": 4351.68, "total_tokens": 2280400} {"current_steps": 3510, "total_steps": 38160, "loss": 0.544, "lr": 0.0009195492662473795, "epoch": 1.8396226415094339, "percentage": 9.2, "elapsed_time": "0:08:44", "remaining_time": "1:26:20", "throughput": 4351.97, "total_tokens": 2283728} {"current_steps": 3515, "total_steps": 38160, "loss": 0.4519, "lr": 0.0009208595387840672, "epoch": 1.8422431865828093, "percentage": 9.21, "elapsed_time": "0:08:45", "remaining_time": "1:26:18", "throughput": 4351.74, "total_tokens": 2286448} {"current_steps": 3520, "total_steps": 38160, "loss": 0.548, "lr": 0.0009221698113207547, "epoch": 1.8448637316561844, "percentage": 9.22, "elapsed_time": "0:08:46", "remaining_time": "1:26:17", "throughput": 4351.94, "total_tokens": 2289648} {"current_steps": 3525, "total_steps": 38160, "loss": 0.4397, "lr": 0.0009234800838574424, "epoch": 1.8474842767295598, "percentage": 9.24, "elapsed_time": "0:08:46", "remaining_time": "1:26:16", "throughput": 4351.81, "total_tokens": 2292528} {"current_steps": 3530, "total_steps": 38160, "loss": 0.4383, "lr": 0.00092479035639413, "epoch": 1.850104821802935, "percentage": 9.25, "elapsed_time": "0:08:47", "remaining_time": "1:26:14", "throughput": 4351.77, "total_tokens": 2295472} {"current_steps": 3535, "total_steps": 38160, "loss": 0.4506, "lr": 0.0009261006289308176, "epoch": 1.8527253668763102, "percentage": 9.26, "elapsed_time": "0:08:48", "remaining_time": "1:26:13", "throughput": 4351.99, "total_tokens": 2298800} {"current_steps": 3540, "total_steps": 38160, "loss": 0.5774, "lr": 0.0009274109014675053, "epoch": 1.8553459119496856, "percentage": 9.28, "elapsed_time": "0:08:48", "remaining_time": "1:26:12", "throughput": 4351.75, "total_tokens": 2301520} {"current_steps": 3545, "total_steps": 38160, "loss": 0.4118, "lr": 0.0009287211740041929, "epoch": 1.857966457023061, "percentage": 9.29, "elapsed_time": "0:08:49", "remaining_time": "1:26:11", "throughput": 4351.92, "total_tokens": 2304784} {"current_steps": 3550, "total_steps": 38160, "loss": 0.521, "lr": 0.0009300314465408806, "epoch": 1.8605870020964361, "percentage": 9.3, "elapsed_time": "0:08:50", "remaining_time": "1:26:09", "throughput": 4351.9, "total_tokens": 2307728} {"current_steps": 3555, "total_steps": 38160, "loss": 0.481, "lr": 0.0009313417190775681, "epoch": 1.8632075471698113, "percentage": 9.32, "elapsed_time": "0:08:51", "remaining_time": "1:26:09", "throughput": 4352.94, "total_tokens": 2311888} {"current_steps": 3560, "total_steps": 38160, "loss": 0.4526, "lr": 0.0009326519916142557, "epoch": 1.8658280922431865, "percentage": 9.33, "elapsed_time": "0:08:51", "remaining_time": "1:26:09", "throughput": 4353.44, "total_tokens": 2315536} {"current_steps": 3565, "total_steps": 38160, "loss": 0.5515, "lr": 0.0009339622641509434, "epoch": 1.8684486373165619, "percentage": 9.34, "elapsed_time": "0:08:52", "remaining_time": "1:26:07", "throughput": 4353.0, "total_tokens": 2318096} {"current_steps": 3570, "total_steps": 38160, "loss": 0.4313, "lr": 0.000935272536687631, "epoch": 1.8710691823899372, "percentage": 9.36, "elapsed_time": "0:08:53", "remaining_time": "1:26:06", "throughput": 4353.13, "total_tokens": 2321168} {"current_steps": 3575, "total_steps": 38160, "loss": 0.4951, "lr": 0.0009365828092243187, "epoch": 1.8736897274633124, "percentage": 9.37, "elapsed_time": "0:08:53", "remaining_time": "1:26:04", "throughput": 4352.79, "total_tokens": 2323824} {"current_steps": 3580, "total_steps": 38160, "loss": 0.5668, "lr": 0.0009378930817610063, "epoch": 1.8763102725366876, "percentage": 9.38, "elapsed_time": "0:08:54", "remaining_time": "1:26:03", "throughput": 4352.69, "total_tokens": 2326672} {"current_steps": 3585, "total_steps": 38160, "loss": 0.4095, "lr": 0.0009392033542976939, "epoch": 1.8789308176100628, "percentage": 9.39, "elapsed_time": "0:08:55", "remaining_time": "1:26:03", "throughput": 4353.46, "total_tokens": 2330640} {"current_steps": 3590, "total_steps": 38160, "loss": 0.4044, "lr": 0.0009405136268343816, "epoch": 1.8815513626834381, "percentage": 9.41, "elapsed_time": "0:08:55", "remaining_time": "1:26:01", "throughput": 4353.09, "total_tokens": 2333232} {"current_steps": 3595, "total_steps": 38160, "loss": 0.4982, "lr": 0.0009418238993710692, "epoch": 1.8841719077568135, "percentage": 9.42, "elapsed_time": "0:08:56", "remaining_time": "1:26:00", "throughput": 4353.42, "total_tokens": 2336560} {"current_steps": 3600, "total_steps": 38160, "loss": 0.5898, "lr": 0.0009431341719077569, "epoch": 1.8867924528301887, "percentage": 9.43, "elapsed_time": "0:08:57", "remaining_time": "1:25:59", "throughput": 4353.53, "total_tokens": 2339632} {"current_steps": 3605, "total_steps": 38160, "loss": 0.509, "lr": 0.0009444444444444445, "epoch": 1.8894129979035639, "percentage": 9.45, "elapsed_time": "0:08:58", "remaining_time": "1:26:04", "throughput": 4357.0, "total_tokens": 2347440} {"current_steps": 3610, "total_steps": 38160, "loss": 0.4609, "lr": 0.0009457547169811322, "epoch": 1.892033542976939, "percentage": 9.46, "elapsed_time": "0:08:59", "remaining_time": "1:26:03", "throughput": 4357.49, "total_tokens": 2350992} {"current_steps": 3615, "total_steps": 38160, "loss": 0.4771, "lr": 0.0009470649895178197, "epoch": 1.8946540880503144, "percentage": 9.47, "elapsed_time": "0:09:00", "remaining_time": "1:26:02", "throughput": 4357.78, "total_tokens": 2354384} {"current_steps": 3620, "total_steps": 38160, "loss": 0.6047, "lr": 0.0009483752620545073, "epoch": 1.8972746331236898, "percentage": 9.49, "elapsed_time": "0:09:00", "remaining_time": "1:26:00", "throughput": 4357.23, "total_tokens": 2356752} {"current_steps": 3625, "total_steps": 38160, "loss": 0.4002, "lr": 0.000949685534591195, "epoch": 1.899895178197065, "percentage": 9.5, "elapsed_time": "0:09:01", "remaining_time": "1:25:59", "throughput": 4357.27, "total_tokens": 2359728} {"current_steps": 3630, "total_steps": 38160, "loss": 0.4928, "lr": 0.0009509958071278826, "epoch": 1.9025157232704402, "percentage": 9.51, "elapsed_time": "0:09:02", "remaining_time": "1:25:59", "throughput": 4358.07, "total_tokens": 2363728} {"current_steps": 3635, "total_steps": 38160, "loss": 0.5778, "lr": 0.0009523060796645703, "epoch": 1.9051362683438156, "percentage": 9.53, "elapsed_time": "0:09:03", "remaining_time": "1:25:57", "throughput": 4357.8, "total_tokens": 2366480} {"current_steps": 3640, "total_steps": 38160, "loss": 0.4329, "lr": 0.0009536163522012579, "epoch": 1.9077568134171907, "percentage": 9.54, "elapsed_time": "0:09:03", "remaining_time": "1:25:56", "throughput": 4357.59, "total_tokens": 2369232} {"current_steps": 3645, "total_steps": 38160, "loss": 0.6186, "lr": 0.0009549266247379456, "epoch": 1.9103773584905661, "percentage": 9.55, "elapsed_time": "0:09:04", "remaining_time": "1:25:55", "throughput": 4357.9, "total_tokens": 2372688} {"current_steps": 3650, "total_steps": 38160, "loss": 0.5194, "lr": 0.0009562368972746331, "epoch": 1.9129979035639413, "percentage": 9.56, "elapsed_time": "0:09:05", "remaining_time": "1:25:55", "throughput": 4358.83, "total_tokens": 2376976} {"current_steps": 3655, "total_steps": 38160, "loss": 0.4431, "lr": 0.0009575471698113207, "epoch": 1.9156184486373165, "percentage": 9.58, "elapsed_time": "0:09:06", "remaining_time": "1:25:54", "throughput": 4358.89, "total_tokens": 2380112} {"current_steps": 3660, "total_steps": 38160, "loss": 0.4795, "lr": 0.0009588574423480084, "epoch": 1.9182389937106918, "percentage": 9.59, "elapsed_time": "0:09:06", "remaining_time": "1:25:52", "throughput": 4358.44, "total_tokens": 2382608} {"current_steps": 3665, "total_steps": 38160, "loss": 0.567, "lr": 0.000960167714884696, "epoch": 1.9208595387840672, "percentage": 9.6, "elapsed_time": "0:09:07", "remaining_time": "1:25:51", "throughput": 4358.27, "total_tokens": 2385424} {"current_steps": 3670, "total_steps": 38160, "loss": 0.5339, "lr": 0.0009614779874213837, "epoch": 1.9234800838574424, "percentage": 9.62, "elapsed_time": "0:09:08", "remaining_time": "1:25:52", "throughput": 4359.57, "total_tokens": 2390032} {"current_steps": 3675, "total_steps": 38160, "loss": 0.4209, "lr": 0.0009627882599580712, "epoch": 1.9261006289308176, "percentage": 9.63, "elapsed_time": "0:09:08", "remaining_time": "1:25:51", "throughput": 4359.79, "total_tokens": 2393328} {"current_steps": 3680, "total_steps": 38160, "loss": 0.3794, "lr": 0.0009640985324947589, "epoch": 1.9287211740041927, "percentage": 9.64, "elapsed_time": "0:09:09", "remaining_time": "1:25:50", "throughput": 4359.85, "total_tokens": 2396432} {"current_steps": 3685, "total_steps": 38160, "loss": 0.5121, "lr": 0.0009654088050314465, "epoch": 1.9313417190775681, "percentage": 9.66, "elapsed_time": "0:09:10", "remaining_time": "1:25:49", "throughput": 4360.26, "total_tokens": 2399952} {"current_steps": 3690, "total_steps": 38160, "loss": 0.4302, "lr": 0.0009667190775681342, "epoch": 1.9339622641509435, "percentage": 9.67, "elapsed_time": "0:09:11", "remaining_time": "1:25:49", "throughput": 4361.36, "total_tokens": 2404240} {"current_steps": 3695, "total_steps": 38160, "loss": 0.3524, "lr": 0.0009680293501048219, "epoch": 1.9365828092243187, "percentage": 9.68, "elapsed_time": "0:09:12", "remaining_time": "1:25:49", "throughput": 4362.02, "total_tokens": 2408080} {"current_steps": 3700, "total_steps": 38160, "loss": 0.4824, "lr": 0.0009693396226415095, "epoch": 1.9392033542976939, "percentage": 9.7, "elapsed_time": "0:09:12", "remaining_time": "1:25:49", "throughput": 4362.81, "total_tokens": 2412080} {"current_steps": 3705, "total_steps": 38160, "loss": 0.3581, "lr": 0.0009706498951781972, "epoch": 1.941823899371069, "percentage": 9.71, "elapsed_time": "0:09:13", "remaining_time": "1:25:50", "throughput": 4364.39, "total_tokens": 2417136} {"current_steps": 3710, "total_steps": 38160, "loss": 0.4409, "lr": 0.0009719601677148847, "epoch": 1.9444444444444444, "percentage": 9.72, "elapsed_time": "0:09:14", "remaining_time": "1:25:49", "throughput": 4364.92, "total_tokens": 2420720} {"current_steps": 3715, "total_steps": 38160, "loss": 0.4507, "lr": 0.0009732704402515723, "epoch": 1.9470649895178198, "percentage": 9.74, "elapsed_time": "0:09:15", "remaining_time": "1:25:48", "throughput": 4364.78, "total_tokens": 2423632} {"current_steps": 3720, "total_steps": 38160, "loss": 0.5608, "lr": 0.00097458071278826, "epoch": 1.949685534591195, "percentage": 9.75, "elapsed_time": "0:09:15", "remaining_time": "1:25:47", "throughput": 4364.75, "total_tokens": 2426704} {"current_steps": 3725, "total_steps": 38160, "loss": 0.476, "lr": 0.0009758909853249476, "epoch": 1.9523060796645701, "percentage": 9.76, "elapsed_time": "0:09:16", "remaining_time": "1:25:47", "throughput": 4365.76, "total_tokens": 2431056} {"current_steps": 3730, "total_steps": 38160, "loss": 0.35, "lr": 0.0009772012578616353, "epoch": 1.9549266247379455, "percentage": 9.77, "elapsed_time": "0:09:17", "remaining_time": "1:25:46", "throughput": 4365.46, "total_tokens": 2433808} {"current_steps": 3735, "total_steps": 38160, "loss": 0.4395, "lr": 0.0009785115303983228, "epoch": 1.9575471698113207, "percentage": 9.79, "elapsed_time": "0:09:18", "remaining_time": "1:25:45", "throughput": 4365.56, "total_tokens": 2437008} {"current_steps": 3740, "total_steps": 38160, "loss": 0.6408, "lr": 0.0009798218029350107, "epoch": 1.960167714884696, "percentage": 9.8, "elapsed_time": "0:09:19", "remaining_time": "1:25:45", "throughput": 4366.65, "total_tokens": 2441520} {"current_steps": 3745, "total_steps": 38160, "loss": 0.3493, "lr": 0.0009811320754716981, "epoch": 1.9627882599580713, "percentage": 9.81, "elapsed_time": "0:09:19", "remaining_time": "1:25:44", "throughput": 4366.47, "total_tokens": 2444400} {"current_steps": 3750, "total_steps": 38160, "loss": 0.4838, "lr": 0.0009824423480083858, "epoch": 1.9654088050314464, "percentage": 9.83, "elapsed_time": "0:09:20", "remaining_time": "1:25:42", "throughput": 4366.34, "total_tokens": 2447248} {"current_steps": 3755, "total_steps": 38160, "loss": 0.4921, "lr": 0.0009837526205450735, "epoch": 1.9680293501048218, "percentage": 9.84, "elapsed_time": "0:09:21", "remaining_time": "1:25:41", "throughput": 4366.34, "total_tokens": 2450352} {"current_steps": 3760, "total_steps": 38160, "loss": 0.5671, "lr": 0.000985062893081761, "epoch": 1.9706498951781972, "percentage": 9.85, "elapsed_time": "0:09:21", "remaining_time": "1:25:40", "throughput": 4366.07, "total_tokens": 2453072} {"current_steps": 3765, "total_steps": 38160, "loss": 0.4291, "lr": 0.0009863731656184487, "epoch": 1.9732704402515724, "percentage": 9.87, "elapsed_time": "0:09:22", "remaining_time": "1:25:39", "throughput": 4366.12, "total_tokens": 2456112} {"current_steps": 3770, "total_steps": 38160, "loss": 0.4326, "lr": 0.0009876834381551364, "epoch": 1.9758909853249476, "percentage": 9.88, "elapsed_time": "0:09:23", "remaining_time": "1:25:38", "throughput": 4366.15, "total_tokens": 2459280} {"current_steps": 3775, "total_steps": 38160, "loss": 0.4166, "lr": 0.0009889937106918238, "epoch": 1.9785115303983227, "percentage": 9.89, "elapsed_time": "0:09:23", "remaining_time": "1:25:36", "throughput": 4365.77, "total_tokens": 2462000} {"current_steps": 3780, "total_steps": 38160, "loss": 0.4925, "lr": 0.0009903039832285115, "epoch": 1.9811320754716981, "percentage": 9.91, "elapsed_time": "0:09:24", "remaining_time": "1:25:34", "throughput": 4365.39, "total_tokens": 2464592} {"current_steps": 3785, "total_steps": 38160, "loss": 0.5555, "lr": 0.0009916142557651992, "epoch": 1.9837526205450735, "percentage": 9.92, "elapsed_time": "0:09:25", "remaining_time": "1:25:35", "throughput": 4366.27, "total_tokens": 2468784} {"current_steps": 3790, "total_steps": 38160, "loss": 0.3722, "lr": 0.000992924528301887, "epoch": 1.9863731656184487, "percentage": 9.93, "elapsed_time": "0:09:26", "remaining_time": "1:25:33", "throughput": 4366.31, "total_tokens": 2471824} {"current_steps": 3795, "total_steps": 38160, "loss": 0.7072, "lr": 0.0009942348008385744, "epoch": 1.9889937106918238, "percentage": 9.94, "elapsed_time": "0:09:26", "remaining_time": "1:25:32", "throughput": 4366.2, "total_tokens": 2474704} {"current_steps": 3800, "total_steps": 38160, "loss": 0.567, "lr": 0.000995545073375262, "epoch": 1.991614255765199, "percentage": 9.96, "elapsed_time": "0:09:27", "remaining_time": "1:25:30", "throughput": 4366.03, "total_tokens": 2477520} {"current_steps": 3805, "total_steps": 38160, "loss": 0.3641, "lr": 0.0009968553459119497, "epoch": 1.9942348008385744, "percentage": 9.97, "elapsed_time": "0:09:28", "remaining_time": "1:25:29", "throughput": 4365.9, "total_tokens": 2480528} {"current_steps": 3810, "total_steps": 38160, "loss": 0.5017, "lr": 0.0009981656184486372, "epoch": 1.9968553459119498, "percentage": 9.98, "elapsed_time": "0:09:28", "remaining_time": "1:25:29", "throughput": 4366.7, "total_tokens": 2484560} {"current_steps": 3815, "total_steps": 38160, "loss": 0.5121, "lr": 0.000999475890985325, "epoch": 1.999475890985325, "percentage": 10.0, "elapsed_time": "0:09:29", "remaining_time": "1:25:30", "throughput": 4368.35, "total_tokens": 2489712} {"current_steps": 3816, "total_steps": 38160, "eval_loss": 0.496399462223053, "epoch": 2.0, "percentage": 10.0, "elapsed_time": "0:09:43", "remaining_time": "1:27:35", "throughput": 4263.83, "total_tokens": 2489840} {"current_steps": 3820, "total_steps": 38160, "loss": 0.4879, "lr": 0.0009999999811730266, "epoch": 2.0020964360587, "percentage": 10.01, "elapsed_time": "0:09:46", "remaining_time": "1:27:50", "throughput": 4252.3, "total_tokens": 2493040} {"current_steps": 3825, "total_steps": 38160, "loss": 0.5338, "lr": 0.000999999866119305, "epoch": 2.0047169811320753, "percentage": 10.02, "elapsed_time": "0:09:46", "remaining_time": "1:27:49", "throughput": 4252.54, "total_tokens": 2496240} {"current_steps": 3830, "total_steps": 38160, "loss": 0.5256, "lr": 0.000999999646471316, "epoch": 2.007337526205451, "percentage": 10.04, "elapsed_time": "0:09:47", "remaining_time": "1:27:47", "throughput": 4252.62, "total_tokens": 2499216} {"current_steps": 3835, "total_steps": 38160, "loss": 0.5319, "lr": 0.0009999993222291053, "epoch": 2.009958071278826, "percentage": 10.05, "elapsed_time": "0:09:48", "remaining_time": "1:27:46", "throughput": 4252.81, "total_tokens": 2502352} {"current_steps": 3840, "total_steps": 38160, "loss": 0.5403, "lr": 0.0009999988933927404, "epoch": 2.0125786163522013, "percentage": 10.06, "elapsed_time": "0:09:49", "remaining_time": "1:27:45", "throughput": 4253.05, "total_tokens": 2505584} {"current_steps": 3845, "total_steps": 38160, "loss": 0.4196, "lr": 0.0009999983599623115, "epoch": 2.0151991614255764, "percentage": 10.08, "elapsed_time": "0:09:49", "remaining_time": "1:27:44", "throughput": 4253.67, "total_tokens": 2509296} {"current_steps": 3850, "total_steps": 38160, "loss": 0.4609, "lr": 0.0009999977219379299, "epoch": 2.0178197064989516, "percentage": 10.09, "elapsed_time": "0:09:50", "remaining_time": "1:27:43", "throughput": 4253.72, "total_tokens": 2512240} {"current_steps": 3855, "total_steps": 38160, "loss": 0.4393, "lr": 0.000999996979319729, "epoch": 2.020440251572327, "percentage": 10.1, "elapsed_time": "0:09:51", "remaining_time": "1:27:42", "throughput": 4254.16, "total_tokens": 2515728} {"current_steps": 3860, "total_steps": 38160, "loss": 0.3968, "lr": 0.0009999961321078645, "epoch": 2.0230607966457024, "percentage": 10.12, "elapsed_time": "0:09:52", "remaining_time": "1:27:41", "throughput": 4254.58, "total_tokens": 2519184} {"current_steps": 3865, "total_steps": 38160, "loss": 0.4077, "lr": 0.0009999951803025134, "epoch": 2.0256813417190775, "percentage": 10.13, "elapsed_time": "0:09:52", "remaining_time": "1:27:40", "throughput": 4254.71, "total_tokens": 2522224} {"current_steps": 3870, "total_steps": 38160, "loss": 0.3915, "lr": 0.0009999941239038747, "epoch": 2.0283018867924527, "percentage": 10.14, "elapsed_time": "0:09:53", "remaining_time": "1:27:39", "throughput": 4255.12, "total_tokens": 2525744} {"current_steps": 3875, "total_steps": 38160, "loss": 0.4206, "lr": 0.0009999929629121696, "epoch": 2.030922431865828, "percentage": 10.15, "elapsed_time": "0:09:54", "remaining_time": "1:27:37", "throughput": 4255.24, "total_tokens": 2528784} {"current_steps": 3880, "total_steps": 38160, "loss": 0.5271, "lr": 0.000999991697327641, "epoch": 2.0335429769392035, "percentage": 10.17, "elapsed_time": "0:09:55", "remaining_time": "1:27:38", "throughput": 4256.21, "total_tokens": 2533040} {"current_steps": 3885, "total_steps": 38160, "loss": 0.4283, "lr": 0.0009999903271505535, "epoch": 2.0361635220125787, "percentage": 10.18, "elapsed_time": "0:09:55", "remaining_time": "1:27:37", "throughput": 4257.0, "total_tokens": 2536848} {"current_steps": 3890, "total_steps": 38160, "loss": 0.4104, "lr": 0.0009999888523811935, "epoch": 2.038784067085954, "percentage": 10.19, "elapsed_time": "0:09:56", "remaining_time": "1:27:36", "throughput": 4257.24, "total_tokens": 2540112} {"current_steps": 3895, "total_steps": 38160, "loss": 0.4591, "lr": 0.00099998727301987, "epoch": 2.041404612159329, "percentage": 10.21, "elapsed_time": "0:09:57", "remaining_time": "1:27:35", "throughput": 4257.3, "total_tokens": 2543184} {"current_steps": 3900, "total_steps": 38160, "loss": 0.4169, "lr": 0.000999985589066913, "epoch": 2.0440251572327046, "percentage": 10.22, "elapsed_time": "0:09:58", "remaining_time": "1:27:33", "throughput": 4257.01, "total_tokens": 2545808} {"current_steps": 3905, "total_steps": 38160, "loss": 0.3426, "lr": 0.000999983800522675, "epoch": 2.04664570230608, "percentage": 10.23, "elapsed_time": "0:09:58", "remaining_time": "1:27:32", "throughput": 4257.09, "total_tokens": 2548816} {"current_steps": 3910, "total_steps": 38160, "loss": 0.5472, "lr": 0.00099998190738753, "epoch": 2.049266247379455, "percentage": 10.25, "elapsed_time": "0:09:59", "remaining_time": "1:27:30", "throughput": 4256.71, "total_tokens": 2551248} {"current_steps": 3915, "total_steps": 38160, "loss": 0.5771, "lr": 0.000999979909661874, "epoch": 2.05188679245283, "percentage": 10.26, "elapsed_time": "0:10:00", "remaining_time": "1:27:29", "throughput": 4257.54, "total_tokens": 2555152} {"current_steps": 3920, "total_steps": 38160, "loss": 0.3919, "lr": 0.000999977807346125, "epoch": 2.0545073375262053, "percentage": 10.27, "elapsed_time": "0:10:00", "remaining_time": "1:27:29", "throughput": 4258.11, "total_tokens": 2558864} {"current_steps": 3925, "total_steps": 38160, "loss": 0.5069, "lr": 0.000999975600440723, "epoch": 2.057127882599581, "percentage": 10.29, "elapsed_time": "0:10:01", "remaining_time": "1:27:28", "throughput": 4258.8, "total_tokens": 2562800} {"current_steps": 3930, "total_steps": 38160, "loss": 0.4634, "lr": 0.000999973288946129, "epoch": 2.059748427672956, "percentage": 10.3, "elapsed_time": "0:10:02", "remaining_time": "1:27:27", "throughput": 4258.92, "total_tokens": 2565904} {"current_steps": 3935, "total_steps": 38160, "loss": 0.4717, "lr": 0.0009999708728628271, "epoch": 2.0623689727463312, "percentage": 10.31, "elapsed_time": "0:10:03", "remaining_time": "1:27:26", "throughput": 4258.94, "total_tokens": 2569104} {"current_steps": 3940, "total_steps": 38160, "loss": 0.5233, "lr": 0.0009999683521913227, "epoch": 2.0649895178197064, "percentage": 10.32, "elapsed_time": "0:10:03", "remaining_time": "1:27:25", "throughput": 4258.67, "total_tokens": 2571888} {"current_steps": 3945, "total_steps": 38160, "loss": 0.4899, "lr": 0.000999965726932143, "epoch": 2.0676100628930816, "percentage": 10.34, "elapsed_time": "0:10:04", "remaining_time": "1:27:24", "throughput": 4258.93, "total_tokens": 2575184} {"current_steps": 3950, "total_steps": 38160, "loss": 0.5132, "lr": 0.0009999629970858371, "epoch": 2.070230607966457, "percentage": 10.35, "elapsed_time": "0:10:05", "remaining_time": "1:27:22", "throughput": 4258.89, "total_tokens": 2578064} {"current_steps": 3955, "total_steps": 38160, "loss": 0.3819, "lr": 0.000999960162652976, "epoch": 2.0728511530398324, "percentage": 10.36, "elapsed_time": "0:10:06", "remaining_time": "1:27:21", "throughput": 4258.69, "total_tokens": 2580848} {"current_steps": 3960, "total_steps": 38160, "loss": 0.4967, "lr": 0.0009999572236341527, "epoch": 2.0754716981132075, "percentage": 10.38, "elapsed_time": "0:10:06", "remaining_time": "1:27:19", "throughput": 4258.84, "total_tokens": 2583920} {"current_steps": 3965, "total_steps": 38160, "loss": 0.44, "lr": 0.000999954180029982, "epoch": 2.0780922431865827, "percentage": 10.39, "elapsed_time": "0:10:07", "remaining_time": "1:27:18", "throughput": 4258.94, "total_tokens": 2586992} {"current_steps": 3970, "total_steps": 38160, "loss": 0.4527, "lr": 0.0009999510318411007, "epoch": 2.080712788259958, "percentage": 10.4, "elapsed_time": "0:10:08", "remaining_time": "1:27:16", "throughput": 4258.29, "total_tokens": 2589136} {"current_steps": 3975, "total_steps": 38160, "loss": 0.5053, "lr": 0.0009999477790681673, "epoch": 2.0833333333333335, "percentage": 10.42, "elapsed_time": "0:10:08", "remaining_time": "1:27:14", "throughput": 4258.03, "total_tokens": 2591760} {"current_steps": 3980, "total_steps": 38160, "loss": 0.4892, "lr": 0.000999944421711862, "epoch": 2.0859538784067087, "percentage": 10.43, "elapsed_time": "0:10:09", "remaining_time": "1:27:13", "throughput": 4257.91, "total_tokens": 2594576} {"current_steps": 3985, "total_steps": 38160, "loss": 0.5983, "lr": 0.0009999409597728876, "epoch": 2.088574423480084, "percentage": 10.44, "elapsed_time": "0:10:10", "remaining_time": "1:27:12", "throughput": 4258.14, "total_tokens": 2597872} {"current_steps": 3990, "total_steps": 38160, "loss": 0.41, "lr": 0.0009999373932519679, "epoch": 2.091194968553459, "percentage": 10.46, "elapsed_time": "0:10:10", "remaining_time": "1:27:10", "throughput": 4258.1, "total_tokens": 2600752} {"current_steps": 3995, "total_steps": 38160, "loss": 0.55, "lr": 0.0009999337221498492, "epoch": 2.0938155136268346, "percentage": 10.47, "elapsed_time": "0:10:11", "remaining_time": "1:27:13", "throughput": 4260.34, "total_tokens": 2607248} {"current_steps": 4000, "total_steps": 38160, "loss": 0.3812, "lr": 0.0009999299464672996, "epoch": 2.0964360587002098, "percentage": 10.48, "elapsed_time": "0:10:12", "remaining_time": "1:27:12", "throughput": 4260.73, "total_tokens": 2610672} {"current_steps": 4005, "total_steps": 38160, "loss": 0.4076, "lr": 0.0009999260662051084, "epoch": 2.099056603773585, "percentage": 10.5, "elapsed_time": "0:10:13", "remaining_time": "1:27:12", "throughput": 4261.91, "total_tokens": 2615120} {"current_steps": 4010, "total_steps": 38160, "loss": 0.4056, "lr": 0.0009999220813640877, "epoch": 2.10167714884696, "percentage": 10.51, "elapsed_time": "0:10:14", "remaining_time": "1:27:11", "throughput": 4262.46, "total_tokens": 2618640} {"current_steps": 4015, "total_steps": 38160, "loss": 0.4263, "lr": 0.000999917991945071, "epoch": 2.1042976939203353, "percentage": 10.52, "elapsed_time": "0:10:15", "remaining_time": "1:27:10", "throughput": 4262.6, "total_tokens": 2621744} {"current_steps": 4020, "total_steps": 38160, "loss": 0.4951, "lr": 0.0009999137979489136, "epoch": 2.106918238993711, "percentage": 10.53, "elapsed_time": "0:10:15", "remaining_time": "1:27:08", "throughput": 4262.5, "total_tokens": 2624496} {"current_steps": 4025, "total_steps": 38160, "loss": 0.3394, "lr": 0.000999909499376493, "epoch": 2.109538784067086, "percentage": 10.55, "elapsed_time": "0:10:16", "remaining_time": "1:27:08", "throughput": 4262.93, "total_tokens": 2627984} {"current_steps": 4030, "total_steps": 38160, "loss": 0.5664, "lr": 0.0009999050962287085, "epoch": 2.1121593291404612, "percentage": 10.56, "elapsed_time": "0:10:17", "remaining_time": "1:27:06", "throughput": 4263.07, "total_tokens": 2631024} {"current_steps": 4035, "total_steps": 38160, "loss": 0.5265, "lr": 0.0009999005885064811, "epoch": 2.1147798742138364, "percentage": 10.57, "elapsed_time": "0:10:17", "remaining_time": "1:27:05", "throughput": 4263.09, "total_tokens": 2634000} {"current_steps": 4040, "total_steps": 38160, "loss": 0.4638, "lr": 0.0009998959762107537, "epoch": 2.1174004192872116, "percentage": 10.59, "elapsed_time": "0:10:18", "remaining_time": "1:27:04", "throughput": 4263.57, "total_tokens": 2637488} {"current_steps": 4045, "total_steps": 38160, "loss": 0.5, "lr": 0.0009998912593424914, "epoch": 2.120020964360587, "percentage": 10.6, "elapsed_time": "0:10:19", "remaining_time": "1:27:06", "throughput": 4265.55, "total_tokens": 2643376} {"current_steps": 4050, "total_steps": 38160, "loss": 0.4514, "lr": 0.0009998864379026804, "epoch": 2.1226415094339623, "percentage": 10.61, "elapsed_time": "0:10:20", "remaining_time": "1:27:04", "throughput": 4265.28, "total_tokens": 2646000} {"current_steps": 4055, "total_steps": 38160, "loss": 0.4615, "lr": 0.00099988151189233, "epoch": 2.1252620545073375, "percentage": 10.63, "elapsed_time": "0:10:21", "remaining_time": "1:27:03", "throughput": 4265.72, "total_tokens": 2649456} {"current_steps": 4060, "total_steps": 38160, "loss": 0.4202, "lr": 0.00099987648131247, "epoch": 2.1278825995807127, "percentage": 10.64, "elapsed_time": "0:10:21", "remaining_time": "1:27:02", "throughput": 4265.42, "total_tokens": 2652016} {"current_steps": 4065, "total_steps": 38160, "loss": 0.6427, "lr": 0.000999871346164153, "epoch": 2.130503144654088, "percentage": 10.65, "elapsed_time": "0:10:22", "remaining_time": "1:27:00", "throughput": 4265.51, "total_tokens": 2654992} {"current_steps": 4070, "total_steps": 38160, "loss": 0.5264, "lr": 0.0009998661064484532, "epoch": 2.1331236897274635, "percentage": 10.67, "elapsed_time": "0:10:23", "remaining_time": "1:26:58", "throughput": 4265.29, "total_tokens": 2657648} {"current_steps": 4075, "total_steps": 38160, "loss": 0.4308, "lr": 0.0009998607621664666, "epoch": 2.1357442348008386, "percentage": 10.68, "elapsed_time": "0:10:23", "remaining_time": "1:26:57", "throughput": 4265.31, "total_tokens": 2660560} {"current_steps": 4080, "total_steps": 38160, "loss": 0.4217, "lr": 0.0009998553133193113, "epoch": 2.138364779874214, "percentage": 10.69, "elapsed_time": "0:10:24", "remaining_time": "1:26:56", "throughput": 4265.25, "total_tokens": 2663440} {"current_steps": 4085, "total_steps": 38160, "loss": 0.6687, "lr": 0.0009998497599081272, "epoch": 2.140985324947589, "percentage": 10.7, "elapsed_time": "0:10:25", "remaining_time": "1:26:54", "throughput": 4265.47, "total_tokens": 2666544} {"current_steps": 4090, "total_steps": 38160, "loss": 0.4419, "lr": 0.0009998441019340761, "epoch": 2.1436058700209646, "percentage": 10.72, "elapsed_time": "0:10:25", "remaining_time": "1:26:53", "throughput": 4265.6, "total_tokens": 2669616} {"current_steps": 4095, "total_steps": 38160, "loss": 0.4817, "lr": 0.000999838339398341, "epoch": 2.1462264150943398, "percentage": 10.73, "elapsed_time": "0:10:26", "remaining_time": "1:26:52", "throughput": 4265.98, "total_tokens": 2673008} {"current_steps": 4100, "total_steps": 38160, "loss": 0.3966, "lr": 0.000999832472302128, "epoch": 2.148846960167715, "percentage": 10.74, "elapsed_time": "0:10:27", "remaining_time": "1:26:51", "throughput": 4266.0, "total_tokens": 2676016} {"current_steps": 4105, "total_steps": 38160, "loss": 0.5061, "lr": 0.0009998265006466642, "epoch": 2.15146750524109, "percentage": 10.76, "elapsed_time": "0:10:28", "remaining_time": "1:26:50", "throughput": 4266.68, "total_tokens": 2679920} {"current_steps": 4110, "total_steps": 38160, "loss": 0.5206, "lr": 0.0009998204244331987, "epoch": 2.1540880503144653, "percentage": 10.77, "elapsed_time": "0:10:28", "remaining_time": "1:26:50", "throughput": 4267.4, "total_tokens": 2683728} {"current_steps": 4115, "total_steps": 38160, "loss": 0.5651, "lr": 0.0009998142436630027, "epoch": 2.156708595387841, "percentage": 10.78, "elapsed_time": "0:10:29", "remaining_time": "1:26:49", "throughput": 4267.59, "total_tokens": 2686960} {"current_steps": 4120, "total_steps": 38160, "loss": 0.4205, "lr": 0.0009998079583373692, "epoch": 2.159329140461216, "percentage": 10.8, "elapsed_time": "0:10:30", "remaining_time": "1:26:48", "throughput": 4268.03, "total_tokens": 2690480} {"current_steps": 4125, "total_steps": 38160, "loss": 0.4428, "lr": 0.0009998015684576128, "epoch": 2.161949685534591, "percentage": 10.81, "elapsed_time": "0:10:31", "remaining_time": "1:26:47", "throughput": 4268.47, "total_tokens": 2694064} {"current_steps": 4130, "total_steps": 38160, "loss": 0.5007, "lr": 0.0009997950740250703, "epoch": 2.1645702306079664, "percentage": 10.82, "elapsed_time": "0:10:31", "remaining_time": "1:26:46", "throughput": 4268.41, "total_tokens": 2696880} {"current_steps": 4135, "total_steps": 38160, "loss": 0.529, "lr": 0.0009997884750411004, "epoch": 2.1671907756813416, "percentage": 10.84, "elapsed_time": "0:10:32", "remaining_time": "1:26:44", "throughput": 4268.48, "total_tokens": 2699856} {"current_steps": 4140, "total_steps": 38160, "loss": 0.4507, "lr": 0.0009997817715070832, "epoch": 2.169811320754717, "percentage": 10.85, "elapsed_time": "0:10:33", "remaining_time": "1:26:43", "throughput": 4268.94, "total_tokens": 2703344} {"current_steps": 4145, "total_steps": 38160, "loss": 0.5492, "lr": 0.0009997749634244213, "epoch": 2.1724318658280923, "percentage": 10.86, "elapsed_time": "0:10:34", "remaining_time": "1:26:42", "throughput": 4269.3, "total_tokens": 2706736} {"current_steps": 4150, "total_steps": 38160, "loss": 0.4897, "lr": 0.000999768050794539, "epoch": 2.1750524109014675, "percentage": 10.88, "elapsed_time": "0:10:34", "remaining_time": "1:26:41", "throughput": 4269.48, "total_tokens": 2709968} {"current_steps": 4155, "total_steps": 38160, "loss": 0.4477, "lr": 0.0009997610336188818, "epoch": 2.1776729559748427, "percentage": 10.89, "elapsed_time": "0:10:35", "remaining_time": "1:26:40", "throughput": 4269.94, "total_tokens": 2713456} {"current_steps": 4160, "total_steps": 38160, "loss": 0.3751, "lr": 0.0009997539118989183, "epoch": 2.180293501048218, "percentage": 10.9, "elapsed_time": "0:10:36", "remaining_time": "1:26:38", "throughput": 4269.61, "total_tokens": 2715952} {"current_steps": 4165, "total_steps": 38160, "loss": 0.5396, "lr": 0.0009997466856361376, "epoch": 2.1829140461215935, "percentage": 10.91, "elapsed_time": "0:10:36", "remaining_time": "1:26:37", "throughput": 4269.8, "total_tokens": 2719120} {"current_steps": 4170, "total_steps": 38160, "loss": 0.4284, "lr": 0.000999739354832052, "epoch": 2.1855345911949686, "percentage": 10.93, "elapsed_time": "0:10:37", "remaining_time": "1:26:36", "throughput": 4269.83, "total_tokens": 2722128} {"current_steps": 4175, "total_steps": 38160, "loss": 0.5778, "lr": 0.0009997319194881944, "epoch": 2.188155136268344, "percentage": 10.94, "elapsed_time": "0:10:38", "remaining_time": "1:26:35", "throughput": 4270.15, "total_tokens": 2725424} {"current_steps": 4180, "total_steps": 38160, "loss": 0.465, "lr": 0.0009997243796061204, "epoch": 2.190775681341719, "percentage": 10.95, "elapsed_time": "0:10:39", "remaining_time": "1:26:36", "throughput": 4271.86, "total_tokens": 2730640} {"current_steps": 4185, "total_steps": 38160, "loss": 0.6115, "lr": 0.0009997167351874076, "epoch": 2.1933962264150946, "percentage": 10.97, "elapsed_time": "0:10:39", "remaining_time": "1:26:34", "throughput": 4271.5, "total_tokens": 2733104} {"current_steps": 4190, "total_steps": 38160, "loss": 0.4015, "lr": 0.0009997089862336548, "epoch": 2.1960167714884697, "percentage": 10.98, "elapsed_time": "0:10:40", "remaining_time": "1:26:32", "throughput": 4271.42, "total_tokens": 2735856} {"current_steps": 4195, "total_steps": 38160, "loss": 0.6048, "lr": 0.000999701132746483, "epoch": 2.198637316561845, "percentage": 10.99, "elapsed_time": "0:10:41", "remaining_time": "1:26:31", "throughput": 4271.43, "total_tokens": 2738832} {"current_steps": 4200, "total_steps": 38160, "loss": 0.5141, "lr": 0.0009996931747275352, "epoch": 2.20125786163522, "percentage": 11.01, "elapsed_time": "0:10:41", "remaining_time": "1:26:30", "throughput": 4271.87, "total_tokens": 2742416} {"current_steps": 4205, "total_steps": 38160, "loss": 0.4521, "lr": 0.000999685112178476, "epoch": 2.2038784067085953, "percentage": 11.02, "elapsed_time": "0:10:42", "remaining_time": "1:26:30", "throughput": 4272.43, "total_tokens": 2746096} {"current_steps": 4210, "total_steps": 38160, "loss": 0.4118, "lr": 0.0009996769451009922, "epoch": 2.2064989517819704, "percentage": 11.03, "elapsed_time": "0:10:43", "remaining_time": "1:26:28", "throughput": 4272.08, "total_tokens": 2748560} {"current_steps": 4215, "total_steps": 38160, "loss": 0.4002, "lr": 0.000999668673496792, "epoch": 2.209119496855346, "percentage": 11.05, "elapsed_time": "0:10:43", "remaining_time": "1:26:26", "throughput": 4271.68, "total_tokens": 2750896} {"current_steps": 4220, "total_steps": 38160, "loss": 0.3923, "lr": 0.0009996602973676057, "epoch": 2.211740041928721, "percentage": 11.06, "elapsed_time": "0:10:44", "remaining_time": "1:26:24", "throughput": 4271.79, "total_tokens": 2753968} {"current_steps": 4225, "total_steps": 38160, "loss": 0.4837, "lr": 0.0009996518167151858, "epoch": 2.2143605870020964, "percentage": 11.07, "elapsed_time": "0:10:45", "remaining_time": "1:26:24", "throughput": 4272.47, "total_tokens": 2757840} {"current_steps": 4230, "total_steps": 38160, "loss": 0.5338, "lr": 0.000999643231541306, "epoch": 2.2169811320754715, "percentage": 11.08, "elapsed_time": "0:10:46", "remaining_time": "1:26:24", "throughput": 4273.35, "total_tokens": 2761936} {"current_steps": 4235, "total_steps": 38160, "loss": 0.565, "lr": 0.0009996345418477625, "epoch": 2.219601677148847, "percentage": 11.1, "elapsed_time": "0:10:46", "remaining_time": "1:26:22", "throughput": 4273.15, "total_tokens": 2764592} {"current_steps": 4240, "total_steps": 38160, "loss": 0.4012, "lr": 0.000999625747636373, "epoch": 2.2222222222222223, "percentage": 11.11, "elapsed_time": "0:10:47", "remaining_time": "1:26:21", "throughput": 4273.08, "total_tokens": 2767408} {"current_steps": 4245, "total_steps": 38160, "loss": 0.3973, "lr": 0.000999616848908977, "epoch": 2.2248427672955975, "percentage": 11.12, "elapsed_time": "0:10:48", "remaining_time": "1:26:19", "throughput": 4272.74, "total_tokens": 2769808} {"current_steps": 4250, "total_steps": 38160, "loss": 0.452, "lr": 0.0009996078456674363, "epoch": 2.2274633123689727, "percentage": 11.14, "elapsed_time": "0:10:48", "remaining_time": "1:26:17", "throughput": 4272.92, "total_tokens": 2772944} {"current_steps": 4255, "total_steps": 38160, "loss": 0.456, "lr": 0.000999598737913634, "epoch": 2.230083857442348, "percentage": 11.15, "elapsed_time": "0:10:49", "remaining_time": "1:26:16", "throughput": 4272.88, "total_tokens": 2775856} {"current_steps": 4260, "total_steps": 38160, "loss": 0.4896, "lr": 0.0009995895256494755, "epoch": 2.2327044025157234, "percentage": 11.16, "elapsed_time": "0:10:50", "remaining_time": "1:26:14", "throughput": 4272.95, "total_tokens": 2778736} {"current_steps": 4265, "total_steps": 38160, "loss": 0.4526, "lr": 0.000999580208876888, "epoch": 2.2353249475890986, "percentage": 11.18, "elapsed_time": "0:10:51", "remaining_time": "1:26:14", "throughput": 4273.63, "total_tokens": 2782608} {"current_steps": 4270, "total_steps": 38160, "loss": 0.5986, "lr": 0.0009995707875978198, "epoch": 2.237945492662474, "percentage": 11.19, "elapsed_time": "0:10:51", "remaining_time": "1:26:12", "throughput": 4273.27, "total_tokens": 2785040} {"current_steps": 4275, "total_steps": 38160, "loss": 0.5072, "lr": 0.0009995612618142428, "epoch": 2.240566037735849, "percentage": 11.2, "elapsed_time": "0:10:52", "remaining_time": "1:26:11", "throughput": 4273.51, "total_tokens": 2788304} {"current_steps": 4280, "total_steps": 38160, "loss": 0.5045, "lr": 0.000999551631528149, "epoch": 2.243186582809224, "percentage": 11.22, "elapsed_time": "0:10:53", "remaining_time": "1:26:10", "throughput": 4273.54, "total_tokens": 2791248} {"current_steps": 4285, "total_steps": 38160, "loss": 0.432, "lr": 0.000999541896741553, "epoch": 2.2458071278825997, "percentage": 11.23, "elapsed_time": "0:10:53", "remaining_time": "1:26:09", "throughput": 4273.91, "total_tokens": 2794736} {"current_steps": 4290, "total_steps": 38160, "loss": 0.4886, "lr": 0.0009995320574564912, "epoch": 2.248427672955975, "percentage": 11.24, "elapsed_time": "0:10:54", "remaining_time": "1:26:08", "throughput": 4274.16, "total_tokens": 2798000} {"current_steps": 4295, "total_steps": 38160, "loss": 0.4156, "lr": 0.000999522113675022, "epoch": 2.25104821802935, "percentage": 11.26, "elapsed_time": "0:10:55", "remaining_time": "1:26:06", "throughput": 4274.15, "total_tokens": 2800912} {"current_steps": 4300, "total_steps": 38160, "loss": 0.3996, "lr": 0.0009995120653992255, "epoch": 2.2536687631027252, "percentage": 11.27, "elapsed_time": "0:10:56", "remaining_time": "1:26:05", "throughput": 4274.24, "total_tokens": 2803984} {"current_steps": 4305, "total_steps": 38160, "loss": 0.4243, "lr": 0.0009995019126312035, "epoch": 2.2562893081761004, "percentage": 11.28, "elapsed_time": "0:10:56", "remaining_time": "1:26:04", "throughput": 4274.08, "total_tokens": 2806640} {"current_steps": 4310, "total_steps": 38160, "loss": 0.5321, "lr": 0.0009994916553730802, "epoch": 2.258909853249476, "percentage": 11.29, "elapsed_time": "0:10:57", "remaining_time": "1:26:02", "throughput": 4274.01, "total_tokens": 2809360} {"current_steps": 4315, "total_steps": 38160, "loss": 0.4649, "lr": 0.000999481293627001, "epoch": 2.261530398322851, "percentage": 11.31, "elapsed_time": "0:10:57", "remaining_time": "1:26:00", "throughput": 4273.82, "total_tokens": 2811984} {"current_steps": 4320, "total_steps": 38160, "loss": 0.6067, "lr": 0.0009994708273951337, "epoch": 2.2641509433962264, "percentage": 11.32, "elapsed_time": "0:10:58", "remaining_time": "1:25:59", "throughput": 4274.19, "total_tokens": 2815440} {"current_steps": 4325, "total_steps": 38160, "loss": 0.5596, "lr": 0.0009994602566796673, "epoch": 2.2667714884696015, "percentage": 11.33, "elapsed_time": "0:10:59", "remaining_time": "1:25:58", "throughput": 4274.14, "total_tokens": 2818192} {"current_steps": 4330, "total_steps": 38160, "loss": 0.3679, "lr": 0.0009994495814828136, "epoch": 2.269392033542977, "percentage": 11.35, "elapsed_time": "0:11:00", "remaining_time": "1:25:57", "throughput": 4274.61, "total_tokens": 2821744} {"current_steps": 4335, "total_steps": 38160, "loss": 0.6054, "lr": 0.0009994388018068055, "epoch": 2.2720125786163523, "percentage": 11.36, "elapsed_time": "0:11:00", "remaining_time": "1:25:56", "throughput": 4275.25, "total_tokens": 2825520} {"current_steps": 4340, "total_steps": 38160, "loss": 0.5158, "lr": 0.0009994279176538977, "epoch": 2.2746331236897275, "percentage": 11.37, "elapsed_time": "0:11:01", "remaining_time": "1:25:56", "throughput": 4276.2, "total_tokens": 2829776} {"current_steps": 4345, "total_steps": 38160, "loss": 0.4785, "lr": 0.0009994169290263675, "epoch": 2.2772536687631026, "percentage": 11.39, "elapsed_time": "0:11:02", "remaining_time": "1:25:55", "throughput": 4276.16, "total_tokens": 2832624} {"current_steps": 4350, "total_steps": 38160, "loss": 0.5661, "lr": 0.0009994058359265132, "epoch": 2.279874213836478, "percentage": 11.4, "elapsed_time": "0:11:03", "remaining_time": "1:25:53", "throughput": 4276.19, "total_tokens": 2835536} {"current_steps": 4355, "total_steps": 38160, "loss": 0.6126, "lr": 0.0009993946383566558, "epoch": 2.2824947589098534, "percentage": 11.41, "elapsed_time": "0:11:03", "remaining_time": "1:25:52", "throughput": 4276.13, "total_tokens": 2838384} {"current_steps": 4360, "total_steps": 38160, "loss": 0.49, "lr": 0.0009993833363191374, "epoch": 2.2851153039832286, "percentage": 11.43, "elapsed_time": "0:11:04", "remaining_time": "1:25:51", "throughput": 4276.62, "total_tokens": 2842032} {"current_steps": 4365, "total_steps": 38160, "loss": 0.4134, "lr": 0.0009993719298163222, "epoch": 2.2877358490566038, "percentage": 11.44, "elapsed_time": "0:11:05", "remaining_time": "1:25:50", "throughput": 4276.53, "total_tokens": 2844720} {"current_steps": 4370, "total_steps": 38160, "loss": 0.3871, "lr": 0.0009993604188505965, "epoch": 2.290356394129979, "percentage": 11.45, "elapsed_time": "0:11:05", "remaining_time": "1:25:49", "throughput": 4276.65, "total_tokens": 2847888} {"current_steps": 4375, "total_steps": 38160, "loss": 0.7515, "lr": 0.000999348803424368, "epoch": 2.2929769392033545, "percentage": 11.46, "elapsed_time": "0:11:06", "remaining_time": "1:25:47", "throughput": 4276.59, "total_tokens": 2850800} {"current_steps": 4380, "total_steps": 38160, "loss": 0.4686, "lr": 0.000999337083540067, "epoch": 2.2955974842767297, "percentage": 11.48, "elapsed_time": "0:11:07", "remaining_time": "1:25:46", "throughput": 4276.79, "total_tokens": 2853936} {"current_steps": 4385, "total_steps": 38160, "loss": 0.5414, "lr": 0.0009993252592001448, "epoch": 2.298218029350105, "percentage": 11.49, "elapsed_time": "0:11:08", "remaining_time": "1:25:45", "throughput": 4276.97, "total_tokens": 2857040} {"current_steps": 4390, "total_steps": 38160, "loss": 0.4615, "lr": 0.0009993133304070747, "epoch": 2.30083857442348, "percentage": 11.5, "elapsed_time": "0:11:08", "remaining_time": "1:25:45", "throughput": 4277.83, "total_tokens": 2861264} {"current_steps": 4395, "total_steps": 38160, "loss": 0.5137, "lr": 0.0009993012971633527, "epoch": 2.3034591194968552, "percentage": 11.52, "elapsed_time": "0:11:09", "remaining_time": "1:25:44", "throughput": 4278.34, "total_tokens": 2864848} {"current_steps": 4400, "total_steps": 38160, "loss": 0.4293, "lr": 0.0009992891594714952, "epoch": 2.3060796645702304, "percentage": 11.53, "elapsed_time": "0:11:10", "remaining_time": "1:25:42", "throughput": 4277.99, "total_tokens": 2867280} {"current_steps": 4405, "total_steps": 38160, "loss": 0.6236, "lr": 0.0009992769173340422, "epoch": 2.308700209643606, "percentage": 11.54, "elapsed_time": "0:11:10", "remaining_time": "1:25:41", "throughput": 4278.04, "total_tokens": 2870288} {"current_steps": 4410, "total_steps": 38160, "loss": 0.4785, "lr": 0.000999264570753554, "epoch": 2.311320754716981, "percentage": 11.56, "elapsed_time": "0:11:11", "remaining_time": "1:25:39", "throughput": 4277.82, "total_tokens": 2872912} {"current_steps": 4415, "total_steps": 38160, "loss": 0.5301, "lr": 0.0009992521197326135, "epoch": 2.3139412997903563, "percentage": 11.57, "elapsed_time": "0:11:12", "remaining_time": "1:25:39", "throughput": 4278.79, "total_tokens": 2877296} {"current_steps": 4420, "total_steps": 38160, "loss": 0.5492, "lr": 0.0009992395642738252, "epoch": 2.3165618448637315, "percentage": 11.58, "elapsed_time": "0:11:13", "remaining_time": "1:25:38", "throughput": 4279.0, "total_tokens": 2880464} {"current_steps": 4425, "total_steps": 38160, "loss": 0.4832, "lr": 0.0009992269043798158, "epoch": 2.319182389937107, "percentage": 11.6, "elapsed_time": "0:11:13", "remaining_time": "1:25:36", "throughput": 4278.69, "total_tokens": 2882896} {"current_steps": 4430, "total_steps": 38160, "loss": 0.417, "lr": 0.0009992141400532336, "epoch": 2.3218029350104823, "percentage": 11.61, "elapsed_time": "0:11:14", "remaining_time": "1:25:35", "throughput": 4279.07, "total_tokens": 2886384} {"current_steps": 4435, "total_steps": 38160, "loss": 0.5384, "lr": 0.0009992012712967484, "epoch": 2.3244234800838575, "percentage": 11.62, "elapsed_time": "0:11:15", "remaining_time": "1:25:35", "throughput": 4279.71, "total_tokens": 2890224} {"current_steps": 4440, "total_steps": 38160, "loss": 0.3691, "lr": 0.0009991882981130525, "epoch": 2.3270440251572326, "percentage": 11.64, "elapsed_time": "0:11:16", "remaining_time": "1:25:34", "throughput": 4279.83, "total_tokens": 2893392} {"current_steps": 4445, "total_steps": 38160, "loss": 0.4444, "lr": 0.0009991752205048597, "epoch": 2.329664570230608, "percentage": 11.65, "elapsed_time": "0:11:16", "remaining_time": "1:25:32", "throughput": 4279.82, "total_tokens": 2896240} {"current_steps": 4450, "total_steps": 38160, "loss": 0.4641, "lr": 0.0009991620384749058, "epoch": 2.3322851153039834, "percentage": 11.66, "elapsed_time": "0:11:17", "remaining_time": "1:25:33", "throughput": 4281.24, "total_tokens": 2901520} {"current_steps": 4455, "total_steps": 38160, "loss": 0.545, "lr": 0.0009991487520259479, "epoch": 2.3349056603773586, "percentage": 11.67, "elapsed_time": "0:11:18", "remaining_time": "1:25:32", "throughput": 4280.85, "total_tokens": 2903856} {"current_steps": 4460, "total_steps": 38160, "loss": 0.442, "lr": 0.000999135361160766, "epoch": 2.3375262054507338, "percentage": 11.69, "elapsed_time": "0:11:18", "remaining_time": "1:25:30", "throughput": 4280.4, "total_tokens": 2906128} {"current_steps": 4465, "total_steps": 38160, "loss": 0.5346, "lr": 0.0009991218658821608, "epoch": 2.340146750524109, "percentage": 11.7, "elapsed_time": "0:11:19", "remaining_time": "1:25:28", "throughput": 4280.25, "total_tokens": 2908848} {"current_steps": 4470, "total_steps": 38160, "loss": 0.4193, "lr": 0.0009991082661929556, "epoch": 2.342767295597484, "percentage": 11.71, "elapsed_time": "0:11:20", "remaining_time": "1:25:28", "throughput": 4281.0, "total_tokens": 2912976} {"current_steps": 4475, "total_steps": 38160, "loss": 0.4325, "lr": 0.000999094562095995, "epoch": 2.3453878406708597, "percentage": 11.73, "elapsed_time": "0:11:21", "remaining_time": "1:25:27", "throughput": 4280.99, "total_tokens": 2915888} {"current_steps": 4480, "total_steps": 38160, "loss": 0.4018, "lr": 0.0009990807535941461, "epoch": 2.348008385744235, "percentage": 11.74, "elapsed_time": "0:11:21", "remaining_time": "1:25:25", "throughput": 4281.06, "total_tokens": 2918928} {"current_steps": 4485, "total_steps": 38160, "loss": 0.5756, "lr": 0.0009990668406902976, "epoch": 2.35062893081761, "percentage": 11.75, "elapsed_time": "0:11:22", "remaining_time": "1:25:24", "throughput": 4280.72, "total_tokens": 2921392} {"current_steps": 4490, "total_steps": 38160, "loss": 0.4396, "lr": 0.0009990528233873594, "epoch": 2.353249475890985, "percentage": 11.77, "elapsed_time": "0:11:23", "remaining_time": "1:25:22", "throughput": 4280.57, "total_tokens": 2924112} {"current_steps": 4495, "total_steps": 38160, "loss": 0.512, "lr": 0.0009990387016882642, "epoch": 2.3558700209643604, "percentage": 11.78, "elapsed_time": "0:11:23", "remaining_time": "1:25:21", "throughput": 4281.1, "total_tokens": 2927792} {"current_steps": 4500, "total_steps": 38160, "loss": 0.6341, "lr": 0.000999024475595966, "epoch": 2.358490566037736, "percentage": 11.79, "elapsed_time": "0:11:24", "remaining_time": "1:25:21", "throughput": 4281.97, "total_tokens": 2931984} {"current_steps": 4505, "total_steps": 38160, "loss": 0.4606, "lr": 0.0009990101451134406, "epoch": 2.361111111111111, "percentage": 11.81, "elapsed_time": "0:11:25", "remaining_time": "1:25:21", "throughput": 4282.6, "total_tokens": 2935856} {"current_steps": 4510, "total_steps": 38160, "loss": 0.4489, "lr": 0.0009989957102436858, "epoch": 2.3637316561844863, "percentage": 11.82, "elapsed_time": "0:11:26", "remaining_time": "1:25:20", "throughput": 4283.31, "total_tokens": 2939760} {"current_steps": 4515, "total_steps": 38160, "loss": 0.5855, "lr": 0.0009989811709897212, "epoch": 2.3663522012578615, "percentage": 11.83, "elapsed_time": "0:11:27", "remaining_time": "1:25:20", "throughput": 4284.31, "total_tokens": 2944112} {"current_steps": 4520, "total_steps": 38160, "loss": 0.4066, "lr": 0.0009989665273545884, "epoch": 2.368972746331237, "percentage": 11.84, "elapsed_time": "0:11:27", "remaining_time": "1:25:19", "throughput": 4284.46, "total_tokens": 2947184} {"current_steps": 4525, "total_steps": 38160, "loss": 0.4287, "lr": 0.0009989517793413507, "epoch": 2.3715932914046123, "percentage": 11.86, "elapsed_time": "0:11:28", "remaining_time": "1:25:18", "throughput": 4284.78, "total_tokens": 2950672} {"current_steps": 4530, "total_steps": 38160, "loss": 0.5616, "lr": 0.000998936926953093, "epoch": 2.3742138364779874, "percentage": 11.87, "elapsed_time": "0:11:29", "remaining_time": "1:25:17", "throughput": 4284.93, "total_tokens": 2953872} {"current_steps": 4535, "total_steps": 38160, "loss": 0.4965, "lr": 0.0009989219701929224, "epoch": 2.3768343815513626, "percentage": 11.88, "elapsed_time": "0:11:30", "remaining_time": "1:25:16", "throughput": 4284.81, "total_tokens": 2956624} {"current_steps": 4540, "total_steps": 38160, "loss": 0.4106, "lr": 0.0009989069090639675, "epoch": 2.379454926624738, "percentage": 11.9, "elapsed_time": "0:11:30", "remaining_time": "1:25:15", "throughput": 4284.96, "total_tokens": 2959824} {"current_steps": 4545, "total_steps": 38160, "loss": 0.4483, "lr": 0.0009988917435693793, "epoch": 2.3820754716981134, "percentage": 11.91, "elapsed_time": "0:11:31", "remaining_time": "1:25:13", "throughput": 4284.97, "total_tokens": 2962736} {"current_steps": 4550, "total_steps": 38160, "loss": 0.5022, "lr": 0.0009988764737123297, "epoch": 2.3846960167714886, "percentage": 11.92, "elapsed_time": "0:11:32", "remaining_time": "1:25:12", "throughput": 4285.14, "total_tokens": 2965872} {"current_steps": 4555, "total_steps": 38160, "loss": 0.3298, "lr": 0.0009988610994960134, "epoch": 2.3873165618448637, "percentage": 11.94, "elapsed_time": "0:11:32", "remaining_time": "1:25:11", "throughput": 4285.29, "total_tokens": 2969104} {"current_steps": 4560, "total_steps": 38160, "loss": 0.5718, "lr": 0.0009988456209236464, "epoch": 2.389937106918239, "percentage": 11.95, "elapsed_time": "0:11:33", "remaining_time": "1:25:11", "throughput": 4286.31, "total_tokens": 2973616} {"current_steps": 4565, "total_steps": 38160, "loss": 0.5696, "lr": 0.0009988300379984668, "epoch": 2.392557651991614, "percentage": 11.96, "elapsed_time": "0:11:34", "remaining_time": "1:25:09", "throughput": 4285.82, "total_tokens": 2975888} {"current_steps": 4570, "total_steps": 38160, "loss": 0.5107, "lr": 0.0009988143507237341, "epoch": 2.3951781970649897, "percentage": 11.98, "elapsed_time": "0:11:35", "remaining_time": "1:25:08", "throughput": 4286.06, "total_tokens": 2979088} {"current_steps": 4575, "total_steps": 38160, "loss": 0.5222, "lr": 0.00099879855910273, "epoch": 2.397798742138365, "percentage": 11.99, "elapsed_time": "0:11:35", "remaining_time": "1:25:08", "throughput": 4286.4, "total_tokens": 2982576} {"current_steps": 4580, "total_steps": 38160, "loss": 0.4425, "lr": 0.0009987826631387578, "epoch": 2.40041928721174, "percentage": 12.0, "elapsed_time": "0:11:36", "remaining_time": "1:25:07", "throughput": 4287.02, "total_tokens": 2986480} {"current_steps": 4585, "total_steps": 38160, "loss": 0.6338, "lr": 0.000998766662835143, "epoch": 2.403039832285115, "percentage": 12.02, "elapsed_time": "0:11:37", "remaining_time": "1:25:06", "throughput": 4287.49, "total_tokens": 2990096} {"current_steps": 4590, "total_steps": 38160, "loss": 0.6223, "lr": 0.0009987505581952325, "epoch": 2.4056603773584904, "percentage": 12.03, "elapsed_time": "0:11:38", "remaining_time": "1:25:05", "throughput": 4287.48, "total_tokens": 2993040} {"current_steps": 4595, "total_steps": 38160, "loss": 0.5228, "lr": 0.0009987343492223954, "epoch": 2.408280922431866, "percentage": 12.04, "elapsed_time": "0:11:38", "remaining_time": "1:25:05", "throughput": 4288.16, "total_tokens": 2997008} {"current_steps": 4600, "total_steps": 38160, "loss": 0.4226, "lr": 0.0009987180359200222, "epoch": 2.410901467505241, "percentage": 12.05, "elapsed_time": "0:11:39", "remaining_time": "1:25:04", "throughput": 4288.42, "total_tokens": 3000432} {"current_steps": 4605, "total_steps": 38160, "loss": 0.4817, "lr": 0.0009987016182915257, "epoch": 2.4135220125786163, "percentage": 12.07, "elapsed_time": "0:11:40", "remaining_time": "1:25:03", "throughput": 4288.79, "total_tokens": 3003952} {"current_steps": 4610, "total_steps": 38160, "loss": 0.4419, "lr": 0.0009986850963403398, "epoch": 2.4161425576519915, "percentage": 12.08, "elapsed_time": "0:11:41", "remaining_time": "1:25:02", "throughput": 4288.49, "total_tokens": 3006448} {"current_steps": 4615, "total_steps": 38160, "loss": 0.4217, "lr": 0.0009986684700699214, "epoch": 2.418763102725367, "percentage": 12.09, "elapsed_time": "0:11:41", "remaining_time": "1:25:01", "throughput": 4288.78, "total_tokens": 3009808} {"current_steps": 4620, "total_steps": 38160, "loss": 0.3905, "lr": 0.000998651739483748, "epoch": 2.4213836477987423, "percentage": 12.11, "elapsed_time": "0:11:42", "remaining_time": "1:25:00", "throughput": 4289.27, "total_tokens": 3013392} {"current_steps": 4625, "total_steps": 38160, "loss": 0.6548, "lr": 0.0009986349045853196, "epoch": 2.4240041928721174, "percentage": 12.12, "elapsed_time": "0:11:43", "remaining_time": "1:24:58", "throughput": 4288.96, "total_tokens": 3015888} {"current_steps": 4630, "total_steps": 38160, "loss": 0.3772, "lr": 0.000998617965378158, "epoch": 2.4266247379454926, "percentage": 12.13, "elapsed_time": "0:11:43", "remaining_time": "1:24:57", "throughput": 4289.09, "total_tokens": 3019120} {"current_steps": 4635, "total_steps": 38160, "loss": 0.5878, "lr": 0.0009986009218658064, "epoch": 2.4292452830188678, "percentage": 12.15, "elapsed_time": "0:11:44", "remaining_time": "1:24:58", "throughput": 4290.26, "total_tokens": 3023920} {"current_steps": 4640, "total_steps": 38160, "loss": 0.5846, "lr": 0.0009985837740518306, "epoch": 2.431865828092243, "percentage": 12.16, "elapsed_time": "0:11:45", "remaining_time": "1:24:56", "throughput": 4290.42, "total_tokens": 3027088} {"current_steps": 4645, "total_steps": 38160, "loss": 0.463, "lr": 0.0009985665219398173, "epoch": 2.4344863731656186, "percentage": 12.17, "elapsed_time": "0:11:46", "remaining_time": "1:24:55", "throughput": 4290.08, "total_tokens": 3029456} {"current_steps": 4650, "total_steps": 38160, "loss": 0.3985, "lr": 0.0009985491655333755, "epoch": 2.4371069182389937, "percentage": 12.19, "elapsed_time": "0:11:46", "remaining_time": "1:24:54", "throughput": 4290.8, "total_tokens": 3033488} {"current_steps": 4655, "total_steps": 38160, "loss": 0.4048, "lr": 0.000998531704836136, "epoch": 2.439727463312369, "percentage": 12.2, "elapsed_time": "0:11:48", "remaining_time": "1:24:55", "throughput": 4292.4, "total_tokens": 3039024} {"current_steps": 4660, "total_steps": 38160, "loss": 0.3618, "lr": 0.0009985141398517513, "epoch": 2.442348008385744, "percentage": 12.21, "elapsed_time": "0:11:48", "remaining_time": "1:24:55", "throughput": 4293.26, "total_tokens": 3043248} {"current_steps": 4665, "total_steps": 38160, "loss": 0.463, "lr": 0.000998496470583896, "epoch": 2.4449685534591197, "percentage": 12.22, "elapsed_time": "0:11:49", "remaining_time": "1:24:54", "throughput": 4293.45, "total_tokens": 3046384} {"current_steps": 4670, "total_steps": 38160, "loss": 0.4275, "lr": 0.0009984786970362663, "epoch": 2.447589098532495, "percentage": 12.24, "elapsed_time": "0:11:50", "remaining_time": "1:24:53", "throughput": 4293.57, "total_tokens": 3049392} {"current_steps": 4675, "total_steps": 38160, "loss": 0.4328, "lr": 0.00099846081921258, "epoch": 2.45020964360587, "percentage": 12.25, "elapsed_time": "0:11:51", "remaining_time": "1:24:52", "throughput": 4294.26, "total_tokens": 3053392} {"current_steps": 4680, "total_steps": 38160, "loss": 0.4129, "lr": 0.000998442837116577, "epoch": 2.452830188679245, "percentage": 12.26, "elapsed_time": "0:11:51", "remaining_time": "1:24:52", "throughput": 4295.04, "total_tokens": 3057520} {"current_steps": 4685, "total_steps": 38160, "loss": 0.4497, "lr": 0.0009984247507520193, "epoch": 2.4554507337526204, "percentage": 12.28, "elapsed_time": "0:11:52", "remaining_time": "1:24:50", "throughput": 4294.63, "total_tokens": 3059824} {"current_steps": 4690, "total_steps": 38160, "loss": 0.5135, "lr": 0.0009984065601226896, "epoch": 2.458071278825996, "percentage": 12.29, "elapsed_time": "0:11:53", "remaining_time": "1:24:49", "throughput": 4294.85, "total_tokens": 3063120} {"current_steps": 4695, "total_steps": 38160, "loss": 0.4325, "lr": 0.0009983882652323942, "epoch": 2.460691823899371, "percentage": 12.3, "elapsed_time": "0:11:53", "remaining_time": "1:24:48", "throughput": 4295.14, "total_tokens": 3066544} {"current_steps": 4700, "total_steps": 38160, "loss": 0.381, "lr": 0.0009983698660849592, "epoch": 2.4633123689727463, "percentage": 12.32, "elapsed_time": "0:11:54", "remaining_time": "1:24:48", "throughput": 4295.59, "total_tokens": 3070224} {"current_steps": 4705, "total_steps": 38160, "loss": 0.4234, "lr": 0.0009983513626842342, "epoch": 2.4659329140461215, "percentage": 12.33, "elapsed_time": "0:11:55", "remaining_time": "1:24:47", "throughput": 4295.72, "total_tokens": 3073456} {"current_steps": 4710, "total_steps": 38160, "loss": 0.5259, "lr": 0.0009983327550340893, "epoch": 2.468553459119497, "percentage": 12.34, "elapsed_time": "0:11:56", "remaining_time": "1:24:46", "throughput": 4295.94, "total_tokens": 3076656} {"current_steps": 4715, "total_steps": 38160, "loss": 0.4537, "lr": 0.0009983140431384177, "epoch": 2.4711740041928723, "percentage": 12.36, "elapsed_time": "0:11:56", "remaining_time": "1:24:44", "throughput": 4295.5, "total_tokens": 3078928} {"current_steps": 4720, "total_steps": 38160, "loss": 0.4888, "lr": 0.0009982952270011331, "epoch": 2.4737945492662474, "percentage": 12.37, "elapsed_time": "0:11:57", "remaining_time": "1:24:42", "throughput": 4295.24, "total_tokens": 3081520} {"current_steps": 4725, "total_steps": 38160, "loss": 0.4702, "lr": 0.000998276306626172, "epoch": 2.4764150943396226, "percentage": 12.38, "elapsed_time": "0:11:58", "remaining_time": "1:24:41", "throughput": 4295.13, "total_tokens": 3084464} {"current_steps": 4730, "total_steps": 38160, "loss": 0.6283, "lr": 0.000998257282017492, "epoch": 2.4790356394129978, "percentage": 12.4, "elapsed_time": "0:11:58", "remaining_time": "1:24:40", "throughput": 4295.41, "total_tokens": 3087856} {"current_steps": 4735, "total_steps": 38160, "loss": 0.4824, "lr": 0.0009982381531790732, "epoch": 2.481656184486373, "percentage": 12.41, "elapsed_time": "0:11:59", "remaining_time": "1:24:40", "throughput": 4296.15, "total_tokens": 3091952} {"current_steps": 4740, "total_steps": 38160, "loss": 0.5683, "lr": 0.0009982189201149167, "epoch": 2.4842767295597485, "percentage": 12.42, "elapsed_time": "0:12:00", "remaining_time": "1:24:39", "throughput": 4296.5, "total_tokens": 3095504} {"current_steps": 4745, "total_steps": 38160, "loss": 0.5922, "lr": 0.0009981995828290465, "epoch": 2.4868972746331237, "percentage": 12.43, "elapsed_time": "0:12:01", "remaining_time": "1:24:41", "throughput": 4298.32, "total_tokens": 3101776} {"current_steps": 4750, "total_steps": 38160, "loss": 0.446, "lr": 0.0009981801413255068, "epoch": 2.489517819706499, "percentage": 12.45, "elapsed_time": "0:12:02", "remaining_time": "1:24:40", "throughput": 4298.58, "total_tokens": 3105200} {"current_steps": 4755, "total_steps": 38160, "loss": 0.5389, "lr": 0.0009981605956083657, "epoch": 2.492138364779874, "percentage": 12.46, "elapsed_time": "0:12:03", "remaining_time": "1:24:40", "throughput": 4298.76, "total_tokens": 3108496} {"current_steps": 4760, "total_steps": 38160, "loss": 0.4775, "lr": 0.000998140945681711, "epoch": 2.4947589098532497, "percentage": 12.47, "elapsed_time": "0:12:03", "remaining_time": "1:24:38", "throughput": 4298.57, "total_tokens": 3111184} {"current_steps": 4765, "total_steps": 38160, "loss": 0.5551, "lr": 0.0009981211915496536, "epoch": 2.497379454926625, "percentage": 12.49, "elapsed_time": "0:12:04", "remaining_time": "1:24:37", "throughput": 4298.68, "total_tokens": 3114320} {"current_steps": 4770, "total_steps": 38160, "loss": 0.4378, "lr": 0.0009981013332163256, "epoch": 2.5, "percentage": 12.5, "elapsed_time": "0:12:05", "remaining_time": "1:24:35", "throughput": 4298.44, "total_tokens": 3116880} {"current_steps": 4775, "total_steps": 38160, "loss": 0.3954, "lr": 0.0009980813706858816, "epoch": 2.502620545073375, "percentage": 12.51, "elapsed_time": "0:12:05", "remaining_time": "1:24:34", "throughput": 4298.71, "total_tokens": 3120240} {"current_steps": 4780, "total_steps": 38160, "loss": 0.4825, "lr": 0.000998061303962497, "epoch": 2.5052410901467503, "percentage": 12.53, "elapsed_time": "0:12:06", "remaining_time": "1:24:34", "throughput": 4299.58, "total_tokens": 3124528} {"current_steps": 4785, "total_steps": 38160, "loss": 0.4126, "lr": 0.00099804113305037, "epoch": 2.507861635220126, "percentage": 12.54, "elapsed_time": "0:12:07", "remaining_time": "1:24:33", "throughput": 4299.74, "total_tokens": 3127760} {"current_steps": 4790, "total_steps": 38160, "loss": 0.4361, "lr": 0.0009980208579537199, "epoch": 2.510482180293501, "percentage": 12.55, "elapsed_time": "0:12:08", "remaining_time": "1:24:33", "throughput": 4300.4, "total_tokens": 3131696} {"current_steps": 4795, "total_steps": 38160, "loss": 0.4384, "lr": 0.000998000478676788, "epoch": 2.5131027253668763, "percentage": 12.57, "elapsed_time": "0:12:09", "remaining_time": "1:24:32", "throughput": 4301.07, "total_tokens": 3135664} {"current_steps": 4800, "total_steps": 38160, "loss": 0.5036, "lr": 0.0009979799952238373, "epoch": 2.5157232704402515, "percentage": 12.58, "elapsed_time": "0:12:09", "remaining_time": "1:24:31", "throughput": 4300.98, "total_tokens": 3138480} {"current_steps": 4805, "total_steps": 38160, "loss": 0.4498, "lr": 0.000997959407599153, "epoch": 2.518343815513627, "percentage": 12.59, "elapsed_time": "0:12:10", "remaining_time": "1:24:30", "throughput": 4301.26, "total_tokens": 3141840} {"current_steps": 4810, "total_steps": 38160, "loss": 0.5871, "lr": 0.000997938715807042, "epoch": 2.5209643605870022, "percentage": 12.6, "elapsed_time": "0:12:11", "remaining_time": "1:24:29", "throughput": 4301.47, "total_tokens": 3145168} {"current_steps": 4815, "total_steps": 38160, "loss": 0.4954, "lr": 0.000997917919851832, "epoch": 2.5235849056603774, "percentage": 12.62, "elapsed_time": "0:12:11", "remaining_time": "1:24:29", "throughput": 4301.94, "total_tokens": 3148944} {"current_steps": 4820, "total_steps": 38160, "loss": 0.4993, "lr": 0.0009978970197378736, "epoch": 2.5262054507337526, "percentage": 12.63, "elapsed_time": "0:12:12", "remaining_time": "1:24:27", "throughput": 4301.94, "total_tokens": 3151888} {"current_steps": 4825, "total_steps": 38160, "loss": 0.5473, "lr": 0.0009978760154695392, "epoch": 2.5288259958071277, "percentage": 12.64, "elapsed_time": "0:12:13", "remaining_time": "1:24:26", "throughput": 4301.92, "total_tokens": 3154864} {"current_steps": 4830, "total_steps": 38160, "loss": 0.3109, "lr": 0.0009978549070512226, "epoch": 2.531446540880503, "percentage": 12.66, "elapsed_time": "0:12:14", "remaining_time": "1:24:25", "throughput": 4301.94, "total_tokens": 3157840} {"current_steps": 4835, "total_steps": 38160, "loss": 0.4566, "lr": 0.000997833694487339, "epoch": 2.5340670859538785, "percentage": 12.67, "elapsed_time": "0:12:14", "remaining_time": "1:24:24", "throughput": 4302.22, "total_tokens": 3161264} {"current_steps": 4840, "total_steps": 38160, "loss": 0.414, "lr": 0.0009978123777823263, "epoch": 2.5366876310272537, "percentage": 12.68, "elapsed_time": "0:12:15", "remaining_time": "1:24:23", "throughput": 4302.25, "total_tokens": 3164272} {"current_steps": 4845, "total_steps": 38160, "loss": 0.4997, "lr": 0.0009977909569406434, "epoch": 2.539308176100629, "percentage": 12.7, "elapsed_time": "0:12:16", "remaining_time": "1:24:21", "throughput": 4301.58, "total_tokens": 3166256} {"current_steps": 4850, "total_steps": 38160, "loss": 0.4189, "lr": 0.0009977694319667713, "epoch": 2.541928721174004, "percentage": 12.71, "elapsed_time": "0:12:16", "remaining_time": "1:24:21", "throughput": 4302.56, "total_tokens": 3170800} {"current_steps": 4855, "total_steps": 38160, "loss": 0.5106, "lr": 0.0009977478028652131, "epoch": 2.5445492662473796, "percentage": 12.72, "elapsed_time": "0:12:17", "remaining_time": "1:24:20", "throughput": 4302.98, "total_tokens": 3174544} {"current_steps": 4860, "total_steps": 38160, "loss": 0.4719, "lr": 0.000997726069640493, "epoch": 2.547169811320755, "percentage": 12.74, "elapsed_time": "0:12:18", "remaining_time": "1:24:19", "throughput": 4302.86, "total_tokens": 3177392} {"current_steps": 4865, "total_steps": 38160, "loss": 0.4364, "lr": 0.0009977042322971577, "epoch": 2.54979035639413, "percentage": 12.75, "elapsed_time": "0:12:19", "remaining_time": "1:24:18", "throughput": 4302.85, "total_tokens": 3180304} {"current_steps": 4870, "total_steps": 38160, "loss": 0.4991, "lr": 0.000997682290839775, "epoch": 2.552410901467505, "percentage": 12.76, "elapsed_time": "0:12:19", "remaining_time": "1:24:17", "throughput": 4302.81, "total_tokens": 3183216} {"current_steps": 4875, "total_steps": 38160, "loss": 0.4842, "lr": 0.0009976602452729348, "epoch": 2.5550314465408803, "percentage": 12.78, "elapsed_time": "0:12:20", "remaining_time": "1:24:15", "throughput": 4302.84, "total_tokens": 3186224} {"current_steps": 4880, "total_steps": 38160, "loss": 0.427, "lr": 0.000997638095601249, "epoch": 2.5576519916142555, "percentage": 12.79, "elapsed_time": "0:12:21", "remaining_time": "1:24:14", "throughput": 4302.64, "total_tokens": 3188848} {"current_steps": 4885, "total_steps": 38160, "loss": 0.4741, "lr": 0.000997615841829351, "epoch": 2.560272536687631, "percentage": 12.8, "elapsed_time": "0:12:21", "remaining_time": "1:24:13", "throughput": 4302.93, "total_tokens": 3192176} {"current_steps": 4890, "total_steps": 38160, "loss": 0.4923, "lr": 0.000997593483961896, "epoch": 2.5628930817610063, "percentage": 12.81, "elapsed_time": "0:12:22", "remaining_time": "1:24:13", "throughput": 4303.82, "total_tokens": 3196560} {"current_steps": 4895, "total_steps": 38160, "loss": 0.4698, "lr": 0.0009975710220035607, "epoch": 2.5655136268343814, "percentage": 12.83, "elapsed_time": "0:12:23", "remaining_time": "1:24:12", "throughput": 4303.88, "total_tokens": 3199600} {"current_steps": 4900, "total_steps": 38160, "loss": 0.4223, "lr": 0.0009975484559590444, "epoch": 2.568134171907757, "percentage": 12.84, "elapsed_time": "0:12:24", "remaining_time": "1:24:11", "throughput": 4304.57, "total_tokens": 3203600} {"current_steps": 4905, "total_steps": 38160, "loss": 0.5089, "lr": 0.0009975257858330674, "epoch": 2.5707547169811322, "percentage": 12.85, "elapsed_time": "0:12:25", "remaining_time": "1:24:11", "throughput": 4305.46, "total_tokens": 3207984} {"current_steps": 4910, "total_steps": 38160, "loss": 0.4094, "lr": 0.0009975030116303723, "epoch": 2.5733752620545074, "percentage": 12.87, "elapsed_time": "0:12:25", "remaining_time": "1:24:10", "throughput": 4305.84, "total_tokens": 3211504} {"current_steps": 4915, "total_steps": 38160, "loss": 0.4765, "lr": 0.0009974801333557228, "epoch": 2.5759958071278826, "percentage": 12.88, "elapsed_time": "0:12:26", "remaining_time": "1:24:09", "throughput": 4305.86, "total_tokens": 3214608} {"current_steps": 4920, "total_steps": 38160, "loss": 0.6418, "lr": 0.000997457151013905, "epoch": 2.5786163522012577, "percentage": 12.89, "elapsed_time": "0:12:27", "remaining_time": "1:24:08", "throughput": 4305.92, "total_tokens": 3217616} {"current_steps": 4925, "total_steps": 38160, "loss": 0.6092, "lr": 0.0009974340646097264, "epoch": 2.581236897274633, "percentage": 12.91, "elapsed_time": "0:12:28", "remaining_time": "1:24:08", "throughput": 4306.41, "total_tokens": 3221488} {"current_steps": 4930, "total_steps": 38160, "loss": 0.5225, "lr": 0.0009974108741480166, "epoch": 2.5838574423480085, "percentage": 12.92, "elapsed_time": "0:12:28", "remaining_time": "1:24:06", "throughput": 4306.41, "total_tokens": 3224400} {"current_steps": 4935, "total_steps": 38160, "loss": 0.5521, "lr": 0.0009973875796336267, "epoch": 2.5864779874213837, "percentage": 12.93, "elapsed_time": "0:12:29", "remaining_time": "1:24:05", "throughput": 4306.43, "total_tokens": 3227408} {"current_steps": 4940, "total_steps": 38160, "loss": 0.362, "lr": 0.0009973641810714295, "epoch": 2.589098532494759, "percentage": 12.95, "elapsed_time": "0:12:30", "remaining_time": "1:24:04", "throughput": 4306.63, "total_tokens": 3230704} {"current_steps": 4945, "total_steps": 38160, "loss": 0.4147, "lr": 0.00099734067846632, "epoch": 2.591719077568134, "percentage": 12.96, "elapsed_time": "0:12:30", "remaining_time": "1:24:03", "throughput": 4306.33, "total_tokens": 3233200} {"current_steps": 4950, "total_steps": 38160, "loss": 0.3913, "lr": 0.0009973170718232144, "epoch": 2.5943396226415096, "percentage": 12.97, "elapsed_time": "0:12:31", "remaining_time": "1:24:02", "throughput": 4306.48, "total_tokens": 3236400} {"current_steps": 4955, "total_steps": 38160, "loss": 0.3778, "lr": 0.000997293361147051, "epoch": 2.596960167714885, "percentage": 12.98, "elapsed_time": "0:12:32", "remaining_time": "1:24:00", "throughput": 4306.34, "total_tokens": 3239216} {"current_steps": 4960, "total_steps": 38160, "loss": 0.3569, "lr": 0.0009972695464427904, "epoch": 2.59958071278826, "percentage": 13.0, "elapsed_time": "0:12:32", "remaining_time": "1:23:59", "throughput": 4306.07, "total_tokens": 3241712} {"current_steps": 4965, "total_steps": 38160, "loss": 0.4503, "lr": 0.0009972456277154134, "epoch": 2.602201257861635, "percentage": 13.01, "elapsed_time": "0:12:33", "remaining_time": "1:23:57", "throughput": 4306.12, "total_tokens": 3244784} {"current_steps": 4970, "total_steps": 38160, "loss": 0.5215, "lr": 0.000997221604969924, "epoch": 2.6048218029350103, "percentage": 13.02, "elapsed_time": "0:12:34", "remaining_time": "1:23:56", "throughput": 4306.01, "total_tokens": 3247568} {"current_steps": 4975, "total_steps": 38160, "loss": 0.5244, "lr": 0.0009971974782113475, "epoch": 2.6074423480083855, "percentage": 13.04, "elapsed_time": "0:12:34", "remaining_time": "1:23:55", "throughput": 4306.41, "total_tokens": 3251248} {"current_steps": 4980, "total_steps": 38160, "loss": 0.5686, "lr": 0.0009971732474447308, "epoch": 2.610062893081761, "percentage": 13.05, "elapsed_time": "0:12:35", "remaining_time": "1:23:54", "throughput": 4306.43, "total_tokens": 3254224} {"current_steps": 4985, "total_steps": 38160, "loss": 0.4843, "lr": 0.0009971489126751427, "epoch": 2.6126834381551363, "percentage": 13.06, "elapsed_time": "0:12:36", "remaining_time": "1:23:53", "throughput": 4306.47, "total_tokens": 3257200} {"current_steps": 4990, "total_steps": 38160, "loss": 0.6243, "lr": 0.0009971244739076742, "epoch": 2.6153039832285114, "percentage": 13.08, "elapsed_time": "0:12:37", "remaining_time": "1:23:52", "throughput": 4306.34, "total_tokens": 3260080} {"current_steps": 4995, "total_steps": 38160, "loss": 0.6038, "lr": 0.000997099931147437, "epoch": 2.617924528301887, "percentage": 13.09, "elapsed_time": "0:12:37", "remaining_time": "1:23:51", "throughput": 4306.32, "total_tokens": 3262992} {"current_steps": 5000, "total_steps": 38160, "loss": 0.5652, "lr": 0.0009970752843995654, "epoch": 2.620545073375262, "percentage": 13.1, "elapsed_time": "0:12:38", "remaining_time": "1:23:49", "throughput": 4306.29, "total_tokens": 3265872} {"current_steps": 5005, "total_steps": 38160, "loss": 0.5951, "lr": 0.0009970505336692153, "epoch": 2.6231656184486374, "percentage": 13.12, "elapsed_time": "0:12:39", "remaining_time": "1:23:48", "throughput": 4306.43, "total_tokens": 3269040} {"current_steps": 5010, "total_steps": 38160, "loss": 0.4367, "lr": 0.0009970256789615642, "epoch": 2.6257861635220126, "percentage": 13.13, "elapsed_time": "0:12:39", "remaining_time": "1:23:47", "throughput": 4306.29, "total_tokens": 3271760} {"current_steps": 5015, "total_steps": 38160, "loss": 0.4973, "lr": 0.0009970007202818115, "epoch": 2.6284067085953877, "percentage": 13.14, "elapsed_time": "0:12:40", "remaining_time": "1:23:45", "throughput": 4305.99, "total_tokens": 3274224} {"current_steps": 5020, "total_steps": 38160, "loss": 0.6117, "lr": 0.000996975657635178, "epoch": 2.631027253668763, "percentage": 13.16, "elapsed_time": "0:12:41", "remaining_time": "1:23:44", "throughput": 4306.09, "total_tokens": 3277392} {"current_steps": 5025, "total_steps": 38160, "loss": 0.447, "lr": 0.000996950491026907, "epoch": 2.6336477987421385, "percentage": 13.17, "elapsed_time": "0:12:41", "remaining_time": "1:23:43", "throughput": 4306.06, "total_tokens": 3280240} {"current_steps": 5030, "total_steps": 38160, "loss": 0.4833, "lr": 0.0009969252204622624, "epoch": 2.6362683438155137, "percentage": 13.18, "elapsed_time": "0:12:42", "remaining_time": "1:23:41", "throughput": 4305.86, "total_tokens": 3282864} {"current_steps": 5035, "total_steps": 38160, "loss": 0.5112, "lr": 0.0009968998459465312, "epoch": 2.638888888888889, "percentage": 13.19, "elapsed_time": "0:12:43", "remaining_time": "1:23:40", "throughput": 4306.03, "total_tokens": 3286064} {"current_steps": 5040, "total_steps": 38160, "loss": 0.6345, "lr": 0.0009968743674850212, "epoch": 2.641509433962264, "percentage": 13.21, "elapsed_time": "0:12:43", "remaining_time": "1:23:39", "throughput": 4305.79, "total_tokens": 3288656} {"current_steps": 5045, "total_steps": 38160, "loss": 0.5671, "lr": 0.0009968487850830622, "epoch": 2.6441299790356396, "percentage": 13.22, "elapsed_time": "0:12:44", "remaining_time": "1:23:38", "throughput": 4306.19, "total_tokens": 3292304} {"current_steps": 5050, "total_steps": 38160, "loss": 0.5992, "lr": 0.0009968230987460055, "epoch": 2.646750524109015, "percentage": 13.23, "elapsed_time": "0:12:45", "remaining_time": "1:23:37", "throughput": 4306.37, "total_tokens": 3295632} {"current_steps": 5055, "total_steps": 38160, "loss": 0.5681, "lr": 0.0009967973084792246, "epoch": 2.64937106918239, "percentage": 13.25, "elapsed_time": "0:12:45", "remaining_time": "1:23:36", "throughput": 4306.31, "total_tokens": 3298608} {"current_steps": 5060, "total_steps": 38160, "loss": 0.5484, "lr": 0.0009967714142881145, "epoch": 2.651991614255765, "percentage": 13.26, "elapsed_time": "0:12:46", "remaining_time": "1:23:35", "throughput": 4306.37, "total_tokens": 3301712} {"current_steps": 5065, "total_steps": 38160, "loss": 0.448, "lr": 0.0009967454161780923, "epoch": 2.6546121593291403, "percentage": 13.27, "elapsed_time": "0:12:47", "remaining_time": "1:23:34", "throughput": 4306.15, "total_tokens": 3304400} {"current_steps": 5070, "total_steps": 38160, "loss": 0.4396, "lr": 0.000996719314154596, "epoch": 2.6572327044025155, "percentage": 13.29, "elapsed_time": "0:12:47", "remaining_time": "1:23:32", "throughput": 4305.75, "total_tokens": 3306704} {"current_steps": 5075, "total_steps": 38160, "loss": 0.4755, "lr": 0.0009966931082230862, "epoch": 2.659853249475891, "percentage": 13.3, "elapsed_time": "0:12:48", "remaining_time": "1:23:31", "throughput": 4306.45, "total_tokens": 3310800} {"current_steps": 5080, "total_steps": 38160, "loss": 0.6228, "lr": 0.0009966667983890445, "epoch": 2.6624737945492662, "percentage": 13.31, "elapsed_time": "0:12:49", "remaining_time": "1:23:31", "throughput": 4307.12, "total_tokens": 3314768} {"current_steps": 5085, "total_steps": 38160, "loss": 0.4577, "lr": 0.000996640384657975, "epoch": 2.6650943396226414, "percentage": 13.33, "elapsed_time": "0:12:50", "remaining_time": "1:23:31", "throughput": 4307.75, "total_tokens": 3318768} {"current_steps": 5090, "total_steps": 38160, "loss": 0.4976, "lr": 0.0009966138670354028, "epoch": 2.667714884696017, "percentage": 13.34, "elapsed_time": "0:12:51", "remaining_time": "1:23:29", "throughput": 4307.84, "total_tokens": 3321808} {"current_steps": 5095, "total_steps": 38160, "loss": 0.5636, "lr": 0.0009965872455268755, "epoch": 2.670335429769392, "percentage": 13.35, "elapsed_time": "0:12:51", "remaining_time": "1:23:29", "throughput": 4308.48, "total_tokens": 3325904} {"current_steps": 5100, "total_steps": 38160, "loss": 0.479, "lr": 0.0009965605201379616, "epoch": 2.6729559748427674, "percentage": 13.36, "elapsed_time": "0:12:52", "remaining_time": "1:23:28", "throughput": 4308.55, "total_tokens": 3329008} {"current_steps": 5105, "total_steps": 38160, "loss": 0.5476, "lr": 0.000996533690874252, "epoch": 2.6755765199161425, "percentage": 13.38, "elapsed_time": "0:12:53", "remaining_time": "1:23:28", "throughput": 4309.16, "total_tokens": 3333008} {"current_steps": 5110, "total_steps": 38160, "loss": 0.4662, "lr": 0.0009965067577413593, "epoch": 2.6781970649895177, "percentage": 13.39, "elapsed_time": "0:12:54", "remaining_time": "1:23:26", "throughput": 4309.06, "total_tokens": 3335760} {"current_steps": 5115, "total_steps": 38160, "loss": 0.5788, "lr": 0.0009964797207449173, "epoch": 2.680817610062893, "percentage": 13.4, "elapsed_time": "0:12:54", "remaining_time": "1:23:25", "throughput": 4309.27, "total_tokens": 3339056} {"current_steps": 5120, "total_steps": 38160, "loss": 0.4803, "lr": 0.0009964525798905816, "epoch": 2.6834381551362685, "percentage": 13.42, "elapsed_time": "0:12:55", "remaining_time": "1:23:24", "throughput": 4309.29, "total_tokens": 3342064} {"current_steps": 5125, "total_steps": 38160, "loss": 0.5676, "lr": 0.0009964253351840303, "epoch": 2.6860587002096437, "percentage": 13.43, "elapsed_time": "0:12:56", "remaining_time": "1:23:23", "throughput": 4309.19, "total_tokens": 3344880} {"current_steps": 5130, "total_steps": 38160, "loss": 0.481, "lr": 0.000996397986630962, "epoch": 2.688679245283019, "percentage": 13.44, "elapsed_time": "0:12:56", "remaining_time": "1:23:22", "throughput": 4309.23, "total_tokens": 3347984} {"current_steps": 5135, "total_steps": 38160, "loss": 0.4639, "lr": 0.0009963705342370982, "epoch": 2.691299790356394, "percentage": 13.46, "elapsed_time": "0:12:57", "remaining_time": "1:23:21", "throughput": 4309.56, "total_tokens": 3351536} {"current_steps": 5140, "total_steps": 38160, "loss": 0.3976, "lr": 0.000996342978008182, "epoch": 2.6939203354297696, "percentage": 13.47, "elapsed_time": "0:12:58", "remaining_time": "1:23:20", "throughput": 4309.37, "total_tokens": 3354160} {"current_steps": 5145, "total_steps": 38160, "loss": 0.5743, "lr": 0.000996315317949977, "epoch": 2.6965408805031448, "percentage": 13.48, "elapsed_time": "0:12:58", "remaining_time": "1:23:18", "throughput": 4309.27, "total_tokens": 3356912} {"current_steps": 5150, "total_steps": 38160, "loss": 0.5229, "lr": 0.0009962875540682696, "epoch": 2.69916142557652, "percentage": 13.5, "elapsed_time": "0:12:59", "remaining_time": "1:23:17", "throughput": 4309.28, "total_tokens": 3359984} {"current_steps": 5155, "total_steps": 38160, "loss": 0.4231, "lr": 0.0009962596863688682, "epoch": 2.701781970649895, "percentage": 13.51, "elapsed_time": "0:13:00", "remaining_time": "1:23:16", "throughput": 4309.3, "total_tokens": 3363024} {"current_steps": 5160, "total_steps": 38160, "loss": 0.3899, "lr": 0.000996231714857602, "epoch": 2.7044025157232703, "percentage": 13.52, "elapsed_time": "0:13:01", "remaining_time": "1:23:15", "throughput": 4309.49, "total_tokens": 3366288} {"current_steps": 5165, "total_steps": 38160, "loss": 0.4067, "lr": 0.000996203639540322, "epoch": 2.7070230607966455, "percentage": 13.54, "elapsed_time": "0:13:01", "remaining_time": "1:23:14", "throughput": 4309.4, "total_tokens": 3369104} {"current_steps": 5170, "total_steps": 38160, "loss": 0.4851, "lr": 0.0009961754604229018, "epoch": 2.709643605870021, "percentage": 13.55, "elapsed_time": "0:13:02", "remaining_time": "1:23:13", "throughput": 4309.52, "total_tokens": 3372304} {"current_steps": 5175, "total_steps": 38160, "loss": 0.4375, "lr": 0.0009961471775112361, "epoch": 2.7122641509433962, "percentage": 13.56, "elapsed_time": "0:13:03", "remaining_time": "1:23:12", "throughput": 4309.43, "total_tokens": 3375152} {"current_steps": 5180, "total_steps": 38160, "loss": 0.5582, "lr": 0.000996118790811241, "epoch": 2.7148846960167714, "percentage": 13.57, "elapsed_time": "0:13:03", "remaining_time": "1:23:10", "throughput": 4309.29, "total_tokens": 3377904} {"current_steps": 5185, "total_steps": 38160, "loss": 0.498, "lr": 0.0009960903003288551, "epoch": 2.717505241090147, "percentage": 13.59, "elapsed_time": "0:13:04", "remaining_time": "1:23:10", "throughput": 4309.71, "total_tokens": 3381552} {"current_steps": 5190, "total_steps": 38160, "loss": 0.5425, "lr": 0.0009960617060700378, "epoch": 2.720125786163522, "percentage": 13.6, "elapsed_time": "0:13:05", "remaining_time": "1:23:08", "throughput": 4309.58, "total_tokens": 3384368} {"current_steps": 5195, "total_steps": 38160, "loss": 0.2774, "lr": 0.000996033008040771, "epoch": 2.7227463312368974, "percentage": 13.61, "elapsed_time": "0:13:05", "remaining_time": "1:23:07", "throughput": 4309.36, "total_tokens": 3387024} {"current_steps": 5200, "total_steps": 38160, "loss": 0.5178, "lr": 0.0009960042062470583, "epoch": 2.7253668763102725, "percentage": 13.63, "elapsed_time": "0:13:06", "remaining_time": "1:23:06", "throughput": 4309.24, "total_tokens": 3389808} {"current_steps": 5205, "total_steps": 38160, "loss": 0.4899, "lr": 0.0009959753006949241, "epoch": 2.7279874213836477, "percentage": 13.64, "elapsed_time": "0:13:07", "remaining_time": "1:23:05", "throughput": 4310.05, "total_tokens": 3394160} {"current_steps": 5210, "total_steps": 38160, "loss": 0.6445, "lr": 0.0009959462913904154, "epoch": 2.730607966457023, "percentage": 13.65, "elapsed_time": "0:13:08", "remaining_time": "1:23:06", "throughput": 4311.57, "total_tokens": 3399664} {"current_steps": 5215, "total_steps": 38160, "loss": 0.5905, "lr": 0.0009959171783396007, "epoch": 2.7332285115303985, "percentage": 13.67, "elapsed_time": "0:13:09", "remaining_time": "1:23:06", "throughput": 4312.02, "total_tokens": 3403472} {"current_steps": 5220, "total_steps": 38160, "loss": 0.3945, "lr": 0.00099588796154857, "epoch": 2.7358490566037736, "percentage": 13.68, "elapsed_time": "0:13:09", "remaining_time": "1:23:05", "throughput": 4311.98, "total_tokens": 3406384} {"current_steps": 5225, "total_steps": 38160, "loss": 0.3777, "lr": 0.000995858641023435, "epoch": 2.738469601677149, "percentage": 13.69, "elapsed_time": "0:13:10", "remaining_time": "1:23:04", "throughput": 4312.09, "total_tokens": 3409584} {"current_steps": 5230, "total_steps": 38160, "loss": 0.4421, "lr": 0.0009958292167703293, "epoch": 2.741090146750524, "percentage": 13.71, "elapsed_time": "0:13:11", "remaining_time": "1:23:05", "throughput": 4313.48, "total_tokens": 3415152} {"current_steps": 5235, "total_steps": 38160, "loss": 0.3799, "lr": 0.0009957996887954082, "epoch": 2.7437106918238996, "percentage": 13.72, "elapsed_time": "0:13:12", "remaining_time": "1:23:04", "throughput": 4313.73, "total_tokens": 3418576} {"current_steps": 5240, "total_steps": 38160, "loss": 0.4556, "lr": 0.0009957700571048486, "epoch": 2.7463312368972748, "percentage": 13.73, "elapsed_time": "0:13:13", "remaining_time": "1:23:03", "throughput": 4313.97, "total_tokens": 3421904} {"current_steps": 5245, "total_steps": 38160, "loss": 0.5407, "lr": 0.0009957403217048493, "epoch": 2.74895178197065, "percentage": 13.74, "elapsed_time": "0:13:13", "remaining_time": "1:23:02", "throughput": 4314.36, "total_tokens": 3425584} {"current_steps": 5250, "total_steps": 38160, "loss": 0.4845, "lr": 0.0009957104826016302, "epoch": 2.751572327044025, "percentage": 13.76, "elapsed_time": "0:13:14", "remaining_time": "1:23:02", "throughput": 4314.88, "total_tokens": 3429488} {"current_steps": 5255, "total_steps": 38160, "loss": 0.5401, "lr": 0.0009956805398014337, "epoch": 2.7541928721174003, "percentage": 13.77, "elapsed_time": "0:13:15", "remaining_time": "1:23:01", "throughput": 4315.16, "total_tokens": 3433040} {"current_steps": 5260, "total_steps": 38160, "loss": 0.4936, "lr": 0.0009956504933105231, "epoch": 2.7568134171907754, "percentage": 13.78, "elapsed_time": "0:13:16", "remaining_time": "1:23:00", "throughput": 4315.45, "total_tokens": 3436464} {"current_steps": 5265, "total_steps": 38160, "loss": 0.3724, "lr": 0.000995620343135184, "epoch": 2.759433962264151, "percentage": 13.8, "elapsed_time": "0:13:16", "remaining_time": "1:22:59", "throughput": 4315.19, "total_tokens": 3438960} {"current_steps": 5270, "total_steps": 38160, "loss": 0.6373, "lr": 0.0009955900892817235, "epoch": 2.762054507337526, "percentage": 13.81, "elapsed_time": "0:13:17", "remaining_time": "1:22:58", "throughput": 4315.46, "total_tokens": 3442416} {"current_steps": 5275, "total_steps": 38160, "loss": 0.5784, "lr": 0.0009955597317564703, "epoch": 2.7646750524109014, "percentage": 13.82, "elapsed_time": "0:13:18", "remaining_time": "1:22:57", "throughput": 4315.83, "total_tokens": 3446128} {"current_steps": 5280, "total_steps": 38160, "loss": 0.5285, "lr": 0.0009955292705657749, "epoch": 2.767295597484277, "percentage": 13.84, "elapsed_time": "0:13:19", "remaining_time": "1:22:56", "throughput": 4315.85, "total_tokens": 3449168} {"current_steps": 5285, "total_steps": 38160, "loss": 0.6107, "lr": 0.0009954987057160093, "epoch": 2.769916142557652, "percentage": 13.85, "elapsed_time": "0:13:19", "remaining_time": "1:22:55", "throughput": 4316.06, "total_tokens": 3452592} {"current_steps": 5290, "total_steps": 38160, "loss": 0.5164, "lr": 0.0009954680372135675, "epoch": 2.7725366876310273, "percentage": 13.86, "elapsed_time": "0:13:20", "remaining_time": "1:22:54", "throughput": 4315.76, "total_tokens": 3455184} {"current_steps": 5295, "total_steps": 38160, "loss": 0.3225, "lr": 0.000995437265064865, "epoch": 2.7751572327044025, "percentage": 13.88, "elapsed_time": "0:13:21", "remaining_time": "1:22:53", "throughput": 4315.64, "total_tokens": 3457968} {"current_steps": 5300, "total_steps": 38160, "loss": 0.4692, "lr": 0.0009954063892763387, "epoch": 2.7777777777777777, "percentage": 13.89, "elapsed_time": "0:13:21", "remaining_time": "1:22:51", "throughput": 4315.3, "total_tokens": 3460400} {"current_steps": 5305, "total_steps": 38160, "loss": 0.5228, "lr": 0.0009953754098544479, "epoch": 2.780398322851153, "percentage": 13.9, "elapsed_time": "0:13:22", "remaining_time": "1:22:50", "throughput": 4315.34, "total_tokens": 3463376} {"current_steps": 5310, "total_steps": 38160, "loss": 0.7371, "lr": 0.0009953443268056726, "epoch": 2.7830188679245285, "percentage": 13.92, "elapsed_time": "0:13:23", "remaining_time": "1:22:48", "throughput": 4315.12, "total_tokens": 3465936} {"current_steps": 5315, "total_steps": 38160, "loss": 0.5647, "lr": 0.0009953131401365155, "epoch": 2.7856394129979036, "percentage": 13.93, "elapsed_time": "0:13:23", "remaining_time": "1:22:47", "throughput": 4315.12, "total_tokens": 3468912} {"current_steps": 5320, "total_steps": 38160, "loss": 0.4236, "lr": 0.0009952818498535003, "epoch": 2.788259958071279, "percentage": 13.94, "elapsed_time": "0:13:24", "remaining_time": "1:22:47", "throughput": 4315.91, "total_tokens": 3473200} {"current_steps": 5325, "total_steps": 38160, "loss": 0.6316, "lr": 0.0009952504559631726, "epoch": 2.790880503144654, "percentage": 13.95, "elapsed_time": "0:13:25", "remaining_time": "1:22:46", "throughput": 4315.82, "total_tokens": 3476048} {"current_steps": 5330, "total_steps": 38160, "loss": 0.4607, "lr": 0.0009952189584720996, "epoch": 2.7935010482180296, "percentage": 13.97, "elapsed_time": "0:13:26", "remaining_time": "1:22:45", "throughput": 4315.96, "total_tokens": 3479312} {"current_steps": 5335, "total_steps": 38160, "loss": 0.5973, "lr": 0.0009951873573868701, "epoch": 2.7961215932914047, "percentage": 13.98, "elapsed_time": "0:13:27", "remaining_time": "1:22:45", "throughput": 4316.76, "total_tokens": 3483792} {"current_steps": 5340, "total_steps": 38160, "loss": 0.4523, "lr": 0.000995155652714095, "epoch": 2.79874213836478, "percentage": 13.99, "elapsed_time": "0:13:27", "remaining_time": "1:22:44", "throughput": 4317.05, "total_tokens": 3487408} {"current_steps": 5345, "total_steps": 38160, "loss": 0.3841, "lr": 0.0009951238444604064, "epoch": 2.801362683438155, "percentage": 14.01, "elapsed_time": "0:13:28", "remaining_time": "1:22:44", "throughput": 4317.18, "total_tokens": 3490672} {"current_steps": 5350, "total_steps": 38160, "loss": 0.4535, "lr": 0.000995091932632458, "epoch": 2.8039832285115303, "percentage": 14.02, "elapsed_time": "0:13:29", "remaining_time": "1:22:43", "throughput": 4317.59, "total_tokens": 3494320} {"current_steps": 5355, "total_steps": 38160, "loss": 0.4158, "lr": 0.000995059917236926, "epoch": 2.8066037735849054, "percentage": 14.03, "elapsed_time": "0:13:30", "remaining_time": "1:22:42", "throughput": 4318.09, "total_tokens": 3498256} {"current_steps": 5360, "total_steps": 38160, "loss": 0.5655, "lr": 0.000995027798280507, "epoch": 2.809224318658281, "percentage": 14.05, "elapsed_time": "0:13:30", "remaining_time": "1:22:41", "throughput": 4317.93, "total_tokens": 3500944} {"current_steps": 5365, "total_steps": 38160, "loss": 0.4895, "lr": 0.00099499557576992, "epoch": 2.811844863731656, "percentage": 14.06, "elapsed_time": "0:13:31", "remaining_time": "1:22:40", "throughput": 4318.45, "total_tokens": 3504752} {"current_steps": 5370, "total_steps": 38160, "loss": 0.4509, "lr": 0.000994963249711906, "epoch": 2.8144654088050314, "percentage": 14.07, "elapsed_time": "0:13:32", "remaining_time": "1:22:39", "throughput": 4318.49, "total_tokens": 3507824} {"current_steps": 5375, "total_steps": 38160, "loss": 0.4701, "lr": 0.000994930820113227, "epoch": 2.8170859538784065, "percentage": 14.09, "elapsed_time": "0:13:32", "remaining_time": "1:22:38", "throughput": 4318.49, "total_tokens": 3510800} {"current_steps": 5380, "total_steps": 38160, "loss": 0.3768, "lr": 0.0009948982869806668, "epoch": 2.819706498951782, "percentage": 14.1, "elapsed_time": "0:13:33", "remaining_time": "1:22:37", "throughput": 4318.45, "total_tokens": 3513808} {"current_steps": 5385, "total_steps": 38160, "loss": 0.5427, "lr": 0.0009948656503210311, "epoch": 2.8223270440251573, "percentage": 14.11, "elapsed_time": "0:13:34", "remaining_time": "1:22:36", "throughput": 4318.71, "total_tokens": 3517232} {"current_steps": 5390, "total_steps": 38160, "loss": 0.4081, "lr": 0.000994832910141147, "epoch": 2.8249475890985325, "percentage": 14.12, "elapsed_time": "0:13:35", "remaining_time": "1:22:35", "throughput": 4318.6, "total_tokens": 3520016} {"current_steps": 5395, "total_steps": 38160, "loss": 0.4302, "lr": 0.0009948000664478638, "epoch": 2.8275681341719077, "percentage": 14.14, "elapsed_time": "0:13:35", "remaining_time": "1:22:34", "throughput": 4318.51, "total_tokens": 3522992} {"current_steps": 5400, "total_steps": 38160, "loss": 0.3908, "lr": 0.0009947671192480515, "epoch": 2.830188679245283, "percentage": 14.15, "elapsed_time": "0:13:36", "remaining_time": "1:22:33", "throughput": 4318.77, "total_tokens": 3526384} {"current_steps": 5405, "total_steps": 38160, "loss": 0.5218, "lr": 0.0009947340685486023, "epoch": 2.832809224318658, "percentage": 14.16, "elapsed_time": "0:13:37", "remaining_time": "1:22:32", "throughput": 4319.04, "total_tokens": 3529840} {"current_steps": 5410, "total_steps": 38160, "loss": 0.4325, "lr": 0.0009947009143564303, "epoch": 2.8354297693920336, "percentage": 14.18, "elapsed_time": "0:13:37", "remaining_time": "1:22:31", "throughput": 4318.9, "total_tokens": 3532592} {"current_steps": 5415, "total_steps": 38160, "loss": 0.4117, "lr": 0.0009946676566784708, "epoch": 2.838050314465409, "percentage": 14.19, "elapsed_time": "0:13:38", "remaining_time": "1:22:30", "throughput": 4318.87, "total_tokens": 3535472} {"current_steps": 5420, "total_steps": 38160, "loss": 0.5141, "lr": 0.000994634295521681, "epoch": 2.840670859538784, "percentage": 14.2, "elapsed_time": "0:13:39", "remaining_time": "1:22:28", "throughput": 4318.57, "total_tokens": 3538000} {"current_steps": 5425, "total_steps": 38160, "loss": 0.439, "lr": 0.0009946008308930397, "epoch": 2.8432914046121596, "percentage": 14.22, "elapsed_time": "0:13:39", "remaining_time": "1:22:27", "throughput": 4318.74, "total_tokens": 3541296} {"current_steps": 5430, "total_steps": 38160, "loss": 0.6249, "lr": 0.0009945672627995473, "epoch": 2.8459119496855347, "percentage": 14.23, "elapsed_time": "0:13:40", "remaining_time": "1:22:26", "throughput": 4318.64, "total_tokens": 3544208} {"current_steps": 5435, "total_steps": 38160, "loss": 0.4491, "lr": 0.0009945335912482256, "epoch": 2.84853249475891, "percentage": 14.24, "elapsed_time": "0:13:41", "remaining_time": "1:22:25", "throughput": 4318.71, "total_tokens": 3547376} {"current_steps": 5440, "total_steps": 38160, "loss": 0.4757, "lr": 0.000994499816246119, "epoch": 2.851153039832285, "percentage": 14.26, "elapsed_time": "0:13:42", "remaining_time": "1:22:24", "throughput": 4318.84, "total_tokens": 3550608} {"current_steps": 5445, "total_steps": 38160, "loss": 0.5574, "lr": 0.000994465937800292, "epoch": 2.8537735849056602, "percentage": 14.27, "elapsed_time": "0:13:42", "remaining_time": "1:22:23", "throughput": 4318.93, "total_tokens": 3553744} {"current_steps": 5450, "total_steps": 38160, "loss": 0.3776, "lr": 0.0009944319559178321, "epoch": 2.8563941299790354, "percentage": 14.28, "elapsed_time": "0:13:43", "remaining_time": "1:22:22", "throughput": 4318.96, "total_tokens": 3556816} {"current_steps": 5455, "total_steps": 38160, "loss": 0.4782, "lr": 0.0009943978706058478, "epoch": 2.859014675052411, "percentage": 14.3, "elapsed_time": "0:13:44", "remaining_time": "1:22:21", "throughput": 4319.11, "total_tokens": 3560080} {"current_steps": 5460, "total_steps": 38160, "loss": 0.4583, "lr": 0.0009943636818714695, "epoch": 2.861635220125786, "percentage": 14.31, "elapsed_time": "0:13:44", "remaining_time": "1:22:20", "throughput": 4318.79, "total_tokens": 3562544} {"current_steps": 5465, "total_steps": 38160, "loss": 0.4669, "lr": 0.0009943293897218487, "epoch": 2.8642557651991614, "percentage": 14.32, "elapsed_time": "0:13:45", "remaining_time": "1:22:18", "throughput": 4318.61, "total_tokens": 3565264} {"current_steps": 5470, "total_steps": 38160, "loss": 0.6349, "lr": 0.0009942949941641594, "epoch": 2.8668763102725365, "percentage": 14.33, "elapsed_time": "0:13:46", "remaining_time": "1:22:17", "throughput": 4318.44, "total_tokens": 3567888} {"current_steps": 5475, "total_steps": 38160, "loss": 0.603, "lr": 0.0009942604952055964, "epoch": 2.869496855345912, "percentage": 14.35, "elapsed_time": "0:13:46", "remaining_time": "1:22:16", "throughput": 4318.67, "total_tokens": 3571440} {"current_steps": 5480, "total_steps": 38160, "loss": 0.5756, "lr": 0.0009942258928533768, "epoch": 2.8721174004192873, "percentage": 14.36, "elapsed_time": "0:13:47", "remaining_time": "1:22:15", "throughput": 4318.68, "total_tokens": 3574448} {"current_steps": 5485, "total_steps": 38160, "loss": 0.4981, "lr": 0.0009941911871147386, "epoch": 2.8747379454926625, "percentage": 14.37, "elapsed_time": "0:13:48", "remaining_time": "1:22:14", "throughput": 4318.68, "total_tokens": 3577488} {"current_steps": 5490, "total_steps": 38160, "loss": 0.3681, "lr": 0.000994156377996942, "epoch": 2.8773584905660377, "percentage": 14.39, "elapsed_time": "0:13:49", "remaining_time": "1:22:13", "throughput": 4318.63, "total_tokens": 3580432} {"current_steps": 5495, "total_steps": 38160, "loss": 0.5083, "lr": 0.0009941214655072692, "epoch": 2.879979035639413, "percentage": 14.4, "elapsed_time": "0:13:49", "remaining_time": "1:22:12", "throughput": 4318.66, "total_tokens": 3583504} {"current_steps": 5500, "total_steps": 38160, "loss": 0.531, "lr": 0.0009940864496530226, "epoch": 2.882599580712788, "percentage": 14.41, "elapsed_time": "0:13:50", "remaining_time": "1:22:11", "throughput": 4318.53, "total_tokens": 3586320} {"current_steps": 5505, "total_steps": 38160, "loss": 0.3922, "lr": 0.000994051330441528, "epoch": 2.8852201257861636, "percentage": 14.43, "elapsed_time": "0:13:51", "remaining_time": "1:22:10", "throughput": 4318.4, "total_tokens": 3589072} {"current_steps": 5510, "total_steps": 38160, "loss": 0.6579, "lr": 0.0009940161078801312, "epoch": 2.8878406708595388, "percentage": 14.44, "elapsed_time": "0:13:52", "remaining_time": "1:22:12", "throughput": 4320.77, "total_tokens": 3596944} {"current_steps": 5515, "total_steps": 38160, "loss": 0.5067, "lr": 0.0009939807819762008, "epoch": 2.890461215932914, "percentage": 14.45, "elapsed_time": "0:13:53", "remaining_time": "1:22:11", "throughput": 4320.84, "total_tokens": 3600080} {"current_steps": 5520, "total_steps": 38160, "loss": 0.4533, "lr": 0.0009939453527371262, "epoch": 2.8930817610062896, "percentage": 14.47, "elapsed_time": "0:13:53", "remaining_time": "1:22:11", "throughput": 4321.18, "total_tokens": 3603632} {"current_steps": 5525, "total_steps": 38160, "loss": 0.4969, "lr": 0.0009939098201703193, "epoch": 2.8957023060796647, "percentage": 14.48, "elapsed_time": "0:13:54", "remaining_time": "1:22:09", "throughput": 4320.76, "total_tokens": 3605936} {"current_steps": 5530, "total_steps": 38160, "loss": 0.4996, "lr": 0.0009938741842832129, "epoch": 2.89832285115304, "percentage": 14.49, "elapsed_time": "0:13:55", "remaining_time": "1:22:08", "throughput": 4321.09, "total_tokens": 3609488} {"current_steps": 5535, "total_steps": 38160, "loss": 0.4007, "lr": 0.0009938384450832614, "epoch": 2.900943396226415, "percentage": 14.5, "elapsed_time": "0:13:56", "remaining_time": "1:22:07", "throughput": 4321.07, "total_tokens": 3612464} {"current_steps": 5540, "total_steps": 38160, "loss": 0.6035, "lr": 0.0009938026025779411, "epoch": 2.9035639412997902, "percentage": 14.52, "elapsed_time": "0:13:56", "remaining_time": "1:22:06", "throughput": 4321.0, "total_tokens": 3615440} {"current_steps": 5545, "total_steps": 38160, "loss": 0.488, "lr": 0.0009937666567747501, "epoch": 2.9061844863731654, "percentage": 14.53, "elapsed_time": "0:13:57", "remaining_time": "1:22:06", "throughput": 4321.84, "total_tokens": 3619952} {"current_steps": 5550, "total_steps": 38160, "loss": 0.4611, "lr": 0.0009937306076812076, "epoch": 2.908805031446541, "percentage": 14.54, "elapsed_time": "0:13:58", "remaining_time": "1:22:06", "throughput": 4322.28, "total_tokens": 3623760} {"current_steps": 5555, "total_steps": 38160, "loss": 0.4114, "lr": 0.0009936944553048548, "epoch": 2.911425576519916, "percentage": 14.56, "elapsed_time": "0:13:59", "remaining_time": "1:22:05", "throughput": 4322.46, "total_tokens": 3627088} {"current_steps": 5560, "total_steps": 38160, "loss": 0.4281, "lr": 0.0009936581996532543, "epoch": 2.9140461215932913, "percentage": 14.57, "elapsed_time": "0:13:59", "remaining_time": "1:22:03", "throughput": 4322.19, "total_tokens": 3629520} {"current_steps": 5565, "total_steps": 38160, "loss": 0.3872, "lr": 0.0009936218407339905, "epoch": 2.9166666666666665, "percentage": 14.58, "elapsed_time": "0:14:00", "remaining_time": "1:22:03", "throughput": 4322.94, "total_tokens": 3634064} {"current_steps": 5570, "total_steps": 38160, "loss": 0.5239, "lr": 0.0009935853785546691, "epoch": 2.919287211740042, "percentage": 14.6, "elapsed_time": "0:14:01", "remaining_time": "1:22:02", "throughput": 4323.05, "total_tokens": 3637296} {"current_steps": 5575, "total_steps": 38160, "loss": 0.4583, "lr": 0.0009935488131229177, "epoch": 2.9219077568134173, "percentage": 14.61, "elapsed_time": "0:14:02", "remaining_time": "1:22:01", "throughput": 4323.09, "total_tokens": 3640400} {"current_steps": 5580, "total_steps": 38160, "loss": 0.565, "lr": 0.000993512144446385, "epoch": 2.9245283018867925, "percentage": 14.62, "elapsed_time": "0:14:02", "remaining_time": "1:22:00", "throughput": 4323.31, "total_tokens": 3643760} {"current_steps": 5585, "total_steps": 38160, "loss": 0.6571, "lr": 0.000993475372532742, "epoch": 2.9271488469601676, "percentage": 14.64, "elapsed_time": "0:14:03", "remaining_time": "1:21:59", "throughput": 4323.09, "total_tokens": 3646352} {"current_steps": 5590, "total_steps": 38160, "loss": 0.5216, "lr": 0.0009934384973896812, "epoch": 2.929769392033543, "percentage": 14.65, "elapsed_time": "0:14:04", "remaining_time": "1:21:58", "throughput": 4323.38, "total_tokens": 3649904} {"current_steps": 5595, "total_steps": 38160, "loss": 0.4579, "lr": 0.0009934015190249162, "epoch": 2.932389937106918, "percentage": 14.66, "elapsed_time": "0:14:04", "remaining_time": "1:21:57", "throughput": 4323.17, "total_tokens": 3652560} {"current_steps": 5600, "total_steps": 38160, "loss": 0.4959, "lr": 0.0009933644374461822, "epoch": 2.9350104821802936, "percentage": 14.68, "elapsed_time": "0:14:05", "remaining_time": "1:21:57", "throughput": 4323.58, "total_tokens": 3656400} {"current_steps": 5605, "total_steps": 38160, "loss": 0.4054, "lr": 0.0009933272526612366, "epoch": 2.9376310272536688, "percentage": 14.69, "elapsed_time": "0:14:06", "remaining_time": "1:21:56", "throughput": 4323.85, "total_tokens": 3659984} {"current_steps": 5610, "total_steps": 38160, "loss": 0.4256, "lr": 0.0009932899646778578, "epoch": 2.940251572327044, "percentage": 14.7, "elapsed_time": "0:14:07", "remaining_time": "1:21:55", "throughput": 4323.95, "total_tokens": 3663152} {"current_steps": 5615, "total_steps": 38160, "loss": 0.3975, "lr": 0.0009932525735038464, "epoch": 2.9428721174004195, "percentage": 14.71, "elapsed_time": "0:14:08", "remaining_time": "1:21:55", "throughput": 4324.66, "total_tokens": 3667472} {"current_steps": 5620, "total_steps": 38160, "loss": 0.5037, "lr": 0.0009932150791470238, "epoch": 2.9454926624737947, "percentage": 14.73, "elapsed_time": "0:14:08", "remaining_time": "1:21:54", "throughput": 4324.7, "total_tokens": 3670608} {"current_steps": 5625, "total_steps": 38160, "loss": 0.5797, "lr": 0.0009931774816152334, "epoch": 2.94811320754717, "percentage": 14.74, "elapsed_time": "0:14:09", "remaining_time": "1:21:53", "throughput": 4325.08, "total_tokens": 3674320} {"current_steps": 5630, "total_steps": 38160, "loss": 0.4136, "lr": 0.0009931397809163406, "epoch": 2.950733752620545, "percentage": 14.75, "elapsed_time": "0:14:10", "remaining_time": "1:21:52", "throughput": 4325.05, "total_tokens": 3677328} {"current_steps": 5635, "total_steps": 38160, "loss": 0.544, "lr": 0.0009931019770582316, "epoch": 2.95335429769392, "percentage": 14.77, "elapsed_time": "0:14:10", "remaining_time": "1:21:51", "throughput": 4324.66, "total_tokens": 3679664} {"current_steps": 5640, "total_steps": 38160, "loss": 0.5449, "lr": 0.0009930640700488143, "epoch": 2.9559748427672954, "percentage": 14.78, "elapsed_time": "0:14:11", "remaining_time": "1:21:50", "throughput": 4324.67, "total_tokens": 3682704} {"current_steps": 5645, "total_steps": 38160, "loss": 0.6005, "lr": 0.000993026059896019, "epoch": 2.958595387840671, "percentage": 14.79, "elapsed_time": "0:14:12", "remaining_time": "1:21:48", "throughput": 4324.23, "total_tokens": 3685008} {"current_steps": 5650, "total_steps": 38160, "loss": 0.7366, "lr": 0.0009929879466077968, "epoch": 2.961215932914046, "percentage": 14.81, "elapsed_time": "0:14:12", "remaining_time": "1:21:47", "throughput": 4324.36, "total_tokens": 3688240} {"current_steps": 5655, "total_steps": 38160, "loss": 0.4888, "lr": 0.0009929497301921202, "epoch": 2.9638364779874213, "percentage": 14.82, "elapsed_time": "0:14:13", "remaining_time": "1:21:46", "throughput": 4324.48, "total_tokens": 3691472} {"current_steps": 5660, "total_steps": 38160, "loss": 0.4314, "lr": 0.000992911410656984, "epoch": 2.9664570230607965, "percentage": 14.83, "elapsed_time": "0:14:14", "remaining_time": "1:21:45", "throughput": 4324.53, "total_tokens": 3694544} {"current_steps": 5665, "total_steps": 38160, "loss": 0.4824, "lr": 0.000992872988010404, "epoch": 2.969077568134172, "percentage": 14.85, "elapsed_time": "0:14:15", "remaining_time": "1:21:44", "throughput": 4324.75, "total_tokens": 3697968} {"current_steps": 5670, "total_steps": 38160, "loss": 0.4274, "lr": 0.0009928344622604183, "epoch": 2.9716981132075473, "percentage": 14.86, "elapsed_time": "0:14:15", "remaining_time": "1:21:43", "throughput": 4324.74, "total_tokens": 3700944} {"current_steps": 5675, "total_steps": 38160, "loss": 0.5182, "lr": 0.0009927958334150853, "epoch": 2.9743186582809225, "percentage": 14.87, "elapsed_time": "0:14:16", "remaining_time": "1:21:42", "throughput": 4324.87, "total_tokens": 3704176} {"current_steps": 5680, "total_steps": 38160, "loss": 0.5283, "lr": 0.0009927571014824862, "epoch": 2.9769392033542976, "percentage": 14.88, "elapsed_time": "0:14:17", "remaining_time": "1:21:42", "throughput": 4325.33, "total_tokens": 3708016} {"current_steps": 5685, "total_steps": 38160, "loss": 0.4161, "lr": 0.000992718266470723, "epoch": 2.979559748427673, "percentage": 14.9, "elapsed_time": "0:14:18", "remaining_time": "1:21:41", "throughput": 4325.41, "total_tokens": 3711216} {"current_steps": 5690, "total_steps": 38160, "loss": 0.467, "lr": 0.00099267932838792, "epoch": 2.982180293501048, "percentage": 14.91, "elapsed_time": "0:14:18", "remaining_time": "1:21:39", "throughput": 4325.3, "total_tokens": 3713968} {"current_steps": 5695, "total_steps": 38160, "loss": 0.4784, "lr": 0.000992640287242222, "epoch": 2.9848008385744236, "percentage": 14.92, "elapsed_time": "0:14:19", "remaining_time": "1:21:39", "throughput": 4325.58, "total_tokens": 3717520} {"current_steps": 5700, "total_steps": 38160, "loss": 0.4651, "lr": 0.0009926011430417961, "epoch": 2.9874213836477987, "percentage": 14.94, "elapsed_time": "0:14:20", "remaining_time": "1:21:38", "throughput": 4325.58, "total_tokens": 3720528} {"current_steps": 5705, "total_steps": 38160, "loss": 0.5212, "lr": 0.0009925618957948312, "epoch": 2.990041928721174, "percentage": 14.95, "elapsed_time": "0:14:20", "remaining_time": "1:21:36", "throughput": 4325.5, "total_tokens": 3723408} {"current_steps": 5710, "total_steps": 38160, "loss": 0.4938, "lr": 0.0009925225455095373, "epoch": 2.9926624737945495, "percentage": 14.96, "elapsed_time": "0:14:21", "remaining_time": "1:21:36", "throughput": 4325.96, "total_tokens": 3727152} {"current_steps": 5715, "total_steps": 38160, "loss": 0.4634, "lr": 0.0009924830921941455, "epoch": 2.9952830188679247, "percentage": 14.98, "elapsed_time": "0:14:22", "remaining_time": "1:21:35", "throughput": 4326.2, "total_tokens": 3730640} {"current_steps": 5720, "total_steps": 38160, "loss": 0.4514, "lr": 0.0009924435358569096, "epoch": 2.9979035639413, "percentage": 14.99, "elapsed_time": "0:14:23", "remaining_time": "1:21:34", "throughput": 4326.08, "total_tokens": 3733488} {"current_steps": 5724, "total_steps": 38160, "eval_loss": 0.4886251986026764, "epoch": 3.0, "percentage": 15.0, "elapsed_time": "0:14:37", "remaining_time": "1:22:53", "throughput": 4257.67, "total_tokens": 3736568} {"current_steps": 5725, "total_steps": 38160, "loss": 0.4706, "lr": 0.000992403876506104, "epoch": 3.000524109014675, "percentage": 15.0, "elapsed_time": "0:14:39", "remaining_time": "1:23:01", "throughput": 4250.16, "total_tokens": 3737048} {"current_steps": 5730, "total_steps": 38160, "loss": 0.4932, "lr": 0.000992364114150025, "epoch": 3.00314465408805, "percentage": 15.02, "elapsed_time": "0:14:39", "remaining_time": "1:23:00", "throughput": 4250.07, "total_tokens": 3739768} {"current_steps": 5735, "total_steps": 38160, "loss": 0.4214, "lr": 0.0009923242487969908, "epoch": 3.0057651991614254, "percentage": 15.03, "elapsed_time": "0:14:40", "remaining_time": "1:22:59", "throughput": 4250.29, "total_tokens": 3743032} {"current_steps": 5740, "total_steps": 38160, "loss": 0.5284, "lr": 0.0009922842804553403, "epoch": 3.008385744234801, "percentage": 15.04, "elapsed_time": "0:14:41", "remaining_time": "1:22:58", "throughput": 4250.67, "total_tokens": 3746744} {"current_steps": 5745, "total_steps": 38160, "loss": 0.4158, "lr": 0.0009922442091334345, "epoch": 3.011006289308176, "percentage": 15.06, "elapsed_time": "0:14:42", "remaining_time": "1:22:57", "throughput": 4250.44, "total_tokens": 3749272} {"current_steps": 5750, "total_steps": 38160, "loss": 0.5853, "lr": 0.0009922040348396561, "epoch": 3.0136268343815513, "percentage": 15.07, "elapsed_time": "0:14:42", "remaining_time": "1:22:56", "throughput": 4250.93, "total_tokens": 3753048} {"current_steps": 5755, "total_steps": 38160, "loss": 0.3777, "lr": 0.000992163757582409, "epoch": 3.0162473794549265, "percentage": 15.08, "elapsed_time": "0:14:43", "remaining_time": "1:22:54", "throughput": 4250.66, "total_tokens": 3755448} {"current_steps": 5760, "total_steps": 38160, "loss": 0.4742, "lr": 0.0009921233773701188, "epoch": 3.018867924528302, "percentage": 15.09, "elapsed_time": "0:14:44", "remaining_time": "1:22:53", "throughput": 4250.72, "total_tokens": 3758424} {"current_steps": 5765, "total_steps": 38160, "loss": 0.4369, "lr": 0.0009920828942112322, "epoch": 3.0214884696016773, "percentage": 15.11, "elapsed_time": "0:14:45", "remaining_time": "1:22:53", "throughput": 4251.39, "total_tokens": 3762552} {"current_steps": 5770, "total_steps": 38160, "loss": 0.4658, "lr": 0.0009920423081142184, "epoch": 3.0241090146750524, "percentage": 15.12, "elapsed_time": "0:14:45", "remaining_time": "1:22:51", "throughput": 4251.11, "total_tokens": 3764920} {"current_steps": 5775, "total_steps": 38160, "loss": 0.4831, "lr": 0.0009920016190875672, "epoch": 3.0267295597484276, "percentage": 15.13, "elapsed_time": "0:14:46", "remaining_time": "1:22:50", "throughput": 4251.28, "total_tokens": 3768056} {"current_steps": 5780, "total_steps": 38160, "loss": 0.5044, "lr": 0.00099196082713979, "epoch": 3.029350104821803, "percentage": 15.15, "elapsed_time": "0:14:47", "remaining_time": "1:22:49", "throughput": 4251.7, "total_tokens": 3771800} {"current_steps": 5785, "total_steps": 38160, "loss": 0.4606, "lr": 0.0009919199322794207, "epoch": 3.0319706498951784, "percentage": 15.16, "elapsed_time": "0:14:47", "remaining_time": "1:22:48", "throughput": 4251.37, "total_tokens": 3774104} {"current_steps": 5790, "total_steps": 38160, "loss": 0.4318, "lr": 0.0009918789345150136, "epoch": 3.0345911949685536, "percentage": 15.17, "elapsed_time": "0:14:48", "remaining_time": "1:22:47", "throughput": 4251.37, "total_tokens": 3777144} {"current_steps": 5795, "total_steps": 38160, "loss": 0.3684, "lr": 0.000991837833855145, "epoch": 3.0372117400419287, "percentage": 15.19, "elapsed_time": "0:14:49", "remaining_time": "1:22:45", "throughput": 4251.46, "total_tokens": 3780248} {"current_steps": 5800, "total_steps": 38160, "loss": 0.429, "lr": 0.000991796630308413, "epoch": 3.039832285115304, "percentage": 15.2, "elapsed_time": "0:14:49", "remaining_time": "1:22:45", "throughput": 4251.75, "total_tokens": 3783672} {"current_steps": 5805, "total_steps": 38160, "loss": 0.4645, "lr": 0.0009917553238834363, "epoch": 3.042452830188679, "percentage": 15.21, "elapsed_time": "0:14:50", "remaining_time": "1:22:44", "throughput": 4251.98, "total_tokens": 3787032} {"current_steps": 5810, "total_steps": 38160, "loss": 0.4391, "lr": 0.0009917139145888562, "epoch": 3.0450733752620547, "percentage": 15.23, "elapsed_time": "0:14:51", "remaining_time": "1:22:42", "throughput": 4251.76, "total_tokens": 3789528} {"current_steps": 5815, "total_steps": 38160, "loss": 0.502, "lr": 0.000991672402433335, "epoch": 3.04769392033543, "percentage": 15.24, "elapsed_time": "0:14:52", "remaining_time": "1:22:41", "throughput": 4252.02, "total_tokens": 3792984} {"current_steps": 5820, "total_steps": 38160, "loss": 0.4268, "lr": 0.0009916307874255565, "epoch": 3.050314465408805, "percentage": 15.25, "elapsed_time": "0:14:52", "remaining_time": "1:22:40", "throughput": 4252.06, "total_tokens": 3795928} {"current_steps": 5825, "total_steps": 38160, "loss": 0.4181, "lr": 0.000991589069574226, "epoch": 3.05293501048218, "percentage": 15.26, "elapsed_time": "0:14:53", "remaining_time": "1:22:39", "throughput": 4252.07, "total_tokens": 3798840} {"current_steps": 5830, "total_steps": 38160, "loss": 0.4726, "lr": 0.0009915472488880705, "epoch": 3.0555555555555554, "percentage": 15.28, "elapsed_time": "0:14:54", "remaining_time": "1:22:38", "throughput": 4251.93, "total_tokens": 3801528} {"current_steps": 5835, "total_steps": 38160, "loss": 0.5612, "lr": 0.0009915053253758386, "epoch": 3.058176100628931, "percentage": 15.29, "elapsed_time": "0:14:54", "remaining_time": "1:22:36", "throughput": 4252.0, "total_tokens": 3804504} {"current_steps": 5840, "total_steps": 38160, "loss": 0.5452, "lr": 0.0009914632990462998, "epoch": 3.060796645702306, "percentage": 15.3, "elapsed_time": "0:14:55", "remaining_time": "1:22:36", "throughput": 4252.69, "total_tokens": 3808728} {"current_steps": 5845, "total_steps": 38160, "loss": 0.5687, "lr": 0.0009914211699082458, "epoch": 3.0634171907756813, "percentage": 15.32, "elapsed_time": "0:14:56", "remaining_time": "1:22:35", "throughput": 4252.5, "total_tokens": 3811256} {"current_steps": 5850, "total_steps": 38160, "loss": 0.6337, "lr": 0.0009913789379704897, "epoch": 3.0660377358490565, "percentage": 15.33, "elapsed_time": "0:14:56", "remaining_time": "1:22:33", "throughput": 4252.6, "total_tokens": 3814360} {"current_steps": 5855, "total_steps": 38160, "loss": 0.3332, "lr": 0.0009913366032418653, "epoch": 3.068658280922432, "percentage": 15.34, "elapsed_time": "0:14:57", "remaining_time": "1:22:32", "throughput": 4252.47, "total_tokens": 3817016} {"current_steps": 5860, "total_steps": 38160, "loss": 0.5184, "lr": 0.0009912941657312293, "epoch": 3.0712788259958073, "percentage": 15.36, "elapsed_time": "0:14:58", "remaining_time": "1:22:31", "throughput": 4252.74, "total_tokens": 3820440} {"current_steps": 5865, "total_steps": 38160, "loss": 0.4217, "lr": 0.0009912516254474586, "epoch": 3.0738993710691824, "percentage": 15.37, "elapsed_time": "0:14:59", "remaining_time": "1:22:30", "throughput": 4252.74, "total_tokens": 3823288} {"current_steps": 5870, "total_steps": 38160, "loss": 0.4486, "lr": 0.0009912089823994525, "epoch": 3.0765199161425576, "percentage": 15.38, "elapsed_time": "0:14:59", "remaining_time": "1:22:30", "throughput": 4253.43, "total_tokens": 3827672} {"current_steps": 5875, "total_steps": 38160, "loss": 0.4169, "lr": 0.0009911662365961313, "epoch": 3.0791404612159328, "percentage": 15.4, "elapsed_time": "0:15:00", "remaining_time": "1:22:29", "throughput": 4253.55, "total_tokens": 3830808} {"current_steps": 5880, "total_steps": 38160, "loss": 0.4616, "lr": 0.000991123388046437, "epoch": 3.0817610062893084, "percentage": 15.41, "elapsed_time": "0:15:01", "remaining_time": "1:22:28", "throughput": 4254.01, "total_tokens": 3834616} {"current_steps": 5885, "total_steps": 38160, "loss": 0.3838, "lr": 0.0009910804367593328, "epoch": 3.0843815513626835, "percentage": 15.42, "elapsed_time": "0:15:02", "remaining_time": "1:22:27", "throughput": 4254.34, "total_tokens": 3838232} {"current_steps": 5890, "total_steps": 38160, "loss": 0.5428, "lr": 0.0009910373827438038, "epoch": 3.0870020964360587, "percentage": 15.44, "elapsed_time": "0:15:02", "remaining_time": "1:22:26", "throughput": 4254.32, "total_tokens": 3841144} {"current_steps": 5895, "total_steps": 38160, "loss": 0.4708, "lr": 0.0009909942260088562, "epoch": 3.089622641509434, "percentage": 15.45, "elapsed_time": "0:15:03", "remaining_time": "1:22:25", "throughput": 4254.49, "total_tokens": 3844440} {"current_steps": 5900, "total_steps": 38160, "loss": 0.5562, "lr": 0.0009909509665635184, "epoch": 3.092243186582809, "percentage": 15.46, "elapsed_time": "0:15:04", "remaining_time": "1:22:24", "throughput": 4254.59, "total_tokens": 3847512} {"current_steps": 5905, "total_steps": 38160, "loss": 0.6975, "lr": 0.0009909076044168394, "epoch": 3.0948637316561847, "percentage": 15.47, "elapsed_time": "0:15:04", "remaining_time": "1:22:23", "throughput": 4254.37, "total_tokens": 3850040} {"current_steps": 5910, "total_steps": 38160, "loss": 0.5019, "lr": 0.00099086413957789, "epoch": 3.09748427672956, "percentage": 15.49, "elapsed_time": "0:15:05", "remaining_time": "1:22:22", "throughput": 4254.98, "total_tokens": 3854232} {"current_steps": 5915, "total_steps": 38160, "loss": 0.6112, "lr": 0.0009908205720557627, "epoch": 3.100104821802935, "percentage": 15.5, "elapsed_time": "0:15:06", "remaining_time": "1:22:22", "throughput": 4255.26, "total_tokens": 3857656} {"current_steps": 5920, "total_steps": 38160, "loss": 0.594, "lr": 0.0009907769018595713, "epoch": 3.10272536687631, "percentage": 15.51, "elapsed_time": "0:15:07", "remaining_time": "1:22:21", "throughput": 4255.4, "total_tokens": 3860888} {"current_steps": 5925, "total_steps": 38160, "loss": 0.6268, "lr": 0.0009907331289984512, "epoch": 3.1053459119496853, "percentage": 15.53, "elapsed_time": "0:15:07", "remaining_time": "1:22:19", "throughput": 4255.43, "total_tokens": 3863896} {"current_steps": 5930, "total_steps": 38160, "loss": 0.4248, "lr": 0.000990689253481559, "epoch": 3.107966457023061, "percentage": 15.54, "elapsed_time": "0:15:08", "remaining_time": "1:22:18", "throughput": 4255.57, "total_tokens": 3867000} {"current_steps": 5935, "total_steps": 38160, "loss": 0.5014, "lr": 0.000990645275318073, "epoch": 3.110587002096436, "percentage": 15.55, "elapsed_time": "0:15:09", "remaining_time": "1:22:18", "throughput": 4255.86, "total_tokens": 3870520} {"current_steps": 5940, "total_steps": 38160, "loss": 0.4418, "lr": 0.000990601194517193, "epoch": 3.1132075471698113, "percentage": 15.57, "elapsed_time": "0:15:10", "remaining_time": "1:22:16", "throughput": 4255.56, "total_tokens": 3872856} {"current_steps": 5945, "total_steps": 38160, "loss": 0.4978, "lr": 0.0009905570110881402, "epoch": 3.1158280922431865, "percentage": 15.58, "elapsed_time": "0:15:10", "remaining_time": "1:22:16", "throughput": 4256.52, "total_tokens": 3877624} {"current_steps": 5950, "total_steps": 38160, "loss": 0.5957, "lr": 0.0009905127250401573, "epoch": 3.1184486373165616, "percentage": 15.59, "elapsed_time": "0:15:11", "remaining_time": "1:22:16", "throughput": 4257.16, "total_tokens": 3881752} {"current_steps": 5955, "total_steps": 38160, "loss": 0.4874, "lr": 0.0009904683363825084, "epoch": 3.1210691823899372, "percentage": 15.61, "elapsed_time": "0:15:12", "remaining_time": "1:22:14", "throughput": 4257.01, "total_tokens": 3884408} {"current_steps": 5960, "total_steps": 38160, "loss": 0.4138, "lr": 0.0009904238451244791, "epoch": 3.1236897274633124, "percentage": 15.62, "elapsed_time": "0:15:13", "remaining_time": "1:22:13", "throughput": 4257.3, "total_tokens": 3887832} {"current_steps": 5965, "total_steps": 38160, "loss": 0.4068, "lr": 0.0009903792512753764, "epoch": 3.1263102725366876, "percentage": 15.63, "elapsed_time": "0:15:13", "remaining_time": "1:22:13", "throughput": 4257.72, "total_tokens": 3891544} {"current_steps": 5970, "total_steps": 38160, "loss": 0.4022, "lr": 0.0009903345548445289, "epoch": 3.1289308176100628, "percentage": 15.64, "elapsed_time": "0:15:14", "remaining_time": "1:22:11", "throughput": 4257.58, "total_tokens": 3894104} {"current_steps": 5975, "total_steps": 38160, "loss": 0.5006, "lr": 0.0009902897558412864, "epoch": 3.131551362683438, "percentage": 15.66, "elapsed_time": "0:15:15", "remaining_time": "1:22:10", "throughput": 4257.67, "total_tokens": 3897208} {"current_steps": 5980, "total_steps": 38160, "loss": 0.4191, "lr": 0.0009902448542750207, "epoch": 3.1341719077568135, "percentage": 15.67, "elapsed_time": "0:15:15", "remaining_time": "1:22:09", "throughput": 4257.6, "total_tokens": 3899960} {"current_steps": 5985, "total_steps": 38160, "loss": 0.4407, "lr": 0.0009901998501551245, "epoch": 3.1367924528301887, "percentage": 15.68, "elapsed_time": "0:15:16", "remaining_time": "1:22:07", "throughput": 4257.58, "total_tokens": 3902808} {"current_steps": 5990, "total_steps": 38160, "loss": 0.4612, "lr": 0.000990154743491012, "epoch": 3.139412997903564, "percentage": 15.7, "elapsed_time": "0:15:17", "remaining_time": "1:22:06", "throughput": 4257.42, "total_tokens": 3905336} {"current_steps": 5995, "total_steps": 38160, "loss": 0.5155, "lr": 0.0009901095342921193, "epoch": 3.142033542976939, "percentage": 15.71, "elapsed_time": "0:15:18", "remaining_time": "1:22:05", "throughput": 4257.45, "total_tokens": 3908376} {"current_steps": 6000, "total_steps": 38160, "loss": 0.6044, "lr": 0.0009900642225679035, "epoch": 3.1446540880503147, "percentage": 15.72, "elapsed_time": "0:15:18", "remaining_time": "1:22:04", "throughput": 4257.43, "total_tokens": 3911256} {"current_steps": 6005, "total_steps": 38160, "loss": 0.4703, "lr": 0.000990018808327843, "epoch": 3.14727463312369, "percentage": 15.74, "elapsed_time": "0:15:19", "remaining_time": "1:22:03", "throughput": 4257.58, "total_tokens": 3914424} {"current_steps": 6010, "total_steps": 38160, "loss": 0.4087, "lr": 0.0009899732915814386, "epoch": 3.149895178197065, "percentage": 15.75, "elapsed_time": "0:15:20", "remaining_time": "1:22:01", "throughput": 4257.45, "total_tokens": 3917080} {"current_steps": 6015, "total_steps": 38160, "loss": 0.5227, "lr": 0.0009899276723382112, "epoch": 3.15251572327044, "percentage": 15.76, "elapsed_time": "0:15:20", "remaining_time": "1:22:00", "throughput": 4257.37, "total_tokens": 3919800} {"current_steps": 6020, "total_steps": 38160, "loss": 0.412, "lr": 0.0009898819506077043, "epoch": 3.1551362683438153, "percentage": 15.78, "elapsed_time": "0:15:21", "remaining_time": "1:21:58", "throughput": 4257.16, "total_tokens": 3922328} {"current_steps": 6025, "total_steps": 38160, "loss": 0.4972, "lr": 0.0009898361263994823, "epoch": 3.157756813417191, "percentage": 15.79, "elapsed_time": "0:15:22", "remaining_time": "1:21:58", "throughput": 4257.75, "total_tokens": 3926488} {"current_steps": 6030, "total_steps": 38160, "loss": 0.4517, "lr": 0.0009897901997231308, "epoch": 3.160377358490566, "percentage": 15.8, "elapsed_time": "0:15:22", "remaining_time": "1:21:57", "throughput": 4257.65, "total_tokens": 3929208} {"current_steps": 6035, "total_steps": 38160, "loss": 0.4906, "lr": 0.0009897441705882576, "epoch": 3.1629979035639413, "percentage": 15.81, "elapsed_time": "0:15:23", "remaining_time": "1:21:56", "throughput": 4257.83, "total_tokens": 3932536} {"current_steps": 6040, "total_steps": 38160, "loss": 0.4766, "lr": 0.0009896980390044908, "epoch": 3.1656184486373165, "percentage": 15.83, "elapsed_time": "0:15:24", "remaining_time": "1:21:55", "throughput": 4258.06, "total_tokens": 3935832} {"current_steps": 6045, "total_steps": 38160, "loss": 0.4715, "lr": 0.0009896518049814812, "epoch": 3.1682389937106916, "percentage": 15.84, "elapsed_time": "0:15:25", "remaining_time": "1:21:55", "throughput": 4258.96, "total_tokens": 3940600} {"current_steps": 6050, "total_steps": 38160, "loss": 0.6018, "lr": 0.0009896054685289005, "epoch": 3.1708595387840672, "percentage": 15.85, "elapsed_time": "0:15:25", "remaining_time": "1:21:54", "throughput": 4259.09, "total_tokens": 3943736} {"current_steps": 6055, "total_steps": 38160, "loss": 0.3439, "lr": 0.0009895590296564412, "epoch": 3.1734800838574424, "percentage": 15.87, "elapsed_time": "0:15:26", "remaining_time": "1:21:53", "throughput": 4259.36, "total_tokens": 3947160} {"current_steps": 6060, "total_steps": 38160, "loss": 0.3706, "lr": 0.000989512488373818, "epoch": 3.1761006289308176, "percentage": 15.88, "elapsed_time": "0:15:27", "remaining_time": "1:21:52", "throughput": 4259.41, "total_tokens": 3950360} {"current_steps": 6065, "total_steps": 38160, "loss": 0.4337, "lr": 0.0009894658446907671, "epoch": 3.1787211740041927, "percentage": 15.89, "elapsed_time": "0:15:28", "remaining_time": "1:21:51", "throughput": 4259.38, "total_tokens": 3953240} {"current_steps": 6070, "total_steps": 38160, "loss": 0.5335, "lr": 0.0009894190986170458, "epoch": 3.181341719077568, "percentage": 15.91, "elapsed_time": "0:15:28", "remaining_time": "1:21:50", "throughput": 4259.7, "total_tokens": 3956792} {"current_steps": 6075, "total_steps": 38160, "loss": 0.6136, "lr": 0.0009893722501624323, "epoch": 3.1839622641509435, "percentage": 15.92, "elapsed_time": "0:15:29", "remaining_time": "1:21:49", "throughput": 4259.83, "total_tokens": 3959896} {"current_steps": 6080, "total_steps": 38160, "loss": 0.4773, "lr": 0.0009893252993367272, "epoch": 3.1865828092243187, "percentage": 15.93, "elapsed_time": "0:15:30", "remaining_time": "1:21:48", "throughput": 4260.15, "total_tokens": 3963480} {"current_steps": 6085, "total_steps": 38160, "loss": 0.5534, "lr": 0.000989278246149752, "epoch": 3.189203354297694, "percentage": 15.95, "elapsed_time": "0:15:31", "remaining_time": "1:21:47", "throughput": 4260.28, "total_tokens": 3966648} {"current_steps": 6090, "total_steps": 38160, "loss": 0.3977, "lr": 0.0009892310906113497, "epoch": 3.191823899371069, "percentage": 15.96, "elapsed_time": "0:15:31", "remaining_time": "1:21:46", "throughput": 4260.39, "total_tokens": 3969784} {"current_steps": 6095, "total_steps": 38160, "loss": 0.3914, "lr": 0.0009891838327313847, "epoch": 3.1944444444444446, "percentage": 15.97, "elapsed_time": "0:15:32", "remaining_time": "1:21:46", "throughput": 4260.8, "total_tokens": 3973624} {"current_steps": 6100, "total_steps": 38160, "loss": 0.3956, "lr": 0.000989136472519743, "epoch": 3.19706498951782, "percentage": 15.99, "elapsed_time": "0:15:33", "remaining_time": "1:21:46", "throughput": 4261.77, "total_tokens": 3978648} {"current_steps": 6105, "total_steps": 38160, "loss": 0.5473, "lr": 0.0009890890099863313, "epoch": 3.199685534591195, "percentage": 16.0, "elapsed_time": "0:15:34", "remaining_time": "1:21:45", "throughput": 4262.11, "total_tokens": 3982296} {"current_steps": 6110, "total_steps": 38160, "loss": 0.4532, "lr": 0.0009890414451410787, "epoch": 3.20230607966457, "percentage": 16.01, "elapsed_time": "0:15:35", "remaining_time": "1:21:45", "throughput": 4262.43, "total_tokens": 3985944} {"current_steps": 6115, "total_steps": 38160, "loss": 0.4981, "lr": 0.0009889937779939348, "epoch": 3.2049266247379453, "percentage": 16.02, "elapsed_time": "0:15:35", "remaining_time": "1:21:44", "throughput": 4262.6, "total_tokens": 3989240} {"current_steps": 6120, "total_steps": 38160, "loss": 0.4437, "lr": 0.0009889460085548715, "epoch": 3.207547169811321, "percentage": 16.04, "elapsed_time": "0:15:36", "remaining_time": "1:21:44", "throughput": 4263.28, "total_tokens": 3993688} {"current_steps": 6125, "total_steps": 38160, "loss": 0.3611, "lr": 0.0009888981368338815, "epoch": 3.210167714884696, "percentage": 16.05, "elapsed_time": "0:15:37", "remaining_time": "1:21:43", "throughput": 4263.63, "total_tokens": 3997432} {"current_steps": 6130, "total_steps": 38160, "loss": 0.4311, "lr": 0.0009888501628409789, "epoch": 3.2127882599580713, "percentage": 16.06, "elapsed_time": "0:15:38", "remaining_time": "1:21:42", "throughput": 4263.5, "total_tokens": 4000120} {"current_steps": 6135, "total_steps": 38160, "loss": 0.4158, "lr": 0.0009888020865861991, "epoch": 3.2154088050314464, "percentage": 16.08, "elapsed_time": "0:15:38", "remaining_time": "1:21:41", "throughput": 4263.73, "total_tokens": 4003480} {"current_steps": 6140, "total_steps": 38160, "loss": 0.4792, "lr": 0.0009887539080795996, "epoch": 3.2180293501048216, "percentage": 16.09, "elapsed_time": "0:15:39", "remaining_time": "1:21:40", "throughput": 4263.7, "total_tokens": 4006456} {"current_steps": 6145, "total_steps": 38160, "loss": 0.4347, "lr": 0.0009887056273312584, "epoch": 3.220649895178197, "percentage": 16.1, "elapsed_time": "0:15:40", "remaining_time": "1:21:38", "throughput": 4263.54, "total_tokens": 4009048} {"current_steps": 6150, "total_steps": 38160, "loss": 0.4143, "lr": 0.0009886572443512753, "epoch": 3.2232704402515724, "percentage": 16.12, "elapsed_time": "0:15:41", "remaining_time": "1:21:38", "throughput": 4263.72, "total_tokens": 4012376} {"current_steps": 6155, "total_steps": 38160, "loss": 0.4258, "lr": 0.0009886087591497717, "epoch": 3.2258909853249476, "percentage": 16.13, "elapsed_time": "0:15:41", "remaining_time": "1:21:36", "throughput": 4263.75, "total_tokens": 4015416} {"current_steps": 6160, "total_steps": 38160, "loss": 0.5686, "lr": 0.00098856017173689, "epoch": 3.2285115303983227, "percentage": 16.14, "elapsed_time": "0:15:42", "remaining_time": "1:21:35", "throughput": 4263.7, "total_tokens": 4018200} {"current_steps": 6165, "total_steps": 38160, "loss": 0.4667, "lr": 0.0009885114821227942, "epoch": 3.231132075471698, "percentage": 16.16, "elapsed_time": "0:15:43", "remaining_time": "1:21:34", "throughput": 4263.52, "total_tokens": 4020792} {"current_steps": 6170, "total_steps": 38160, "loss": 0.5197, "lr": 0.0009884626903176696, "epoch": 3.2337526205450735, "percentage": 16.17, "elapsed_time": "0:15:43", "remaining_time": "1:21:33", "throughput": 4263.8, "total_tokens": 4024280} {"current_steps": 6175, "total_steps": 38160, "loss": 0.4306, "lr": 0.0009884137963317228, "epoch": 3.2363731656184487, "percentage": 16.18, "elapsed_time": "0:15:44", "remaining_time": "1:21:32", "throughput": 4263.7, "total_tokens": 4027000} {"current_steps": 6180, "total_steps": 38160, "loss": 0.6627, "lr": 0.000988364800175182, "epoch": 3.238993710691824, "percentage": 16.19, "elapsed_time": "0:15:45", "remaining_time": "1:21:31", "throughput": 4263.74, "total_tokens": 4030008} {"current_steps": 6185, "total_steps": 38160, "loss": 0.4787, "lr": 0.0009883157018582966, "epoch": 3.241614255765199, "percentage": 16.21, "elapsed_time": "0:15:45", "remaining_time": "1:21:30", "throughput": 4263.94, "total_tokens": 4033400} {"current_steps": 6190, "total_steps": 38160, "loss": 0.3559, "lr": 0.0009882665013913373, "epoch": 3.2442348008385746, "percentage": 16.22, "elapsed_time": "0:15:46", "remaining_time": "1:21:29", "throughput": 4263.88, "total_tokens": 4036216} {"current_steps": 6195, "total_steps": 38160, "loss": 0.4954, "lr": 0.0009882171987845962, "epoch": 3.24685534591195, "percentage": 16.23, "elapsed_time": "0:15:47", "remaining_time": "1:21:29", "throughput": 4264.63, "total_tokens": 4040920} {"current_steps": 6200, "total_steps": 38160, "loss": 0.4943, "lr": 0.000988167794048387, "epoch": 3.249475890985325, "percentage": 16.25, "elapsed_time": "0:15:48", "remaining_time": "1:21:28", "throughput": 4264.9, "total_tokens": 4044344} {"current_steps": 6205, "total_steps": 38160, "loss": 0.4982, "lr": 0.0009881182871930448, "epoch": 3.2520964360587, "percentage": 16.26, "elapsed_time": "0:15:49", "remaining_time": "1:21:27", "throughput": 4265.07, "total_tokens": 4047608} {"current_steps": 6210, "total_steps": 38160, "loss": 0.4963, "lr": 0.0009880686782289256, "epoch": 3.2547169811320753, "percentage": 16.27, "elapsed_time": "0:15:50", "remaining_time": "1:21:29", "throughput": 4267.08, "total_tokens": 4055288} {"current_steps": 6215, "total_steps": 38160, "loss": 0.4893, "lr": 0.000988018967166407, "epoch": 3.257337526205451, "percentage": 16.29, "elapsed_time": "0:15:51", "remaining_time": "1:21:28", "throughput": 4267.1, "total_tokens": 4058168} {"current_steps": 6220, "total_steps": 38160, "loss": 0.4199, "lr": 0.0009879691540158884, "epoch": 3.259958071278826, "percentage": 16.3, "elapsed_time": "0:15:51", "remaining_time": "1:21:27", "throughput": 4267.17, "total_tokens": 4061272} {"current_steps": 6225, "total_steps": 38160, "loss": 0.5016, "lr": 0.0009879192387877895, "epoch": 3.2625786163522013, "percentage": 16.31, "elapsed_time": "0:15:52", "remaining_time": "1:21:26", "throughput": 4267.36, "total_tokens": 4064536} {"current_steps": 6230, "total_steps": 38160, "loss": 0.4664, "lr": 0.0009878692214925523, "epoch": 3.2651991614255764, "percentage": 16.33, "elapsed_time": "0:15:53", "remaining_time": "1:21:25", "throughput": 4267.73, "total_tokens": 4068184} {"current_steps": 6235, "total_steps": 38160, "loss": 0.6335, "lr": 0.00098781910214064, "epoch": 3.2678197064989516, "percentage": 16.34, "elapsed_time": "0:15:53", "remaining_time": "1:21:24", "throughput": 4267.71, "total_tokens": 4071064} {"current_steps": 6240, "total_steps": 38160, "loss": 0.4385, "lr": 0.0009877688807425368, "epoch": 3.270440251572327, "percentage": 16.35, "elapsed_time": "0:15:54", "remaining_time": "1:21:22", "throughput": 4267.45, "total_tokens": 4073464} {"current_steps": 6245, "total_steps": 38160, "loss": 0.4201, "lr": 0.0009877185573087487, "epoch": 3.2730607966457024, "percentage": 16.37, "elapsed_time": "0:15:55", "remaining_time": "1:21:21", "throughput": 4267.61, "total_tokens": 4076696} {"current_steps": 6250, "total_steps": 38160, "loss": 0.6167, "lr": 0.0009876681318498025, "epoch": 3.2756813417190775, "percentage": 16.38, "elapsed_time": "0:15:55", "remaining_time": "1:21:20", "throughput": 4267.56, "total_tokens": 4079480} {"current_steps": 6255, "total_steps": 38160, "loss": 0.4711, "lr": 0.0009876176043762466, "epoch": 3.2783018867924527, "percentage": 16.39, "elapsed_time": "0:15:56", "remaining_time": "1:21:19", "throughput": 4267.46, "total_tokens": 4082264} {"current_steps": 6260, "total_steps": 38160, "loss": 0.3271, "lr": 0.000987566974898651, "epoch": 3.280922431865828, "percentage": 16.4, "elapsed_time": "0:15:57", "remaining_time": "1:21:18", "throughput": 4267.56, "total_tokens": 4085400} {"current_steps": 6265, "total_steps": 38160, "loss": 0.4445, "lr": 0.0009875162434276065, "epoch": 3.2835429769392035, "percentage": 16.42, "elapsed_time": "0:15:57", "remaining_time": "1:21:17", "throughput": 4267.51, "total_tokens": 4088184} {"current_steps": 6270, "total_steps": 38160, "loss": 0.4152, "lr": 0.000987465409973726, "epoch": 3.2861635220125787, "percentage": 16.43, "elapsed_time": "0:15:59", "remaining_time": "1:21:17", "throughput": 4268.77, "total_tokens": 4094072} {"current_steps": 6275, "total_steps": 38160, "loss": 0.4311, "lr": 0.0009874144745476432, "epoch": 3.288784067085954, "percentage": 16.44, "elapsed_time": "0:15:59", "remaining_time": "1:21:17", "throughput": 4269.21, "total_tokens": 4097912} {"current_steps": 6280, "total_steps": 38160, "loss": 0.4932, "lr": 0.0009873634371600126, "epoch": 3.291404612159329, "percentage": 16.46, "elapsed_time": "0:16:00", "remaining_time": "1:21:16", "throughput": 4269.33, "total_tokens": 4101048} {"current_steps": 6285, "total_steps": 38160, "loss": 0.6447, "lr": 0.0009873122978215115, "epoch": 3.2940251572327046, "percentage": 16.47, "elapsed_time": "0:16:01", "remaining_time": "1:21:14", "throughput": 4269.1, "total_tokens": 4103480} {"current_steps": 6290, "total_steps": 38160, "loss": 0.4467, "lr": 0.000987261056542837, "epoch": 3.29664570230608, "percentage": 16.48, "elapsed_time": "0:16:02", "remaining_time": "1:21:14", "throughput": 4269.9, "total_tokens": 4108120} {"current_steps": 6295, "total_steps": 38160, "loss": 0.5008, "lr": 0.0009872097133347085, "epoch": 3.299266247379455, "percentage": 16.5, "elapsed_time": "0:16:02", "remaining_time": "1:21:13", "throughput": 4269.8, "total_tokens": 4110872} {"current_steps": 6300, "total_steps": 38160, "loss": 0.4058, "lr": 0.0009871582682078664, "epoch": 3.30188679245283, "percentage": 16.51, "elapsed_time": "0:16:03", "remaining_time": "1:21:12", "throughput": 4269.99, "total_tokens": 4114232} {"current_steps": 6305, "total_steps": 38160, "loss": 0.4801, "lr": 0.0009871067211730722, "epoch": 3.3045073375262053, "percentage": 16.52, "elapsed_time": "0:16:04", "remaining_time": "1:21:11", "throughput": 4270.2, "total_tokens": 4117592} {"current_steps": 6310, "total_steps": 38160, "loss": 0.4612, "lr": 0.0009870550722411093, "epoch": 3.307127882599581, "percentage": 16.54, "elapsed_time": "0:16:05", "remaining_time": "1:21:11", "throughput": 4270.54, "total_tokens": 4121208} {"current_steps": 6315, "total_steps": 38160, "loss": 0.4585, "lr": 0.000987003321422782, "epoch": 3.309748427672956, "percentage": 16.55, "elapsed_time": "0:16:05", "remaining_time": "1:21:10", "throughput": 4270.77, "total_tokens": 4124568} {"current_steps": 6320, "total_steps": 38160, "loss": 0.5844, "lr": 0.0009869514687289155, "epoch": 3.3123689727463312, "percentage": 16.56, "elapsed_time": "0:16:06", "remaining_time": "1:21:09", "throughput": 4270.96, "total_tokens": 4127928} {"current_steps": 6325, "total_steps": 38160, "loss": 0.6313, "lr": 0.0009868995141703576, "epoch": 3.3149895178197064, "percentage": 16.57, "elapsed_time": "0:16:07", "remaining_time": "1:21:07", "throughput": 4270.8, "total_tokens": 4130552} {"current_steps": 6330, "total_steps": 38160, "loss": 0.4874, "lr": 0.000986847457757976, "epoch": 3.3176100628930816, "percentage": 16.59, "elapsed_time": "0:16:07", "remaining_time": "1:21:06", "throughput": 4270.8, "total_tokens": 4133592} {"current_steps": 6335, "total_steps": 38160, "loss": 0.5425, "lr": 0.0009867952995026605, "epoch": 3.320230607966457, "percentage": 16.6, "elapsed_time": "0:16:08", "remaining_time": "1:21:05", "throughput": 4270.88, "total_tokens": 4136728} {"current_steps": 6340, "total_steps": 38160, "loss": 0.4381, "lr": 0.0009867430394153221, "epoch": 3.3228511530398324, "percentage": 16.61, "elapsed_time": "0:16:09", "remaining_time": "1:21:04", "throughput": 4270.91, "total_tokens": 4139736} {"current_steps": 6345, "total_steps": 38160, "loss": 0.4182, "lr": 0.0009866906775068927, "epoch": 3.3254716981132075, "percentage": 16.63, "elapsed_time": "0:16:09", "remaining_time": "1:21:03", "throughput": 4270.8, "total_tokens": 4142488} {"current_steps": 6350, "total_steps": 38160, "loss": 0.549, "lr": 0.0009866382137883262, "epoch": 3.3280922431865827, "percentage": 16.64, "elapsed_time": "0:16:10", "remaining_time": "1:21:02", "throughput": 4270.79, "total_tokens": 4145400} {"current_steps": 6355, "total_steps": 38160, "loss": 0.631, "lr": 0.0009865856482705973, "epoch": 3.330712788259958, "percentage": 16.65, "elapsed_time": "0:16:11", "remaining_time": "1:21:01", "throughput": 4271.12, "total_tokens": 4149112} {"current_steps": 6360, "total_steps": 38160, "loss": 0.53, "lr": 0.0009865329809647019, "epoch": 3.3333333333333335, "percentage": 16.67, "elapsed_time": "0:16:12", "remaining_time": "1:21:00", "throughput": 4271.17, "total_tokens": 4152184} {"current_steps": 6365, "total_steps": 38160, "loss": 0.7337, "lr": 0.0009864802118816575, "epoch": 3.3359538784067087, "percentage": 16.68, "elapsed_time": "0:16:12", "remaining_time": "1:20:59", "throughput": 4271.21, "total_tokens": 4155288} {"current_steps": 6370, "total_steps": 38160, "loss": 0.4651, "lr": 0.0009864273410325028, "epoch": 3.338574423480084, "percentage": 16.69, "elapsed_time": "0:16:13", "remaining_time": "1:20:58", "throughput": 4271.36, "total_tokens": 4158488} {"current_steps": 6375, "total_steps": 38160, "loss": 0.4323, "lr": 0.000986374368428298, "epoch": 3.341194968553459, "percentage": 16.71, "elapsed_time": "0:16:14", "remaining_time": "1:20:58", "throughput": 4271.79, "total_tokens": 4162328} {"current_steps": 6380, "total_steps": 38160, "loss": 0.4571, "lr": 0.000986321294080124, "epoch": 3.3438155136268346, "percentage": 16.72, "elapsed_time": "0:16:15", "remaining_time": "1:20:57", "throughput": 4272.24, "total_tokens": 4166232} {"current_steps": 6385, "total_steps": 38160, "loss": 0.5694, "lr": 0.0009862681179990838, "epoch": 3.3464360587002098, "percentage": 16.73, "elapsed_time": "0:16:15", "remaining_time": "1:20:56", "throughput": 4272.25, "total_tokens": 4169240} {"current_steps": 6390, "total_steps": 38160, "loss": 0.5392, "lr": 0.0009862148401963008, "epoch": 3.349056603773585, "percentage": 16.75, "elapsed_time": "0:16:16", "remaining_time": "1:20:55", "throughput": 4272.18, "total_tokens": 4171992} {"current_steps": 6395, "total_steps": 38160, "loss": 0.506, "lr": 0.0009861614606829201, "epoch": 3.35167714884696, "percentage": 16.76, "elapsed_time": "0:16:17", "remaining_time": "1:20:53", "throughput": 4271.97, "total_tokens": 4174488} {"current_steps": 6400, "total_steps": 38160, "loss": 0.4659, "lr": 0.0009861079794701085, "epoch": 3.3542976939203353, "percentage": 16.77, "elapsed_time": "0:16:17", "remaining_time": "1:20:52", "throughput": 4272.2, "total_tokens": 4177880} {"current_steps": 6405, "total_steps": 38160, "loss": 0.551, "lr": 0.000986054396569053, "epoch": 3.3569182389937104, "percentage": 16.78, "elapsed_time": "0:16:18", "remaining_time": "1:20:52", "throughput": 4272.66, "total_tokens": 4181816} {"current_steps": 6410, "total_steps": 38160, "loss": 0.6165, "lr": 0.0009860007119909635, "epoch": 3.359538784067086, "percentage": 16.8, "elapsed_time": "0:16:19", "remaining_time": "1:20:51", "throughput": 4272.7, "total_tokens": 4184824} {"current_steps": 6415, "total_steps": 38160, "loss": 0.5705, "lr": 0.0009859469257470692, "epoch": 3.3621593291404612, "percentage": 16.81, "elapsed_time": "0:16:20", "remaining_time": "1:20:50", "throughput": 4272.62, "total_tokens": 4187608} {"current_steps": 6420, "total_steps": 38160, "loss": 0.5647, "lr": 0.0009858930378486223, "epoch": 3.3647798742138364, "percentage": 16.82, "elapsed_time": "0:16:20", "remaining_time": "1:20:49", "throughput": 4272.82, "total_tokens": 4190968} {"current_steps": 6425, "total_steps": 38160, "loss": 0.4945, "lr": 0.000985839048306895, "epoch": 3.3674004192872116, "percentage": 16.84, "elapsed_time": "0:16:21", "remaining_time": "1:20:48", "throughput": 4273.44, "total_tokens": 4195256} {"current_steps": 6430, "total_steps": 38160, "loss": 0.5022, "lr": 0.000985784957133182, "epoch": 3.370020964360587, "percentage": 16.85, "elapsed_time": "0:16:22", "remaining_time": "1:20:48", "throughput": 4273.82, "total_tokens": 4199000} {"current_steps": 6435, "total_steps": 38160, "loss": 0.4614, "lr": 0.0009857307643387975, "epoch": 3.3726415094339623, "percentage": 16.86, "elapsed_time": "0:16:23", "remaining_time": "1:20:47", "throughput": 4273.84, "total_tokens": 4202104} {"current_steps": 6440, "total_steps": 38160, "loss": 0.4546, "lr": 0.000985676469935079, "epoch": 3.3752620545073375, "percentage": 16.88, "elapsed_time": "0:16:23", "remaining_time": "1:20:45", "throughput": 4273.48, "total_tokens": 4204344} {"current_steps": 6445, "total_steps": 38160, "loss": 0.5122, "lr": 0.0009856220739333837, "epoch": 3.3778825995807127, "percentage": 16.89, "elapsed_time": "0:16:24", "remaining_time": "1:20:44", "throughput": 4273.6, "total_tokens": 4207544} {"current_steps": 6450, "total_steps": 38160, "loss": 0.5841, "lr": 0.000985567576345091, "epoch": 3.380503144654088, "percentage": 16.9, "elapsed_time": "0:16:25", "remaining_time": "1:20:43", "throughput": 4273.5, "total_tokens": 4210360} {"current_steps": 6455, "total_steps": 38160, "loss": 0.4957, "lr": 0.0009855129771816006, "epoch": 3.3831236897274635, "percentage": 16.92, "elapsed_time": "0:16:25", "remaining_time": "1:20:42", "throughput": 4273.47, "total_tokens": 4213272} {"current_steps": 6460, "total_steps": 38160, "loss": 0.4491, "lr": 0.0009854582764543347, "epoch": 3.3857442348008386, "percentage": 16.93, "elapsed_time": "0:16:26", "remaining_time": "1:20:41", "throughput": 4273.66, "total_tokens": 4216536} {"current_steps": 6465, "total_steps": 38160, "loss": 0.4611, "lr": 0.0009854034741747356, "epoch": 3.388364779874214, "percentage": 16.94, "elapsed_time": "0:16:27", "remaining_time": "1:20:40", "throughput": 4273.56, "total_tokens": 4219256} {"current_steps": 6470, "total_steps": 38160, "loss": 0.6098, "lr": 0.0009853485703542675, "epoch": 3.390985324947589, "percentage": 16.95, "elapsed_time": "0:16:28", "remaining_time": "1:20:39", "throughput": 4273.8, "total_tokens": 4222744} {"current_steps": 6475, "total_steps": 38160, "loss": 0.4397, "lr": 0.0009852935650044158, "epoch": 3.3936058700209646, "percentage": 16.97, "elapsed_time": "0:16:28", "remaining_time": "1:20:38", "throughput": 4274.01, "total_tokens": 4226168} {"current_steps": 6480, "total_steps": 38160, "loss": 0.3083, "lr": 0.0009852384581366866, "epoch": 3.3962264150943398, "percentage": 16.98, "elapsed_time": "0:16:29", "remaining_time": "1:20:37", "throughput": 4274.11, "total_tokens": 4229272} {"current_steps": 6485, "total_steps": 38160, "loss": 0.48, "lr": 0.000985183249762608, "epoch": 3.398846960167715, "percentage": 16.99, "elapsed_time": "0:16:30", "remaining_time": "1:20:36", "throughput": 4274.05, "total_tokens": 4232120} {"current_steps": 6490, "total_steps": 38160, "loss": 0.5249, "lr": 0.000985127939893729, "epoch": 3.40146750524109, "percentage": 17.01, "elapsed_time": "0:16:31", "remaining_time": "1:20:35", "throughput": 4274.57, "total_tokens": 4236184} {"current_steps": 6495, "total_steps": 38160, "loss": 0.537, "lr": 0.0009850725285416194, "epoch": 3.4040880503144653, "percentage": 17.02, "elapsed_time": "0:16:31", "remaining_time": "1:20:35", "throughput": 4274.98, "total_tokens": 4240056} {"current_steps": 6500, "total_steps": 38160, "loss": 0.5092, "lr": 0.0009850170157178707, "epoch": 3.4067085953878404, "percentage": 17.03, "elapsed_time": "0:16:32", "remaining_time": "1:20:34", "throughput": 4275.29, "total_tokens": 4243640} {"current_steps": 6505, "total_steps": 38160, "loss": 0.5805, "lr": 0.000984961401434096, "epoch": 3.409329140461216, "percentage": 17.05, "elapsed_time": "0:16:33", "remaining_time": "1:20:33", "throughput": 4275.22, "total_tokens": 4246424} {"current_steps": 6510, "total_steps": 38160, "loss": 0.4975, "lr": 0.0009849056857019285, "epoch": 3.411949685534591, "percentage": 17.06, "elapsed_time": "0:16:33", "remaining_time": "1:20:32", "throughput": 4275.11, "total_tokens": 4249144} {"current_steps": 6515, "total_steps": 38160, "loss": 0.5731, "lr": 0.0009848498685330238, "epoch": 3.4145702306079664, "percentage": 17.07, "elapsed_time": "0:16:34", "remaining_time": "1:20:31", "throughput": 4275.05, "total_tokens": 4251960} {"current_steps": 6520, "total_steps": 38160, "loss": 0.4297, "lr": 0.000984793949939058, "epoch": 3.4171907756813416, "percentage": 17.09, "elapsed_time": "0:16:35", "remaining_time": "1:20:29", "throughput": 4274.96, "total_tokens": 4254712} {"current_steps": 6525, "total_steps": 38160, "loss": 0.4609, "lr": 0.0009847379299317287, "epoch": 3.419811320754717, "percentage": 17.1, "elapsed_time": "0:16:35", "remaining_time": "1:20:28", "throughput": 4274.93, "total_tokens": 4257656} {"current_steps": 6530, "total_steps": 38160, "loss": 0.5252, "lr": 0.0009846818085227549, "epoch": 3.4224318658280923, "percentage": 17.11, "elapsed_time": "0:16:36", "remaining_time": "1:20:27", "throughput": 4274.97, "total_tokens": 4260696} {"current_steps": 6535, "total_steps": 38160, "loss": 0.464, "lr": 0.000984625585723876, "epoch": 3.4250524109014675, "percentage": 17.13, "elapsed_time": "0:16:37", "remaining_time": "1:20:26", "throughput": 4274.98, "total_tokens": 4263672} {"current_steps": 6540, "total_steps": 38160, "loss": 0.4609, "lr": 0.0009845692615468536, "epoch": 3.4276729559748427, "percentage": 17.14, "elapsed_time": "0:16:38", "remaining_time": "1:20:25", "throughput": 4274.89, "total_tokens": 4266488} {"current_steps": 6545, "total_steps": 38160, "loss": 0.38, "lr": 0.00098451283600347, "epoch": 3.430293501048218, "percentage": 17.15, "elapsed_time": "0:16:38", "remaining_time": "1:20:25", "throughput": 4275.7, "total_tokens": 4271224} {"current_steps": 6550, "total_steps": 38160, "loss": 0.5558, "lr": 0.0009844563091055286, "epoch": 3.4329140461215935, "percentage": 17.16, "elapsed_time": "0:16:39", "remaining_time": "1:20:24", "throughput": 4275.67, "total_tokens": 4274104} {"current_steps": 6555, "total_steps": 38160, "loss": 0.5113, "lr": 0.0009843996808648542, "epoch": 3.4355345911949686, "percentage": 17.18, "elapsed_time": "0:16:40", "remaining_time": "1:20:23", "throughput": 4275.97, "total_tokens": 4277752} {"current_steps": 6560, "total_steps": 38160, "loss": 0.4376, "lr": 0.000984342951293293, "epoch": 3.438155136268344, "percentage": 17.19, "elapsed_time": "0:16:41", "remaining_time": "1:20:22", "throughput": 4276.18, "total_tokens": 4281080} {"current_steps": 6565, "total_steps": 38160, "loss": 0.4138, "lr": 0.0009842861204027121, "epoch": 3.440775681341719, "percentage": 17.2, "elapsed_time": "0:16:41", "remaining_time": "1:20:22", "throughput": 4276.72, "total_tokens": 4285208} {"current_steps": 6570, "total_steps": 38160, "loss": 0.4799, "lr": 0.0009842291882049999, "epoch": 3.4433962264150946, "percentage": 17.22, "elapsed_time": "0:16:42", "remaining_time": "1:20:20", "throughput": 4276.49, "total_tokens": 4287608} {"current_steps": 6575, "total_steps": 38160, "loss": 0.491, "lr": 0.0009841721547120658, "epoch": 3.4460167714884697, "percentage": 17.23, "elapsed_time": "0:16:43", "remaining_time": "1:20:19", "throughput": 4276.64, "total_tokens": 4290872} {"current_steps": 6580, "total_steps": 38160, "loss": 0.4002, "lr": 0.0009841150199358408, "epoch": 3.448637316561845, "percentage": 17.24, "elapsed_time": "0:16:44", "remaining_time": "1:20:18", "throughput": 4276.67, "total_tokens": 4293912} {"current_steps": 6585, "total_steps": 38160, "loss": 0.474, "lr": 0.0009840577838882765, "epoch": 3.45125786163522, "percentage": 17.26, "elapsed_time": "0:16:44", "remaining_time": "1:20:17", "throughput": 4276.78, "total_tokens": 4297112} {"current_steps": 6590, "total_steps": 38160, "loss": 0.4679, "lr": 0.0009840004465813464, "epoch": 3.4538784067085953, "percentage": 17.27, "elapsed_time": "0:16:45", "remaining_time": "1:20:16", "throughput": 4276.88, "total_tokens": 4300248} {"current_steps": 6595, "total_steps": 38160, "loss": 0.5211, "lr": 0.0009839430080270445, "epoch": 3.4564989517819704, "percentage": 17.28, "elapsed_time": "0:16:46", "remaining_time": "1:20:15", "throughput": 4277.12, "total_tokens": 4303672} {"current_steps": 6600, "total_steps": 38160, "loss": 0.3768, "lr": 0.0009838854682373865, "epoch": 3.459119496855346, "percentage": 17.3, "elapsed_time": "0:16:47", "remaining_time": "1:20:17", "throughput": 4278.91, "total_tokens": 4311096} {"current_steps": 6605, "total_steps": 38160, "loss": 0.4883, "lr": 0.000983827827224409, "epoch": 3.461740041928721, "percentage": 17.31, "elapsed_time": "0:16:48", "remaining_time": "1:20:16", "throughput": 4278.91, "total_tokens": 4314072} {"current_steps": 6610, "total_steps": 38160, "loss": 0.5806, "lr": 0.0009837700850001698, "epoch": 3.4643605870020964, "percentage": 17.32, "elapsed_time": "0:16:48", "remaining_time": "1:20:15", "throughput": 4279.14, "total_tokens": 4317528} {"current_steps": 6615, "total_steps": 38160, "loss": 0.4436, "lr": 0.000983712241576748, "epoch": 3.4669811320754715, "percentage": 17.33, "elapsed_time": "0:16:49", "remaining_time": "1:20:14", "throughput": 4279.26, "total_tokens": 4320760} {"current_steps": 6620, "total_steps": 38160, "loss": 0.4844, "lr": 0.000983654296966244, "epoch": 3.469601677148847, "percentage": 17.35, "elapsed_time": "0:16:50", "remaining_time": "1:20:14", "throughput": 4279.6, "total_tokens": 4324440} {"current_steps": 6625, "total_steps": 38160, "loss": 0.6265, "lr": 0.0009835962511807786, "epoch": 3.4722222222222223, "percentage": 17.36, "elapsed_time": "0:16:51", "remaining_time": "1:20:13", "throughput": 4279.93, "total_tokens": 4328056} {"current_steps": 6630, "total_steps": 38160, "loss": 0.4043, "lr": 0.0009835381042324948, "epoch": 3.4748427672955975, "percentage": 17.37, "elapsed_time": "0:16:51", "remaining_time": "1:20:12", "throughput": 4279.88, "total_tokens": 4330936} {"current_steps": 6635, "total_steps": 38160, "loss": 0.443, "lr": 0.0009834798561335558, "epoch": 3.4774633123689727, "percentage": 17.39, "elapsed_time": "0:16:52", "remaining_time": "1:20:11", "throughput": 4280.07, "total_tokens": 4334328} {"current_steps": 6640, "total_steps": 38160, "loss": 0.4433, "lr": 0.000983421506896147, "epoch": 3.480083857442348, "percentage": 17.4, "elapsed_time": "0:16:53", "remaining_time": "1:20:10", "throughput": 4280.18, "total_tokens": 4337432} {"current_steps": 6645, "total_steps": 38160, "loss": 0.5004, "lr": 0.000983363056532474, "epoch": 3.4827044025157234, "percentage": 17.41, "elapsed_time": "0:16:54", "remaining_time": "1:20:09", "throughput": 4280.05, "total_tokens": 4340056} {"current_steps": 6650, "total_steps": 38160, "loss": 0.628, "lr": 0.000983304505054764, "epoch": 3.4853249475890986, "percentage": 17.43, "elapsed_time": "0:16:54", "remaining_time": "1:20:07", "throughput": 4279.79, "total_tokens": 4342520} {"current_steps": 6655, "total_steps": 38160, "loss": 0.3872, "lr": 0.0009832458524752655, "epoch": 3.487945492662474, "percentage": 17.44, "elapsed_time": "0:16:55", "remaining_time": "1:20:07", "throughput": 4280.38, "total_tokens": 4346776} {"current_steps": 6660, "total_steps": 38160, "loss": 0.5483, "lr": 0.0009831870988062476, "epoch": 3.490566037735849, "percentage": 17.45, "elapsed_time": "0:16:56", "remaining_time": "1:20:06", "throughput": 4280.54, "total_tokens": 4350104} {"current_steps": 6665, "total_steps": 38160, "loss": 0.5541, "lr": 0.0009831282440600014, "epoch": 3.4931865828092246, "percentage": 17.47, "elapsed_time": "0:16:56", "remaining_time": "1:20:05", "throughput": 4280.52, "total_tokens": 4352952} {"current_steps": 6670, "total_steps": 38160, "loss": 0.3978, "lr": 0.0009830692882488383, "epoch": 3.4958071278825997, "percentage": 17.48, "elapsed_time": "0:16:57", "remaining_time": "1:20:04", "throughput": 4280.47, "total_tokens": 4355896} {"current_steps": 6675, "total_steps": 38160, "loss": 0.5059, "lr": 0.000983010231385091, "epoch": 3.498427672955975, "percentage": 17.49, "elapsed_time": "0:16:58", "remaining_time": "1:20:03", "throughput": 4280.45, "total_tokens": 4358968} {"current_steps": 6680, "total_steps": 38160, "loss": 0.566, "lr": 0.000982951073481114, "epoch": 3.50104821802935, "percentage": 17.51, "elapsed_time": "0:16:59", "remaining_time": "1:20:02", "throughput": 4280.97, "total_tokens": 4363000} {"current_steps": 6685, "total_steps": 38160, "loss": 0.6933, "lr": 0.0009828918145492823, "epoch": 3.5036687631027252, "percentage": 17.52, "elapsed_time": "0:16:59", "remaining_time": "1:20:02", "throughput": 4281.14, "total_tokens": 4366360} {"current_steps": 6690, "total_steps": 38160, "loss": 0.5421, "lr": 0.000982832454601992, "epoch": 3.5062893081761004, "percentage": 17.53, "elapsed_time": "0:17:00", "remaining_time": "1:20:00", "throughput": 4281.23, "total_tokens": 4369432} {"current_steps": 6695, "total_steps": 38160, "loss": 0.4636, "lr": 0.0009827729936516605, "epoch": 3.508909853249476, "percentage": 17.54, "elapsed_time": "0:17:01", "remaining_time": "1:20:00", "throughput": 4281.64, "total_tokens": 4373432} {"current_steps": 6700, "total_steps": 38160, "loss": 0.3886, "lr": 0.0009827134317107267, "epoch": 3.511530398322851, "percentage": 17.56, "elapsed_time": "0:17:02", "remaining_time": "1:20:00", "throughput": 4282.16, "total_tokens": 4377528} {"current_steps": 6705, "total_steps": 38160, "loss": 0.5228, "lr": 0.0009826537687916501, "epoch": 3.5141509433962264, "percentage": 17.57, "elapsed_time": "0:17:02", "remaining_time": "1:19:59", "throughput": 4282.24, "total_tokens": 4380632} {"current_steps": 6710, "total_steps": 38160, "loss": 0.3914, "lr": 0.0009825940049069113, "epoch": 3.5167714884696015, "percentage": 17.58, "elapsed_time": "0:17:03", "remaining_time": "1:19:58", "throughput": 4282.68, "total_tokens": 4384504} {"current_steps": 6715, "total_steps": 38160, "loss": 0.4854, "lr": 0.0009825341400690126, "epoch": 3.519392033542977, "percentage": 17.6, "elapsed_time": "0:17:04", "remaining_time": "1:19:57", "throughput": 4282.96, "total_tokens": 4388024} {"current_steps": 6720, "total_steps": 38160, "loss": 0.4313, "lr": 0.0009824741742904767, "epoch": 3.5220125786163523, "percentage": 17.61, "elapsed_time": "0:17:05", "remaining_time": "1:19:56", "throughput": 4282.96, "total_tokens": 4390968} {"current_steps": 6725, "total_steps": 38160, "loss": 0.468, "lr": 0.000982414107583848, "epoch": 3.5246331236897275, "percentage": 17.62, "elapsed_time": "0:17:05", "remaining_time": "1:19:55", "throughput": 4283.16, "total_tokens": 4394328} {"current_steps": 6730, "total_steps": 38160, "loss": 0.5396, "lr": 0.0009823539399616914, "epoch": 3.5272536687631026, "percentage": 17.64, "elapsed_time": "0:17:06", "remaining_time": "1:19:54", "throughput": 4283.47, "total_tokens": 4397976} {"current_steps": 6735, "total_steps": 38160, "loss": 0.4736, "lr": 0.0009822936714365938, "epoch": 3.529874213836478, "percentage": 17.65, "elapsed_time": "0:17:07", "remaining_time": "1:19:54", "throughput": 4283.79, "total_tokens": 4401560} {"current_steps": 6740, "total_steps": 38160, "loss": 0.4682, "lr": 0.0009822333020211623, "epoch": 3.532494758909853, "percentage": 17.66, "elapsed_time": "0:17:08", "remaining_time": "1:19:53", "throughput": 4283.81, "total_tokens": 4404568} {"current_steps": 6745, "total_steps": 38160, "loss": 0.448, "lr": 0.0009821728317280256, "epoch": 3.5351153039832286, "percentage": 17.68, "elapsed_time": "0:17:08", "remaining_time": "1:19:52", "throughput": 4284.28, "total_tokens": 4408472} {"current_steps": 6750, "total_steps": 38160, "loss": 0.416, "lr": 0.0009821122605698336, "epoch": 3.5377358490566038, "percentage": 17.69, "elapsed_time": "0:17:10", "remaining_time": "1:19:53", "throughput": 4285.66, "total_tokens": 4415064} {"current_steps": 6755, "total_steps": 38160, "loss": 0.5441, "lr": 0.0009820515885592567, "epoch": 3.540356394129979, "percentage": 17.7, "elapsed_time": "0:17:10", "remaining_time": "1:19:52", "throughput": 4285.49, "total_tokens": 4417720} {"current_steps": 6760, "total_steps": 38160, "loss": 0.4456, "lr": 0.0009819908157089872, "epoch": 3.5429769392033545, "percentage": 17.71, "elapsed_time": "0:17:11", "remaining_time": "1:19:51", "throughput": 4285.42, "total_tokens": 4420536} {"current_steps": 6765, "total_steps": 38160, "loss": 0.4123, "lr": 0.0009819299420317379, "epoch": 3.5455974842767297, "percentage": 17.73, "elapsed_time": "0:17:12", "remaining_time": "1:19:50", "throughput": 4285.36, "total_tokens": 4423320} {"current_steps": 6770, "total_steps": 38160, "loss": 0.526, "lr": 0.0009818689675402427, "epoch": 3.548218029350105, "percentage": 17.74, "elapsed_time": "0:17:12", "remaining_time": "1:19:48", "throughput": 4285.16, "total_tokens": 4425816} {"current_steps": 6775, "total_steps": 38160, "loss": 0.4931, "lr": 0.000981807892247257, "epoch": 3.55083857442348, "percentage": 17.75, "elapsed_time": "0:17:13", "remaining_time": "1:19:48", "throughput": 4285.6, "total_tokens": 4429752} {"current_steps": 6780, "total_steps": 38160, "loss": 0.5378, "lr": 0.0009817467161655571, "epoch": 3.5534591194968552, "percentage": 17.77, "elapsed_time": "0:17:14", "remaining_time": "1:19:47", "throughput": 4285.7, "total_tokens": 4432888} {"current_steps": 6785, "total_steps": 38160, "loss": 0.5184, "lr": 0.0009816854393079402, "epoch": 3.5560796645702304, "percentage": 17.78, "elapsed_time": "0:17:15", "remaining_time": "1:19:46", "throughput": 4286.05, "total_tokens": 4436568} {"current_steps": 6790, "total_steps": 38160, "loss": 0.4095, "lr": 0.0009816240616872247, "epoch": 3.558700209643606, "percentage": 17.79, "elapsed_time": "0:17:15", "remaining_time": "1:19:45", "throughput": 4286.0, "total_tokens": 4439352} {"current_steps": 6795, "total_steps": 38160, "loss": 0.6442, "lr": 0.0009815625833162502, "epoch": 3.561320754716981, "percentage": 17.81, "elapsed_time": "0:17:16", "remaining_time": "1:19:44", "throughput": 4286.24, "total_tokens": 4442808} {"current_steps": 6800, "total_steps": 38160, "loss": 0.5686, "lr": 0.0009815010042078772, "epoch": 3.5639412997903563, "percentage": 17.82, "elapsed_time": "0:17:17", "remaining_time": "1:19:43", "throughput": 4286.3, "total_tokens": 4445816} {"current_steps": 6805, "total_steps": 38160, "loss": 0.5091, "lr": 0.0009814393243749873, "epoch": 3.5665618448637315, "percentage": 17.83, "elapsed_time": "0:17:17", "remaining_time": "1:19:42", "throughput": 4286.52, "total_tokens": 4449272} {"current_steps": 6810, "total_steps": 38160, "loss": 0.5304, "lr": 0.0009813775438304835, "epoch": 3.569182389937107, "percentage": 17.85, "elapsed_time": "0:17:18", "remaining_time": "1:19:41", "throughput": 4286.91, "total_tokens": 4453048} {"current_steps": 6815, "total_steps": 38160, "loss": 0.693, "lr": 0.0009813156625872893, "epoch": 3.5718029350104823, "percentage": 17.86, "elapsed_time": "0:17:19", "remaining_time": "1:19:40", "throughput": 4286.82, "total_tokens": 4455832} {"current_steps": 6820, "total_steps": 38160, "loss": 0.504, "lr": 0.0009812536806583494, "epoch": 3.5744234800838575, "percentage": 17.87, "elapsed_time": "0:17:20", "remaining_time": "1:19:39", "throughput": 4286.89, "total_tokens": 4458904} {"current_steps": 6825, "total_steps": 38160, "loss": 0.4343, "lr": 0.0009811915980566302, "epoch": 3.5770440251572326, "percentage": 17.89, "elapsed_time": "0:17:20", "remaining_time": "1:19:38", "throughput": 4287.0, "total_tokens": 4462168} {"current_steps": 6830, "total_steps": 38160, "loss": 0.4598, "lr": 0.0009811294147951182, "epoch": 3.579664570230608, "percentage": 17.9, "elapsed_time": "0:17:21", "remaining_time": "1:19:37", "throughput": 4287.03, "total_tokens": 4465208} {"current_steps": 6835, "total_steps": 38160, "loss": 0.4433, "lr": 0.000981067130886822, "epoch": 3.582285115303983, "percentage": 17.91, "elapsed_time": "0:17:22", "remaining_time": "1:19:36", "throughput": 4286.7, "total_tokens": 4467448} {"current_steps": 6840, "total_steps": 38160, "loss": 0.4103, "lr": 0.00098100474634477, "epoch": 3.5849056603773586, "percentage": 17.92, "elapsed_time": "0:17:22", "remaining_time": "1:19:35", "throughput": 4287.05, "total_tokens": 4471224} {"current_steps": 6845, "total_steps": 38160, "loss": 0.3452, "lr": 0.0009809422611820127, "epoch": 3.5875262054507338, "percentage": 17.94, "elapsed_time": "0:17:23", "remaining_time": "1:19:34", "throughput": 4286.9, "total_tokens": 4473848} {"current_steps": 6850, "total_steps": 38160, "loss": 0.4282, "lr": 0.0009808796754116212, "epoch": 3.590146750524109, "percentage": 17.95, "elapsed_time": "0:17:24", "remaining_time": "1:19:33", "throughput": 4287.23, "total_tokens": 4477528} {"current_steps": 6855, "total_steps": 38160, "loss": 0.5376, "lr": 0.0009808169890466879, "epoch": 3.5927672955974845, "percentage": 17.96, "elapsed_time": "0:17:25", "remaining_time": "1:19:33", "throughput": 4287.83, "total_tokens": 4481784} {"current_steps": 6860, "total_steps": 38160, "loss": 0.4545, "lr": 0.000980754202100326, "epoch": 3.5953878406708597, "percentage": 17.98, "elapsed_time": "0:17:26", "remaining_time": "1:19:32", "throughput": 4288.25, "total_tokens": 4485624} {"current_steps": 6865, "total_steps": 38160, "loss": 0.6279, "lr": 0.0009806913145856695, "epoch": 3.598008385744235, "percentage": 17.99, "elapsed_time": "0:17:26", "remaining_time": "1:19:31", "throughput": 4288.04, "total_tokens": 4488120} {"current_steps": 6870, "total_steps": 38160, "loss": 0.5598, "lr": 0.0009806283265158741, "epoch": 3.60062893081761, "percentage": 18.0, "elapsed_time": "0:17:27", "remaining_time": "1:19:30", "throughput": 4288.29, "total_tokens": 4491640} {"current_steps": 6875, "total_steps": 38160, "loss": 0.4795, "lr": 0.0009805652379041162, "epoch": 3.603249475890985, "percentage": 18.02, "elapsed_time": "0:17:28", "remaining_time": "1:19:29", "throughput": 4288.29, "total_tokens": 4494648} {"current_steps": 6880, "total_steps": 38160, "loss": 0.5399, "lr": 0.000980502048763593, "epoch": 3.6058700209643604, "percentage": 18.03, "elapsed_time": "0:17:28", "remaining_time": "1:19:28", "throughput": 4288.08, "total_tokens": 4497176} {"current_steps": 6885, "total_steps": 38160, "loss": 0.4333, "lr": 0.0009804387591075233, "epoch": 3.608490566037736, "percentage": 18.04, "elapsed_time": "0:17:29", "remaining_time": "1:19:27", "throughput": 4288.12, "total_tokens": 4500248} {"current_steps": 6890, "total_steps": 38160, "loss": 0.3394, "lr": 0.000980375368949146, "epoch": 3.611111111111111, "percentage": 18.06, "elapsed_time": "0:17:30", "remaining_time": "1:19:26", "throughput": 4288.22, "total_tokens": 4503416} {"current_steps": 6895, "total_steps": 38160, "loss": 0.4649, "lr": 0.0009803118783017221, "epoch": 3.6137316561844863, "percentage": 18.07, "elapsed_time": "0:17:30", "remaining_time": "1:19:25", "throughput": 4288.43, "total_tokens": 4506904} {"current_steps": 6900, "total_steps": 38160, "loss": 0.3446, "lr": 0.0009802482871785329, "epoch": 3.6163522012578615, "percentage": 18.08, "elapsed_time": "0:17:31", "remaining_time": "1:19:25", "throughput": 4289.08, "total_tokens": 4511352} {"current_steps": 6905, "total_steps": 38160, "loss": 0.4602, "lr": 0.000980184595592881, "epoch": 3.618972746331237, "percentage": 18.09, "elapsed_time": "0:17:32", "remaining_time": "1:19:24", "throughput": 4289.15, "total_tokens": 4514520} {"current_steps": 6910, "total_steps": 38160, "loss": 0.4243, "lr": 0.00098012080355809, "epoch": 3.6215932914046123, "percentage": 18.11, "elapsed_time": "0:17:33", "remaining_time": "1:19:23", "throughput": 4289.08, "total_tokens": 4517336} {"current_steps": 6915, "total_steps": 38160, "loss": 0.4115, "lr": 0.0009800569110875043, "epoch": 3.6242138364779874, "percentage": 18.12, "elapsed_time": "0:17:33", "remaining_time": "1:19:21", "throughput": 4289.09, "total_tokens": 4520280} {"current_steps": 6920, "total_steps": 38160, "loss": 0.4356, "lr": 0.0009799929181944895, "epoch": 3.6268343815513626, "percentage": 18.13, "elapsed_time": "0:17:34", "remaining_time": "1:19:21", "throughput": 4289.36, "total_tokens": 4523960} {"current_steps": 6925, "total_steps": 38160, "loss": 0.5717, "lr": 0.0009799288248924325, "epoch": 3.629454926624738, "percentage": 18.15, "elapsed_time": "0:17:35", "remaining_time": "1:19:20", "throughput": 4289.65, "total_tokens": 4527512} {"current_steps": 6930, "total_steps": 38160, "loss": 0.4149, "lr": 0.0009798646311947404, "epoch": 3.632075471698113, "percentage": 18.16, "elapsed_time": "0:17:36", "remaining_time": "1:19:20", "throughput": 4290.21, "total_tokens": 4531704} {"current_steps": 6935, "total_steps": 38160, "loss": 0.5068, "lr": 0.0009798003371148422, "epoch": 3.6346960167714886, "percentage": 18.17, "elapsed_time": "0:17:37", "remaining_time": "1:19:19", "throughput": 4290.47, "total_tokens": 4535192} {"current_steps": 6940, "total_steps": 38160, "loss": 0.3476, "lr": 0.0009797359426661873, "epoch": 3.6373165618448637, "percentage": 18.19, "elapsed_time": "0:17:37", "remaining_time": "1:19:18", "throughput": 4290.42, "total_tokens": 4538136} {"current_steps": 6945, "total_steps": 38160, "loss": 0.3782, "lr": 0.0009796714478622463, "epoch": 3.639937106918239, "percentage": 18.2, "elapsed_time": "0:17:38", "remaining_time": "1:19:17", "throughput": 4290.29, "total_tokens": 4540824} {"current_steps": 6950, "total_steps": 38160, "loss": 0.5333, "lr": 0.0009796068527165107, "epoch": 3.6425576519916145, "percentage": 18.21, "elapsed_time": "0:17:39", "remaining_time": "1:19:16", "throughput": 4290.33, "total_tokens": 4543896} {"current_steps": 6955, "total_steps": 38160, "loss": 0.4968, "lr": 0.0009795421572424935, "epoch": 3.6451781970649897, "percentage": 18.23, "elapsed_time": "0:17:39", "remaining_time": "1:19:15", "throughput": 4290.57, "total_tokens": 4547448} {"current_steps": 6960, "total_steps": 38160, "loss": 0.4728, "lr": 0.0009794773614537275, "epoch": 3.647798742138365, "percentage": 18.24, "elapsed_time": "0:17:40", "remaining_time": "1:19:13", "throughput": 4290.35, "total_tokens": 4549880} {"current_steps": 6965, "total_steps": 38160, "loss": 0.4631, "lr": 0.0009794124653637677, "epoch": 3.65041928721174, "percentage": 18.25, "elapsed_time": "0:17:41", "remaining_time": "1:19:12", "throughput": 4290.41, "total_tokens": 4552952} {"current_steps": 6970, "total_steps": 38160, "loss": 0.4545, "lr": 0.00097934746898619, "epoch": 3.653039832285115, "percentage": 18.27, "elapsed_time": "0:17:41", "remaining_time": "1:19:11", "throughput": 4290.19, "total_tokens": 4555384} {"current_steps": 6975, "total_steps": 38160, "loss": 0.4038, "lr": 0.00097928237233459, "epoch": 3.6556603773584904, "percentage": 18.28, "elapsed_time": "0:17:42", "remaining_time": "1:19:11", "throughput": 4290.98, "total_tokens": 4560248} {"current_steps": 6980, "total_steps": 38160, "loss": 0.3888, "lr": 0.0009792171754225859, "epoch": 3.658280922431866, "percentage": 18.29, "elapsed_time": "0:17:43", "remaining_time": "1:19:10", "throughput": 4290.63, "total_tokens": 4562424} {"current_steps": 6985, "total_steps": 38160, "loss": 0.613, "lr": 0.0009791518782638158, "epoch": 3.660901467505241, "percentage": 18.3, "elapsed_time": "0:17:44", "remaining_time": "1:19:09", "throughput": 4290.75, "total_tokens": 4565656} {"current_steps": 6990, "total_steps": 38160, "loss": 0.4874, "lr": 0.0009790864808719392, "epoch": 3.6635220125786163, "percentage": 18.32, "elapsed_time": "0:17:44", "remaining_time": "1:19:08", "throughput": 4290.83, "total_tokens": 4568760} {"current_steps": 6995, "total_steps": 38160, "loss": 0.6179, "lr": 0.0009790209832606365, "epoch": 3.6661425576519915, "percentage": 18.33, "elapsed_time": "0:17:45", "remaining_time": "1:19:07", "throughput": 4290.94, "total_tokens": 4571960} {"current_steps": 7000, "total_steps": 38160, "loss": 0.4832, "lr": 0.000978955385443609, "epoch": 3.668763102725367, "percentage": 18.34, "elapsed_time": "0:17:46", "remaining_time": "1:19:06", "throughput": 4291.09, "total_tokens": 4575288} {"current_steps": 7005, "total_steps": 38160, "loss": 0.4854, "lr": 0.0009788896874345792, "epoch": 3.6713836477987423, "percentage": 18.36, "elapsed_time": "0:17:46", "remaining_time": "1:19:04", "throughput": 4290.95, "total_tokens": 4577848} {"current_steps": 7010, "total_steps": 38160, "loss": 0.4775, "lr": 0.0009788238892472904, "epoch": 3.6740041928721174, "percentage": 18.37, "elapsed_time": "0:17:47", "remaining_time": "1:19:04", "throughput": 4291.21, "total_tokens": 4581400} {"current_steps": 7015, "total_steps": 38160, "loss": 0.4341, "lr": 0.0009787579908955063, "epoch": 3.6766247379454926, "percentage": 18.38, "elapsed_time": "0:17:48", "remaining_time": "1:19:03", "throughput": 4291.46, "total_tokens": 4584984} {"current_steps": 7020, "total_steps": 38160, "loss": 0.4147, "lr": 0.0009786919923930127, "epoch": 3.6792452830188678, "percentage": 18.4, "elapsed_time": "0:17:49", "remaining_time": "1:19:02", "throughput": 4291.32, "total_tokens": 4587544} {"current_steps": 7025, "total_steps": 38160, "loss": 0.4444, "lr": 0.0009786258937536155, "epoch": 3.681865828092243, "percentage": 18.41, "elapsed_time": "0:17:49", "remaining_time": "1:19:01", "throughput": 4291.39, "total_tokens": 4590680} {"current_steps": 7030, "total_steps": 38160, "loss": 0.4979, "lr": 0.0009785596949911418, "epoch": 3.6844863731656186, "percentage": 18.42, "elapsed_time": "0:17:50", "remaining_time": "1:19:00", "throughput": 4291.73, "total_tokens": 4594392} {"current_steps": 7035, "total_steps": 38160, "loss": 0.378, "lr": 0.0009784933961194395, "epoch": 3.6871069182389937, "percentage": 18.44, "elapsed_time": "0:17:51", "remaining_time": "1:18:59", "throughput": 4291.63, "total_tokens": 4597144} {"current_steps": 7040, "total_steps": 38160, "loss": 0.573, "lr": 0.0009784269971523777, "epoch": 3.689727463312369, "percentage": 18.45, "elapsed_time": "0:17:51", "remaining_time": "1:18:57", "throughput": 4291.5, "total_tokens": 4599736} {"current_steps": 7045, "total_steps": 38160, "loss": 0.3944, "lr": 0.0009783604981038463, "epoch": 3.6923480083857445, "percentage": 18.46, "elapsed_time": "0:17:52", "remaining_time": "1:18:56", "throughput": 4291.52, "total_tokens": 4602712} {"current_steps": 7050, "total_steps": 38160, "loss": 0.4257, "lr": 0.000978293898987756, "epoch": 3.6949685534591197, "percentage": 18.47, "elapsed_time": "0:17:53", "remaining_time": "1:18:55", "throughput": 4291.54, "total_tokens": 4605752} {"current_steps": 7055, "total_steps": 38160, "loss": 0.4524, "lr": 0.000978227199818039, "epoch": 3.697589098532495, "percentage": 18.49, "elapsed_time": "0:17:54", "remaining_time": "1:18:55", "throughput": 4291.94, "total_tokens": 4609560} {"current_steps": 7060, "total_steps": 38160, "loss": 0.494, "lr": 0.0009781604006086474, "epoch": 3.70020964360587, "percentage": 18.5, "elapsed_time": "0:17:54", "remaining_time": "1:18:54", "throughput": 4292.01, "total_tokens": 4612696} {"current_steps": 7065, "total_steps": 38160, "loss": 0.5166, "lr": 0.0009780935013735553, "epoch": 3.702830188679245, "percentage": 18.51, "elapsed_time": "0:17:55", "remaining_time": "1:18:53", "throughput": 4292.16, "total_tokens": 4615928} {"current_steps": 7070, "total_steps": 38160, "loss": 0.4888, "lr": 0.0009780265021267572, "epoch": 3.7054507337526204, "percentage": 18.53, "elapsed_time": "0:17:56", "remaining_time": "1:18:52", "throughput": 4292.26, "total_tokens": 4619160} {"current_steps": 7075, "total_steps": 38160, "loss": 0.5188, "lr": 0.0009779594028822682, "epoch": 3.708071278825996, "percentage": 18.54, "elapsed_time": "0:17:56", "remaining_time": "1:18:51", "throughput": 4292.23, "total_tokens": 4621944} {"current_steps": 7080, "total_steps": 38160, "loss": 0.487, "lr": 0.0009778922036541252, "epoch": 3.710691823899371, "percentage": 18.55, "elapsed_time": "0:17:57", "remaining_time": "1:18:50", "throughput": 4292.44, "total_tokens": 4625400} {"current_steps": 7085, "total_steps": 38160, "loss": 0.3966, "lr": 0.0009778249044563852, "epoch": 3.7133123689727463, "percentage": 18.57, "elapsed_time": "0:17:58", "remaining_time": "1:18:49", "throughput": 4292.52, "total_tokens": 4628600} {"current_steps": 7090, "total_steps": 38160, "loss": 0.4571, "lr": 0.0009777575053031263, "epoch": 3.7159329140461215, "percentage": 18.58, "elapsed_time": "0:17:58", "remaining_time": "1:18:48", "throughput": 4292.57, "total_tokens": 4631640} {"current_steps": 7095, "total_steps": 38160, "loss": 0.5708, "lr": 0.000977690006208448, "epoch": 3.718553459119497, "percentage": 18.59, "elapsed_time": "0:17:59", "remaining_time": "1:18:47", "throughput": 4292.93, "total_tokens": 4635480} {"current_steps": 7100, "total_steps": 38160, "loss": 0.524, "lr": 0.0009776224071864703, "epoch": 3.7211740041928723, "percentage": 18.61, "elapsed_time": "0:18:00", "remaining_time": "1:18:46", "throughput": 4292.8, "total_tokens": 4638136} {"current_steps": 7105, "total_steps": 38160, "loss": 0.3976, "lr": 0.000977554708251334, "epoch": 3.7237945492662474, "percentage": 18.62, "elapsed_time": "0:18:01", "remaining_time": "1:18:45", "throughput": 4292.82, "total_tokens": 4641176} {"current_steps": 7110, "total_steps": 38160, "loss": 0.4138, "lr": 0.0009774869094172007, "epoch": 3.7264150943396226, "percentage": 18.63, "elapsed_time": "0:18:01", "remaining_time": "1:18:45", "throughput": 4293.25, "total_tokens": 4645144} {"current_steps": 7115, "total_steps": 38160, "loss": 0.5349, "lr": 0.0009774190106982537, "epoch": 3.7290356394129978, "percentage": 18.65, "elapsed_time": "0:18:02", "remaining_time": "1:18:44", "throughput": 4293.41, "total_tokens": 4648408} {"current_steps": 7120, "total_steps": 38160, "loss": 0.5206, "lr": 0.0009773510121086962, "epoch": 3.731656184486373, "percentage": 18.66, "elapsed_time": "0:18:03", "remaining_time": "1:18:42", "throughput": 4293.32, "total_tokens": 4651096} {"current_steps": 7125, "total_steps": 38160, "loss": 0.4159, "lr": 0.0009772829136627528, "epoch": 3.7342767295597485, "percentage": 18.67, "elapsed_time": "0:18:04", "remaining_time": "1:18:42", "throughput": 4293.67, "total_tokens": 4654776} {"current_steps": 7130, "total_steps": 38160, "loss": 0.413, "lr": 0.0009772147153746691, "epoch": 3.7368972746331237, "percentage": 18.68, "elapsed_time": "0:18:04", "remaining_time": "1:18:41", "throughput": 4293.93, "total_tokens": 4658360} {"current_steps": 7135, "total_steps": 38160, "loss": 0.4699, "lr": 0.0009771464172587112, "epoch": 3.739517819706499, "percentage": 18.7, "elapsed_time": "0:18:05", "remaining_time": "1:18:40", "throughput": 4294.01, "total_tokens": 4661528} {"current_steps": 7140, "total_steps": 38160, "loss": 0.6372, "lr": 0.0009770780193291667, "epoch": 3.742138364779874, "percentage": 18.71, "elapsed_time": "0:18:06", "remaining_time": "1:18:39", "throughput": 4294.03, "total_tokens": 4664600} {"current_steps": 7145, "total_steps": 38160, "loss": 0.4802, "lr": 0.000977009521600343, "epoch": 3.7447589098532497, "percentage": 18.72, "elapsed_time": "0:18:06", "remaining_time": "1:18:38", "throughput": 4293.97, "total_tokens": 4667416} {"current_steps": 7150, "total_steps": 38160, "loss": 0.4343, "lr": 0.0009769409240865696, "epoch": 3.747379454926625, "percentage": 18.74, "elapsed_time": "0:18:07", "remaining_time": "1:18:37", "throughput": 4293.88, "total_tokens": 4670136} {"current_steps": 7155, "total_steps": 38160, "loss": 0.4907, "lr": 0.0009768722268021959, "epoch": 3.75, "percentage": 18.75, "elapsed_time": "0:18:08", "remaining_time": "1:18:36", "throughput": 4294.08, "total_tokens": 4673592} {"current_steps": 7160, "total_steps": 38160, "loss": 0.5063, "lr": 0.000976803429761593, "epoch": 3.752620545073375, "percentage": 18.76, "elapsed_time": "0:18:09", "remaining_time": "1:18:35", "throughput": 4294.4, "total_tokens": 4677272} {"current_steps": 7165, "total_steps": 38160, "loss": 0.4672, "lr": 0.000976734532979152, "epoch": 3.7552410901467503, "percentage": 18.78, "elapsed_time": "0:18:09", "remaining_time": "1:18:35", "throughput": 4294.94, "total_tokens": 4681464} {"current_steps": 7170, "total_steps": 38160, "loss": 0.4871, "lr": 0.000976665536469286, "epoch": 3.757861635220126, "percentage": 18.79, "elapsed_time": "0:18:10", "remaining_time": "1:18:34", "throughput": 4294.89, "total_tokens": 4684408} {"current_steps": 7175, "total_steps": 38160, "loss": 0.5426, "lr": 0.0009765964402464276, "epoch": 3.760482180293501, "percentage": 18.8, "elapsed_time": "0:18:11", "remaining_time": "1:18:33", "throughput": 4294.9, "total_tokens": 4687448} {"current_steps": 7180, "total_steps": 38160, "loss": 0.7222, "lr": 0.0009765272443250312, "epoch": 3.7631027253668763, "percentage": 18.82, "elapsed_time": "0:18:12", "remaining_time": "1:18:32", "throughput": 4295.12, "total_tokens": 4690904} {"current_steps": 7185, "total_steps": 38160, "loss": 0.5804, "lr": 0.0009764579487195717, "epoch": 3.7657232704402515, "percentage": 18.83, "elapsed_time": "0:18:12", "remaining_time": "1:18:31", "throughput": 4295.36, "total_tokens": 4694488} {"current_steps": 7190, "total_steps": 38160, "loss": 0.4609, "lr": 0.0009763885534445452, "epoch": 3.768343815513627, "percentage": 18.84, "elapsed_time": "0:18:13", "remaining_time": "1:18:30", "throughput": 4295.38, "total_tokens": 4697528} {"current_steps": 7195, "total_steps": 38160, "loss": 0.4498, "lr": 0.0009763190585144682, "epoch": 3.7709643605870022, "percentage": 18.85, "elapsed_time": "0:18:14", "remaining_time": "1:18:29", "throughput": 4295.69, "total_tokens": 4701208} {"current_steps": 7200, "total_steps": 38160, "loss": 0.5184, "lr": 0.0009762494639438783, "epoch": 3.7735849056603774, "percentage": 18.87, "elapsed_time": "0:18:15", "remaining_time": "1:18:29", "throughput": 4296.12, "total_tokens": 4705240} {"current_steps": 7205, "total_steps": 38160, "loss": 0.5224, "lr": 0.0009761797697473339, "epoch": 3.7762054507337526, "percentage": 18.88, "elapsed_time": "0:18:15", "remaining_time": "1:18:28", "throughput": 4296.12, "total_tokens": 4708216} {"current_steps": 7210, "total_steps": 38160, "loss": 0.724, "lr": 0.0009761099759394142, "epoch": 3.7788259958071277, "percentage": 18.89, "elapsed_time": "0:18:16", "remaining_time": "1:18:27", "throughput": 4295.92, "total_tokens": 4710712} {"current_steps": 7215, "total_steps": 38160, "loss": 0.5298, "lr": 0.0009760400825347194, "epoch": 3.781446540880503, "percentage": 18.91, "elapsed_time": "0:18:17", "remaining_time": "1:18:26", "throughput": 4296.03, "total_tokens": 4713912} {"current_steps": 7220, "total_steps": 38160, "loss": 0.4567, "lr": 0.00097597008954787, "epoch": 3.7840670859538785, "percentage": 18.92, "elapsed_time": "0:18:17", "remaining_time": "1:18:24", "throughput": 4295.84, "total_tokens": 4716440} {"current_steps": 7225, "total_steps": 38160, "loss": 0.5692, "lr": 0.0009758999969935083, "epoch": 3.7866876310272537, "percentage": 18.93, "elapsed_time": "0:18:18", "remaining_time": "1:18:24", "throughput": 4296.16, "total_tokens": 4720184} {"current_steps": 7230, "total_steps": 38160, "loss": 0.5186, "lr": 0.0009758298048862965, "epoch": 3.789308176100629, "percentage": 18.95, "elapsed_time": "0:18:19", "remaining_time": "1:18:24", "throughput": 4296.81, "total_tokens": 4724760} {"current_steps": 7235, "total_steps": 38160, "loss": 0.461, "lr": 0.0009757595132409181, "epoch": 3.791928721174004, "percentage": 18.96, "elapsed_time": "0:18:20", "remaining_time": "1:18:23", "throughput": 4296.85, "total_tokens": 4727832} {"current_steps": 7240, "total_steps": 38160, "loss": 0.3699, "lr": 0.0009756891220720771, "epoch": 3.7945492662473796, "percentage": 18.97, "elapsed_time": "0:18:20", "remaining_time": "1:18:21", "throughput": 4296.75, "total_tokens": 4730584} {"current_steps": 7245, "total_steps": 38160, "loss": 0.484, "lr": 0.0009756186313944988, "epoch": 3.797169811320755, "percentage": 18.99, "elapsed_time": "0:18:21", "remaining_time": "1:18:20", "throughput": 4296.6, "total_tokens": 4733208} {"current_steps": 7250, "total_steps": 38160, "loss": 0.4452, "lr": 0.0009755480412229291, "epoch": 3.79979035639413, "percentage": 19.0, "elapsed_time": "0:18:22", "remaining_time": "1:18:19", "throughput": 4296.52, "total_tokens": 4736088} {"current_steps": 7255, "total_steps": 38160, "loss": 0.5539, "lr": 0.0009754773515721343, "epoch": 3.802410901467505, "percentage": 19.01, "elapsed_time": "0:18:23", "remaining_time": "1:18:18", "throughput": 4296.53, "total_tokens": 4739096} {"current_steps": 7260, "total_steps": 38160, "loss": 0.3699, "lr": 0.0009754065624569022, "epoch": 3.8050314465408803, "percentage": 19.03, "elapsed_time": "0:18:23", "remaining_time": "1:18:17", "throughput": 4296.54, "total_tokens": 4742168} {"current_steps": 7265, "total_steps": 38160, "loss": 0.4718, "lr": 0.000975335673892041, "epoch": 3.8076519916142555, "percentage": 19.04, "elapsed_time": "0:18:24", "remaining_time": "1:18:16", "throughput": 4296.66, "total_tokens": 4745432} {"current_steps": 7270, "total_steps": 38160, "loss": 0.4363, "lr": 0.0009752646858923797, "epoch": 3.810272536687631, "percentage": 19.05, "elapsed_time": "0:18:25", "remaining_time": "1:18:15", "throughput": 4296.72, "total_tokens": 4748536} {"current_steps": 7275, "total_steps": 38160, "loss": 0.5378, "lr": 0.0009751935984727683, "epoch": 3.8128930817610063, "percentage": 19.06, "elapsed_time": "0:18:25", "remaining_time": "1:18:14", "throughput": 4296.85, "total_tokens": 4751800} {"current_steps": 7280, "total_steps": 38160, "loss": 0.3583, "lr": 0.0009751224116480772, "epoch": 3.8155136268343814, "percentage": 19.08, "elapsed_time": "0:18:26", "remaining_time": "1:18:14", "throughput": 4297.31, "total_tokens": 4755800} {"current_steps": 7285, "total_steps": 38160, "loss": 0.3994, "lr": 0.0009750511254331982, "epoch": 3.818134171907757, "percentage": 19.09, "elapsed_time": "0:18:27", "remaining_time": "1:18:13", "throughput": 4297.36, "total_tokens": 4758904} {"current_steps": 7290, "total_steps": 38160, "loss": 0.3836, "lr": 0.0009749797398430433, "epoch": 3.8207547169811322, "percentage": 19.1, "elapsed_time": "0:18:28", "remaining_time": "1:18:13", "throughput": 4297.99, "total_tokens": 4763352} {"current_steps": 7295, "total_steps": 38160, "loss": 0.4705, "lr": 0.0009749082548925459, "epoch": 3.8233752620545074, "percentage": 19.12, "elapsed_time": "0:18:28", "remaining_time": "1:18:11", "throughput": 4297.81, "total_tokens": 4765880} {"current_steps": 7300, "total_steps": 38160, "loss": 0.4204, "lr": 0.0009748366705966593, "epoch": 3.8259958071278826, "percentage": 19.13, "elapsed_time": "0:18:29", "remaining_time": "1:18:10", "throughput": 4297.96, "total_tokens": 4769112} {"current_steps": 7305, "total_steps": 38160, "loss": 0.4081, "lr": 0.0009747649869703588, "epoch": 3.8286163522012577, "percentage": 19.14, "elapsed_time": "0:18:30", "remaining_time": "1:18:09", "throughput": 4297.92, "total_tokens": 4772024} {"current_steps": 7310, "total_steps": 38160, "loss": 0.43, "lr": 0.0009746932040286391, "epoch": 3.831236897274633, "percentage": 19.16, "elapsed_time": "0:18:31", "remaining_time": "1:18:08", "throughput": 4298.06, "total_tokens": 4775320} {"current_steps": 7315, "total_steps": 38160, "loss": 0.4906, "lr": 0.000974621321786517, "epoch": 3.8338574423480085, "percentage": 19.17, "elapsed_time": "0:18:31", "remaining_time": "1:18:07", "throughput": 4298.04, "total_tokens": 4778232} {"current_steps": 7320, "total_steps": 38160, "loss": 0.4544, "lr": 0.000974549340259029, "epoch": 3.8364779874213837, "percentage": 19.18, "elapsed_time": "0:18:32", "remaining_time": "1:18:07", "throughput": 4298.43, "total_tokens": 4782200} {"current_steps": 7325, "total_steps": 38160, "loss": 0.4735, "lr": 0.000974477259461233, "epoch": 3.839098532494759, "percentage": 19.2, "elapsed_time": "0:18:33", "remaining_time": "1:18:06", "throughput": 4298.28, "total_tokens": 4784888} {"current_steps": 7330, "total_steps": 38160, "loss": 0.4692, "lr": 0.0009744050794082074, "epoch": 3.841719077568134, "percentage": 19.21, "elapsed_time": "0:18:33", "remaining_time": "1:18:05", "throughput": 4298.45, "total_tokens": 4788344} {"current_steps": 7335, "total_steps": 38160, "loss": 0.393, "lr": 0.0009743328001150515, "epoch": 3.8443396226415096, "percentage": 19.22, "elapsed_time": "0:18:34", "remaining_time": "1:18:04", "throughput": 4298.32, "total_tokens": 4791000} {"current_steps": 7340, "total_steps": 38160, "loss": 0.4272, "lr": 0.0009742604215968853, "epoch": 3.846960167714885, "percentage": 19.23, "elapsed_time": "0:18:35", "remaining_time": "1:18:03", "throughput": 4298.51, "total_tokens": 4794392} {"current_steps": 7345, "total_steps": 38160, "loss": 0.6075, "lr": 0.0009741879438688495, "epoch": 3.84958071278826, "percentage": 19.25, "elapsed_time": "0:18:35", "remaining_time": "1:18:02", "throughput": 4298.29, "total_tokens": 4796888} {"current_steps": 7350, "total_steps": 38160, "loss": 0.4747, "lr": 0.0009741153669461058, "epoch": 3.852201257861635, "percentage": 19.26, "elapsed_time": "0:18:36", "remaining_time": "1:18:01", "throughput": 4298.74, "total_tokens": 4800856} {"current_steps": 7355, "total_steps": 38160, "loss": 0.4809, "lr": 0.0009740426908438362, "epoch": 3.8548218029350103, "percentage": 19.27, "elapsed_time": "0:18:37", "remaining_time": "1:18:00", "throughput": 4299.02, "total_tokens": 4804568} {"current_steps": 7360, "total_steps": 38160, "loss": 0.3349, "lr": 0.0009739699155772439, "epoch": 3.8574423480083855, "percentage": 19.29, "elapsed_time": "0:18:38", "remaining_time": "1:17:59", "throughput": 4298.95, "total_tokens": 4807384} {"current_steps": 7365, "total_steps": 38160, "loss": 0.4955, "lr": 0.0009738970411615525, "epoch": 3.860062893081761, "percentage": 19.3, "elapsed_time": "0:18:39", "remaining_time": "1:17:58", "throughput": 4299.21, "total_tokens": 4810904} {"current_steps": 7370, "total_steps": 38160, "loss": 0.4384, "lr": 0.0009738240676120067, "epoch": 3.8626834381551363, "percentage": 19.31, "elapsed_time": "0:18:39", "remaining_time": "1:17:57", "throughput": 4299.28, "total_tokens": 4814008} {"current_steps": 7375, "total_steps": 38160, "loss": 0.5258, "lr": 0.0009737509949438717, "epoch": 3.8653039832285114, "percentage": 19.33, "elapsed_time": "0:18:40", "remaining_time": "1:17:57", "throughput": 4299.42, "total_tokens": 4817272} {"current_steps": 7380, "total_steps": 38160, "loss": 0.4068, "lr": 0.0009736778231724333, "epoch": 3.867924528301887, "percentage": 19.34, "elapsed_time": "0:18:41", "remaining_time": "1:17:55", "throughput": 4299.25, "total_tokens": 4819896} {"current_steps": 7385, "total_steps": 38160, "loss": 0.4145, "lr": 0.0009736045523129982, "epoch": 3.870545073375262, "percentage": 19.35, "elapsed_time": "0:18:41", "remaining_time": "1:17:54", "throughput": 4299.28, "total_tokens": 4822936} {"current_steps": 7390, "total_steps": 38160, "loss": 0.3612, "lr": 0.0009735311823808938, "epoch": 3.8731656184486374, "percentage": 19.37, "elapsed_time": "0:18:42", "remaining_time": "1:17:54", "throughput": 4299.64, "total_tokens": 4826776} {"current_steps": 7395, "total_steps": 38160, "loss": 0.413, "lr": 0.0009734577133914687, "epoch": 3.8757861635220126, "percentage": 19.38, "elapsed_time": "0:18:43", "remaining_time": "1:17:53", "throughput": 4300.25, "total_tokens": 4831288} {"current_steps": 7400, "total_steps": 38160, "loss": 0.5321, "lr": 0.0009733841453600914, "epoch": 3.8784067085953877, "percentage": 19.39, "elapsed_time": "0:18:44", "remaining_time": "1:17:52", "throughput": 4300.26, "total_tokens": 4834232} {"current_steps": 7405, "total_steps": 38160, "loss": 0.5185, "lr": 0.0009733104783021515, "epoch": 3.881027253668763, "percentage": 19.41, "elapsed_time": "0:18:44", "remaining_time": "1:17:52", "throughput": 4300.49, "total_tokens": 4837752} {"current_steps": 7410, "total_steps": 38160, "loss": 0.5748, "lr": 0.0009732367122330593, "epoch": 3.8836477987421385, "percentage": 19.42, "elapsed_time": "0:18:45", "remaining_time": "1:17:51", "throughput": 4300.68, "total_tokens": 4841304} {"current_steps": 7415, "total_steps": 38160, "loss": 0.4316, "lr": 0.0009731628471682459, "epoch": 3.8862683438155137, "percentage": 19.43, "elapsed_time": "0:18:46", "remaining_time": "1:17:50", "throughput": 4300.91, "total_tokens": 4844888} {"current_steps": 7420, "total_steps": 38160, "loss": 0.5517, "lr": 0.000973088883123163, "epoch": 3.888888888888889, "percentage": 19.44, "elapsed_time": "0:18:47", "remaining_time": "1:17:49", "throughput": 4301.02, "total_tokens": 4848088} {"current_steps": 7425, "total_steps": 38160, "loss": 0.437, "lr": 0.0009730148201132829, "epoch": 3.891509433962264, "percentage": 19.46, "elapsed_time": "0:18:48", "remaining_time": "1:17:49", "throughput": 4301.49, "total_tokens": 4852248} {"current_steps": 7430, "total_steps": 38160, "loss": 0.4426, "lr": 0.0009729406581540991, "epoch": 3.8941299790356396, "percentage": 19.47, "elapsed_time": "0:18:48", "remaining_time": "1:17:48", "throughput": 4301.49, "total_tokens": 4855192} {"current_steps": 7435, "total_steps": 38160, "loss": 0.4174, "lr": 0.0009728663972611251, "epoch": 3.896750524109015, "percentage": 19.48, "elapsed_time": "0:18:49", "remaining_time": "1:17:47", "throughput": 4301.65, "total_tokens": 4858584} {"current_steps": 7440, "total_steps": 38160, "loss": 0.433, "lr": 0.0009727920374498955, "epoch": 3.89937106918239, "percentage": 19.5, "elapsed_time": "0:18:50", "remaining_time": "1:17:46", "throughput": 4301.5, "total_tokens": 4861304} {"current_steps": 7445, "total_steps": 38160, "loss": 0.5735, "lr": 0.0009727175787359656, "epoch": 3.901991614255765, "percentage": 19.51, "elapsed_time": "0:18:50", "remaining_time": "1:17:45", "throughput": 4301.68, "total_tokens": 4864824} {"current_steps": 7450, "total_steps": 38160, "loss": 0.5276, "lr": 0.0009726430211349113, "epoch": 3.9046121593291403, "percentage": 19.52, "elapsed_time": "0:18:51", "remaining_time": "1:17:44", "throughput": 4301.62, "total_tokens": 4867736} {"current_steps": 7455, "total_steps": 38160, "loss": 0.4448, "lr": 0.0009725683646623291, "epoch": 3.9072327044025155, "percentage": 19.54, "elapsed_time": "0:18:52", "remaining_time": "1:17:43", "throughput": 4301.69, "total_tokens": 4870936} {"current_steps": 7460, "total_steps": 38160, "loss": 0.61, "lr": 0.0009724936093338365, "epoch": 3.909853249475891, "percentage": 19.55, "elapsed_time": "0:18:53", "remaining_time": "1:17:43", "throughput": 4302.18, "total_tokens": 4875160} {"current_steps": 7465, "total_steps": 38160, "loss": 0.3191, "lr": 0.0009724187551650712, "epoch": 3.9124737945492662, "percentage": 19.56, "elapsed_time": "0:18:53", "remaining_time": "1:17:42", "throughput": 4302.15, "total_tokens": 4878072} {"current_steps": 7470, "total_steps": 38160, "loss": 0.547, "lr": 0.0009723438021716919, "epoch": 3.9150943396226414, "percentage": 19.58, "elapsed_time": "0:18:54", "remaining_time": "1:17:41", "throughput": 4302.56, "total_tokens": 4882008} {"current_steps": 7475, "total_steps": 38160, "loss": 0.4354, "lr": 0.0009722687503693782, "epoch": 3.917714884696017, "percentage": 19.59, "elapsed_time": "0:18:55", "remaining_time": "1:17:40", "throughput": 4302.57, "total_tokens": 4884952} {"current_steps": 7480, "total_steps": 38160, "loss": 0.4682, "lr": 0.0009721935997738296, "epoch": 3.920335429769392, "percentage": 19.6, "elapsed_time": "0:18:56", "remaining_time": "1:17:39", "throughput": 4302.51, "total_tokens": 4887736} {"current_steps": 7485, "total_steps": 38160, "loss": 0.4294, "lr": 0.0009721183504007671, "epoch": 3.9229559748427674, "percentage": 19.61, "elapsed_time": "0:18:56", "remaining_time": "1:17:38", "throughput": 4302.81, "total_tokens": 4891384} {"current_steps": 7490, "total_steps": 38160, "loss": 0.3752, "lr": 0.0009720430022659319, "epoch": 3.9255765199161425, "percentage": 19.63, "elapsed_time": "0:18:57", "remaining_time": "1:17:38", "throughput": 4303.13, "total_tokens": 4895160} {"current_steps": 7495, "total_steps": 38160, "loss": 0.3202, "lr": 0.000971967555385086, "epoch": 3.9281970649895177, "percentage": 19.64, "elapsed_time": "0:18:58", "remaining_time": "1:17:37", "throughput": 4303.3, "total_tokens": 4898456} {"current_steps": 7500, "total_steps": 38160, "loss": 0.432, "lr": 0.000971892009774012, "epoch": 3.930817610062893, "percentage": 19.65, "elapsed_time": "0:18:58", "remaining_time": "1:17:36", "throughput": 4303.2, "total_tokens": 4901176} {"current_steps": 7505, "total_steps": 38160, "loss": 0.4315, "lr": 0.0009718163654485133, "epoch": 3.9334381551362685, "percentage": 19.67, "elapsed_time": "0:18:59", "remaining_time": "1:17:34", "throughput": 4302.98, "total_tokens": 4903608} {"current_steps": 7510, "total_steps": 38160, "loss": 0.4899, "lr": 0.0009717406224244136, "epoch": 3.9360587002096437, "percentage": 19.68, "elapsed_time": "0:19:00", "remaining_time": "1:17:33", "throughput": 4303.05, "total_tokens": 4906712} {"current_steps": 7515, "total_steps": 38160, "loss": 0.4478, "lr": 0.0009716647807175575, "epoch": 3.938679245283019, "percentage": 19.69, "elapsed_time": "0:19:01", "remaining_time": "1:17:33", "throughput": 4303.47, "total_tokens": 4910776} {"current_steps": 7520, "total_steps": 38160, "loss": 0.5187, "lr": 0.0009715888403438105, "epoch": 3.941299790356394, "percentage": 19.71, "elapsed_time": "0:19:01", "remaining_time": "1:17:32", "throughput": 4303.47, "total_tokens": 4913656} {"current_steps": 7525, "total_steps": 38160, "loss": 0.5821, "lr": 0.0009715128013190581, "epoch": 3.9439203354297696, "percentage": 19.72, "elapsed_time": "0:19:02", "remaining_time": "1:17:31", "throughput": 4303.57, "total_tokens": 4916856} {"current_steps": 7530, "total_steps": 38160, "loss": 0.5989, "lr": 0.0009714366636592069, "epoch": 3.9465408805031448, "percentage": 19.73, "elapsed_time": "0:19:03", "remaining_time": "1:17:30", "throughput": 4303.61, "total_tokens": 4919960} {"current_steps": 7535, "total_steps": 38160, "loss": 0.3951, "lr": 0.0009713604273801844, "epoch": 3.94916142557652, "percentage": 19.75, "elapsed_time": "0:19:03", "remaining_time": "1:17:29", "throughput": 4303.42, "total_tokens": 4922456} {"current_steps": 7540, "total_steps": 38160, "loss": 0.6275, "lr": 0.0009712840924979378, "epoch": 3.951781970649895, "percentage": 19.76, "elapsed_time": "0:19:04", "remaining_time": "1:17:27", "throughput": 4303.36, "total_tokens": 4925336} {"current_steps": 7545, "total_steps": 38160, "loss": 0.3384, "lr": 0.0009712076590284357, "epoch": 3.9544025157232703, "percentage": 19.77, "elapsed_time": "0:19:05", "remaining_time": "1:17:26", "throughput": 4303.2, "total_tokens": 4928056} {"current_steps": 7550, "total_steps": 38160, "loss": 0.4087, "lr": 0.0009711311269876674, "epoch": 3.9570230607966455, "percentage": 19.79, "elapsed_time": "0:19:05", "remaining_time": "1:17:25", "throughput": 4303.29, "total_tokens": 4931192} {"current_steps": 7555, "total_steps": 38160, "loss": 0.418, "lr": 0.0009710544963916421, "epoch": 3.959643605870021, "percentage": 19.8, "elapsed_time": "0:19:06", "remaining_time": "1:17:25", "throughput": 4303.62, "total_tokens": 4934872} {"current_steps": 7560, "total_steps": 38160, "loss": 0.6091, "lr": 0.0009709777672563903, "epoch": 3.9622641509433962, "percentage": 19.81, "elapsed_time": "0:19:07", "remaining_time": "1:17:24", "throughput": 4303.73, "total_tokens": 4938104} {"current_steps": 7565, "total_steps": 38160, "loss": 0.3019, "lr": 0.0009709009395979628, "epoch": 3.9648846960167714, "percentage": 19.82, "elapsed_time": "0:19:08", "remaining_time": "1:17:23", "throughput": 4304.28, "total_tokens": 4942456} {"current_steps": 7570, "total_steps": 38160, "loss": 0.541, "lr": 0.0009708240134324311, "epoch": 3.967505241090147, "percentage": 19.84, "elapsed_time": "0:19:09", "remaining_time": "1:17:23", "throughput": 4304.69, "total_tokens": 4946488} {"current_steps": 7575, "total_steps": 38160, "loss": 0.4216, "lr": 0.0009707469887758871, "epoch": 3.970125786163522, "percentage": 19.85, "elapsed_time": "0:19:09", "remaining_time": "1:17:22", "throughput": 4304.49, "total_tokens": 4948920} {"current_steps": 7580, "total_steps": 38160, "loss": 0.4723, "lr": 0.0009706698656444437, "epoch": 3.9727463312368974, "percentage": 19.86, "elapsed_time": "0:19:10", "remaining_time": "1:17:21", "throughput": 4304.63, "total_tokens": 4952152} {"current_steps": 7585, "total_steps": 38160, "loss": 0.3745, "lr": 0.000970592644054234, "epoch": 3.9753668763102725, "percentage": 19.88, "elapsed_time": "0:19:11", "remaining_time": "1:17:20", "throughput": 4304.71, "total_tokens": 4955288} {"current_steps": 7590, "total_steps": 38160, "loss": 0.4249, "lr": 0.000970515324021412, "epoch": 3.9779874213836477, "percentage": 19.89, "elapsed_time": "0:19:11", "remaining_time": "1:17:19", "throughput": 4304.79, "total_tokens": 4958520} {"current_steps": 7595, "total_steps": 38160, "loss": 0.4022, "lr": 0.0009704379055621523, "epoch": 3.980607966457023, "percentage": 19.9, "elapsed_time": "0:19:12", "remaining_time": "1:17:18", "throughput": 4304.71, "total_tokens": 4961336} {"current_steps": 7600, "total_steps": 38160, "loss": 0.6038, "lr": 0.0009703603886926497, "epoch": 3.9832285115303985, "percentage": 19.92, "elapsed_time": "0:19:13", "remaining_time": "1:17:18", "throughput": 4305.36, "total_tokens": 4965944} {"current_steps": 7605, "total_steps": 38160, "loss": 0.4496, "lr": 0.0009702827734291198, "epoch": 3.9858490566037736, "percentage": 19.93, "elapsed_time": "0:19:14", "remaining_time": "1:17:16", "throughput": 4305.3, "total_tokens": 4968824} {"current_steps": 7610, "total_steps": 38160, "loss": 0.3464, "lr": 0.0009702050597877992, "epoch": 3.988469601677149, "percentage": 19.94, "elapsed_time": "0:19:14", "remaining_time": "1:17:15", "throughput": 4305.21, "total_tokens": 4971608} {"current_steps": 7615, "total_steps": 38160, "loss": 0.4763, "lr": 0.0009701272477849444, "epoch": 3.991090146750524, "percentage": 19.96, "elapsed_time": "0:19:15", "remaining_time": "1:17:14", "throughput": 4304.92, "total_tokens": 4973912} {"current_steps": 7620, "total_steps": 38160, "loss": 0.5707, "lr": 0.0009700493374368327, "epoch": 3.9937106918238996, "percentage": 19.97, "elapsed_time": "0:19:16", "remaining_time": "1:17:13", "throughput": 4305.27, "total_tokens": 4977784} {"current_steps": 7625, "total_steps": 38160, "loss": 0.4347, "lr": 0.0009699713287597624, "epoch": 3.9963312368972748, "percentage": 19.98, "elapsed_time": "0:19:16", "remaining_time": "1:17:12", "throughput": 4305.1, "total_tokens": 4980344} {"current_steps": 7630, "total_steps": 38160, "loss": 0.4348, "lr": 0.0009698932217700518, "epoch": 3.99895178197065, "percentage": 19.99, "elapsed_time": "0:19:17", "remaining_time": "1:17:11", "throughput": 4305.16, "total_tokens": 4983384} {"current_steps": 7632, "total_steps": 38160, "eval_loss": 0.49002858996391296, "epoch": 4.0, "percentage": 20.0, "elapsed_time": "0:19:31", "remaining_time": "1:18:06", "throughput": 4253.98, "total_tokens": 4984176} {"current_steps": 7635, "total_steps": 38160, "loss": 0.374, "lr": 0.0009698150164840399, "epoch": 4.001572327044025, "percentage": 20.01, "elapsed_time": "0:19:33", "remaining_time": "1:18:11", "throughput": 4248.58, "total_tokens": 4985968} {"current_steps": 7640, "total_steps": 38160, "loss": 0.4376, "lr": 0.0009697367129180866, "epoch": 4.0041928721174, "percentage": 20.02, "elapsed_time": "0:19:34", "remaining_time": "1:18:11", "throughput": 4248.73, "total_tokens": 4989232} {"current_steps": 7645, "total_steps": 38160, "loss": 0.4629, "lr": 0.000969658311088572, "epoch": 4.006813417190775, "percentage": 20.03, "elapsed_time": "0:19:34", "remaining_time": "1:18:09", "throughput": 4248.72, "total_tokens": 4992176} {"current_steps": 7650, "total_steps": 38160, "loss": 0.5011, "lr": 0.0009695798110118969, "epoch": 4.009433962264151, "percentage": 20.05, "elapsed_time": "0:19:35", "remaining_time": "1:18:08", "throughput": 4248.72, "total_tokens": 4995024} {"current_steps": 7655, "total_steps": 38160, "loss": 0.5758, "lr": 0.0009695012127044824, "epoch": 4.012054507337526, "percentage": 20.06, "elapsed_time": "0:19:36", "remaining_time": "1:18:07", "throughput": 4248.75, "total_tokens": 4998224} {"current_steps": 7660, "total_steps": 38160, "loss": 0.4959, "lr": 0.0009694225161827707, "epoch": 4.014675052410902, "percentage": 20.07, "elapsed_time": "0:19:37", "remaining_time": "1:18:07", "throughput": 4249.12, "total_tokens": 5002032} {"current_steps": 7665, "total_steps": 38160, "loss": 0.4001, "lr": 0.0009693437214632241, "epoch": 4.017295597484277, "percentage": 20.09, "elapsed_time": "0:19:37", "remaining_time": "1:18:06", "throughput": 4249.36, "total_tokens": 5005520} {"current_steps": 7670, "total_steps": 38160, "loss": 0.5459, "lr": 0.0009692648285623256, "epoch": 4.019916142557652, "percentage": 20.1, "elapsed_time": "0:19:38", "remaining_time": "1:18:05", "throughput": 4249.38, "total_tokens": 5008624} {"current_steps": 7675, "total_steps": 38160, "loss": 0.4594, "lr": 0.0009691858374965784, "epoch": 4.022536687631027, "percentage": 20.11, "elapsed_time": "0:19:39", "remaining_time": "1:18:04", "throughput": 4249.01, "total_tokens": 5010704} {"current_steps": 7680, "total_steps": 38160, "loss": 0.4256, "lr": 0.0009691067482825069, "epoch": 4.0251572327044025, "percentage": 20.13, "elapsed_time": "0:19:40", "remaining_time": "1:18:03", "throughput": 4249.32, "total_tokens": 5014416} {"current_steps": 7685, "total_steps": 38160, "loss": 0.486, "lr": 0.0009690275609366554, "epoch": 4.027777777777778, "percentage": 20.14, "elapsed_time": "0:19:40", "remaining_time": "1:18:02", "throughput": 4249.89, "total_tokens": 5018704} {"current_steps": 7690, "total_steps": 38160, "loss": 0.4761, "lr": 0.0009689482754755891, "epoch": 4.030398322851153, "percentage": 20.15, "elapsed_time": "0:19:41", "remaining_time": "1:18:02", "throughput": 4250.32, "total_tokens": 5022768} {"current_steps": 7695, "total_steps": 38160, "loss": 0.5409, "lr": 0.0009688688919158938, "epoch": 4.033018867924528, "percentage": 20.17, "elapsed_time": "0:19:43", "remaining_time": "1:18:03", "throughput": 4251.86, "total_tokens": 5030096} {"current_steps": 7700, "total_steps": 38160, "loss": 0.512, "lr": 0.0009687894102741754, "epoch": 4.035639412997903, "percentage": 20.18, "elapsed_time": "0:19:43", "remaining_time": "1:18:02", "throughput": 4252.04, "total_tokens": 5033392} {"current_steps": 7705, "total_steps": 38160, "loss": 0.5776, "lr": 0.0009687098305670605, "epoch": 4.038259958071279, "percentage": 20.19, "elapsed_time": "0:19:44", "remaining_time": "1:18:01", "throughput": 4251.88, "total_tokens": 5035920} {"current_steps": 7710, "total_steps": 38160, "loss": 0.5119, "lr": 0.0009686301528111964, "epoch": 4.040880503144654, "percentage": 20.2, "elapsed_time": "0:19:45", "remaining_time": "1:18:00", "throughput": 4252.2, "total_tokens": 5039568} {"current_steps": 7715, "total_steps": 38160, "loss": 0.4057, "lr": 0.0009685503770232507, "epoch": 4.04350104821803, "percentage": 20.22, "elapsed_time": "0:19:45", "remaining_time": "1:17:59", "throughput": 4252.42, "total_tokens": 5042992} {"current_steps": 7720, "total_steps": 38160, "loss": 0.4615, "lr": 0.0009684705032199117, "epoch": 4.046121593291405, "percentage": 20.23, "elapsed_time": "0:19:46", "remaining_time": "1:17:59", "throughput": 4252.64, "total_tokens": 5046608} {"current_steps": 7725, "total_steps": 38160, "loss": 0.4387, "lr": 0.0009683905314178881, "epoch": 4.04874213836478, "percentage": 20.24, "elapsed_time": "0:19:47", "remaining_time": "1:17:58", "throughput": 4253.25, "total_tokens": 5051152} {"current_steps": 7730, "total_steps": 38160, "loss": 0.539, "lr": 0.000968310461633909, "epoch": 4.051362683438155, "percentage": 20.26, "elapsed_time": "0:19:48", "remaining_time": "1:17:57", "throughput": 4253.17, "total_tokens": 5053872} {"current_steps": 7735, "total_steps": 38160, "loss": 0.3981, "lr": 0.0009682302938847238, "epoch": 4.05398322851153, "percentage": 20.27, "elapsed_time": "0:19:48", "remaining_time": "1:17:56", "throughput": 4253.1, "total_tokens": 5056624} {"current_steps": 7740, "total_steps": 38160, "loss": 0.3864, "lr": 0.0009681500281871031, "epoch": 4.056603773584905, "percentage": 20.28, "elapsed_time": "0:19:49", "remaining_time": "1:17:55", "throughput": 4253.07, "total_tokens": 5059472} {"current_steps": 7745, "total_steps": 38160, "loss": 0.508, "lr": 0.0009680696645578377, "epoch": 4.059224318658281, "percentage": 20.3, "elapsed_time": "0:19:50", "remaining_time": "1:17:54", "throughput": 4253.31, "total_tokens": 5062928} {"current_steps": 7750, "total_steps": 38160, "loss": 0.4537, "lr": 0.0009679892030137382, "epoch": 4.061844863731656, "percentage": 20.31, "elapsed_time": "0:19:51", "remaining_time": "1:17:53", "throughput": 4253.38, "total_tokens": 5066128} {"current_steps": 7755, "total_steps": 38160, "loss": 0.501, "lr": 0.0009679086435716368, "epoch": 4.064465408805032, "percentage": 20.32, "elapsed_time": "0:19:51", "remaining_time": "1:17:52", "throughput": 4253.58, "total_tokens": 5069616} {"current_steps": 7760, "total_steps": 38160, "loss": 0.5741, "lr": 0.0009678279862483852, "epoch": 4.067085953878407, "percentage": 20.34, "elapsed_time": "0:19:52", "remaining_time": "1:17:52", "throughput": 4253.81, "total_tokens": 5073168} {"current_steps": 7765, "total_steps": 38160, "loss": 0.4663, "lr": 0.0009677472310608561, "epoch": 4.069706498951782, "percentage": 20.35, "elapsed_time": "0:19:53", "remaining_time": "1:17:51", "throughput": 4253.87, "total_tokens": 5076336} {"current_steps": 7770, "total_steps": 38160, "loss": 0.5797, "lr": 0.0009676663780259427, "epoch": 4.072327044025157, "percentage": 20.36, "elapsed_time": "0:19:54", "remaining_time": "1:17:50", "throughput": 4253.8, "total_tokens": 5079088} {"current_steps": 7775, "total_steps": 38160, "loss": 0.6626, "lr": 0.0009675854271605583, "epoch": 4.0749475890985325, "percentage": 20.37, "elapsed_time": "0:19:54", "remaining_time": "1:17:49", "throughput": 4254.01, "total_tokens": 5082480} {"current_steps": 7780, "total_steps": 38160, "loss": 0.4057, "lr": 0.0009675043784816371, "epoch": 4.077568134171908, "percentage": 20.39, "elapsed_time": "0:19:55", "remaining_time": "1:17:48", "throughput": 4254.08, "total_tokens": 5085552} {"current_steps": 7785, "total_steps": 38160, "loss": 0.4873, "lr": 0.0009674232320061336, "epoch": 4.080188679245283, "percentage": 20.4, "elapsed_time": "0:19:56", "remaining_time": "1:17:47", "throughput": 4254.41, "total_tokens": 5089232} {"current_steps": 7790, "total_steps": 38160, "loss": 0.3741, "lr": 0.0009673419877510226, "epoch": 4.082809224318658, "percentage": 20.41, "elapsed_time": "0:19:56", "remaining_time": "1:17:46", "throughput": 4254.39, "total_tokens": 5092080} {"current_steps": 7795, "total_steps": 38160, "loss": 0.6198, "lr": 0.0009672606457332994, "epoch": 4.085429769392033, "percentage": 20.43, "elapsed_time": "0:19:57", "remaining_time": "1:17:45", "throughput": 4254.43, "total_tokens": 5095152} {"current_steps": 7800, "total_steps": 38160, "loss": 0.5072, "lr": 0.0009671792059699798, "epoch": 4.088050314465409, "percentage": 20.44, "elapsed_time": "0:19:58", "remaining_time": "1:17:44", "throughput": 4254.34, "total_tokens": 5097872} {"current_steps": 7805, "total_steps": 38160, "loss": 0.4656, "lr": 0.0009670976684781003, "epoch": 4.090670859538784, "percentage": 20.45, "elapsed_time": "0:19:58", "remaining_time": "1:17:42", "throughput": 4254.27, "total_tokens": 5100592} {"current_steps": 7810, "total_steps": 38160, "loss": 0.546, "lr": 0.0009670160332747174, "epoch": 4.09329140461216, "percentage": 20.47, "elapsed_time": "0:19:59", "remaining_time": "1:17:41", "throughput": 4254.37, "total_tokens": 5103664} {"current_steps": 7815, "total_steps": 38160, "loss": 0.4428, "lr": 0.0009669343003769085, "epoch": 4.095911949685535, "percentage": 20.48, "elapsed_time": "0:20:00", "remaining_time": "1:17:41", "throughput": 4254.67, "total_tokens": 5107280} {"current_steps": 7820, "total_steps": 38160, "loss": 0.5491, "lr": 0.0009668524698017709, "epoch": 4.09853249475891, "percentage": 20.49, "elapsed_time": "0:20:01", "remaining_time": "1:17:39", "throughput": 4254.6, "total_tokens": 5109968} {"current_steps": 7825, "total_steps": 38160, "loss": 0.4279, "lr": 0.0009667705415664227, "epoch": 4.101153039832285, "percentage": 20.51, "elapsed_time": "0:20:01", "remaining_time": "1:17:38", "throughput": 4254.65, "total_tokens": 5113040} {"current_steps": 7830, "total_steps": 38160, "loss": 0.4436, "lr": 0.0009666885156880026, "epoch": 4.10377358490566, "percentage": 20.52, "elapsed_time": "0:20:02", "remaining_time": "1:17:38", "throughput": 4255.07, "total_tokens": 5117072} {"current_steps": 7835, "total_steps": 38160, "loss": 0.4522, "lr": 0.0009666063921836692, "epoch": 4.106394129979035, "percentage": 20.53, "elapsed_time": "0:20:03", "remaining_time": "1:17:37", "throughput": 4255.53, "total_tokens": 5121168} {"current_steps": 7840, "total_steps": 38160, "loss": 0.4493, "lr": 0.0009665241710706019, "epoch": 4.109014675052411, "percentage": 20.55, "elapsed_time": "0:20:04", "remaining_time": "1:17:36", "throughput": 4255.58, "total_tokens": 5124144} {"current_steps": 7845, "total_steps": 38160, "loss": 0.5441, "lr": 0.0009664418523660003, "epoch": 4.111635220125786, "percentage": 20.56, "elapsed_time": "0:20:04", "remaining_time": "1:17:35", "throughput": 4255.49, "total_tokens": 5126736} {"current_steps": 7850, "total_steps": 38160, "loss": 0.4411, "lr": 0.0009663594360870847, "epoch": 4.114255765199162, "percentage": 20.57, "elapsed_time": "0:20:05", "remaining_time": "1:17:34", "throughput": 4255.92, "total_tokens": 5130768} {"current_steps": 7855, "total_steps": 38160, "loss": 0.425, "lr": 0.0009662769222510955, "epoch": 4.116876310272537, "percentage": 20.58, "elapsed_time": "0:20:06", "remaining_time": "1:17:33", "throughput": 4255.82, "total_tokens": 5133424} {"current_steps": 7860, "total_steps": 38160, "loss": 0.4359, "lr": 0.0009661943108752939, "epoch": 4.119496855345912, "percentage": 20.6, "elapsed_time": "0:20:06", "remaining_time": "1:17:32", "throughput": 4255.81, "total_tokens": 5136304} {"current_steps": 7865, "total_steps": 38160, "loss": 0.4892, "lr": 0.0009661116019769609, "epoch": 4.122117400419287, "percentage": 20.61, "elapsed_time": "0:20:07", "remaining_time": "1:17:31", "throughput": 4255.88, "total_tokens": 5139472} {"current_steps": 7870, "total_steps": 38160, "loss": 0.3827, "lr": 0.0009660287955733986, "epoch": 4.1247379454926625, "percentage": 20.62, "elapsed_time": "0:20:08", "remaining_time": "1:17:31", "throughput": 4256.51, "total_tokens": 5144144} {"current_steps": 7875, "total_steps": 38160, "loss": 0.411, "lr": 0.0009659458916819289, "epoch": 4.127358490566038, "percentage": 20.64, "elapsed_time": "0:20:09", "remaining_time": "1:17:31", "throughput": 4257.05, "total_tokens": 5148496} {"current_steps": 7880, "total_steps": 38160, "loss": 0.4463, "lr": 0.0009658628903198945, "epoch": 4.129979035639413, "percentage": 20.65, "elapsed_time": "0:20:10", "remaining_time": "1:17:30", "throughput": 4257.17, "total_tokens": 5151760} {"current_steps": 7885, "total_steps": 38160, "loss": 0.3074, "lr": 0.0009657797915046583, "epoch": 4.132599580712788, "percentage": 20.66, "elapsed_time": "0:20:10", "remaining_time": "1:17:29", "throughput": 4257.65, "total_tokens": 5155920} {"current_steps": 7890, "total_steps": 38160, "loss": 0.7352, "lr": 0.0009656965952536036, "epoch": 4.135220125786163, "percentage": 20.68, "elapsed_time": "0:20:11", "remaining_time": "1:17:28", "throughput": 4257.57, "total_tokens": 5158576} {"current_steps": 7895, "total_steps": 38160, "loss": 0.4057, "lr": 0.0009656133015841342, "epoch": 4.137840670859539, "percentage": 20.69, "elapsed_time": "0:20:12", "remaining_time": "1:17:27", "throughput": 4257.67, "total_tokens": 5161712} {"current_steps": 7900, "total_steps": 38160, "loss": 0.478, "lr": 0.000965529910513674, "epoch": 4.140461215932914, "percentage": 20.7, "elapsed_time": "0:20:13", "remaining_time": "1:17:26", "throughput": 4257.98, "total_tokens": 5165456} {"current_steps": 7905, "total_steps": 38160, "loss": 0.4755, "lr": 0.0009654464220596676, "epoch": 4.1430817610062896, "percentage": 20.72, "elapsed_time": "0:20:13", "remaining_time": "1:17:25", "throughput": 4257.82, "total_tokens": 5168048} {"current_steps": 7910, "total_steps": 38160, "loss": 0.5161, "lr": 0.0009653628362395799, "epoch": 4.145702306079665, "percentage": 20.73, "elapsed_time": "0:20:14", "remaining_time": "1:17:24", "throughput": 4257.81, "total_tokens": 5170928} {"current_steps": 7915, "total_steps": 38160, "loss": 0.468, "lr": 0.0009652791530708958, "epoch": 4.14832285115304, "percentage": 20.74, "elapsed_time": "0:20:15", "remaining_time": "1:17:23", "throughput": 4257.68, "total_tokens": 5173520} {"current_steps": 7920, "total_steps": 38160, "loss": 0.5017, "lr": 0.0009651953725711212, "epoch": 4.150943396226415, "percentage": 20.75, "elapsed_time": "0:20:15", "remaining_time": "1:17:22", "throughput": 4257.7, "total_tokens": 5176496} {"current_steps": 7925, "total_steps": 38160, "loss": 0.5138, "lr": 0.0009651114947577818, "epoch": 4.15356394129979, "percentage": 20.77, "elapsed_time": "0:20:16", "remaining_time": "1:17:21", "throughput": 4257.93, "total_tokens": 5180112} {"current_steps": 7930, "total_steps": 38160, "loss": 0.3737, "lr": 0.0009650275196484239, "epoch": 4.156184486373165, "percentage": 20.78, "elapsed_time": "0:20:17", "remaining_time": "1:17:20", "throughput": 4258.31, "total_tokens": 5184048} {"current_steps": 7935, "total_steps": 38160, "loss": 0.3498, "lr": 0.0009649434472606144, "epoch": 4.158805031446541, "percentage": 20.79, "elapsed_time": "0:20:18", "remaining_time": "1:17:19", "throughput": 4258.3, "total_tokens": 5186960} {"current_steps": 7940, "total_steps": 38160, "loss": 0.3831, "lr": 0.00096485927761194, "epoch": 4.161425576519916, "percentage": 20.81, "elapsed_time": "0:20:18", "remaining_time": "1:17:18", "throughput": 4258.38, "total_tokens": 5190064} {"current_steps": 7945, "total_steps": 38160, "loss": 0.5912, "lr": 0.0009647750107200082, "epoch": 4.164046121593292, "percentage": 20.82, "elapsed_time": "0:20:19", "remaining_time": "1:17:17", "throughput": 4258.36, "total_tokens": 5192912} {"current_steps": 7950, "total_steps": 38160, "loss": 0.4169, "lr": 0.0009646906466024465, "epoch": 4.166666666666667, "percentage": 20.83, "elapsed_time": "0:20:20", "remaining_time": "1:17:16", "throughput": 4258.12, "total_tokens": 5195152} {"current_steps": 7955, "total_steps": 38160, "loss": 0.4632, "lr": 0.000964606185276903, "epoch": 4.169287211740042, "percentage": 20.85, "elapsed_time": "0:20:20", "remaining_time": "1:17:15", "throughput": 4258.17, "total_tokens": 5198192} {"current_steps": 7960, "total_steps": 38160, "loss": 0.3848, "lr": 0.0009645216267610461, "epoch": 4.171907756813417, "percentage": 20.86, "elapsed_time": "0:20:21", "remaining_time": "1:17:14", "throughput": 4258.26, "total_tokens": 5201296} {"current_steps": 7965, "total_steps": 38160, "loss": 0.4391, "lr": 0.0009644369710725644, "epoch": 4.1745283018867925, "percentage": 20.87, "elapsed_time": "0:20:22", "remaining_time": "1:17:13", "throughput": 4258.64, "total_tokens": 5205232} {"current_steps": 7970, "total_steps": 38160, "loss": 0.4036, "lr": 0.0009643522182291669, "epoch": 4.177148846960168, "percentage": 20.89, "elapsed_time": "0:20:23", "remaining_time": "1:17:12", "throughput": 4258.77, "total_tokens": 5208528} {"current_steps": 7975, "total_steps": 38160, "loss": 0.3796, "lr": 0.000964267368248583, "epoch": 4.179769392033543, "percentage": 20.9, "elapsed_time": "0:20:23", "remaining_time": "1:17:11", "throughput": 4258.95, "total_tokens": 5211824} {"current_steps": 7980, "total_steps": 38160, "loss": 0.5498, "lr": 0.0009641824211485623, "epoch": 4.182389937106918, "percentage": 20.91, "elapsed_time": "0:20:24", "remaining_time": "1:17:10", "throughput": 4259.02, "total_tokens": 5214928} {"current_steps": 7985, "total_steps": 38160, "loss": 0.4937, "lr": 0.0009640973769468747, "epoch": 4.185010482180293, "percentage": 20.93, "elapsed_time": "0:20:25", "remaining_time": "1:17:09", "throughput": 4259.18, "total_tokens": 5218224} {"current_steps": 7990, "total_steps": 38160, "loss": 0.3905, "lr": 0.0009640122356613105, "epoch": 4.187631027253669, "percentage": 20.94, "elapsed_time": "0:20:25", "remaining_time": "1:17:08", "throughput": 4259.22, "total_tokens": 5221200} {"current_steps": 7995, "total_steps": 38160, "loss": 0.5257, "lr": 0.0009639269973096805, "epoch": 4.190251572327044, "percentage": 20.95, "elapsed_time": "0:20:26", "remaining_time": "1:17:07", "throughput": 4259.29, "total_tokens": 5224368} {"current_steps": 8000, "total_steps": 38160, "loss": 0.5236, "lr": 0.0009638416619098154, "epoch": 4.1928721174004195, "percentage": 20.96, "elapsed_time": "0:20:27", "remaining_time": "1:17:07", "throughput": 4259.63, "total_tokens": 5228208} {"current_steps": 8005, "total_steps": 38160, "loss": 0.5807, "lr": 0.0009637562294795663, "epoch": 4.195492662473795, "percentage": 20.98, "elapsed_time": "0:20:28", "remaining_time": "1:17:06", "throughput": 4259.53, "total_tokens": 5230864} {"current_steps": 8010, "total_steps": 38160, "loss": 0.3743, "lr": 0.0009636707000368049, "epoch": 4.19811320754717, "percentage": 20.99, "elapsed_time": "0:20:28", "remaining_time": "1:17:04", "throughput": 4259.39, "total_tokens": 5233360} {"current_steps": 8015, "total_steps": 38160, "loss": 0.4628, "lr": 0.000963585073599423, "epoch": 4.200733752620545, "percentage": 21.0, "elapsed_time": "0:20:29", "remaining_time": "1:17:03", "throughput": 4259.53, "total_tokens": 5236624} {"current_steps": 8020, "total_steps": 38160, "loss": 0.4277, "lr": 0.0009634993501853323, "epoch": 4.20335429769392, "percentage": 21.02, "elapsed_time": "0:20:30", "remaining_time": "1:17:02", "throughput": 4259.59, "total_tokens": 5239696} {"current_steps": 8025, "total_steps": 38160, "loss": 0.4406, "lr": 0.0009634135298124656, "epoch": 4.205974842767295, "percentage": 21.03, "elapsed_time": "0:20:30", "remaining_time": "1:17:01", "throughput": 4259.63, "total_tokens": 5242736} {"current_steps": 8030, "total_steps": 38160, "loss": 0.5811, "lr": 0.0009633276124987752, "epoch": 4.2085953878406706, "percentage": 21.04, "elapsed_time": "0:20:31", "remaining_time": "1:17:01", "throughput": 4259.98, "total_tokens": 5246544} {"current_steps": 8035, "total_steps": 38160, "loss": 0.6741, "lr": 0.0009632415982622342, "epoch": 4.211215932914046, "percentage": 21.06, "elapsed_time": "0:20:32", "remaining_time": "1:17:00", "throughput": 4260.15, "total_tokens": 5249840} {"current_steps": 8040, "total_steps": 38160, "loss": 0.3097, "lr": 0.0009631554871208359, "epoch": 4.213836477987422, "percentage": 21.07, "elapsed_time": "0:20:33", "remaining_time": "1:16:59", "throughput": 4260.41, "total_tokens": 5253456} {"current_steps": 8045, "total_steps": 38160, "loss": 0.4271, "lr": 0.0009630692790925936, "epoch": 4.216457023060797, "percentage": 21.08, "elapsed_time": "0:20:33", "remaining_time": "1:16:58", "throughput": 4260.35, "total_tokens": 5256208} {"current_steps": 8050, "total_steps": 38160, "loss": 0.4765, "lr": 0.0009629829741955411, "epoch": 4.219077568134172, "percentage": 21.1, "elapsed_time": "0:20:34", "remaining_time": "1:16:56", "throughput": 4260.13, "total_tokens": 5258512} {"current_steps": 8055, "total_steps": 38160, "loss": 0.4045, "lr": 0.0009628965724477325, "epoch": 4.221698113207547, "percentage": 21.11, "elapsed_time": "0:20:35", "remaining_time": "1:16:55", "throughput": 4260.19, "total_tokens": 5261520} {"current_steps": 8060, "total_steps": 38160, "loss": 0.5729, "lr": 0.0009628100738672419, "epoch": 4.2243186582809225, "percentage": 21.12, "elapsed_time": "0:20:35", "remaining_time": "1:16:54", "throughput": 4260.17, "total_tokens": 5264400} {"current_steps": 8065, "total_steps": 38160, "loss": 0.3396, "lr": 0.0009627234784721637, "epoch": 4.226939203354298, "percentage": 21.13, "elapsed_time": "0:20:36", "remaining_time": "1:16:53", "throughput": 4260.24, "total_tokens": 5267472} {"current_steps": 8070, "total_steps": 38160, "loss": 0.4025, "lr": 0.0009626367862806129, "epoch": 4.229559748427673, "percentage": 21.15, "elapsed_time": "0:20:37", "remaining_time": "1:16:52", "throughput": 4260.38, "total_tokens": 5270736} {"current_steps": 8075, "total_steps": 38160, "loss": 0.4772, "lr": 0.0009625499973107246, "epoch": 4.232180293501048, "percentage": 21.16, "elapsed_time": "0:20:37", "remaining_time": "1:16:52", "throughput": 4260.64, "total_tokens": 5274384} {"current_steps": 8080, "total_steps": 38160, "loss": 0.5232, "lr": 0.0009624631115806537, "epoch": 4.234800838574423, "percentage": 21.17, "elapsed_time": "0:20:38", "remaining_time": "1:16:50", "throughput": 4260.47, "total_tokens": 5276912} {"current_steps": 8085, "total_steps": 38160, "loss": 0.5703, "lr": 0.0009623761291085761, "epoch": 4.237421383647799, "percentage": 21.19, "elapsed_time": "0:20:39", "remaining_time": "1:16:49", "throughput": 4260.47, "total_tokens": 5279792} {"current_steps": 8090, "total_steps": 38160, "loss": 0.5247, "lr": 0.0009622890499126873, "epoch": 4.240041928721174, "percentage": 21.2, "elapsed_time": "0:20:39", "remaining_time": "1:16:48", "throughput": 4260.58, "total_tokens": 5282992} {"current_steps": 8095, "total_steps": 38160, "loss": 0.4775, "lr": 0.0009622018740112032, "epoch": 4.2426624737945495, "percentage": 21.21, "elapsed_time": "0:20:40", "remaining_time": "1:16:47", "throughput": 4260.41, "total_tokens": 5285456} {"current_steps": 8100, "total_steps": 38160, "loss": 0.5832, "lr": 0.0009621146014223603, "epoch": 4.245283018867925, "percentage": 21.23, "elapsed_time": "0:20:41", "remaining_time": "1:16:46", "throughput": 4260.44, "total_tokens": 5288432} {"current_steps": 8105, "total_steps": 38160, "loss": 0.5962, "lr": 0.0009620272321644148, "epoch": 4.2479035639413, "percentage": 21.24, "elapsed_time": "0:20:41", "remaining_time": "1:16:45", "throughput": 4260.41, "total_tokens": 5291248} {"current_steps": 8110, "total_steps": 38160, "loss": 0.3941, "lr": 0.0009619397662556434, "epoch": 4.250524109014675, "percentage": 21.25, "elapsed_time": "0:20:42", "remaining_time": "1:16:44", "throughput": 4260.23, "total_tokens": 5293680} {"current_steps": 8115, "total_steps": 38160, "loss": 0.5531, "lr": 0.000961852203714343, "epoch": 4.25314465408805, "percentage": 21.27, "elapsed_time": "0:20:43", "remaining_time": "1:16:43", "throughput": 4260.39, "total_tokens": 5297040} {"current_steps": 8120, "total_steps": 38160, "loss": 0.4235, "lr": 0.0009617645445588307, "epoch": 4.255765199161425, "percentage": 21.28, "elapsed_time": "0:20:44", "remaining_time": "1:16:42", "throughput": 4260.6, "total_tokens": 5300592} {"current_steps": 8125, "total_steps": 38160, "loss": 0.6537, "lr": 0.0009616767888074438, "epoch": 4.2583857442348005, "percentage": 21.29, "elapsed_time": "0:20:44", "remaining_time": "1:16:41", "throughput": 4260.6, "total_tokens": 5303440} {"current_steps": 8130, "total_steps": 38160, "loss": 0.6519, "lr": 0.0009615889364785397, "epoch": 4.261006289308176, "percentage": 21.31, "elapsed_time": "0:20:45", "remaining_time": "1:16:40", "throughput": 4260.6, "total_tokens": 5306384} {"current_steps": 8135, "total_steps": 38160, "loss": 0.5354, "lr": 0.000961500987590496, "epoch": 4.263626834381552, "percentage": 21.32, "elapsed_time": "0:20:46", "remaining_time": "1:16:39", "throughput": 4260.85, "total_tokens": 5309936} {"current_steps": 8140, "total_steps": 38160, "loss": 0.4844, "lr": 0.0009614129421617111, "epoch": 4.266247379454927, "percentage": 21.33, "elapsed_time": "0:20:47", "remaining_time": "1:16:39", "throughput": 4261.53, "total_tokens": 5314576} {"current_steps": 8145, "total_steps": 38160, "loss": 0.4264, "lr": 0.0009613248002106027, "epoch": 4.268867924528302, "percentage": 21.34, "elapsed_time": "0:20:47", "remaining_time": "1:16:38", "throughput": 4261.8, "total_tokens": 5318128} {"current_steps": 8150, "total_steps": 38160, "loss": 0.5099, "lr": 0.000961236561755609, "epoch": 4.271488469601677, "percentage": 21.36, "elapsed_time": "0:20:48", "remaining_time": "1:16:37", "throughput": 4261.78, "total_tokens": 5320944} {"current_steps": 8155, "total_steps": 38160, "loss": 0.5042, "lr": 0.0009611482268151888, "epoch": 4.274109014675052, "percentage": 21.37, "elapsed_time": "0:20:49", "remaining_time": "1:16:36", "throughput": 4261.91, "total_tokens": 5324208} {"current_steps": 8160, "total_steps": 38160, "loss": 0.4842, "lr": 0.0009610597954078206, "epoch": 4.276729559748428, "percentage": 21.38, "elapsed_time": "0:20:49", "remaining_time": "1:16:35", "throughput": 4262.0, "total_tokens": 5327344} {"current_steps": 8165, "total_steps": 38160, "loss": 0.3827, "lr": 0.0009609712675520031, "epoch": 4.279350104821803, "percentage": 21.4, "elapsed_time": "0:20:50", "remaining_time": "1:16:34", "throughput": 4262.04, "total_tokens": 5330288} {"current_steps": 8170, "total_steps": 38160, "loss": 0.3853, "lr": 0.0009608826432662556, "epoch": 4.281970649895178, "percentage": 21.41, "elapsed_time": "0:20:51", "remaining_time": "1:16:33", "throughput": 4262.42, "total_tokens": 5334192} {"current_steps": 8175, "total_steps": 38160, "loss": 0.545, "lr": 0.0009607939225691172, "epoch": 4.284591194968553, "percentage": 21.42, "elapsed_time": "0:20:52", "remaining_time": "1:16:32", "throughput": 4262.55, "total_tokens": 5337360} {"current_steps": 8180, "total_steps": 38160, "loss": 0.4809, "lr": 0.0009607051054791472, "epoch": 4.287211740041929, "percentage": 21.44, "elapsed_time": "0:20:52", "remaining_time": "1:16:32", "throughput": 4262.81, "total_tokens": 5341072} {"current_steps": 8185, "total_steps": 38160, "loss": 0.5092, "lr": 0.000960616192014925, "epoch": 4.289832285115304, "percentage": 21.45, "elapsed_time": "0:20:53", "remaining_time": "1:16:31", "throughput": 4263.01, "total_tokens": 5344592} {"current_steps": 8190, "total_steps": 38160, "loss": 0.6188, "lr": 0.0009605271821950506, "epoch": 4.2924528301886795, "percentage": 21.46, "elapsed_time": "0:20:54", "remaining_time": "1:16:30", "throughput": 4262.81, "total_tokens": 5346992} {"current_steps": 8195, "total_steps": 38160, "loss": 0.5129, "lr": 0.0009604380760381434, "epoch": 4.295073375262055, "percentage": 21.48, "elapsed_time": "0:20:55", "remaining_time": "1:16:28", "throughput": 4262.76, "total_tokens": 5349776} {"current_steps": 8200, "total_steps": 38160, "loss": 0.5376, "lr": 0.0009603488735628439, "epoch": 4.29769392033543, "percentage": 21.49, "elapsed_time": "0:20:55", "remaining_time": "1:16:28", "throughput": 4263.25, "total_tokens": 5353968} {"current_steps": 8205, "total_steps": 38160, "loss": 0.5698, "lr": 0.0009602595747878118, "epoch": 4.300314465408805, "percentage": 21.5, "elapsed_time": "0:20:56", "remaining_time": "1:16:27", "throughput": 4263.14, "total_tokens": 5356560} {"current_steps": 8210, "total_steps": 38160, "loss": 0.3592, "lr": 0.0009601701797317278, "epoch": 4.30293501048218, "percentage": 21.51, "elapsed_time": "0:20:57", "remaining_time": "1:16:26", "throughput": 4263.27, "total_tokens": 5359824} {"current_steps": 8215, "total_steps": 38160, "loss": 0.5704, "lr": 0.0009600806884132917, "epoch": 4.305555555555555, "percentage": 21.53, "elapsed_time": "0:20:58", "remaining_time": "1:16:25", "throughput": 4263.77, "total_tokens": 5364144} {"current_steps": 8220, "total_steps": 38160, "loss": 0.5319, "lr": 0.0009599911008512248, "epoch": 4.3081761006289305, "percentage": 21.54, "elapsed_time": "0:20:58", "remaining_time": "1:16:25", "throughput": 4264.23, "total_tokens": 5368336} {"current_steps": 8225, "total_steps": 38160, "loss": 0.4015, "lr": 0.0009599014170642674, "epoch": 4.310796645702306, "percentage": 21.55, "elapsed_time": "0:20:59", "remaining_time": "1:16:24", "throughput": 4264.28, "total_tokens": 5371440} {"current_steps": 8230, "total_steps": 38160, "loss": 0.4096, "lr": 0.0009598116370711805, "epoch": 4.313417190775682, "percentage": 21.57, "elapsed_time": "0:21:00", "remaining_time": "1:16:23", "throughput": 4264.22, "total_tokens": 5374160} {"current_steps": 8235, "total_steps": 38160, "loss": 0.5534, "lr": 0.0009597217608907447, "epoch": 4.316037735849057, "percentage": 21.58, "elapsed_time": "0:21:01", "remaining_time": "1:16:22", "throughput": 4264.45, "total_tokens": 5377680} {"current_steps": 8240, "total_steps": 38160, "loss": 0.4084, "lr": 0.0009596317885417614, "epoch": 4.318658280922432, "percentage": 21.59, "elapsed_time": "0:21:01", "remaining_time": "1:16:21", "throughput": 4264.78, "total_tokens": 5381488} {"current_steps": 8245, "total_steps": 38160, "loss": 0.4241, "lr": 0.0009595417200430516, "epoch": 4.321278825995807, "percentage": 21.61, "elapsed_time": "0:21:02", "remaining_time": "1:16:21", "throughput": 4264.95, "total_tokens": 5384912} {"current_steps": 8250, "total_steps": 38160, "loss": 0.3824, "lr": 0.0009594515554134568, "epoch": 4.323899371069182, "percentage": 21.62, "elapsed_time": "0:21:03", "remaining_time": "1:16:19", "throughput": 4264.95, "total_tokens": 5387792} {"current_steps": 8255, "total_steps": 38160, "loss": 0.4995, "lr": 0.0009593612946718384, "epoch": 4.326519916142558, "percentage": 21.63, "elapsed_time": "0:21:03", "remaining_time": "1:16:18", "throughput": 4264.93, "total_tokens": 5390608} {"current_steps": 8260, "total_steps": 38160, "loss": 0.4864, "lr": 0.0009592709378370778, "epoch": 4.329140461215933, "percentage": 21.65, "elapsed_time": "0:21:04", "remaining_time": "1:16:17", "throughput": 4264.87, "total_tokens": 5393328} {"current_steps": 8265, "total_steps": 38160, "loss": 0.4857, "lr": 0.0009591804849280766, "epoch": 4.331761006289308, "percentage": 21.66, "elapsed_time": "0:21:05", "remaining_time": "1:16:16", "throughput": 4264.77, "total_tokens": 5395952} {"current_steps": 8270, "total_steps": 38160, "loss": 0.4535, "lr": 0.0009590899359637564, "epoch": 4.334381551362683, "percentage": 21.67, "elapsed_time": "0:21:05", "remaining_time": "1:16:15", "throughput": 4264.61, "total_tokens": 5398384} {"current_steps": 8275, "total_steps": 38160, "loss": 0.4287, "lr": 0.0009589992909630594, "epoch": 4.337002096436059, "percentage": 21.69, "elapsed_time": "0:21:06", "remaining_time": "1:16:14", "throughput": 4264.66, "total_tokens": 5401424} {"current_steps": 8280, "total_steps": 38160, "loss": 0.3516, "lr": 0.0009589085499449471, "epoch": 4.339622641509434, "percentage": 21.7, "elapsed_time": "0:21:07", "remaining_time": "1:16:13", "throughput": 4264.89, "total_tokens": 5404976} {"current_steps": 8285, "total_steps": 38160, "loss": 0.3618, "lr": 0.0009588177129284017, "epoch": 4.3422431865828095, "percentage": 21.71, "elapsed_time": "0:21:08", "remaining_time": "1:16:12", "throughput": 4265.11, "total_tokens": 5408464} {"current_steps": 8290, "total_steps": 38160, "loss": 0.4975, "lr": 0.0009587267799324253, "epoch": 4.344863731656185, "percentage": 21.72, "elapsed_time": "0:21:08", "remaining_time": "1:16:11", "throughput": 4265.08, "total_tokens": 5411280} {"current_steps": 8295, "total_steps": 38160, "loss": 0.4441, "lr": 0.0009586357509760399, "epoch": 4.34748427672956, "percentage": 21.74, "elapsed_time": "0:21:09", "remaining_time": "1:16:10", "throughput": 4265.4, "total_tokens": 5415184} {"current_steps": 8300, "total_steps": 38160, "loss": 0.3832, "lr": 0.0009585446260782878, "epoch": 4.350104821802935, "percentage": 21.75, "elapsed_time": "0:21:10", "remaining_time": "1:16:09", "throughput": 4265.16, "total_tokens": 5417456} {"current_steps": 8305, "total_steps": 38160, "loss": 0.4138, "lr": 0.0009584534052582313, "epoch": 4.35272536687631, "percentage": 21.76, "elapsed_time": "0:21:10", "remaining_time": "1:16:08", "throughput": 4265.01, "total_tokens": 5420016} {"current_steps": 8310, "total_steps": 38160, "loss": 0.5575, "lr": 0.0009583620885349527, "epoch": 4.355345911949685, "percentage": 21.78, "elapsed_time": "0:21:11", "remaining_time": "1:16:07", "throughput": 4265.15, "total_tokens": 5423344} {"current_steps": 8315, "total_steps": 38160, "loss": 0.3978, "lr": 0.0009582706759275546, "epoch": 4.3579664570230605, "percentage": 21.79, "elapsed_time": "0:21:12", "remaining_time": "1:16:06", "throughput": 4265.31, "total_tokens": 5426640} {"current_steps": 8320, "total_steps": 38160, "loss": 0.4499, "lr": 0.0009581791674551592, "epoch": 4.360587002096436, "percentage": 21.8, "elapsed_time": "0:21:13", "remaining_time": "1:16:05", "throughput": 4265.57, "total_tokens": 5430256} {"current_steps": 8325, "total_steps": 38160, "loss": 0.3036, "lr": 0.000958087563136909, "epoch": 4.363207547169811, "percentage": 21.82, "elapsed_time": "0:21:13", "remaining_time": "1:16:04", "throughput": 4265.72, "total_tokens": 5433520} {"current_steps": 8330, "total_steps": 38160, "loss": 0.4639, "lr": 0.000957995862991967, "epoch": 4.365828092243187, "percentage": 21.83, "elapsed_time": "0:21:14", "remaining_time": "1:16:03", "throughput": 4265.68, "total_tokens": 5436368} {"current_steps": 8335, "total_steps": 38160, "loss": 0.4489, "lr": 0.0009579040670395154, "epoch": 4.368448637316562, "percentage": 21.84, "elapsed_time": "0:21:15", "remaining_time": "1:16:02", "throughput": 4265.69, "total_tokens": 5439216} {"current_steps": 8340, "total_steps": 38160, "loss": 0.4627, "lr": 0.000957812175298757, "epoch": 4.371069182389937, "percentage": 21.86, "elapsed_time": "0:21:15", "remaining_time": "1:16:01", "throughput": 4265.59, "total_tokens": 5441776} {"current_steps": 8345, "total_steps": 38160, "loss": 0.5922, "lr": 0.0009577201877889145, "epoch": 4.373689727463312, "percentage": 21.87, "elapsed_time": "0:21:16", "remaining_time": "1:16:00", "throughput": 4265.79, "total_tokens": 5445168} {"current_steps": 8350, "total_steps": 38160, "loss": 0.4819, "lr": 0.0009576281045292308, "epoch": 4.376310272536688, "percentage": 21.88, "elapsed_time": "0:21:17", "remaining_time": "1:16:00", "throughput": 4266.55, "total_tokens": 5450192} {"current_steps": 8355, "total_steps": 38160, "loss": 0.4032, "lr": 0.0009575359255389686, "epoch": 4.378930817610063, "percentage": 21.89, "elapsed_time": "0:21:18", "remaining_time": "1:15:59", "throughput": 4266.56, "total_tokens": 5453200} {"current_steps": 8360, "total_steps": 38160, "loss": 0.4854, "lr": 0.0009574436508374104, "epoch": 4.381551362683438, "percentage": 21.91, "elapsed_time": "0:21:18", "remaining_time": "1:15:58", "throughput": 4266.57, "total_tokens": 5456144} {"current_steps": 8365, "total_steps": 38160, "loss": 0.6686, "lr": 0.0009573512804438594, "epoch": 4.384171907756813, "percentage": 21.92, "elapsed_time": "0:21:19", "remaining_time": "1:15:57", "throughput": 4266.87, "total_tokens": 5460016} {"current_steps": 8370, "total_steps": 38160, "loss": 0.42, "lr": 0.0009572588143776381, "epoch": 4.386792452830189, "percentage": 21.93, "elapsed_time": "0:21:20", "remaining_time": "1:15:56", "throughput": 4266.66, "total_tokens": 5462384} {"current_steps": 8375, "total_steps": 38160, "loss": 0.5937, "lr": 0.0009571662526580897, "epoch": 4.389412997903564, "percentage": 21.95, "elapsed_time": "0:21:21", "remaining_time": "1:15:55", "throughput": 4267.1, "total_tokens": 5466416} {"current_steps": 8380, "total_steps": 38160, "loss": 0.4089, "lr": 0.0009570735953045768, "epoch": 4.3920335429769395, "percentage": 21.96, "elapsed_time": "0:21:21", "remaining_time": "1:15:55", "throughput": 4267.61, "total_tokens": 5470736} {"current_steps": 8385, "total_steps": 38160, "loss": 0.5014, "lr": 0.0009569808423364823, "epoch": 4.394654088050315, "percentage": 21.97, "elapsed_time": "0:21:22", "remaining_time": "1:15:54", "throughput": 4267.63, "total_tokens": 5473648} {"current_steps": 8390, "total_steps": 38160, "loss": 0.4122, "lr": 0.0009568879937732091, "epoch": 4.39727463312369, "percentage": 21.99, "elapsed_time": "0:21:23", "remaining_time": "1:15:53", "throughput": 4268.09, "total_tokens": 5477776} {"current_steps": 8395, "total_steps": 38160, "loss": 0.3702, "lr": 0.0009567950496341802, "epoch": 4.399895178197065, "percentage": 22.0, "elapsed_time": "0:21:24", "remaining_time": "1:15:53", "throughput": 4268.4, "total_tokens": 5481552} {"current_steps": 8400, "total_steps": 38160, "loss": 0.5333, "lr": 0.0009567020099388382, "epoch": 4.40251572327044, "percentage": 22.01, "elapsed_time": "0:21:24", "remaining_time": "1:15:52", "throughput": 4268.49, "total_tokens": 5484656} {"current_steps": 8405, "total_steps": 38160, "loss": 0.5016, "lr": 0.0009566088747066459, "epoch": 4.405136268343815, "percentage": 22.03, "elapsed_time": "0:21:25", "remaining_time": "1:15:51", "throughput": 4268.48, "total_tokens": 5487568} {"current_steps": 8410, "total_steps": 38160, "loss": 0.5597, "lr": 0.0009565156439570866, "epoch": 4.4077568134171905, "percentage": 22.04, "elapsed_time": "0:21:26", "remaining_time": "1:15:50", "throughput": 4268.63, "total_tokens": 5490928} {"current_steps": 8415, "total_steps": 38160, "loss": 0.4665, "lr": 0.0009564223177096625, "epoch": 4.410377358490566, "percentage": 22.05, "elapsed_time": "0:21:27", "remaining_time": "1:15:50", "throughput": 4269.26, "total_tokens": 5495536} {"current_steps": 8420, "total_steps": 38160, "loss": 0.4789, "lr": 0.0009563288959838969, "epoch": 4.412997903563941, "percentage": 22.06, "elapsed_time": "0:21:28", "remaining_time": "1:15:49", "throughput": 4269.63, "total_tokens": 5499504} {"current_steps": 8425, "total_steps": 38160, "loss": 0.4256, "lr": 0.0009562353787993321, "epoch": 4.415618448637317, "percentage": 22.08, "elapsed_time": "0:21:28", "remaining_time": "1:15:48", "throughput": 4269.6, "total_tokens": 5502320} {"current_steps": 8430, "total_steps": 38160, "loss": 0.5301, "lr": 0.0009561417661755312, "epoch": 4.418238993710692, "percentage": 22.09, "elapsed_time": "0:21:29", "remaining_time": "1:15:47", "throughput": 4269.71, "total_tokens": 5505552} {"current_steps": 8435, "total_steps": 38160, "loss": 0.4624, "lr": 0.0009560480581320768, "epoch": 4.420859538784067, "percentage": 22.1, "elapsed_time": "0:21:30", "remaining_time": "1:15:46", "throughput": 4270.19, "total_tokens": 5509776} {"current_steps": 8440, "total_steps": 38160, "loss": 0.51, "lr": 0.0009559542546885714, "epoch": 4.423480083857442, "percentage": 22.12, "elapsed_time": "0:21:31", "remaining_time": "1:15:46", "throughput": 4270.87, "total_tokens": 5514640} {"current_steps": 8445, "total_steps": 38160, "loss": 0.4954, "lr": 0.0009558603558646378, "epoch": 4.426100628930818, "percentage": 22.13, "elapsed_time": "0:21:31", "remaining_time": "1:15:45", "throughput": 4270.79, "total_tokens": 5517360} {"current_steps": 8450, "total_steps": 38160, "loss": 0.419, "lr": 0.0009557663616799185, "epoch": 4.428721174004193, "percentage": 22.14, "elapsed_time": "0:21:32", "remaining_time": "1:15:44", "throughput": 4271.0, "total_tokens": 5520912} {"current_steps": 8455, "total_steps": 38160, "loss": 0.4592, "lr": 0.0009556722721540759, "epoch": 4.431341719077568, "percentage": 22.16, "elapsed_time": "0:21:33", "remaining_time": "1:15:44", "throughput": 4271.15, "total_tokens": 5524272} {"current_steps": 8460, "total_steps": 38160, "loss": 0.3968, "lr": 0.0009555780873067927, "epoch": 4.433962264150943, "percentage": 22.17, "elapsed_time": "0:21:34", "remaining_time": "1:15:43", "throughput": 4271.19, "total_tokens": 5527280} {"current_steps": 8465, "total_steps": 38160, "loss": 0.4137, "lr": 0.000955483807157771, "epoch": 4.436582809224318, "percentage": 22.18, "elapsed_time": "0:21:34", "remaining_time": "1:15:41", "throughput": 4271.1, "total_tokens": 5529872} {"current_steps": 8470, "total_steps": 38160, "loss": 0.585, "lr": 0.0009553894317267333, "epoch": 4.439203354297694, "percentage": 22.2, "elapsed_time": "0:21:35", "remaining_time": "1:15:40", "throughput": 4271.15, "total_tokens": 5532976} {"current_steps": 8475, "total_steps": 38160, "loss": 0.552, "lr": 0.0009552949610334219, "epoch": 4.4418238993710695, "percentage": 22.21, "elapsed_time": "0:21:36", "remaining_time": "1:15:40", "throughput": 4271.32, "total_tokens": 5536400} {"current_steps": 8480, "total_steps": 38160, "loss": 0.5595, "lr": 0.000955200395097599, "epoch": 4.444444444444445, "percentage": 22.22, "elapsed_time": "0:21:36", "remaining_time": "1:15:39", "throughput": 4271.68, "total_tokens": 5540304} {"current_steps": 8485, "total_steps": 38160, "loss": 0.4531, "lr": 0.0009551057339390464, "epoch": 4.44706498951782, "percentage": 22.24, "elapsed_time": "0:21:37", "remaining_time": "1:15:39", "throughput": 4272.15, "total_tokens": 5544592} {"current_steps": 8490, "total_steps": 38160, "loss": 0.4367, "lr": 0.0009550109775775666, "epoch": 4.449685534591195, "percentage": 22.25, "elapsed_time": "0:21:38", "remaining_time": "1:15:37", "throughput": 4272.07, "total_tokens": 5547248} {"current_steps": 8495, "total_steps": 38160, "loss": 0.4367, "lr": 0.0009549161260329811, "epoch": 4.45230607966457, "percentage": 22.26, "elapsed_time": "0:21:39", "remaining_time": "1:15:36", "throughput": 4272.05, "total_tokens": 5550096} {"current_steps": 8500, "total_steps": 38160, "loss": 0.456, "lr": 0.0009548211793251322, "epoch": 4.454926624737945, "percentage": 22.27, "elapsed_time": "0:21:39", "remaining_time": "1:15:35", "throughput": 4272.12, "total_tokens": 5553328} {"current_steps": 8505, "total_steps": 38160, "loss": 0.4783, "lr": 0.0009547261374738814, "epoch": 4.4575471698113205, "percentage": 22.29, "elapsed_time": "0:21:40", "remaining_time": "1:15:35", "throughput": 4272.5, "total_tokens": 5557264} {"current_steps": 8510, "total_steps": 38160, "loss": 0.449, "lr": 0.0009546310004991105, "epoch": 4.460167714884696, "percentage": 22.3, "elapsed_time": "0:21:41", "remaining_time": "1:15:34", "throughput": 4272.76, "total_tokens": 5560912} {"current_steps": 8515, "total_steps": 38160, "loss": 0.4266, "lr": 0.000954535768420721, "epoch": 4.462788259958071, "percentage": 22.31, "elapsed_time": "0:21:42", "remaining_time": "1:15:33", "throughput": 4273.18, "total_tokens": 5564976} {"current_steps": 8520, "total_steps": 38160, "loss": 0.4117, "lr": 0.0009544404412586343, "epoch": 4.465408805031447, "percentage": 22.33, "elapsed_time": "0:21:43", "remaining_time": "1:15:33", "throughput": 4273.29, "total_tokens": 5568208} {"current_steps": 8525, "total_steps": 38160, "loss": 0.4528, "lr": 0.0009543450190327917, "epoch": 4.468029350104822, "percentage": 22.34, "elapsed_time": "0:21:43", "remaining_time": "1:15:32", "throughput": 4273.53, "total_tokens": 5571696} {"current_steps": 8530, "total_steps": 38160, "loss": 0.4947, "lr": 0.0009542495017631547, "epoch": 4.470649895178197, "percentage": 22.35, "elapsed_time": "0:21:44", "remaining_time": "1:15:31", "throughput": 4273.9, "total_tokens": 5575760} {"current_steps": 8535, "total_steps": 38160, "loss": 0.4844, "lr": 0.0009541538894697043, "epoch": 4.473270440251572, "percentage": 22.37, "elapsed_time": "0:21:45", "remaining_time": "1:15:30", "throughput": 4274.02, "total_tokens": 5578992} {"current_steps": 8540, "total_steps": 38160, "loss": 0.5184, "lr": 0.0009540581821724414, "epoch": 4.475890985324948, "percentage": 22.38, "elapsed_time": "0:21:45", "remaining_time": "1:15:29", "throughput": 4273.95, "total_tokens": 5581712} {"current_steps": 8545, "total_steps": 38160, "loss": 0.3789, "lr": 0.000953962379891387, "epoch": 4.478511530398323, "percentage": 22.39, "elapsed_time": "0:21:46", "remaining_time": "1:15:28", "throughput": 4273.96, "total_tokens": 5584688} {"current_steps": 8550, "total_steps": 38160, "loss": 0.5305, "lr": 0.0009538664826465818, "epoch": 4.481132075471698, "percentage": 22.41, "elapsed_time": "0:21:47", "remaining_time": "1:15:28", "throughput": 4274.45, "total_tokens": 5589008} {"current_steps": 8555, "total_steps": 38160, "loss": 0.4038, "lr": 0.0009537704904580864, "epoch": 4.483752620545073, "percentage": 22.42, "elapsed_time": "0:21:48", "remaining_time": "1:15:26", "throughput": 4274.23, "total_tokens": 5591280} {"current_steps": 8560, "total_steps": 38160, "loss": 0.4154, "lr": 0.0009536744033459815, "epoch": 4.486373165618448, "percentage": 22.43, "elapsed_time": "0:21:49", "remaining_time": "1:15:26", "throughput": 4274.86, "total_tokens": 5596176} {"current_steps": 8565, "total_steps": 38160, "loss": 0.7805, "lr": 0.0009535782213303669, "epoch": 4.488993710691824, "percentage": 22.44, "elapsed_time": "0:21:49", "remaining_time": "1:15:25", "throughput": 4274.78, "total_tokens": 5598832} {"current_steps": 8570, "total_steps": 38160, "loss": 0.4679, "lr": 0.0009534819444313631, "epoch": 4.4916142557651995, "percentage": 22.46, "elapsed_time": "0:21:50", "remaining_time": "1:15:24", "throughput": 4274.95, "total_tokens": 5602288} {"current_steps": 8575, "total_steps": 38160, "loss": 0.5709, "lr": 0.0009533855726691103, "epoch": 4.494234800838575, "percentage": 22.47, "elapsed_time": "0:21:51", "remaining_time": "1:15:25", "throughput": 4276.07, "total_tokens": 5608976} {"current_steps": 8580, "total_steps": 38160, "loss": 0.391, "lr": 0.0009532891060637681, "epoch": 4.49685534591195, "percentage": 22.48, "elapsed_time": "0:21:52", "remaining_time": "1:15:24", "throughput": 4276.32, "total_tokens": 5612688} {"current_steps": 8585, "total_steps": 38160, "loss": 0.5708, "lr": 0.0009531925446355163, "epoch": 4.499475890985325, "percentage": 22.5, "elapsed_time": "0:21:53", "remaining_time": "1:15:24", "throughput": 4276.53, "total_tokens": 5616208} {"current_steps": 8590, "total_steps": 38160, "loss": 0.4941, "lr": 0.0009530958884045545, "epoch": 4.5020964360587, "percentage": 22.51, "elapsed_time": "0:21:54", "remaining_time": "1:15:23", "throughput": 4276.65, "total_tokens": 5619568} {"current_steps": 8595, "total_steps": 38160, "loss": 0.5403, "lr": 0.000952999137391102, "epoch": 4.504716981132075, "percentage": 22.52, "elapsed_time": "0:21:54", "remaining_time": "1:15:22", "throughput": 4276.76, "total_tokens": 5622864} {"current_steps": 8600, "total_steps": 38160, "loss": 0.5765, "lr": 0.0009529022916153982, "epoch": 4.5073375262054505, "percentage": 22.54, "elapsed_time": "0:21:55", "remaining_time": "1:15:21", "throughput": 4276.61, "total_tokens": 5625360} {"current_steps": 8605, "total_steps": 38160, "loss": 0.592, "lr": 0.0009528053510977017, "epoch": 4.509958071278826, "percentage": 22.55, "elapsed_time": "0:21:56", "remaining_time": "1:15:20", "throughput": 4276.63, "total_tokens": 5628400} {"current_steps": 8610, "total_steps": 38160, "loss": 0.5699, "lr": 0.0009527083158582919, "epoch": 4.512578616352201, "percentage": 22.56, "elapsed_time": "0:21:56", "remaining_time": "1:15:19", "throughput": 4276.58, "total_tokens": 5631152} {"current_steps": 8615, "total_steps": 38160, "loss": 0.4571, "lr": 0.0009526111859174671, "epoch": 4.515199161425577, "percentage": 22.58, "elapsed_time": "0:21:57", "remaining_time": "1:15:18", "throughput": 4276.86, "total_tokens": 5634800} {"current_steps": 8620, "total_steps": 38160, "loss": 0.3449, "lr": 0.0009525139612955458, "epoch": 4.517819706498952, "percentage": 22.59, "elapsed_time": "0:21:58", "remaining_time": "1:15:17", "throughput": 4277.01, "total_tokens": 5638096} {"current_steps": 8625, "total_steps": 38160, "loss": 0.5244, "lr": 0.0009524166420128664, "epoch": 4.520440251572327, "percentage": 22.6, "elapsed_time": "0:21:58", "remaining_time": "1:15:16", "throughput": 4277.03, "total_tokens": 5641072} {"current_steps": 8630, "total_steps": 38160, "loss": 0.4349, "lr": 0.0009523192280897867, "epoch": 4.523060796645702, "percentage": 22.62, "elapsed_time": "0:21:59", "remaining_time": "1:15:15", "throughput": 4277.34, "total_tokens": 5644944} {"current_steps": 8635, "total_steps": 38160, "loss": 0.473, "lr": 0.0009522217195466851, "epoch": 4.5256813417190775, "percentage": 22.63, "elapsed_time": "0:22:00", "remaining_time": "1:15:14", "throughput": 4277.39, "total_tokens": 5647984} {"current_steps": 8640, "total_steps": 38160, "loss": 0.4361, "lr": 0.0009521241164039589, "epoch": 4.528301886792453, "percentage": 22.64, "elapsed_time": "0:22:01", "remaining_time": "1:15:13", "throughput": 4277.52, "total_tokens": 5651312} {"current_steps": 8645, "total_steps": 38160, "loss": 0.5068, "lr": 0.0009520264186820258, "epoch": 4.530922431865828, "percentage": 22.65, "elapsed_time": "0:22:01", "remaining_time": "1:15:12", "throughput": 4277.38, "total_tokens": 5653904} {"current_steps": 8650, "total_steps": 38160, "loss": 0.4792, "lr": 0.0009519286264013227, "epoch": 4.533542976939203, "percentage": 22.67, "elapsed_time": "0:22:02", "remaining_time": "1:15:12", "throughput": 4277.65, "total_tokens": 5657552} {"current_steps": 8655, "total_steps": 38160, "loss": 0.4369, "lr": 0.0009518307395823069, "epoch": 4.536163522012579, "percentage": 22.68, "elapsed_time": "0:22:03", "remaining_time": "1:15:11", "throughput": 4277.75, "total_tokens": 5660720} {"current_steps": 8660, "total_steps": 38160, "loss": 0.4715, "lr": 0.0009517327582454551, "epoch": 4.538784067085954, "percentage": 22.69, "elapsed_time": "0:22:03", "remaining_time": "1:15:09", "throughput": 4277.62, "total_tokens": 5663280} {"current_steps": 8665, "total_steps": 38160, "loss": 0.5666, "lr": 0.000951634682411264, "epoch": 4.5414046121593294, "percentage": 22.71, "elapsed_time": "0:22:04", "remaining_time": "1:15:09", "throughput": 4278.16, "total_tokens": 5667984} {"current_steps": 8670, "total_steps": 38160, "loss": 0.5075, "lr": 0.0009515365121002498, "epoch": 4.544025157232705, "percentage": 22.72, "elapsed_time": "0:22:05", "remaining_time": "1:15:08", "throughput": 4278.04, "total_tokens": 5670608} {"current_steps": 8675, "total_steps": 38160, "loss": 0.4346, "lr": 0.0009514382473329487, "epoch": 4.54664570230608, "percentage": 22.73, "elapsed_time": "0:22:06", "remaining_time": "1:15:07", "throughput": 4278.19, "total_tokens": 5674000} {"current_steps": 8680, "total_steps": 38160, "loss": 0.4186, "lr": 0.0009513398881299164, "epoch": 4.549266247379455, "percentage": 22.75, "elapsed_time": "0:22:06", "remaining_time": "1:15:06", "throughput": 4277.88, "total_tokens": 5676080} {"current_steps": 8685, "total_steps": 38160, "loss": 0.4539, "lr": 0.0009512414345117289, "epoch": 4.55188679245283, "percentage": 22.76, "elapsed_time": "0:22:07", "remaining_time": "1:15:05", "throughput": 4278.21, "total_tokens": 5679888} {"current_steps": 8690, "total_steps": 38160, "loss": 0.6894, "lr": 0.0009511428864989813, "epoch": 4.554507337526205, "percentage": 22.77, "elapsed_time": "0:22:08", "remaining_time": "1:15:04", "throughput": 4278.4, "total_tokens": 5683344} {"current_steps": 8695, "total_steps": 38160, "loss": 0.4038, "lr": 0.0009510442441122886, "epoch": 4.5571278825995805, "percentage": 22.79, "elapsed_time": "0:22:09", "remaining_time": "1:15:04", "throughput": 4278.66, "total_tokens": 5687056} {"current_steps": 8700, "total_steps": 38160, "loss": 0.4349, "lr": 0.0009509455073722859, "epoch": 4.559748427672956, "percentage": 22.8, "elapsed_time": "0:22:09", "remaining_time": "1:15:03", "throughput": 4278.75, "total_tokens": 5690224} {"current_steps": 8705, "total_steps": 38160, "loss": 0.4225, "lr": 0.0009508466762996277, "epoch": 4.562368972746331, "percentage": 22.81, "elapsed_time": "0:22:10", "remaining_time": "1:15:02", "throughput": 4279.01, "total_tokens": 5693840} {"current_steps": 8710, "total_steps": 38160, "loss": 0.4577, "lr": 0.0009507477509149883, "epoch": 4.564989517819707, "percentage": 22.82, "elapsed_time": "0:22:11", "remaining_time": "1:15:02", "throughput": 4279.69, "total_tokens": 5698896} {"current_steps": 8715, "total_steps": 38160, "loss": 0.5438, "lr": 0.0009506487312390619, "epoch": 4.567610062893082, "percentage": 22.84, "elapsed_time": "0:22:12", "remaining_time": "1:15:01", "throughput": 4279.64, "total_tokens": 5701744} {"current_steps": 8720, "total_steps": 38160, "loss": 0.4703, "lr": 0.0009505496172925622, "epoch": 4.570230607966457, "percentage": 22.85, "elapsed_time": "0:22:12", "remaining_time": "1:15:00", "throughput": 4279.69, "total_tokens": 5704816} {"current_steps": 8725, "total_steps": 38160, "loss": 0.4464, "lr": 0.0009504504090962226, "epoch": 4.572851153039832, "percentage": 22.86, "elapsed_time": "0:22:13", "remaining_time": "1:14:59", "throughput": 4279.85, "total_tokens": 5708112} {"current_steps": 8730, "total_steps": 38160, "loss": 0.4888, "lr": 0.0009503511066707966, "epoch": 4.5754716981132075, "percentage": 22.88, "elapsed_time": "0:22:14", "remaining_time": "1:14:58", "throughput": 4279.95, "total_tokens": 5711280} {"current_steps": 8735, "total_steps": 38160, "loss": 0.5568, "lr": 0.0009502517100370568, "epoch": 4.578092243186583, "percentage": 22.89, "elapsed_time": "0:22:15", "remaining_time": "1:14:57", "throughput": 4280.09, "total_tokens": 5714576} {"current_steps": 8740, "total_steps": 38160, "loss": 0.4522, "lr": 0.0009501522192157961, "epoch": 4.580712788259958, "percentage": 22.9, "elapsed_time": "0:22:16", "remaining_time": "1:14:58", "throughput": 4281.11, "total_tokens": 5720944} {"current_steps": 8745, "total_steps": 38160, "loss": 0.3977, "lr": 0.0009500526342278266, "epoch": 4.583333333333333, "percentage": 22.92, "elapsed_time": "0:22:16", "remaining_time": "1:14:56", "throughput": 4280.93, "total_tokens": 5723344} {"current_steps": 8750, "total_steps": 38160, "loss": 0.4843, "lr": 0.0009499529550939807, "epoch": 4.585953878406709, "percentage": 22.93, "elapsed_time": "0:22:17", "remaining_time": "1:14:56", "throughput": 4281.1, "total_tokens": 5726864} {"current_steps": 8755, "total_steps": 38160, "loss": 0.4445, "lr": 0.0009498531818351098, "epoch": 4.588574423480084, "percentage": 22.94, "elapsed_time": "0:22:18", "remaining_time": "1:14:55", "throughput": 4281.25, "total_tokens": 5730288} {"current_steps": 8760, "total_steps": 38160, "loss": 0.4933, "lr": 0.0009497533144720854, "epoch": 4.591194968553459, "percentage": 22.96, "elapsed_time": "0:22:19", "remaining_time": "1:14:54", "throughput": 4281.56, "total_tokens": 5734160} {"current_steps": 8765, "total_steps": 38160, "loss": 0.6022, "lr": 0.0009496533530257988, "epoch": 4.593815513626835, "percentage": 22.97, "elapsed_time": "0:22:19", "remaining_time": "1:14:53", "throughput": 4281.46, "total_tokens": 5736752} {"current_steps": 8770, "total_steps": 38160, "loss": 0.4962, "lr": 0.0009495532975171605, "epoch": 4.59643605870021, "percentage": 22.98, "elapsed_time": "0:22:20", "remaining_time": "1:14:53", "throughput": 4281.91, "total_tokens": 5740976} {"current_steps": 8775, "total_steps": 38160, "loss": 0.5377, "lr": 0.0009494531479671014, "epoch": 4.599056603773585, "percentage": 23.0, "elapsed_time": "0:22:21", "remaining_time": "1:14:51", "throughput": 4281.73, "total_tokens": 5743376} {"current_steps": 8780, "total_steps": 38160, "loss": 0.4418, "lr": 0.0009493529043965712, "epoch": 4.60167714884696, "percentage": 23.01, "elapsed_time": "0:22:21", "remaining_time": "1:14:50", "throughput": 4281.54, "total_tokens": 5745776} {"current_steps": 8785, "total_steps": 38160, "loss": 0.4538, "lr": 0.00094925256682654, "epoch": 4.604297693920335, "percentage": 23.02, "elapsed_time": "0:22:22", "remaining_time": "1:14:49", "throughput": 4281.58, "total_tokens": 5748784} {"current_steps": 8790, "total_steps": 38160, "loss": 0.4697, "lr": 0.000949152135277997, "epoch": 4.6069182389937104, "percentage": 23.03, "elapsed_time": "0:22:23", "remaining_time": "1:14:48", "throughput": 4281.48, "total_tokens": 5751440} {"current_steps": 8795, "total_steps": 38160, "loss": 0.4795, "lr": 0.0009490516097719515, "epoch": 4.609538784067086, "percentage": 23.05, "elapsed_time": "0:22:23", "remaining_time": "1:14:47", "throughput": 4281.23, "total_tokens": 5753648} {"current_steps": 8800, "total_steps": 38160, "loss": 0.5038, "lr": 0.0009489509903294324, "epoch": 4.612159329140461, "percentage": 23.06, "elapsed_time": "0:22:24", "remaining_time": "1:14:45", "throughput": 4281.02, "total_tokens": 5756016} {"current_steps": 8805, "total_steps": 38160, "loss": 0.4454, "lr": 0.000948850276971488, "epoch": 4.614779874213837, "percentage": 23.07, "elapsed_time": "0:22:25", "remaining_time": "1:14:45", "throughput": 4281.15, "total_tokens": 5759312} {"current_steps": 8810, "total_steps": 38160, "loss": 0.3553, "lr": 0.0009487494697191864, "epoch": 4.617400419287212, "percentage": 23.09, "elapsed_time": "0:22:26", "remaining_time": "1:14:44", "throughput": 4281.3, "total_tokens": 5762640} {"current_steps": 8815, "total_steps": 38160, "loss": 0.5129, "lr": 0.0009486485685936154, "epoch": 4.620020964360587, "percentage": 23.1, "elapsed_time": "0:22:26", "remaining_time": "1:14:43", "throughput": 4281.39, "total_tokens": 5765840} {"current_steps": 8820, "total_steps": 38160, "loss": 0.391, "lr": 0.0009485475736158822, "epoch": 4.622641509433962, "percentage": 23.11, "elapsed_time": "0:22:27", "remaining_time": "1:14:41", "throughput": 4281.19, "total_tokens": 5768208} {"current_steps": 8825, "total_steps": 38160, "loss": 0.6517, "lr": 0.000948446484807114, "epoch": 4.6252620545073375, "percentage": 23.13, "elapsed_time": "0:22:27", "remaining_time": "1:14:40", "throughput": 4281.11, "total_tokens": 5770896} {"current_steps": 8830, "total_steps": 38160, "loss": 0.4255, "lr": 0.0009483453021884572, "epoch": 4.627882599580713, "percentage": 23.14, "elapsed_time": "0:22:28", "remaining_time": "1:14:39", "throughput": 4280.98, "total_tokens": 5773488} {"current_steps": 8835, "total_steps": 38160, "loss": 0.3714, "lr": 0.0009482440257810782, "epoch": 4.630503144654088, "percentage": 23.15, "elapsed_time": "0:22:29", "remaining_time": "1:14:38", "throughput": 4281.24, "total_tokens": 5777168} {"current_steps": 8840, "total_steps": 38160, "loss": 0.4872, "lr": 0.000948142655606163, "epoch": 4.633123689727463, "percentage": 23.17, "elapsed_time": "0:22:30", "remaining_time": "1:14:37", "throughput": 4281.04, "total_tokens": 5779536} {"current_steps": 8845, "total_steps": 38160, "loss": 0.3537, "lr": 0.0009480411916849168, "epoch": 4.635744234800838, "percentage": 23.18, "elapsed_time": "0:22:30", "remaining_time": "1:14:36", "throughput": 4281.25, "total_tokens": 5782992} {"current_steps": 8850, "total_steps": 38160, "loss": 0.5208, "lr": 0.0009479396340385649, "epoch": 4.638364779874214, "percentage": 23.19, "elapsed_time": "0:22:31", "remaining_time": "1:14:35", "throughput": 4281.18, "total_tokens": 5785776} {"current_steps": 8855, "total_steps": 38160, "loss": 0.3788, "lr": 0.0009478379826883519, "epoch": 4.640985324947589, "percentage": 23.2, "elapsed_time": "0:22:32", "remaining_time": "1:14:34", "throughput": 4281.05, "total_tokens": 5788272} {"current_steps": 8860, "total_steps": 38160, "loss": 0.5058, "lr": 0.0009477362376555421, "epoch": 4.643605870020965, "percentage": 23.22, "elapsed_time": "0:22:32", "remaining_time": "1:14:33", "throughput": 4281.08, "total_tokens": 5791248} {"current_steps": 8865, "total_steps": 38160, "loss": 0.3403, "lr": 0.0009476343989614194, "epoch": 4.64622641509434, "percentage": 23.23, "elapsed_time": "0:22:33", "remaining_time": "1:14:32", "throughput": 4281.24, "total_tokens": 5794640} {"current_steps": 8870, "total_steps": 38160, "loss": 0.4523, "lr": 0.0009475324666272873, "epoch": 4.648846960167715, "percentage": 23.24, "elapsed_time": "0:22:34", "remaining_time": "1:14:31", "throughput": 4281.15, "total_tokens": 5797328} {"current_steps": 8875, "total_steps": 38160, "loss": 0.4689, "lr": 0.0009474304406744689, "epoch": 4.65146750524109, "percentage": 23.26, "elapsed_time": "0:22:34", "remaining_time": "1:14:30", "throughput": 4281.09, "total_tokens": 5800144} {"current_steps": 8880, "total_steps": 38160, "loss": 0.5065, "lr": 0.0009473283211243069, "epoch": 4.654088050314465, "percentage": 23.27, "elapsed_time": "0:22:35", "remaining_time": "1:14:29", "throughput": 4281.36, "total_tokens": 5803920} {"current_steps": 8885, "total_steps": 38160, "loss": 0.3768, "lr": 0.0009472261079981637, "epoch": 4.65670859538784, "percentage": 23.28, "elapsed_time": "0:22:36", "remaining_time": "1:14:28", "throughput": 4281.34, "total_tokens": 5806736} {"current_steps": 8890, "total_steps": 38160, "loss": 0.4451, "lr": 0.0009471238013174206, "epoch": 4.659329140461216, "percentage": 23.3, "elapsed_time": "0:22:36", "remaining_time": "1:14:27", "throughput": 4281.35, "total_tokens": 5809744} {"current_steps": 8895, "total_steps": 38160, "loss": 0.4774, "lr": 0.0009470214011034795, "epoch": 4.661949685534591, "percentage": 23.31, "elapsed_time": "0:22:37", "remaining_time": "1:14:27", "throughput": 4281.7, "total_tokens": 5813712} {"current_steps": 8900, "total_steps": 38160, "loss": 0.4903, "lr": 0.0009469189073777612, "epoch": 4.664570230607967, "percentage": 23.32, "elapsed_time": "0:22:38", "remaining_time": "1:14:26", "throughput": 4281.75, "total_tokens": 5816880} {"current_steps": 8905, "total_steps": 38160, "loss": 0.5351, "lr": 0.0009468163201617061, "epoch": 4.667190775681342, "percentage": 23.34, "elapsed_time": "0:22:39", "remaining_time": "1:14:25", "throughput": 4281.73, "total_tokens": 5819792} {"current_steps": 8910, "total_steps": 38160, "loss": 0.5164, "lr": 0.0009467136394767744, "epoch": 4.669811320754717, "percentage": 23.35, "elapsed_time": "0:22:39", "remaining_time": "1:14:24", "throughput": 4281.75, "total_tokens": 5822768} {"current_steps": 8915, "total_steps": 38160, "loss": 0.3509, "lr": 0.0009466108653444458, "epoch": 4.672431865828092, "percentage": 23.36, "elapsed_time": "0:22:40", "remaining_time": "1:14:23", "throughput": 4281.86, "total_tokens": 5826032} {"current_steps": 8920, "total_steps": 38160, "loss": 0.4592, "lr": 0.0009465079977862193, "epoch": 4.6750524109014675, "percentage": 23.38, "elapsed_time": "0:22:41", "remaining_time": "1:14:22", "throughput": 4281.77, "total_tokens": 5828656} {"current_steps": 8925, "total_steps": 38160, "loss": 0.4033, "lr": 0.0009464050368236137, "epoch": 4.677672955974843, "percentage": 23.39, "elapsed_time": "0:22:42", "remaining_time": "1:14:21", "throughput": 4281.92, "total_tokens": 5832048} {"current_steps": 8930, "total_steps": 38160, "loss": 0.4104, "lr": 0.0009463019824781674, "epoch": 4.680293501048218, "percentage": 23.4, "elapsed_time": "0:22:42", "remaining_time": "1:14:20", "throughput": 4282.24, "total_tokens": 5836080} {"current_steps": 8935, "total_steps": 38160, "loss": 0.5352, "lr": 0.0009461988347714377, "epoch": 4.682914046121593, "percentage": 23.41, "elapsed_time": "0:22:43", "remaining_time": "1:14:19", "throughput": 4282.22, "total_tokens": 5838928} {"current_steps": 8940, "total_steps": 38160, "loss": 0.4513, "lr": 0.0009460955937250025, "epoch": 4.685534591194968, "percentage": 23.43, "elapsed_time": "0:22:44", "remaining_time": "1:14:19", "throughput": 4282.36, "total_tokens": 5842224} {"current_steps": 8945, "total_steps": 38160, "loss": 0.4406, "lr": 0.0009459922593604584, "epoch": 4.688155136268344, "percentage": 23.44, "elapsed_time": "0:22:44", "remaining_time": "1:14:18", "throughput": 4282.48, "total_tokens": 5845520} {"current_steps": 8950, "total_steps": 38160, "loss": 0.4207, "lr": 0.0009458888316994219, "epoch": 4.690775681341719, "percentage": 23.45, "elapsed_time": "0:22:45", "remaining_time": "1:14:17", "throughput": 4282.45, "total_tokens": 5848368} {"current_steps": 8955, "total_steps": 38160, "loss": 0.4491, "lr": 0.0009457853107635286, "epoch": 4.693396226415095, "percentage": 23.47, "elapsed_time": "0:22:46", "remaining_time": "1:14:16", "throughput": 4282.57, "total_tokens": 5851664} {"current_steps": 8960, "total_steps": 38160, "loss": 0.5211, "lr": 0.0009456816965744342, "epoch": 4.69601677148847, "percentage": 23.48, "elapsed_time": "0:22:47", "remaining_time": "1:14:15", "throughput": 4282.51, "total_tokens": 5854416} {"current_steps": 8965, "total_steps": 38160, "loss": 0.4555, "lr": 0.0009455779891538134, "epoch": 4.698637316561845, "percentage": 23.49, "elapsed_time": "0:22:47", "remaining_time": "1:14:14", "throughput": 4282.64, "total_tokens": 5857744} {"current_steps": 8970, "total_steps": 38160, "loss": 0.3965, "lr": 0.0009454741885233606, "epoch": 4.70125786163522, "percentage": 23.51, "elapsed_time": "0:22:48", "remaining_time": "1:14:13", "throughput": 4283.11, "total_tokens": 5862192} {"current_steps": 8975, "total_steps": 38160, "loss": 0.3798, "lr": 0.0009453702947047899, "epoch": 4.703878406708595, "percentage": 23.52, "elapsed_time": "0:22:49", "remaining_time": "1:14:12", "throughput": 4283.19, "total_tokens": 5865296} {"current_steps": 8980, "total_steps": 38160, "loss": 0.5521, "lr": 0.0009452663077198347, "epoch": 4.70649895178197, "percentage": 23.53, "elapsed_time": "0:22:50", "remaining_time": "1:14:11", "throughput": 4283.23, "total_tokens": 5868272} {"current_steps": 8985, "total_steps": 38160, "loss": 0.4658, "lr": 0.0009451622275902477, "epoch": 4.709119496855346, "percentage": 23.55, "elapsed_time": "0:22:50", "remaining_time": "1:14:11", "throughput": 4283.26, "total_tokens": 5871408} {"current_steps": 8990, "total_steps": 38160, "loss": 0.4163, "lr": 0.0009450580543378013, "epoch": 4.711740041928721, "percentage": 23.56, "elapsed_time": "0:22:51", "remaining_time": "1:14:10", "throughput": 4283.41, "total_tokens": 5874800} {"current_steps": 8995, "total_steps": 38160, "loss": 0.5108, "lr": 0.0009449537879842875, "epoch": 4.714360587002097, "percentage": 23.57, "elapsed_time": "0:22:52", "remaining_time": "1:14:09", "throughput": 4283.83, "total_tokens": 5879088} {"current_steps": 9000, "total_steps": 38160, "loss": 0.5161, "lr": 0.0009448494285515177, "epoch": 4.716981132075472, "percentage": 23.58, "elapsed_time": "0:22:53", "remaining_time": "1:14:08", "throughput": 4283.76, "total_tokens": 5881840} {"current_steps": 9005, "total_steps": 38160, "loss": 0.4415, "lr": 0.0009447449760613222, "epoch": 4.719601677148847, "percentage": 23.6, "elapsed_time": "0:22:53", "remaining_time": "1:14:08", "throughput": 4284.16, "total_tokens": 5885968} {"current_steps": 9010, "total_steps": 38160, "loss": 0.5667, "lr": 0.0009446404305355519, "epoch": 4.722222222222222, "percentage": 23.61, "elapsed_time": "0:22:54", "remaining_time": "1:14:07", "throughput": 4284.18, "total_tokens": 5888944} {"current_steps": 9015, "total_steps": 38160, "loss": 0.412, "lr": 0.0009445357919960762, "epoch": 4.7248427672955975, "percentage": 23.62, "elapsed_time": "0:22:55", "remaining_time": "1:14:06", "throughput": 4284.23, "total_tokens": 5891920} {"current_steps": 9020, "total_steps": 38160, "loss": 0.4828, "lr": 0.0009444310604647844, "epoch": 4.727463312368973, "percentage": 23.64, "elapsed_time": "0:22:55", "remaining_time": "1:14:05", "throughput": 4284.11, "total_tokens": 5894544} {"current_steps": 9025, "total_steps": 38160, "loss": 0.4642, "lr": 0.000944326235963585, "epoch": 4.730083857442348, "percentage": 23.65, "elapsed_time": "0:22:56", "remaining_time": "1:14:04", "throughput": 4284.19, "total_tokens": 5897648} {"current_steps": 9030, "total_steps": 38160, "loss": 0.3895, "lr": 0.0009442213185144062, "epoch": 4.732704402515723, "percentage": 23.66, "elapsed_time": "0:22:57", "remaining_time": "1:14:03", "throughput": 4284.27, "total_tokens": 5900848} {"current_steps": 9035, "total_steps": 38160, "loss": 0.388, "lr": 0.0009441163081391954, "epoch": 4.735324947589098, "percentage": 23.68, "elapsed_time": "0:22:57", "remaining_time": "1:14:01", "throughput": 4284.16, "total_tokens": 5903408} {"current_steps": 9040, "total_steps": 38160, "loss": 0.6181, "lr": 0.00094401120485992, "epoch": 4.737945492662474, "percentage": 23.69, "elapsed_time": "0:22:58", "remaining_time": "1:14:00", "throughput": 4283.98, "total_tokens": 5905840} {"current_steps": 9045, "total_steps": 38160, "loss": 0.397, "lr": 0.0009439060086985658, "epoch": 4.740566037735849, "percentage": 23.7, "elapsed_time": "0:22:59", "remaining_time": "1:14:00", "throughput": 4284.37, "total_tokens": 5909968} {"current_steps": 9050, "total_steps": 38160, "loss": 0.3636, "lr": 0.000943800719677139, "epoch": 4.743186582809225, "percentage": 23.72, "elapsed_time": "0:23:00", "remaining_time": "1:13:59", "throughput": 4284.27, "total_tokens": 5912624} {"current_steps": 9055, "total_steps": 38160, "loss": 0.4183, "lr": 0.0009436953378176649, "epoch": 4.7458071278826, "percentage": 23.73, "elapsed_time": "0:23:00", "remaining_time": "1:13:58", "throughput": 4284.36, "total_tokens": 5915824} {"current_steps": 9060, "total_steps": 38160, "loss": 0.4792, "lr": 0.0009435898631421879, "epoch": 4.748427672955975, "percentage": 23.74, "elapsed_time": "0:23:01", "remaining_time": "1:13:57", "throughput": 4284.76, "total_tokens": 5920048} {"current_steps": 9065, "total_steps": 38160, "loss": 0.5703, "lr": 0.0009434842956727724, "epoch": 4.75104821802935, "percentage": 23.76, "elapsed_time": "0:23:02", "remaining_time": "1:13:56", "throughput": 4284.77, "total_tokens": 5923088} {"current_steps": 9070, "total_steps": 38160, "loss": 0.5059, "lr": 0.0009433786354315017, "epoch": 4.753668763102725, "percentage": 23.77, "elapsed_time": "0:23:03", "remaining_time": "1:13:55", "throughput": 4284.72, "total_tokens": 5925872} {"current_steps": 9075, "total_steps": 38160, "loss": 0.5468, "lr": 0.0009432728824404789, "epoch": 4.7562893081761, "percentage": 23.78, "elapsed_time": "0:23:03", "remaining_time": "1:13:54", "throughput": 4284.6, "total_tokens": 5928464} {"current_steps": 9080, "total_steps": 38160, "loss": 0.2995, "lr": 0.0009431670367218262, "epoch": 4.758909853249476, "percentage": 23.79, "elapsed_time": "0:23:04", "remaining_time": "1:13:53", "throughput": 4284.59, "total_tokens": 5931344} {"current_steps": 9085, "total_steps": 38160, "loss": 0.5674, "lr": 0.0009430610982976852, "epoch": 4.761530398322851, "percentage": 23.81, "elapsed_time": "0:23:05", "remaining_time": "1:13:52", "throughput": 4284.57, "total_tokens": 5934224} {"current_steps": 9090, "total_steps": 38160, "loss": 0.4035, "lr": 0.0009429550671902171, "epoch": 4.764150943396227, "percentage": 23.82, "elapsed_time": "0:23:05", "remaining_time": "1:13:51", "throughput": 4284.64, "total_tokens": 5937424} {"current_steps": 9095, "total_steps": 38160, "loss": 0.4042, "lr": 0.0009428489434216028, "epoch": 4.766771488469602, "percentage": 23.83, "elapsed_time": "0:23:06", "remaining_time": "1:13:50", "throughput": 4284.72, "total_tokens": 5940624} {"current_steps": 9100, "total_steps": 38160, "loss": 0.4398, "lr": 0.0009427427270140415, "epoch": 4.769392033542977, "percentage": 23.85, "elapsed_time": "0:23:07", "remaining_time": "1:13:49", "throughput": 4284.58, "total_tokens": 5943184} {"current_steps": 9105, "total_steps": 38160, "loss": 0.4656, "lr": 0.0009426364179897529, "epoch": 4.772012578616352, "percentage": 23.86, "elapsed_time": "0:23:07", "remaining_time": "1:13:48", "throughput": 4284.42, "total_tokens": 5945680} {"current_steps": 9110, "total_steps": 38160, "loss": 0.3865, "lr": 0.0009425300163709756, "epoch": 4.7746331236897275, "percentage": 23.87, "elapsed_time": "0:23:08", "remaining_time": "1:13:47", "throughput": 4284.46, "total_tokens": 5948816} {"current_steps": 9115, "total_steps": 38160, "loss": 0.4289, "lr": 0.0009424235221799673, "epoch": 4.777253668763103, "percentage": 23.89, "elapsed_time": "0:23:09", "remaining_time": "1:13:46", "throughput": 4284.52, "total_tokens": 5951984} {"current_steps": 9120, "total_steps": 38160, "loss": 0.5561, "lr": 0.0009423169354390058, "epoch": 4.779874213836478, "percentage": 23.9, "elapsed_time": "0:23:09", "remaining_time": "1:13:45", "throughput": 4284.52, "total_tokens": 5954864} {"current_steps": 9125, "total_steps": 38160, "loss": 0.444, "lr": 0.0009422102561703875, "epoch": 4.782494758909853, "percentage": 23.91, "elapsed_time": "0:23:10", "remaining_time": "1:13:44", "throughput": 4284.51, "total_tokens": 5957744} {"current_steps": 9130, "total_steps": 38160, "loss": 0.4988, "lr": 0.0009421034843964287, "epoch": 4.785115303983228, "percentage": 23.93, "elapsed_time": "0:23:11", "remaining_time": "1:13:43", "throughput": 4284.6, "total_tokens": 5961008} {"current_steps": 9135, "total_steps": 38160, "loss": 0.3293, "lr": 0.0009419966201394646, "epoch": 4.787735849056604, "percentage": 23.94, "elapsed_time": "0:23:11", "remaining_time": "1:13:42", "throughput": 4284.74, "total_tokens": 5964336} {"current_steps": 9140, "total_steps": 38160, "loss": 0.4264, "lr": 0.0009418896634218503, "epoch": 4.790356394129979, "percentage": 23.95, "elapsed_time": "0:23:12", "remaining_time": "1:13:42", "throughput": 4284.93, "total_tokens": 5967920} {"current_steps": 9145, "total_steps": 38160, "loss": 0.4554, "lr": 0.0009417826142659596, "epoch": 4.7929769392033545, "percentage": 23.96, "elapsed_time": "0:23:13", "remaining_time": "1:13:41", "throughput": 4285.13, "total_tokens": 5971440} {"current_steps": 9150, "total_steps": 38160, "loss": 0.4621, "lr": 0.0009416754726941863, "epoch": 4.79559748427673, "percentage": 23.98, "elapsed_time": "0:23:14", "remaining_time": "1:13:40", "throughput": 4285.02, "total_tokens": 5974096} {"current_steps": 9155, "total_steps": 38160, "loss": 0.5267, "lr": 0.0009415682387289428, "epoch": 4.798218029350105, "percentage": 23.99, "elapsed_time": "0:23:14", "remaining_time": "1:13:39", "throughput": 4284.9, "total_tokens": 5976624} {"current_steps": 9160, "total_steps": 38160, "loss": 0.5588, "lr": 0.0009414609123926616, "epoch": 4.80083857442348, "percentage": 24.0, "elapsed_time": "0:23:15", "remaining_time": "1:13:38", "throughput": 4285.14, "total_tokens": 5980336} {"current_steps": 9165, "total_steps": 38160, "loss": 0.5216, "lr": 0.000941353493707794, "epoch": 4.803459119496855, "percentage": 24.02, "elapsed_time": "0:23:16", "remaining_time": "1:13:37", "throughput": 4285.05, "total_tokens": 5982992} {"current_steps": 9170, "total_steps": 38160, "loss": 0.5732, "lr": 0.0009412459826968107, "epoch": 4.80607966457023, "percentage": 24.03, "elapsed_time": "0:23:16", "remaining_time": "1:13:36", "throughput": 4285.16, "total_tokens": 5986320} {"current_steps": 9175, "total_steps": 38160, "loss": 0.338, "lr": 0.0009411383793822017, "epoch": 4.808700209643606, "percentage": 24.04, "elapsed_time": "0:23:17", "remaining_time": "1:13:35", "throughput": 4285.41, "total_tokens": 5990032} {"current_steps": 9180, "total_steps": 38160, "loss": 0.5469, "lr": 0.0009410306837864766, "epoch": 4.811320754716981, "percentage": 24.06, "elapsed_time": "0:23:18", "remaining_time": "1:13:34", "throughput": 4285.45, "total_tokens": 5993136} {"current_steps": 9185, "total_steps": 38160, "loss": 0.5557, "lr": 0.000940922895932164, "epoch": 4.813941299790356, "percentage": 24.07, "elapsed_time": "0:23:19", "remaining_time": "1:13:33", "throughput": 4285.5, "total_tokens": 5996304} {"current_steps": 9190, "total_steps": 38160, "loss": 0.4584, "lr": 0.0009408150158418119, "epoch": 4.816561844863732, "percentage": 24.08, "elapsed_time": "0:23:19", "remaining_time": "1:13:32", "throughput": 4285.42, "total_tokens": 5998992} {"current_steps": 9195, "total_steps": 38160, "loss": 0.4241, "lr": 0.0009407070435379876, "epoch": 4.819182389937107, "percentage": 24.1, "elapsed_time": "0:23:20", "remaining_time": "1:13:31", "throughput": 4285.43, "total_tokens": 6001904} {"current_steps": 9200, "total_steps": 38160, "loss": 0.4763, "lr": 0.0009405989790432776, "epoch": 4.821802935010482, "percentage": 24.11, "elapsed_time": "0:23:21", "remaining_time": "1:13:30", "throughput": 4285.45, "total_tokens": 6004912} {"current_steps": 9205, "total_steps": 38160, "loss": 0.548, "lr": 0.0009404908223802877, "epoch": 4.8244234800838575, "percentage": 24.12, "elapsed_time": "0:23:21", "remaining_time": "1:13:29", "throughput": 4285.38, "total_tokens": 6007696} {"current_steps": 9210, "total_steps": 38160, "loss": 0.473, "lr": 0.0009403825735716433, "epoch": 4.827044025157233, "percentage": 24.14, "elapsed_time": "0:23:22", "remaining_time": "1:13:28", "throughput": 4285.35, "total_tokens": 6010544} {"current_steps": 9215, "total_steps": 38160, "loss": 0.4895, "lr": 0.0009402742326399887, "epoch": 4.829664570230608, "percentage": 24.15, "elapsed_time": "0:23:23", "remaining_time": "1:13:27", "throughput": 4285.24, "total_tokens": 6013136} {"current_steps": 9220, "total_steps": 38160, "loss": 0.425, "lr": 0.0009401657996079873, "epoch": 4.832285115303983, "percentage": 24.16, "elapsed_time": "0:23:23", "remaining_time": "1:13:26", "throughput": 4285.32, "total_tokens": 6016336} {"current_steps": 9225, "total_steps": 38160, "loss": 0.5385, "lr": 0.0009400572744983224, "epoch": 4.834905660377358, "percentage": 24.17, "elapsed_time": "0:23:24", "remaining_time": "1:13:25", "throughput": 4285.26, "total_tokens": 6019120} {"current_steps": 9230, "total_steps": 38160, "loss": 0.7082, "lr": 0.0009399486573336963, "epoch": 4.837526205450734, "percentage": 24.19, "elapsed_time": "0:23:25", "remaining_time": "1:13:24", "throughput": 4285.11, "total_tokens": 6021616} {"current_steps": 9235, "total_steps": 38160, "loss": 0.4318, "lr": 0.00093983994813683, "epoch": 4.840146750524109, "percentage": 24.2, "elapsed_time": "0:23:25", "remaining_time": "1:13:23", "throughput": 4285.04, "total_tokens": 6024272} {"current_steps": 9240, "total_steps": 38160, "loss": 0.4526, "lr": 0.0009397311469304648, "epoch": 4.8427672955974845, "percentage": 24.21, "elapsed_time": "0:23:26", "remaining_time": "1:13:22", "throughput": 4285.15, "total_tokens": 6027440} {"current_steps": 9245, "total_steps": 38160, "loss": 0.3895, "lr": 0.0009396222537373602, "epoch": 4.84538784067086, "percentage": 24.23, "elapsed_time": "0:23:27", "remaining_time": "1:13:22", "throughput": 4285.9, "total_tokens": 6032784} {"current_steps": 9250, "total_steps": 38160, "loss": 0.4847, "lr": 0.0009395132685802956, "epoch": 4.848008385744235, "percentage": 24.24, "elapsed_time": "0:23:28", "remaining_time": "1:13:21", "throughput": 4285.85, "total_tokens": 6035600} {"current_steps": 9255, "total_steps": 38160, "loss": 0.6629, "lr": 0.0009394041914820695, "epoch": 4.85062893081761, "percentage": 24.25, "elapsed_time": "0:23:29", "remaining_time": "1:13:20", "throughput": 4286.13, "total_tokens": 6039408} {"current_steps": 9260, "total_steps": 38160, "loss": 0.4246, "lr": 0.0009392950224654994, "epoch": 4.853249475890985, "percentage": 24.27, "elapsed_time": "0:23:29", "remaining_time": "1:13:19", "throughput": 4286.18, "total_tokens": 6042448} {"current_steps": 9265, "total_steps": 38160, "loss": 0.5344, "lr": 0.0009391857615534225, "epoch": 4.85587002096436, "percentage": 24.28, "elapsed_time": "0:23:30", "remaining_time": "1:13:19", "throughput": 4286.38, "total_tokens": 6046032} {"current_steps": 9270, "total_steps": 38160, "loss": 0.5089, "lr": 0.0009390764087686948, "epoch": 4.8584905660377355, "percentage": 24.29, "elapsed_time": "0:23:31", "remaining_time": "1:13:17", "throughput": 4286.28, "total_tokens": 6048656} {"current_steps": 9275, "total_steps": 38160, "loss": 0.704, "lr": 0.0009389669641341916, "epoch": 4.861111111111111, "percentage": 24.31, "elapsed_time": "0:23:31", "remaining_time": "1:13:17", "throughput": 4286.47, "total_tokens": 6052176} {"current_steps": 9280, "total_steps": 38160, "loss": 0.4414, "lr": 0.0009388574276728075, "epoch": 4.863731656184486, "percentage": 24.32, "elapsed_time": "0:23:32", "remaining_time": "1:13:16", "throughput": 4286.31, "total_tokens": 6054704} {"current_steps": 9285, "total_steps": 38160, "loss": 0.5621, "lr": 0.0009387477994074562, "epoch": 4.866352201257862, "percentage": 24.33, "elapsed_time": "0:23:33", "remaining_time": "1:13:14", "throughput": 4286.11, "total_tokens": 6057040} {"current_steps": 9290, "total_steps": 38160, "loss": 0.4349, "lr": 0.0009386380793610707, "epoch": 4.868972746331237, "percentage": 24.34, "elapsed_time": "0:23:33", "remaining_time": "1:13:13", "throughput": 4286.19, "total_tokens": 6060272} {"current_steps": 9295, "total_steps": 38160, "loss": 0.4657, "lr": 0.0009385282675566034, "epoch": 4.871593291404612, "percentage": 24.36, "elapsed_time": "0:23:34", "remaining_time": "1:13:13", "throughput": 4286.38, "total_tokens": 6063792} {"current_steps": 9300, "total_steps": 38160, "loss": 0.3357, "lr": 0.0009384183640170255, "epoch": 4.8742138364779874, "percentage": 24.37, "elapsed_time": "0:23:35", "remaining_time": "1:13:12", "throughput": 4286.57, "total_tokens": 6067312} {"current_steps": 9305, "total_steps": 38160, "loss": 0.5249, "lr": 0.0009383083687653275, "epoch": 4.876834381551363, "percentage": 24.38, "elapsed_time": "0:23:36", "remaining_time": "1:13:11", "throughput": 4286.66, "total_tokens": 6070544} {"current_steps": 9310, "total_steps": 38160, "loss": 0.3973, "lr": 0.0009381982818245193, "epoch": 4.879454926624738, "percentage": 24.4, "elapsed_time": "0:23:36", "remaining_time": "1:13:10", "throughput": 4286.76, "total_tokens": 6073904} {"current_steps": 9315, "total_steps": 38160, "loss": 0.4625, "lr": 0.0009380881032176299, "epoch": 4.882075471698113, "percentage": 24.41, "elapsed_time": "0:23:37", "remaining_time": "1:13:09", "throughput": 4286.93, "total_tokens": 6077392} {"current_steps": 9320, "total_steps": 38160, "loss": 0.4369, "lr": 0.0009379778329677071, "epoch": 4.884696016771488, "percentage": 24.42, "elapsed_time": "0:23:38", "remaining_time": "1:13:09", "throughput": 4287.11, "total_tokens": 6080880} {"current_steps": 9325, "total_steps": 38160, "loss": 0.4491, "lr": 0.0009378674710978184, "epoch": 4.887316561844864, "percentage": 24.44, "elapsed_time": "0:23:39", "remaining_time": "1:13:08", "throughput": 4287.2, "total_tokens": 6084144} {"current_steps": 9330, "total_steps": 38160, "loss": 0.4101, "lr": 0.0009377570176310503, "epoch": 4.889937106918239, "percentage": 24.45, "elapsed_time": "0:23:39", "remaining_time": "1:13:07", "throughput": 4287.4, "total_tokens": 6087792} {"current_steps": 9335, "total_steps": 38160, "loss": 0.4615, "lr": 0.0009376464725905082, "epoch": 4.8925576519916145, "percentage": 24.46, "elapsed_time": "0:23:40", "remaining_time": "1:13:07", "throughput": 4287.87, "total_tokens": 6092240} {"current_steps": 9340, "total_steps": 38160, "loss": 0.5572, "lr": 0.000937535835999317, "epoch": 4.89517819706499, "percentage": 24.48, "elapsed_time": "0:23:41", "remaining_time": "1:13:06", "throughput": 4288.09, "total_tokens": 6095920} {"current_steps": 9345, "total_steps": 38160, "loss": 0.4483, "lr": 0.0009374251078806206, "epoch": 4.897798742138365, "percentage": 24.49, "elapsed_time": "0:23:42", "remaining_time": "1:13:07", "throughput": 4289.3, "total_tokens": 6102960} {"current_steps": 9350, "total_steps": 38160, "loss": 0.4874, "lr": 0.000937314288257582, "epoch": 4.90041928721174, "percentage": 24.5, "elapsed_time": "0:23:43", "remaining_time": "1:13:06", "throughput": 4289.44, "total_tokens": 6106320} {"current_steps": 9355, "total_steps": 38160, "loss": 0.5013, "lr": 0.0009372033771533835, "epoch": 4.903039832285115, "percentage": 24.52, "elapsed_time": "0:23:44", "remaining_time": "1:13:05", "throughput": 4289.37, "total_tokens": 6109104} {"current_steps": 9360, "total_steps": 38160, "loss": 0.5138, "lr": 0.0009370923745912264, "epoch": 4.90566037735849, "percentage": 24.53, "elapsed_time": "0:23:44", "remaining_time": "1:13:04", "throughput": 4289.45, "total_tokens": 6112368} {"current_steps": 9365, "total_steps": 38160, "loss": 0.4453, "lr": 0.000936981280594331, "epoch": 4.9082809224318655, "percentage": 24.54, "elapsed_time": "0:23:45", "remaining_time": "1:13:03", "throughput": 4289.28, "total_tokens": 6114800} {"current_steps": 9370, "total_steps": 38160, "loss": 0.5098, "lr": 0.0009368700951859371, "epoch": 4.910901467505241, "percentage": 24.55, "elapsed_time": "0:23:46", "remaining_time": "1:13:02", "throughput": 4289.08, "total_tokens": 6117232} {"current_steps": 9375, "total_steps": 38160, "loss": 0.5369, "lr": 0.0009367588183893035, "epoch": 4.913522012578616, "percentage": 24.57, "elapsed_time": "0:23:46", "remaining_time": "1:13:01", "throughput": 4289.04, "total_tokens": 6120112} {"current_steps": 9380, "total_steps": 38160, "loss": 0.4261, "lr": 0.0009366474502277076, "epoch": 4.916142557651992, "percentage": 24.58, "elapsed_time": "0:23:47", "remaining_time": "1:13:00", "throughput": 4289.32, "total_tokens": 6123984} {"current_steps": 9385, "total_steps": 38160, "loss": 0.3763, "lr": 0.0009365359907244469, "epoch": 4.918763102725367, "percentage": 24.59, "elapsed_time": "0:23:48", "remaining_time": "1:12:59", "throughput": 4289.53, "total_tokens": 6127568} {"current_steps": 9390, "total_steps": 38160, "loss": 0.3541, "lr": 0.0009364244399028372, "epoch": 4.921383647798742, "percentage": 24.61, "elapsed_time": "0:23:49", "remaining_time": "1:12:58", "throughput": 4289.62, "total_tokens": 6130800} {"current_steps": 9395, "total_steps": 38160, "loss": 0.5279, "lr": 0.0009363127977862136, "epoch": 4.924004192872117, "percentage": 24.62, "elapsed_time": "0:23:49", "remaining_time": "1:12:58", "throughput": 4289.77, "total_tokens": 6134224} {"current_steps": 9400, "total_steps": 38160, "loss": 0.5962, "lr": 0.0009362010643979304, "epoch": 4.926624737945493, "percentage": 24.63, "elapsed_time": "0:23:50", "remaining_time": "1:12:57", "throughput": 4289.68, "total_tokens": 6136912} {"current_steps": 9405, "total_steps": 38160, "loss": 0.4571, "lr": 0.000936089239761361, "epoch": 4.929245283018868, "percentage": 24.65, "elapsed_time": "0:23:51", "remaining_time": "1:12:56", "throughput": 4290.19, "total_tokens": 6141552} {"current_steps": 9410, "total_steps": 38160, "loss": 0.5087, "lr": 0.0009359773238998978, "epoch": 4.931865828092243, "percentage": 24.66, "elapsed_time": "0:23:52", "remaining_time": "1:12:55", "throughput": 4290.13, "total_tokens": 6144336} {"current_steps": 9415, "total_steps": 38160, "loss": 0.4275, "lr": 0.0009358653168369524, "epoch": 4.934486373165618, "percentage": 24.67, "elapsed_time": "0:23:52", "remaining_time": "1:12:54", "throughput": 4290.16, "total_tokens": 6147472} {"current_steps": 9420, "total_steps": 38160, "loss": 0.5455, "lr": 0.0009357532185959554, "epoch": 4.937106918238994, "percentage": 24.69, "elapsed_time": "0:23:53", "remaining_time": "1:12:53", "throughput": 4290.2, "total_tokens": 6150544} {"current_steps": 9425, "total_steps": 38160, "loss": 0.4983, "lr": 0.0009356410292003562, "epoch": 4.939727463312369, "percentage": 24.7, "elapsed_time": "0:23:54", "remaining_time": "1:12:53", "throughput": 4290.42, "total_tokens": 6154192} {"current_steps": 9430, "total_steps": 38160, "loss": 0.5044, "lr": 0.0009355287486736239, "epoch": 4.9423480083857445, "percentage": 24.71, "elapsed_time": "0:23:55", "remaining_time": "1:12:52", "throughput": 4290.36, "total_tokens": 6156880} {"current_steps": 9435, "total_steps": 38160, "loss": 0.4157, "lr": 0.0009354163770392461, "epoch": 4.94496855345912, "percentage": 24.72, "elapsed_time": "0:23:55", "remaining_time": "1:12:51", "throughput": 4290.49, "total_tokens": 6160240} {"current_steps": 9440, "total_steps": 38160, "loss": 0.4332, "lr": 0.0009353039143207295, "epoch": 4.947589098532495, "percentage": 24.74, "elapsed_time": "0:23:56", "remaining_time": "1:12:50", "throughput": 4290.76, "total_tokens": 6164048} {"current_steps": 9445, "total_steps": 38160, "loss": 0.4615, "lr": 0.0009351913605416007, "epoch": 4.95020964360587, "percentage": 24.75, "elapsed_time": "0:23:57", "remaining_time": "1:12:49", "throughput": 4290.62, "total_tokens": 6166576} {"current_steps": 9450, "total_steps": 38160, "loss": 0.484, "lr": 0.000935078715725404, "epoch": 4.952830188679245, "percentage": 24.76, "elapsed_time": "0:23:57", "remaining_time": "1:12:48", "throughput": 4290.7, "total_tokens": 6169808} {"current_steps": 9455, "total_steps": 38160, "loss": 0.45, "lr": 0.0009349659798957034, "epoch": 4.95545073375262, "percentage": 24.78, "elapsed_time": "0:23:58", "remaining_time": "1:12:47", "throughput": 4290.52, "total_tokens": 6172176} {"current_steps": 9460, "total_steps": 38160, "loss": 0.4605, "lr": 0.0009348531530760823, "epoch": 4.9580712788259955, "percentage": 24.79, "elapsed_time": "0:23:59", "remaining_time": "1:12:46", "throughput": 4290.52, "total_tokens": 6175120} {"current_steps": 9465, "total_steps": 38160, "loss": 0.3572, "lr": 0.0009347402352901426, "epoch": 4.960691823899371, "percentage": 24.8, "elapsed_time": "0:24:00", "remaining_time": "1:12:45", "throughput": 4290.74, "total_tokens": 6178832} {"current_steps": 9470, "total_steps": 38160, "loss": 0.4784, "lr": 0.0009346272265615057, "epoch": 4.963312368972746, "percentage": 24.82, "elapsed_time": "0:24:00", "remaining_time": "1:12:44", "throughput": 4290.88, "total_tokens": 6182224} {"current_steps": 9475, "total_steps": 38160, "loss": 0.4827, "lr": 0.0009345141269138112, "epoch": 4.965932914046122, "percentage": 24.83, "elapsed_time": "0:24:01", "remaining_time": "1:12:44", "throughput": 4290.94, "total_tokens": 6185392} {"current_steps": 9480, "total_steps": 38160, "loss": 0.5156, "lr": 0.0009344009363707186, "epoch": 4.968553459119497, "percentage": 24.84, "elapsed_time": "0:24:02", "remaining_time": "1:12:43", "throughput": 4291.12, "total_tokens": 6188848} {"current_steps": 9485, "total_steps": 38160, "loss": 0.4994, "lr": 0.000934287654955906, "epoch": 4.971174004192872, "percentage": 24.86, "elapsed_time": "0:24:02", "remaining_time": "1:12:42", "throughput": 4291.1, "total_tokens": 6191760} {"current_steps": 9490, "total_steps": 38160, "loss": 0.6476, "lr": 0.0009341742826930708, "epoch": 4.973794549266247, "percentage": 24.87, "elapsed_time": "0:24:03", "remaining_time": "1:12:41", "throughput": 4291.13, "total_tokens": 6194864} {"current_steps": 9495, "total_steps": 38160, "loss": 0.4756, "lr": 0.0009340608196059289, "epoch": 4.976415094339623, "percentage": 24.88, "elapsed_time": "0:24:04", "remaining_time": "1:12:40", "throughput": 4291.08, "total_tokens": 6197648} {"current_steps": 9500, "total_steps": 38160, "loss": 0.4437, "lr": 0.0009339472657182155, "epoch": 4.979035639412998, "percentage": 24.9, "elapsed_time": "0:24:05", "remaining_time": "1:12:39", "throughput": 4291.14, "total_tokens": 6200816} {"current_steps": 9505, "total_steps": 38160, "loss": 0.4466, "lr": 0.0009338336210536848, "epoch": 4.981656184486373, "percentage": 24.91, "elapsed_time": "0:24:05", "remaining_time": "1:12:38", "throughput": 4291.02, "total_tokens": 6203344} {"current_steps": 9510, "total_steps": 38160, "loss": 0.3441, "lr": 0.0009337198856361102, "epoch": 4.984276729559748, "percentage": 24.92, "elapsed_time": "0:24:06", "remaining_time": "1:12:37", "throughput": 4291.17, "total_tokens": 6206768} {"current_steps": 9515, "total_steps": 38160, "loss": 0.4892, "lr": 0.0009336060594892834, "epoch": 4.986897274633124, "percentage": 24.93, "elapsed_time": "0:24:07", "remaining_time": "1:12:36", "throughput": 4291.01, "total_tokens": 6209168} {"current_steps": 9520, "total_steps": 38160, "loss": 0.5183, "lr": 0.000933492142637016, "epoch": 4.989517819706499, "percentage": 24.95, "elapsed_time": "0:24:07", "remaining_time": "1:12:36", "throughput": 4291.66, "total_tokens": 6214320} {"current_steps": 9525, "total_steps": 38160, "loss": 0.4572, "lr": 0.0009333781351031379, "epoch": 4.9921383647798745, "percentage": 24.96, "elapsed_time": "0:24:08", "remaining_time": "1:12:36", "throughput": 4292.31, "total_tokens": 6219472} {"current_steps": 9530, "total_steps": 38160, "loss": 0.4907, "lr": 0.0009332640369114981, "epoch": 4.99475890985325, "percentage": 24.97, "elapsed_time": "0:24:09", "remaining_time": "1:12:35", "throughput": 4292.46, "total_tokens": 6222800} {"current_steps": 9535, "total_steps": 38160, "loss": 0.5792, "lr": 0.0009331498480859647, "epoch": 4.997379454926625, "percentage": 24.99, "elapsed_time": "0:24:10", "remaining_time": "1:12:34", "throughput": 4292.67, "total_tokens": 6226416} {"current_steps": 9540, "total_steps": 38160, "loss": 0.4158, "lr": 0.0009330355686504247, "epoch": 5.0, "percentage": 25.0, "elapsed_time": "0:24:11", "remaining_time": "1:12:33", "throughput": 4292.18, "total_tokens": 6229240} {"current_steps": 9540, "total_steps": 38160, "eval_loss": 0.48624399304389954, "epoch": 5.0, "percentage": 25.0, "elapsed_time": "0:24:25", "remaining_time": "1:13:15", "throughput": 4251.99, "total_tokens": 6229240} {"current_steps": 9545, "total_steps": 38160, "loss": 0.4261, "lr": 0.0009329211986287842, "epoch": 5.002620545073375, "percentage": 25.01, "elapsed_time": "0:24:27", "remaining_time": "1:13:19", "throughput": 4247.58, "total_tokens": 6233752} {"current_steps": 9550, "total_steps": 38160, "loss": 0.4472, "lr": 0.0009328067380449678, "epoch": 5.00524109014675, "percentage": 25.03, "elapsed_time": "0:24:28", "remaining_time": "1:13:18", "throughput": 4247.55, "total_tokens": 6236568} {"current_steps": 9555, "total_steps": 38160, "loss": 0.4915, "lr": 0.0009326921869229197, "epoch": 5.0078616352201255, "percentage": 25.04, "elapsed_time": "0:24:28", "remaining_time": "1:13:17", "throughput": 4247.41, "total_tokens": 6239096} {"current_steps": 9560, "total_steps": 38160, "loss": 0.4063, "lr": 0.0009325775452866023, "epoch": 5.010482180293501, "percentage": 25.05, "elapsed_time": "0:24:29", "remaining_time": "1:13:16", "throughput": 4247.26, "total_tokens": 6241688} {"current_steps": 9565, "total_steps": 38160, "loss": 0.4026, "lr": 0.0009324628131599977, "epoch": 5.013102725366877, "percentage": 25.07, "elapsed_time": "0:24:30", "remaining_time": "1:13:15", "throughput": 4247.36, "total_tokens": 6244888} {"current_steps": 9570, "total_steps": 38160, "loss": 0.3987, "lr": 0.0009323479905671064, "epoch": 5.015723270440252, "percentage": 25.08, "elapsed_time": "0:24:30", "remaining_time": "1:13:14", "throughput": 4247.24, "total_tokens": 6247352} {"current_steps": 9575, "total_steps": 38160, "loss": 0.5504, "lr": 0.0009322330775319479, "epoch": 5.018343815513627, "percentage": 25.09, "elapsed_time": "0:24:31", "remaining_time": "1:13:13", "throughput": 4247.17, "total_tokens": 6250136} {"current_steps": 9580, "total_steps": 38160, "loss": 0.5302, "lr": 0.0009321180740785607, "epoch": 5.020964360587002, "percentage": 25.1, "elapsed_time": "0:24:32", "remaining_time": "1:13:12", "throughput": 4247.14, "total_tokens": 6252920} {"current_steps": 9585, "total_steps": 38160, "loss": 0.3786, "lr": 0.0009320029802310023, "epoch": 5.023584905660377, "percentage": 25.12, "elapsed_time": "0:24:32", "remaining_time": "1:13:11", "throughput": 4247.0, "total_tokens": 6255416} {"current_steps": 9590, "total_steps": 38160, "loss": 0.4558, "lr": 0.0009318877960133489, "epoch": 5.026205450733753, "percentage": 25.13, "elapsed_time": "0:24:33", "remaining_time": "1:13:10", "throughput": 4247.09, "total_tokens": 6258584} {"current_steps": 9595, "total_steps": 38160, "loss": 0.5084, "lr": 0.0009317725214496959, "epoch": 5.028825995807128, "percentage": 25.14, "elapsed_time": "0:24:34", "remaining_time": "1:13:10", "throughput": 4248.14, "total_tokens": 6265528} {"current_steps": 9600, "total_steps": 38160, "loss": 0.4801, "lr": 0.0009316571565641574, "epoch": 5.031446540880503, "percentage": 25.16, "elapsed_time": "0:24:35", "remaining_time": "1:13:10", "throughput": 4248.32, "total_tokens": 6269016} {"current_steps": 9605, "total_steps": 38160, "loss": 0.4384, "lr": 0.0009315417013808663, "epoch": 5.034067085953878, "percentage": 25.17, "elapsed_time": "0:24:36", "remaining_time": "1:13:09", "throughput": 4248.41, "total_tokens": 6272216} {"current_steps": 9610, "total_steps": 38160, "loss": 0.4578, "lr": 0.0009314261559239745, "epoch": 5.036687631027253, "percentage": 25.18, "elapsed_time": "0:24:37", "remaining_time": "1:13:08", "throughput": 4248.64, "total_tokens": 6275960} {"current_steps": 9615, "total_steps": 38160, "loss": 0.4425, "lr": 0.000931310520217653, "epoch": 5.039308176100629, "percentage": 25.2, "elapsed_time": "0:24:37", "remaining_time": "1:13:07", "throughput": 4248.61, "total_tokens": 6278744} {"current_steps": 9620, "total_steps": 38160, "loss": 0.5357, "lr": 0.0009311947942860912, "epoch": 5.0419287211740045, "percentage": 25.21, "elapsed_time": "0:24:38", "remaining_time": "1:13:06", "throughput": 4248.65, "total_tokens": 6281880} {"current_steps": 9625, "total_steps": 38160, "loss": 0.5327, "lr": 0.0009310789781534979, "epoch": 5.04454926624738, "percentage": 25.22, "elapsed_time": "0:24:39", "remaining_time": "1:13:05", "throughput": 4248.82, "total_tokens": 6285336} {"current_steps": 9630, "total_steps": 38160, "loss": 0.5292, "lr": 0.0009309630718441003, "epoch": 5.047169811320755, "percentage": 25.24, "elapsed_time": "0:24:40", "remaining_time": "1:13:05", "throughput": 4249.12, "total_tokens": 6289176} {"current_steps": 9635, "total_steps": 38160, "loss": 0.4859, "lr": 0.0009308470753821445, "epoch": 5.04979035639413, "percentage": 25.25, "elapsed_time": "0:24:40", "remaining_time": "1:13:04", "throughput": 4249.34, "total_tokens": 6292824} {"current_steps": 9640, "total_steps": 38160, "loss": 0.3726, "lr": 0.0009307309887918962, "epoch": 5.052410901467505, "percentage": 25.26, "elapsed_time": "0:24:41", "remaining_time": "1:13:03", "throughput": 4249.66, "total_tokens": 6296760} {"current_steps": 9645, "total_steps": 38160, "loss": 0.5158, "lr": 0.000930614812097639, "epoch": 5.05503144654088, "percentage": 25.28, "elapsed_time": "0:24:42", "remaining_time": "1:13:02", "throughput": 4249.85, "total_tokens": 6300280} {"current_steps": 9650, "total_steps": 38160, "loss": 0.4459, "lr": 0.0009304985453236758, "epoch": 5.0576519916142555, "percentage": 25.29, "elapsed_time": "0:24:43", "remaining_time": "1:13:02", "throughput": 4250.12, "total_tokens": 6304056} {"current_steps": 9655, "total_steps": 38160, "loss": 0.3201, "lr": 0.0009303821884943284, "epoch": 5.060272536687631, "percentage": 25.3, "elapsed_time": "0:24:43", "remaining_time": "1:13:01", "throughput": 4250.14, "total_tokens": 6307000} {"current_steps": 9660, "total_steps": 38160, "loss": 0.4337, "lr": 0.0009302657416339371, "epoch": 5.062893081761007, "percentage": 25.31, "elapsed_time": "0:24:44", "remaining_time": "1:13:00", "throughput": 4250.49, "total_tokens": 6311032} {"current_steps": 9665, "total_steps": 38160, "loss": 0.5017, "lr": 0.0009301492047668615, "epoch": 5.065513626834382, "percentage": 25.33, "elapsed_time": "0:24:45", "remaining_time": "1:12:59", "throughput": 4250.75, "total_tokens": 6314680} {"current_steps": 9670, "total_steps": 38160, "loss": 0.3925, "lr": 0.0009300325779174796, "epoch": 5.068134171907757, "percentage": 25.34, "elapsed_time": "0:24:46", "remaining_time": "1:12:58", "throughput": 4250.75, "total_tokens": 6317560} {"current_steps": 9675, "total_steps": 38160, "loss": 0.5882, "lr": 0.0009299158611101885, "epoch": 5.070754716981132, "percentage": 25.35, "elapsed_time": "0:24:47", "remaining_time": "1:12:58", "throughput": 4250.99, "total_tokens": 6321336} {"current_steps": 9680, "total_steps": 38160, "loss": 0.6108, "lr": 0.000929799054369404, "epoch": 5.073375262054507, "percentage": 25.37, "elapsed_time": "0:24:47", "remaining_time": "1:12:57", "throughput": 4251.04, "total_tokens": 6324376} {"current_steps": 9685, "total_steps": 38160, "loss": 0.4614, "lr": 0.0009296821577195606, "epoch": 5.075995807127883, "percentage": 25.38, "elapsed_time": "0:24:48", "remaining_time": "1:12:56", "throughput": 4251.02, "total_tokens": 6327256} {"current_steps": 9690, "total_steps": 38160, "loss": 0.3533, "lr": 0.000929565171185112, "epoch": 5.078616352201258, "percentage": 25.39, "elapsed_time": "0:24:49", "remaining_time": "1:12:55", "throughput": 4251.19, "total_tokens": 6330680} {"current_steps": 9695, "total_steps": 38160, "loss": 0.4809, "lr": 0.0009294480947905304, "epoch": 5.081236897274633, "percentage": 25.41, "elapsed_time": "0:24:50", "remaining_time": "1:12:54", "throughput": 4251.56, "total_tokens": 6334872} {"current_steps": 9700, "total_steps": 38160, "loss": 0.4432, "lr": 0.0009293309285603067, "epoch": 5.083857442348008, "percentage": 25.42, "elapsed_time": "0:24:50", "remaining_time": "1:12:53", "throughput": 4251.56, "total_tokens": 6337752} {"current_steps": 9705, "total_steps": 38160, "loss": 0.4081, "lr": 0.0009292136725189506, "epoch": 5.086477987421383, "percentage": 25.43, "elapsed_time": "0:24:51", "remaining_time": "1:12:52", "throughput": 4251.47, "total_tokens": 6340376} {"current_steps": 9710, "total_steps": 38160, "loss": 0.6092, "lr": 0.0009290963266909912, "epoch": 5.089098532494759, "percentage": 25.45, "elapsed_time": "0:24:52", "remaining_time": "1:12:51", "throughput": 4251.6, "total_tokens": 6343768} {"current_steps": 9715, "total_steps": 38160, "loss": 0.4441, "lr": 0.0009289788911009756, "epoch": 5.0917190775681345, "percentage": 25.46, "elapsed_time": "0:24:52", "remaining_time": "1:12:50", "throughput": 4251.7, "total_tokens": 6346968} {"current_steps": 9720, "total_steps": 38160, "loss": 0.4687, "lr": 0.0009288613657734699, "epoch": 5.09433962264151, "percentage": 25.47, "elapsed_time": "0:24:53", "remaining_time": "1:12:50", "throughput": 4252.4, "total_tokens": 6352280} {"current_steps": 9725, "total_steps": 38160, "loss": 0.4435, "lr": 0.0009287437507330594, "epoch": 5.096960167714885, "percentage": 25.48, "elapsed_time": "0:24:54", "remaining_time": "1:12:49", "throughput": 4252.45, "total_tokens": 6355288} {"current_steps": 9730, "total_steps": 38160, "loss": 0.5776, "lr": 0.0009286260460043475, "epoch": 5.09958071278826, "percentage": 25.5, "elapsed_time": "0:24:55", "remaining_time": "1:12:48", "throughput": 4252.41, "total_tokens": 6358040} {"current_steps": 9735, "total_steps": 38160, "loss": 0.3595, "lr": 0.0009285082516119567, "epoch": 5.102201257861635, "percentage": 25.51, "elapsed_time": "0:24:55", "remaining_time": "1:12:47", "throughput": 4252.41, "total_tokens": 6360984} {"current_steps": 9740, "total_steps": 38160, "loss": 0.4192, "lr": 0.0009283903675805285, "epoch": 5.10482180293501, "percentage": 25.52, "elapsed_time": "0:24:56", "remaining_time": "1:12:46", "throughput": 4252.33, "total_tokens": 6363736} {"current_steps": 9745, "total_steps": 38160, "loss": 0.4745, "lr": 0.0009282723939347227, "epoch": 5.1074423480083855, "percentage": 25.54, "elapsed_time": "0:24:57", "remaining_time": "1:12:45", "throughput": 4252.12, "total_tokens": 6365944} {"current_steps": 9750, "total_steps": 38160, "loss": 0.3449, "lr": 0.0009281543306992181, "epoch": 5.110062893081761, "percentage": 25.55, "elapsed_time": "0:24:58", "remaining_time": "1:12:44", "throughput": 4252.63, "total_tokens": 6370488} {"current_steps": 9755, "total_steps": 38160, "loss": 0.4838, "lr": 0.0009280361778987121, "epoch": 5.112683438155136, "percentage": 25.56, "elapsed_time": "0:24:58", "remaining_time": "1:12:44", "throughput": 4252.84, "total_tokens": 6374008} {"current_steps": 9760, "total_steps": 38160, "loss": 0.5512, "lr": 0.0009279179355579211, "epoch": 5.115303983228512, "percentage": 25.58, "elapsed_time": "0:24:59", "remaining_time": "1:12:43", "throughput": 4253.08, "total_tokens": 6377688} {"current_steps": 9765, "total_steps": 38160, "loss": 0.403, "lr": 0.0009277996037015798, "epoch": 5.117924528301887, "percentage": 25.59, "elapsed_time": "0:25:00", "remaining_time": "1:12:42", "throughput": 4253.44, "total_tokens": 6381752} {"current_steps": 9770, "total_steps": 38160, "loss": 0.4527, "lr": 0.000927681182354442, "epoch": 5.120545073375262, "percentage": 25.6, "elapsed_time": "0:25:01", "remaining_time": "1:12:41", "throughput": 4253.43, "total_tokens": 6384600} {"current_steps": 9775, "total_steps": 38160, "loss": 0.6011, "lr": 0.0009275626715412802, "epoch": 5.123165618448637, "percentage": 25.62, "elapsed_time": "0:25:01", "remaining_time": "1:12:41", "throughput": 4253.85, "total_tokens": 6388888} {"current_steps": 9780, "total_steps": 38160, "loss": 0.4759, "lr": 0.0009274440712868853, "epoch": 5.1257861635220126, "percentage": 25.63, "elapsed_time": "0:25:02", "remaining_time": "1:12:40", "throughput": 4253.99, "total_tokens": 6392248} {"current_steps": 9785, "total_steps": 38160, "loss": 0.4852, "lr": 0.0009273253816160673, "epoch": 5.128406708595388, "percentage": 25.64, "elapsed_time": "0:25:03", "remaining_time": "1:12:39", "throughput": 4253.99, "total_tokens": 6395160} {"current_steps": 9790, "total_steps": 38160, "loss": 0.5621, "lr": 0.0009272066025536545, "epoch": 5.131027253668763, "percentage": 25.66, "elapsed_time": "0:25:03", "remaining_time": "1:12:38", "throughput": 4253.93, "total_tokens": 6397912} {"current_steps": 9795, "total_steps": 38160, "loss": 0.5703, "lr": 0.0009270877341244945, "epoch": 5.133647798742138, "percentage": 25.67, "elapsed_time": "0:25:04", "remaining_time": "1:12:37", "throughput": 4253.76, "total_tokens": 6400280} {"current_steps": 9800, "total_steps": 38160, "loss": 0.463, "lr": 0.0009269687763534529, "epoch": 5.136268343815513, "percentage": 25.68, "elapsed_time": "0:25:05", "remaining_time": "1:12:36", "throughput": 4254.14, "total_tokens": 6404440} {"current_steps": 9805, "total_steps": 38160, "loss": 0.7031, "lr": 0.0009268497292654143, "epoch": 5.138888888888889, "percentage": 25.69, "elapsed_time": "0:25:06", "remaining_time": "1:12:35", "throughput": 4254.0, "total_tokens": 6406872} {"current_steps": 9810, "total_steps": 38160, "loss": 0.4429, "lr": 0.0009267305928852823, "epoch": 5.1415094339622645, "percentage": 25.71, "elapsed_time": "0:25:06", "remaining_time": "1:12:34", "throughput": 4254.45, "total_tokens": 6411288} {"current_steps": 9815, "total_steps": 38160, "loss": 0.4672, "lr": 0.0009266113672379786, "epoch": 5.14412997903564, "percentage": 25.72, "elapsed_time": "0:25:07", "remaining_time": "1:12:34", "throughput": 4254.46, "total_tokens": 6414360} {"current_steps": 9820, "total_steps": 38160, "loss": 0.4818, "lr": 0.0009264920523484437, "epoch": 5.146750524109015, "percentage": 25.73, "elapsed_time": "0:25:08", "remaining_time": "1:12:33", "throughput": 4254.53, "total_tokens": 6417624} {"current_steps": 9825, "total_steps": 38160, "loss": 0.548, "lr": 0.0009263726482416374, "epoch": 5.14937106918239, "percentage": 25.75, "elapsed_time": "0:25:09", "remaining_time": "1:12:32", "throughput": 4254.71, "total_tokens": 6421080} {"current_steps": 9830, "total_steps": 38160, "loss": 0.4735, "lr": 0.0009262531549425372, "epoch": 5.151991614255765, "percentage": 25.76, "elapsed_time": "0:25:10", "remaining_time": "1:12:32", "throughput": 4255.26, "total_tokens": 6425752} {"current_steps": 9835, "total_steps": 38160, "loss": 0.4318, "lr": 0.0009261335724761402, "epoch": 5.15461215932914, "percentage": 25.77, "elapsed_time": "0:25:10", "remaining_time": "1:12:31", "throughput": 4255.36, "total_tokens": 6429016} {"current_steps": 9840, "total_steps": 38160, "loss": 0.5319, "lr": 0.0009260139008674612, "epoch": 5.1572327044025155, "percentage": 25.79, "elapsed_time": "0:25:11", "remaining_time": "1:12:30", "throughput": 4255.43, "total_tokens": 6432056} {"current_steps": 9845, "total_steps": 38160, "loss": 0.4592, "lr": 0.0009258941401415344, "epoch": 5.159853249475891, "percentage": 25.8, "elapsed_time": "0:25:12", "remaining_time": "1:12:29", "throughput": 4255.6, "total_tokens": 6435448} {"current_steps": 9850, "total_steps": 38160, "loss": 0.3822, "lr": 0.0009257742903234123, "epoch": 5.162473794549266, "percentage": 25.81, "elapsed_time": "0:25:12", "remaining_time": "1:12:28", "throughput": 4255.64, "total_tokens": 6438520} {"current_steps": 9855, "total_steps": 38160, "loss": 0.4497, "lr": 0.0009256543514381664, "epoch": 5.165094339622642, "percentage": 25.83, "elapsed_time": "0:25:13", "remaining_time": "1:12:27", "throughput": 4255.52, "total_tokens": 6440984} {"current_steps": 9860, "total_steps": 38160, "loss": 0.5196, "lr": 0.0009255343235108859, "epoch": 5.167714884696017, "percentage": 25.84, "elapsed_time": "0:25:14", "remaining_time": "1:12:26", "throughput": 4255.53, "total_tokens": 6443992} {"current_steps": 9865, "total_steps": 38160, "loss": 0.4055, "lr": 0.00092541420656668, "epoch": 5.170335429769392, "percentage": 25.85, "elapsed_time": "0:25:14", "remaining_time": "1:12:25", "throughput": 4255.43, "total_tokens": 6446552} {"current_steps": 9870, "total_steps": 38160, "loss": 0.4551, "lr": 0.0009252940006306753, "epoch": 5.172955974842767, "percentage": 25.86, "elapsed_time": "0:25:15", "remaining_time": "1:12:23", "throughput": 4255.32, "total_tokens": 6449080} {"current_steps": 9875, "total_steps": 38160, "loss": 0.4532, "lr": 0.0009251737057280179, "epoch": 5.1755765199161425, "percentage": 25.88, "elapsed_time": "0:25:16", "remaining_time": "1:12:23", "throughput": 4255.6, "total_tokens": 6452856} {"current_steps": 9880, "total_steps": 38160, "loss": 0.4998, "lr": 0.0009250533218838717, "epoch": 5.178197064989518, "percentage": 25.89, "elapsed_time": "0:25:17", "remaining_time": "1:12:22", "throughput": 4255.73, "total_tokens": 6456184} {"current_steps": 9885, "total_steps": 38160, "loss": 0.3471, "lr": 0.0009249328491234199, "epoch": 5.180817610062893, "percentage": 25.9, "elapsed_time": "0:25:17", "remaining_time": "1:12:21", "throughput": 4255.83, "total_tokens": 6459512} {"current_steps": 9890, "total_steps": 38160, "loss": 0.5506, "lr": 0.0009248122874718638, "epoch": 5.183438155136268, "percentage": 25.92, "elapsed_time": "0:25:18", "remaining_time": "1:12:20", "throughput": 4255.8, "total_tokens": 6462360} {"current_steps": 9895, "total_steps": 38160, "loss": 0.4987, "lr": 0.0009246916369544238, "epoch": 5.186058700209643, "percentage": 25.93, "elapsed_time": "0:25:19", "remaining_time": "1:12:19", "throughput": 4255.77, "total_tokens": 6465144} {"current_steps": 9900, "total_steps": 38160, "loss": 0.577, "lr": 0.0009245708975963386, "epoch": 5.188679245283019, "percentage": 25.94, "elapsed_time": "0:25:19", "remaining_time": "1:12:18", "throughput": 4255.75, "total_tokens": 6467864} {"current_steps": 9905, "total_steps": 38160, "loss": 0.3328, "lr": 0.0009244500694228653, "epoch": 5.191299790356394, "percentage": 25.96, "elapsed_time": "0:25:20", "remaining_time": "1:12:17", "throughput": 4255.98, "total_tokens": 6471512} {"current_steps": 9910, "total_steps": 38160, "loss": 0.3467, "lr": 0.0009243291524592799, "epoch": 5.19392033542977, "percentage": 25.97, "elapsed_time": "0:25:21", "remaining_time": "1:12:16", "throughput": 4256.11, "total_tokens": 6474808} {"current_steps": 9915, "total_steps": 38160, "loss": 0.4129, "lr": 0.0009242081467308766, "epoch": 5.196540880503145, "percentage": 25.98, "elapsed_time": "0:25:21", "remaining_time": "1:12:15", "throughput": 4255.96, "total_tokens": 6477208} {"current_steps": 9920, "total_steps": 38160, "loss": 0.6253, "lr": 0.0009240870522629688, "epoch": 5.19916142557652, "percentage": 26.0, "elapsed_time": "0:25:22", "remaining_time": "1:12:14", "throughput": 4256.27, "total_tokens": 6481144} {"current_steps": 9925, "total_steps": 38160, "loss": 0.415, "lr": 0.0009239658690808879, "epoch": 5.201781970649895, "percentage": 26.01, "elapsed_time": "0:25:23", "remaining_time": "1:12:14", "throughput": 4256.89, "total_tokens": 6486200} {"current_steps": 9930, "total_steps": 38160, "loss": 0.6064, "lr": 0.000923844597209984, "epoch": 5.20440251572327, "percentage": 26.02, "elapsed_time": "0:25:24", "remaining_time": "1:12:13", "throughput": 4257.07, "total_tokens": 6489656} {"current_steps": 9935, "total_steps": 38160, "loss": 0.4977, "lr": 0.0009237232366756258, "epoch": 5.2070230607966455, "percentage": 26.04, "elapsed_time": "0:25:25", "remaining_time": "1:12:12", "throughput": 4257.03, "total_tokens": 6492440} {"current_steps": 9940, "total_steps": 38160, "loss": 0.3635, "lr": 0.0009236017875032007, "epoch": 5.209643605870021, "percentage": 26.05, "elapsed_time": "0:25:25", "remaining_time": "1:12:11", "throughput": 4256.96, "total_tokens": 6495096} {"current_steps": 9945, "total_steps": 38160, "loss": 0.4362, "lr": 0.0009234802497181143, "epoch": 5.212264150943396, "percentage": 26.06, "elapsed_time": "0:25:26", "remaining_time": "1:12:11", "throughput": 4257.39, "total_tokens": 6499384} {"current_steps": 9950, "total_steps": 38160, "loss": 0.5211, "lr": 0.0009233586233457909, "epoch": 5.214884696016772, "percentage": 26.07, "elapsed_time": "0:25:27", "remaining_time": "1:12:10", "throughput": 4257.45, "total_tokens": 6502584} {"current_steps": 9955, "total_steps": 38160, "loss": 0.4431, "lr": 0.0009232369084116736, "epoch": 5.217505241090147, "percentage": 26.09, "elapsed_time": "0:25:28", "remaining_time": "1:12:09", "throughput": 4257.61, "total_tokens": 6505944} {"current_steps": 9960, "total_steps": 38160, "loss": 0.4969, "lr": 0.0009231151049412234, "epoch": 5.220125786163522, "percentage": 26.1, "elapsed_time": "0:25:28", "remaining_time": "1:12:08", "throughput": 4257.56, "total_tokens": 6508696} {"current_steps": 9965, "total_steps": 38160, "loss": 0.3665, "lr": 0.0009229932129599205, "epoch": 5.222746331236897, "percentage": 26.11, "elapsed_time": "0:25:29", "remaining_time": "1:12:07", "throughput": 4257.62, "total_tokens": 6511768} {"current_steps": 9970, "total_steps": 38160, "loss": 0.4543, "lr": 0.0009228712324932634, "epoch": 5.2253668763102725, "percentage": 26.13, "elapsed_time": "0:25:30", "remaining_time": "1:12:06", "throughput": 4257.85, "total_tokens": 6515480} {"current_steps": 9975, "total_steps": 38160, "loss": 0.3893, "lr": 0.0009227491635667685, "epoch": 5.227987421383648, "percentage": 26.14, "elapsed_time": "0:25:31", "remaining_time": "1:12:06", "throughput": 4258.19, "total_tokens": 6519448} {"current_steps": 9980, "total_steps": 38160, "loss": 0.4689, "lr": 0.0009226270062059717, "epoch": 5.230607966457023, "percentage": 26.15, "elapsed_time": "0:25:31", "remaining_time": "1:12:05", "throughput": 4258.25, "total_tokens": 6522584} {"current_steps": 9985, "total_steps": 38160, "loss": 0.3149, "lr": 0.0009225047604364267, "epoch": 5.233228511530398, "percentage": 26.17, "elapsed_time": "0:25:32", "remaining_time": "1:12:04", "throughput": 4258.85, "total_tokens": 6527576} {"current_steps": 9990, "total_steps": 38160, "loss": 0.4459, "lr": 0.0009223824262837062, "epoch": 5.235849056603773, "percentage": 26.18, "elapsed_time": "0:25:33", "remaining_time": "1:12:03", "throughput": 4258.88, "total_tokens": 6530520} {"current_steps": 9995, "total_steps": 38160, "loss": 0.3584, "lr": 0.0009222600037734008, "epoch": 5.238469601677149, "percentage": 26.19, "elapsed_time": "0:25:34", "remaining_time": "1:12:02", "throughput": 4258.92, "total_tokens": 6533560} {"current_steps": 10000, "total_steps": 38160, "loss": 0.4315, "lr": 0.00092213749293112, "epoch": 5.241090146750524, "percentage": 26.21, "elapsed_time": "0:25:34", "remaining_time": "1:12:01", "throughput": 4258.76, "total_tokens": 6535992} {"current_steps": 10005, "total_steps": 38160, "loss": 0.4457, "lr": 0.0009220148937824917, "epoch": 5.2437106918239, "percentage": 26.22, "elapsed_time": "0:25:35", "remaining_time": "1:12:00", "throughput": 4258.88, "total_tokens": 6539416} {"current_steps": 10010, "total_steps": 38160, "loss": 0.4206, "lr": 0.0009218922063531623, "epoch": 5.246331236897275, "percentage": 26.23, "elapsed_time": "0:25:36", "remaining_time": "1:12:00", "throughput": 4259.06, "total_tokens": 6542968} {"current_steps": 10015, "total_steps": 38160, "loss": 0.4583, "lr": 0.0009217694306687963, "epoch": 5.24895178197065, "percentage": 26.24, "elapsed_time": "0:25:37", "remaining_time": "1:11:59", "throughput": 4259.24, "total_tokens": 6546488} {"current_steps": 10020, "total_steps": 38160, "loss": 0.4309, "lr": 0.0009216465667550774, "epoch": 5.251572327044025, "percentage": 26.26, "elapsed_time": "0:25:37", "remaining_time": "1:11:58", "throughput": 4259.22, "total_tokens": 6549400} {"current_steps": 10025, "total_steps": 38160, "loss": 0.3653, "lr": 0.0009215236146377071, "epoch": 5.2541928721174, "percentage": 26.27, "elapsed_time": "0:25:38", "remaining_time": "1:11:57", "throughput": 4259.02, "total_tokens": 6551736} {"current_steps": 10030, "total_steps": 38160, "loss": 0.3758, "lr": 0.0009214005743424056, "epoch": 5.256813417190775, "percentage": 26.28, "elapsed_time": "0:25:39", "remaining_time": "1:11:56", "throughput": 4259.19, "total_tokens": 6555256} {"current_steps": 10035, "total_steps": 38160, "loss": 0.6313, "lr": 0.0009212774458949116, "epoch": 5.259433962264151, "percentage": 26.3, "elapsed_time": "0:25:39", "remaining_time": "1:11:55", "throughput": 4259.02, "total_tokens": 6557624} {"current_steps": 10040, "total_steps": 38160, "loss": 0.4393, "lr": 0.000921154229320982, "epoch": 5.262054507337526, "percentage": 26.31, "elapsed_time": "0:25:40", "remaining_time": "1:11:54", "throughput": 4259.52, "total_tokens": 6562008} {"current_steps": 10045, "total_steps": 38160, "loss": 0.4068, "lr": 0.0009210309246463924, "epoch": 5.264675052410902, "percentage": 26.32, "elapsed_time": "0:25:41", "remaining_time": "1:11:53", "throughput": 4259.34, "total_tokens": 6564376} {"current_steps": 10050, "total_steps": 38160, "loss": 0.5323, "lr": 0.0009209075318969369, "epoch": 5.267295597484277, "percentage": 26.34, "elapsed_time": "0:25:41", "remaining_time": "1:11:52", "throughput": 4259.32, "total_tokens": 6567192} {"current_steps": 10055, "total_steps": 38160, "loss": 0.5932, "lr": 0.0009207840510984276, "epoch": 5.269916142557652, "percentage": 26.35, "elapsed_time": "0:25:42", "remaining_time": "1:11:51", "throughput": 4259.52, "total_tokens": 6570712} {"current_steps": 10060, "total_steps": 38160, "loss": 0.4839, "lr": 0.0009206604822766953, "epoch": 5.272536687631027, "percentage": 26.36, "elapsed_time": "0:25:43", "remaining_time": "1:11:51", "throughput": 4259.76, "total_tokens": 6574424} {"current_steps": 10065, "total_steps": 38160, "loss": 0.5865, "lr": 0.0009205368254575892, "epoch": 5.2751572327044025, "percentage": 26.38, "elapsed_time": "0:25:44", "remaining_time": "1:11:49", "throughput": 4259.64, "total_tokens": 6576920} {"current_steps": 10070, "total_steps": 38160, "loss": 0.4653, "lr": 0.000920413080666977, "epoch": 5.277777777777778, "percentage": 26.39, "elapsed_time": "0:25:44", "remaining_time": "1:11:49", "throughput": 4259.79, "total_tokens": 6580408} {"current_steps": 10075, "total_steps": 38160, "loss": 0.4813, "lr": 0.0009202892479307448, "epoch": 5.280398322851153, "percentage": 26.4, "elapsed_time": "0:25:45", "remaining_time": "1:11:48", "throughput": 4259.98, "total_tokens": 6583928} {"current_steps": 10080, "total_steps": 38160, "loss": 0.4509, "lr": 0.0009201653272747967, "epoch": 5.283018867924528, "percentage": 26.42, "elapsed_time": "0:25:46", "remaining_time": "1:11:47", "throughput": 4260.08, "total_tokens": 6587064} {"current_steps": 10085, "total_steps": 38160, "loss": 0.4531, "lr": 0.0009200413187250558, "epoch": 5.285639412997903, "percentage": 26.43, "elapsed_time": "0:25:47", "remaining_time": "1:11:46", "throughput": 4260.41, "total_tokens": 6591096} {"current_steps": 10090, "total_steps": 38160, "loss": 0.4938, "lr": 0.000919917222307463, "epoch": 5.288259958071279, "percentage": 26.44, "elapsed_time": "0:25:47", "remaining_time": "1:11:45", "throughput": 4260.43, "total_tokens": 6594168} {"current_steps": 10095, "total_steps": 38160, "loss": 0.4878, "lr": 0.000919793038047978, "epoch": 5.290880503144654, "percentage": 26.45, "elapsed_time": "0:25:48", "remaining_time": "1:11:44", "throughput": 4260.53, "total_tokens": 6597432} {"current_steps": 10100, "total_steps": 38160, "loss": 0.4187, "lr": 0.0009196687659725787, "epoch": 5.29350104821803, "percentage": 26.47, "elapsed_time": "0:25:49", "remaining_time": "1:11:44", "throughput": 4260.8, "total_tokens": 6601464} {"current_steps": 10105, "total_steps": 38160, "loss": 0.3815, "lr": 0.0009195444061072612, "epoch": 5.296121593291405, "percentage": 26.48, "elapsed_time": "0:25:50", "remaining_time": "1:11:43", "throughput": 4260.8, "total_tokens": 6604376} {"current_steps": 10110, "total_steps": 38160, "loss": 0.4704, "lr": 0.0009194199584780405, "epoch": 5.29874213836478, "percentage": 26.49, "elapsed_time": "0:25:50", "remaining_time": "1:11:42", "throughput": 4261.06, "total_tokens": 6608184} {"current_steps": 10115, "total_steps": 38160, "loss": 0.4824, "lr": 0.0009192954231109496, "epoch": 5.301362683438155, "percentage": 26.51, "elapsed_time": "0:25:51", "remaining_time": "1:11:42", "throughput": 4261.36, "total_tokens": 6612152} {"current_steps": 10120, "total_steps": 38160, "loss": 0.5781, "lr": 0.0009191708000320396, "epoch": 5.30398322851153, "percentage": 26.52, "elapsed_time": "0:25:52", "remaining_time": "1:11:41", "throughput": 4261.46, "total_tokens": 6615448} {"current_steps": 10125, "total_steps": 38160, "loss": 0.4489, "lr": 0.0009190460892673805, "epoch": 5.306603773584905, "percentage": 26.53, "elapsed_time": "0:25:53", "remaining_time": "1:11:40", "throughput": 4261.64, "total_tokens": 6619000} {"current_steps": 10130, "total_steps": 38160, "loss": 0.3415, "lr": 0.0009189212908430601, "epoch": 5.309224318658281, "percentage": 26.55, "elapsed_time": "0:25:54", "remaining_time": "1:11:40", "throughput": 4262.09, "total_tokens": 6623416} {"current_steps": 10135, "total_steps": 38160, "loss": 0.4512, "lr": 0.0009187964047851851, "epoch": 5.311844863731656, "percentage": 26.56, "elapsed_time": "0:25:54", "remaining_time": "1:11:39", "throughput": 4262.29, "total_tokens": 6626968} {"current_steps": 10140, "total_steps": 38160, "loss": 0.4003, "lr": 0.0009186714311198801, "epoch": 5.314465408805032, "percentage": 26.57, "elapsed_time": "0:25:55", "remaining_time": "1:11:38", "throughput": 4262.28, "total_tokens": 6629912} {"current_steps": 10145, "total_steps": 38160, "loss": 0.4407, "lr": 0.000918546369873288, "epoch": 5.317085953878407, "percentage": 26.59, "elapsed_time": "0:25:56", "remaining_time": "1:11:37", "throughput": 4262.51, "total_tokens": 6633560} {"current_steps": 10150, "total_steps": 38160, "loss": 0.4284, "lr": 0.0009184212210715704, "epoch": 5.319706498951782, "percentage": 26.6, "elapsed_time": "0:25:56", "remaining_time": "1:11:36", "throughput": 4262.59, "total_tokens": 6636760} {"current_steps": 10155, "total_steps": 38160, "loss": 0.3926, "lr": 0.0009182959847409072, "epoch": 5.322327044025157, "percentage": 26.61, "elapsed_time": "0:25:57", "remaining_time": "1:11:35", "throughput": 4262.72, "total_tokens": 6639992} {"current_steps": 10160, "total_steps": 38160, "loss": 0.4852, "lr": 0.0009181706609074959, "epoch": 5.3249475890985325, "percentage": 26.62, "elapsed_time": "0:25:58", "remaining_time": "1:11:34", "throughput": 4262.74, "total_tokens": 6643096} {"current_steps": 10165, "total_steps": 38160, "loss": 0.4444, "lr": 0.0009180452495975531, "epoch": 5.327568134171908, "percentage": 26.64, "elapsed_time": "0:25:59", "remaining_time": "1:11:34", "throughput": 4262.92, "total_tokens": 6646616} {"current_steps": 10170, "total_steps": 38160, "loss": 0.5052, "lr": 0.0009179197508373134, "epoch": 5.330188679245283, "percentage": 26.65, "elapsed_time": "0:25:59", "remaining_time": "1:11:33", "throughput": 4263.02, "total_tokens": 6649848} {"current_steps": 10175, "total_steps": 38160, "loss": 0.4064, "lr": 0.0009177941646530299, "epoch": 5.332809224318658, "percentage": 26.66, "elapsed_time": "0:26:00", "remaining_time": "1:11:32", "throughput": 4262.99, "total_tokens": 6652696} {"current_steps": 10180, "total_steps": 38160, "loss": 0.4521, "lr": 0.0009176684910709733, "epoch": 5.335429769392033, "percentage": 26.68, "elapsed_time": "0:26:01", "remaining_time": "1:11:31", "throughput": 4263.02, "total_tokens": 6655640} {"current_steps": 10185, "total_steps": 38160, "loss": 0.396, "lr": 0.0009175427301174338, "epoch": 5.338050314465409, "percentage": 26.69, "elapsed_time": "0:26:01", "remaining_time": "1:11:30", "throughput": 4263.11, "total_tokens": 6658776} {"current_steps": 10190, "total_steps": 38160, "loss": 0.5795, "lr": 0.0009174168818187183, "epoch": 5.340670859538784, "percentage": 26.7, "elapsed_time": "0:26:02", "remaining_time": "1:11:29", "throughput": 4263.03, "total_tokens": 6661464} {"current_steps": 10195, "total_steps": 38160, "loss": 0.4151, "lr": 0.0009172909462011536, "epoch": 5.34329140461216, "percentage": 26.72, "elapsed_time": "0:26:03", "remaining_time": "1:11:28", "throughput": 4263.02, "total_tokens": 6664280} {"current_steps": 10200, "total_steps": 38160, "loss": 0.5149, "lr": 0.0009171649232910835, "epoch": 5.345911949685535, "percentage": 26.73, "elapsed_time": "0:26:04", "remaining_time": "1:11:27", "throughput": 4263.14, "total_tokens": 6667672} {"current_steps": 10205, "total_steps": 38160, "loss": 0.5786, "lr": 0.0009170388131148707, "epoch": 5.34853249475891, "percentage": 26.74, "elapsed_time": "0:26:04", "remaining_time": "1:11:26", "throughput": 4263.14, "total_tokens": 6670648} {"current_steps": 10210, "total_steps": 38160, "loss": 0.5549, "lr": 0.000916912615698896, "epoch": 5.351153039832285, "percentage": 26.76, "elapsed_time": "0:26:05", "remaining_time": "1:11:25", "throughput": 4263.07, "total_tokens": 6673368} {"current_steps": 10215, "total_steps": 38160, "loss": 0.4429, "lr": 0.0009167863310695585, "epoch": 5.35377358490566, "percentage": 26.77, "elapsed_time": "0:26:06", "remaining_time": "1:11:24", "throughput": 4263.31, "total_tokens": 6677016} {"current_steps": 10220, "total_steps": 38160, "loss": 0.5635, "lr": 0.0009166599592532756, "epoch": 5.356394129979035, "percentage": 26.78, "elapsed_time": "0:26:06", "remaining_time": "1:11:23", "throughput": 4263.37, "total_tokens": 6680152} {"current_steps": 10225, "total_steps": 38160, "loss": 0.4059, "lr": 0.0009165335002764828, "epoch": 5.359014675052411, "percentage": 26.8, "elapsed_time": "0:26:07", "remaining_time": "1:11:23", "throughput": 4264.14, "total_tokens": 6686040} {"current_steps": 10230, "total_steps": 38160, "loss": 0.5144, "lr": 0.0009164069541656337, "epoch": 5.361635220125786, "percentage": 26.81, "elapsed_time": "0:26:08", "remaining_time": "1:11:22", "throughput": 4264.28, "total_tokens": 6689400} {"current_steps": 10235, "total_steps": 38160, "loss": 0.4517, "lr": 0.0009162803209472004, "epoch": 5.364255765199162, "percentage": 26.82, "elapsed_time": "0:26:09", "remaining_time": "1:11:21", "throughput": 4264.28, "total_tokens": 6692376} {"current_steps": 10240, "total_steps": 38160, "loss": 0.4127, "lr": 0.000916153600647673, "epoch": 5.366876310272537, "percentage": 26.83, "elapsed_time": "0:26:10", "remaining_time": "1:11:20", "throughput": 4264.36, "total_tokens": 6695480} {"current_steps": 10245, "total_steps": 38160, "loss": 0.4711, "lr": 0.0009160267932935602, "epoch": 5.369496855345912, "percentage": 26.85, "elapsed_time": "0:26:10", "remaining_time": "1:11:20", "throughput": 4264.42, "total_tokens": 6698680} {"current_steps": 10250, "total_steps": 38160, "loss": 0.4617, "lr": 0.0009158998989113885, "epoch": 5.372117400419287, "percentage": 26.86, "elapsed_time": "0:26:11", "remaining_time": "1:11:19", "throughput": 4264.47, "total_tokens": 6701784} {"current_steps": 10255, "total_steps": 38160, "loss": 0.5377, "lr": 0.0009157729175277028, "epoch": 5.3747379454926625, "percentage": 26.87, "elapsed_time": "0:26:12", "remaining_time": "1:11:18", "throughput": 4264.83, "total_tokens": 6705976} {"current_steps": 10260, "total_steps": 38160, "loss": 0.3522, "lr": 0.0009156458491690662, "epoch": 5.377358490566038, "percentage": 26.89, "elapsed_time": "0:26:13", "remaining_time": "1:11:17", "throughput": 4264.85, "total_tokens": 6708920} {"current_steps": 10265, "total_steps": 38160, "loss": 0.4509, "lr": 0.0009155186938620599, "epoch": 5.379979035639413, "percentage": 26.9, "elapsed_time": "0:26:13", "remaining_time": "1:11:16", "throughput": 4264.85, "total_tokens": 6711864} {"current_steps": 10270, "total_steps": 38160, "loss": 0.4908, "lr": 0.0009153914516332833, "epoch": 5.382599580712788, "percentage": 26.91, "elapsed_time": "0:26:14", "remaining_time": "1:11:15", "throughput": 4264.89, "total_tokens": 6714904} {"current_steps": 10275, "total_steps": 38160, "loss": 0.4165, "lr": 0.000915264122509354, "epoch": 5.385220125786163, "percentage": 26.93, "elapsed_time": "0:26:15", "remaining_time": "1:11:14", "throughput": 4264.85, "total_tokens": 6717752} {"current_steps": 10280, "total_steps": 38160, "loss": 0.4897, "lr": 0.0009151367065169078, "epoch": 5.387840670859539, "percentage": 26.94, "elapsed_time": "0:26:15", "remaining_time": "1:11:13", "throughput": 4264.81, "total_tokens": 6720568} {"current_steps": 10285, "total_steps": 38160, "loss": 0.4085, "lr": 0.0009150092036825989, "epoch": 5.390461215932914, "percentage": 26.95, "elapsed_time": "0:26:16", "remaining_time": "1:11:12", "throughput": 4264.81, "total_tokens": 6723480} {"current_steps": 10290, "total_steps": 38160, "loss": 0.3847, "lr": 0.0009148816140330991, "epoch": 5.3930817610062896, "percentage": 26.97, "elapsed_time": "0:26:17", "remaining_time": "1:11:12", "throughput": 4265.55, "total_tokens": 6729400} {"current_steps": 10295, "total_steps": 38160, "loss": 0.4325, "lr": 0.000914753937595099, "epoch": 5.395702306079665, "percentage": 26.98, "elapsed_time": "0:26:18", "remaining_time": "1:11:11", "throughput": 4265.44, "total_tokens": 6731960} {"current_steps": 10300, "total_steps": 38160, "loss": 0.4409, "lr": 0.0009146261743953068, "epoch": 5.39832285115304, "percentage": 26.99, "elapsed_time": "0:26:18", "remaining_time": "1:11:10", "throughput": 4265.39, "total_tokens": 6734648} {"current_steps": 10305, "total_steps": 38160, "loss": 0.4219, "lr": 0.0009144983244604493, "epoch": 5.400943396226415, "percentage": 27.0, "elapsed_time": "0:26:19", "remaining_time": "1:11:09", "throughput": 4265.34, "total_tokens": 6737368} {"current_steps": 10310, "total_steps": 38160, "loss": 0.6237, "lr": 0.0009143703878172712, "epoch": 5.40356394129979, "percentage": 27.02, "elapsed_time": "0:26:20", "remaining_time": "1:11:08", "throughput": 4265.53, "total_tokens": 6740952} {"current_steps": 10315, "total_steps": 38160, "loss": 0.5113, "lr": 0.0009142423644925353, "epoch": 5.406184486373165, "percentage": 27.03, "elapsed_time": "0:26:20", "remaining_time": "1:11:07", "throughput": 4265.48, "total_tokens": 6743640} {"current_steps": 10320, "total_steps": 38160, "loss": 0.4414, "lr": 0.0009141142545130228, "epoch": 5.408805031446541, "percentage": 27.04, "elapsed_time": "0:26:21", "remaining_time": "1:11:06", "throughput": 4265.39, "total_tokens": 6746264} {"current_steps": 10325, "total_steps": 38160, "loss": 0.4236, "lr": 0.0009139860579055326, "epoch": 5.411425576519916, "percentage": 27.06, "elapsed_time": "0:26:22", "remaining_time": "1:11:05", "throughput": 4265.5, "total_tokens": 6749592} {"current_steps": 10330, "total_steps": 38160, "loss": 0.5489, "lr": 0.0009138577746968821, "epoch": 5.414046121593292, "percentage": 27.07, "elapsed_time": "0:26:23", "remaining_time": "1:11:04", "throughput": 4265.45, "total_tokens": 6752280} {"current_steps": 10335, "total_steps": 38160, "loss": 0.3772, "lr": 0.0009137294049139066, "epoch": 5.416666666666667, "percentage": 27.08, "elapsed_time": "0:26:23", "remaining_time": "1:11:04", "throughput": 4265.68, "total_tokens": 6755960} {"current_steps": 10340, "total_steps": 38160, "loss": 0.4885, "lr": 0.0009136009485834598, "epoch": 5.419287211740042, "percentage": 27.1, "elapsed_time": "0:26:24", "remaining_time": "1:11:03", "throughput": 4266.07, "total_tokens": 6760312} {"current_steps": 10345, "total_steps": 38160, "loss": 0.4416, "lr": 0.0009134724057324131, "epoch": 5.421907756813417, "percentage": 27.11, "elapsed_time": "0:26:25", "remaining_time": "1:11:02", "throughput": 4265.86, "total_tokens": 6762616} {"current_steps": 10350, "total_steps": 38160, "loss": 0.4981, "lr": 0.0009133437763876562, "epoch": 5.4245283018867925, "percentage": 27.12, "elapsed_time": "0:26:26", "remaining_time": "1:11:01", "throughput": 4265.99, "total_tokens": 6766040} {"current_steps": 10355, "total_steps": 38160, "loss": 0.4289, "lr": 0.000913215060576097, "epoch": 5.427148846960168, "percentage": 27.14, "elapsed_time": "0:26:26", "remaining_time": "1:11:00", "throughput": 4265.87, "total_tokens": 6768568} {"current_steps": 10360, "total_steps": 38160, "loss": 0.476, "lr": 0.0009130862583246613, "epoch": 5.429769392033543, "percentage": 27.15, "elapsed_time": "0:26:27", "remaining_time": "1:10:59", "throughput": 4265.8, "total_tokens": 6771288} {"current_steps": 10365, "total_steps": 38160, "loss": 0.5702, "lr": 0.0009129573696602932, "epoch": 5.432389937106918, "percentage": 27.16, "elapsed_time": "0:26:28", "remaining_time": "1:10:58", "throughput": 4265.75, "total_tokens": 6774104} {"current_steps": 10370, "total_steps": 38160, "loss": 0.4235, "lr": 0.0009128283946099546, "epoch": 5.435010482180293, "percentage": 27.18, "elapsed_time": "0:26:28", "remaining_time": "1:10:57", "throughput": 4265.81, "total_tokens": 6777240} {"current_steps": 10375, "total_steps": 38160, "loss": 0.364, "lr": 0.0009126993332006256, "epoch": 5.437631027253669, "percentage": 27.19, "elapsed_time": "0:26:29", "remaining_time": "1:10:56", "throughput": 4265.98, "total_tokens": 6780856} {"current_steps": 10380, "total_steps": 38160, "loss": 0.6181, "lr": 0.0009125701854593045, "epoch": 5.440251572327044, "percentage": 27.2, "elapsed_time": "0:26:30", "remaining_time": "1:10:55", "throughput": 4265.97, "total_tokens": 6783736} {"current_steps": 10385, "total_steps": 38160, "loss": 0.4893, "lr": 0.0009124409514130073, "epoch": 5.4428721174004195, "percentage": 27.21, "elapsed_time": "0:26:31", "remaining_time": "1:10:55", "throughput": 4266.5, "total_tokens": 6788472} {"current_steps": 10390, "total_steps": 38160, "loss": 0.6174, "lr": 0.0009123116310887686, "epoch": 5.445492662473795, "percentage": 27.23, "elapsed_time": "0:26:31", "remaining_time": "1:10:54", "throughput": 4266.4, "total_tokens": 6791032} {"current_steps": 10395, "total_steps": 38160, "loss": 0.5302, "lr": 0.0009121822245136404, "epoch": 5.44811320754717, "percentage": 27.24, "elapsed_time": "0:26:32", "remaining_time": "1:10:53", "throughput": 4266.61, "total_tokens": 6794680} {"current_steps": 10400, "total_steps": 38160, "loss": 0.4262, "lr": 0.0009120527317146934, "epoch": 5.450733752620545, "percentage": 27.25, "elapsed_time": "0:26:33", "remaining_time": "1:10:52", "throughput": 4266.72, "total_tokens": 6798072} {"current_steps": 10405, "total_steps": 38160, "loss": 0.7979, "lr": 0.0009119231527190158, "epoch": 5.45335429769392, "percentage": 27.27, "elapsed_time": "0:26:34", "remaining_time": "1:10:52", "throughput": 4267.08, "total_tokens": 6802296} {"current_steps": 10410, "total_steps": 38160, "loss": 0.5096, "lr": 0.0009117934875537141, "epoch": 5.455974842767295, "percentage": 27.28, "elapsed_time": "0:26:35", "remaining_time": "1:10:51", "throughput": 4267.58, "total_tokens": 6807000} {"current_steps": 10415, "total_steps": 38160, "loss": 0.5165, "lr": 0.0009116637362459129, "epoch": 5.4585953878406706, "percentage": 27.29, "elapsed_time": "0:26:35", "remaining_time": "1:10:50", "throughput": 4267.59, "total_tokens": 6809944} {"current_steps": 10420, "total_steps": 38160, "loss": 0.399, "lr": 0.0009115338988227546, "epoch": 5.461215932914046, "percentage": 27.31, "elapsed_time": "0:26:36", "remaining_time": "1:10:50", "throughput": 4267.62, "total_tokens": 6812984} {"current_steps": 10425, "total_steps": 38160, "loss": 0.4316, "lr": 0.0009114039753113997, "epoch": 5.463836477987422, "percentage": 27.32, "elapsed_time": "0:26:37", "remaining_time": "1:10:49", "throughput": 4267.85, "total_tokens": 6816728} {"current_steps": 10430, "total_steps": 38160, "loss": 0.6604, "lr": 0.0009112739657390265, "epoch": 5.466457023060797, "percentage": 27.33, "elapsed_time": "0:26:37", "remaining_time": "1:10:48", "throughput": 4267.75, "total_tokens": 6819352} {"current_steps": 10435, "total_steps": 38160, "loss": 0.6169, "lr": 0.0009111438701328319, "epoch": 5.469077568134172, "percentage": 27.35, "elapsed_time": "0:26:38", "remaining_time": "1:10:47", "throughput": 4267.88, "total_tokens": 6822776} {"current_steps": 10440, "total_steps": 38160, "loss": 0.4206, "lr": 0.0009110136885200302, "epoch": 5.471698113207547, "percentage": 27.36, "elapsed_time": "0:26:39", "remaining_time": "1:10:46", "throughput": 4267.97, "total_tokens": 6826040} {"current_steps": 10445, "total_steps": 38160, "loss": 0.4876, "lr": 0.000910883420927854, "epoch": 5.4743186582809225, "percentage": 27.37, "elapsed_time": "0:26:40", "remaining_time": "1:10:45", "throughput": 4268.18, "total_tokens": 6829752} {"current_steps": 10450, "total_steps": 38160, "loss": 0.4001, "lr": 0.0009107530673835536, "epoch": 5.476939203354298, "percentage": 27.38, "elapsed_time": "0:26:40", "remaining_time": "1:10:44", "throughput": 4268.18, "total_tokens": 6832728} {"current_steps": 10455, "total_steps": 38160, "loss": 0.4229, "lr": 0.0009106226279143979, "epoch": 5.479559748427673, "percentage": 27.4, "elapsed_time": "0:26:41", "remaining_time": "1:10:43", "throughput": 4268.01, "total_tokens": 6835096} {"current_steps": 10460, "total_steps": 38160, "loss": 0.3768, "lr": 0.0009104921025476728, "epoch": 5.482180293501048, "percentage": 27.41, "elapsed_time": "0:26:42", "remaining_time": "1:10:42", "throughput": 4267.88, "total_tokens": 6837592} {"current_steps": 10465, "total_steps": 38160, "loss": 0.5051, "lr": 0.0009103614913106832, "epoch": 5.484800838574423, "percentage": 27.42, "elapsed_time": "0:26:42", "remaining_time": "1:10:41", "throughput": 4267.93, "total_tokens": 6840664} {"current_steps": 10470, "total_steps": 38160, "loss": 0.5292, "lr": 0.0009102307942307511, "epoch": 5.487421383647799, "percentage": 27.44, "elapsed_time": "0:26:43", "remaining_time": "1:10:40", "throughput": 4268.06, "total_tokens": 6843992} {"current_steps": 10475, "total_steps": 38160, "loss": 0.4982, "lr": 0.000910100011335217, "epoch": 5.490041928721174, "percentage": 27.45, "elapsed_time": "0:26:44", "remaining_time": "1:10:39", "throughput": 4267.88, "total_tokens": 6846296} {"current_steps": 10480, "total_steps": 38160, "loss": 0.5054, "lr": 0.0009099691426514392, "epoch": 5.4926624737945495, "percentage": 27.46, "elapsed_time": "0:26:44", "remaining_time": "1:10:38", "throughput": 4268.04, "total_tokens": 6849784} {"current_steps": 10485, "total_steps": 38160, "loss": 0.6087, "lr": 0.0009098381882067941, "epoch": 5.495283018867925, "percentage": 27.48, "elapsed_time": "0:26:45", "remaining_time": "1:10:38", "throughput": 4268.46, "total_tokens": 6854296} {"current_steps": 10490, "total_steps": 38160, "loss": 0.5438, "lr": 0.0009097071480286756, "epoch": 5.4979035639413, "percentage": 27.49, "elapsed_time": "0:26:46", "remaining_time": "1:10:37", "throughput": 4268.54, "total_tokens": 6857528} {"current_steps": 10495, "total_steps": 38160, "loss": 0.4728, "lr": 0.0009095760221444959, "epoch": 5.500524109014675, "percentage": 27.5, "elapsed_time": "0:26:47", "remaining_time": "1:10:36", "throughput": 4268.71, "total_tokens": 6861112} {"current_steps": 10500, "total_steps": 38160, "loss": 0.406, "lr": 0.000909444810581685, "epoch": 5.50314465408805, "percentage": 27.52, "elapsed_time": "0:26:48", "remaining_time": "1:10:36", "throughput": 4269.02, "total_tokens": 6865144} {"current_steps": 10505, "total_steps": 38160, "loss": 0.5627, "lr": 0.000909313513367691, "epoch": 5.505765199161425, "percentage": 27.53, "elapsed_time": "0:26:49", "remaining_time": "1:10:35", "throughput": 4269.48, "total_tokens": 6869720} {"current_steps": 10510, "total_steps": 38160, "loss": 0.4775, "lr": 0.0009091821305299798, "epoch": 5.5083857442348005, "percentage": 27.54, "elapsed_time": "0:26:49", "remaining_time": "1:10:34", "throughput": 4269.48, "total_tokens": 6872696} {"current_steps": 10515, "total_steps": 38160, "loss": 0.4248, "lr": 0.000909050662096035, "epoch": 5.511006289308176, "percentage": 27.56, "elapsed_time": "0:26:50", "remaining_time": "1:10:33", "throughput": 4269.41, "total_tokens": 6875384} {"current_steps": 10520, "total_steps": 38160, "loss": 0.3664, "lr": 0.0009089191080933583, "epoch": 5.513626834381551, "percentage": 27.57, "elapsed_time": "0:26:51", "remaining_time": "1:10:33", "throughput": 4269.7, "total_tokens": 6879352} {"current_steps": 10525, "total_steps": 38160, "loss": 0.4417, "lr": 0.0009087874685494695, "epoch": 5.516247379454927, "percentage": 27.58, "elapsed_time": "0:26:51", "remaining_time": "1:10:32", "throughput": 4269.96, "total_tokens": 6883128} {"current_steps": 10530, "total_steps": 38160, "loss": 0.4209, "lr": 0.0009086557434919059, "epoch": 5.518867924528302, "percentage": 27.59, "elapsed_time": "0:26:52", "remaining_time": "1:10:31", "throughput": 4270.0, "total_tokens": 6886200} {"current_steps": 10535, "total_steps": 38160, "loss": 0.3855, "lr": 0.0009085239329482231, "epoch": 5.521488469601677, "percentage": 27.61, "elapsed_time": "0:26:53", "remaining_time": "1:10:30", "throughput": 4270.05, "total_tokens": 6889336} {"current_steps": 10540, "total_steps": 38160, "loss": 0.5176, "lr": 0.0009083920369459941, "epoch": 5.524109014675052, "percentage": 27.62, "elapsed_time": "0:26:54", "remaining_time": "1:10:30", "throughput": 4270.3, "total_tokens": 6893208} {"current_steps": 10545, "total_steps": 38160, "loss": 0.4688, "lr": 0.00090826005551281, "epoch": 5.526729559748428, "percentage": 27.63, "elapsed_time": "0:26:55", "remaining_time": "1:10:30", "throughput": 4271.2, "total_tokens": 6899896} {"current_steps": 10550, "total_steps": 38160, "loss": 0.4948, "lr": 0.0009081279886762802, "epoch": 5.529350104821803, "percentage": 27.65, "elapsed_time": "0:26:56", "remaining_time": "1:10:29", "throughput": 4271.36, "total_tokens": 6903416} {"current_steps": 10555, "total_steps": 38160, "loss": 0.4657, "lr": 0.0009079958364640313, "epoch": 5.531970649895178, "percentage": 27.66, "elapsed_time": "0:26:56", "remaining_time": "1:10:28", "throughput": 4271.48, "total_tokens": 6906776} {"current_steps": 10560, "total_steps": 38160, "loss": 0.4397, "lr": 0.0009078635989037081, "epoch": 5.534591194968553, "percentage": 27.67, "elapsed_time": "0:26:57", "remaining_time": "1:10:27", "throughput": 4271.47, "total_tokens": 6909784} {"current_steps": 10565, "total_steps": 38160, "loss": 0.5912, "lr": 0.000907731276022973, "epoch": 5.537211740041929, "percentage": 27.69, "elapsed_time": "0:26:58", "remaining_time": "1:10:27", "throughput": 4271.51, "total_tokens": 6912856} {"current_steps": 10570, "total_steps": 38160, "loss": 0.7328, "lr": 0.0009075988678495066, "epoch": 5.539832285115304, "percentage": 27.7, "elapsed_time": "0:26:59", "remaining_time": "1:10:26", "throughput": 4271.56, "total_tokens": 6915896} {"current_steps": 10575, "total_steps": 38160, "loss": 0.444, "lr": 0.0009074663744110073, "epoch": 5.5424528301886795, "percentage": 27.71, "elapsed_time": "0:26:59", "remaining_time": "1:10:25", "throughput": 4271.54, "total_tokens": 6918744} {"current_steps": 10580, "total_steps": 38160, "loss": 0.3911, "lr": 0.0009073337957351911, "epoch": 5.545073375262055, "percentage": 27.73, "elapsed_time": "0:27:00", "remaining_time": "1:10:24", "throughput": 4271.51, "total_tokens": 6921528} {"current_steps": 10585, "total_steps": 38160, "loss": 0.5298, "lr": 0.0009072011318497919, "epoch": 5.54769392033543, "percentage": 27.74, "elapsed_time": "0:27:01", "remaining_time": "1:10:23", "throughput": 4271.52, "total_tokens": 6924504} {"current_steps": 10590, "total_steps": 38160, "loss": 0.4389, "lr": 0.0009070683827825615, "epoch": 5.550314465408805, "percentage": 27.75, "elapsed_time": "0:27:01", "remaining_time": "1:10:22", "throughput": 4271.63, "total_tokens": 6927832} {"current_steps": 10595, "total_steps": 38160, "loss": 0.5439, "lr": 0.0009069355485612695, "epoch": 5.55293501048218, "percentage": 27.76, "elapsed_time": "0:27:02", "remaining_time": "1:10:21", "throughput": 4271.54, "total_tokens": 6930520} {"current_steps": 10600, "total_steps": 38160, "loss": 0.4478, "lr": 0.0009068026292137034, "epoch": 5.555555555555555, "percentage": 27.78, "elapsed_time": "0:27:03", "remaining_time": "1:10:21", "throughput": 4272.16, "total_tokens": 6935736} {"current_steps": 10605, "total_steps": 38160, "loss": 0.4281, "lr": 0.0009066696247676682, "epoch": 5.5581761006289305, "percentage": 27.79, "elapsed_time": "0:27:04", "remaining_time": "1:10:20", "throughput": 4272.17, "total_tokens": 6938744} {"current_steps": 10610, "total_steps": 38160, "loss": 0.4111, "lr": 0.0009065365352509871, "epoch": 5.560796645702306, "percentage": 27.8, "elapsed_time": "0:27:04", "remaining_time": "1:10:19", "throughput": 4272.23, "total_tokens": 6941848} {"current_steps": 10615, "total_steps": 38160, "loss": 0.4999, "lr": 0.0009064033606915008, "epoch": 5.563417190775681, "percentage": 27.82, "elapsed_time": "0:27:05", "remaining_time": "1:10:18", "throughput": 4272.16, "total_tokens": 6944504} {"current_steps": 10620, "total_steps": 38160, "loss": 0.5342, "lr": 0.000906270101117068, "epoch": 5.566037735849057, "percentage": 27.83, "elapsed_time": "0:27:06", "remaining_time": "1:10:17", "throughput": 4272.48, "total_tokens": 6948632} {"current_steps": 10625, "total_steps": 38160, "loss": 0.4253, "lr": 0.0009061367565555649, "epoch": 5.568658280922432, "percentage": 27.84, "elapsed_time": "0:27:07", "remaining_time": "1:10:16", "throughput": 4272.47, "total_tokens": 6951672} {"current_steps": 10630, "total_steps": 38160, "loss": 0.5009, "lr": 0.000906003327034886, "epoch": 5.571278825995807, "percentage": 27.86, "elapsed_time": "0:27:07", "remaining_time": "1:10:15", "throughput": 4272.76, "total_tokens": 6955544} {"current_steps": 10635, "total_steps": 38160, "loss": 0.4987, "lr": 0.0009058698125829428, "epoch": 5.573899371069182, "percentage": 27.87, "elapsed_time": "0:27:08", "remaining_time": "1:10:15", "throughput": 4272.82, "total_tokens": 6958712} {"current_steps": 10640, "total_steps": 38160, "loss": 0.4114, "lr": 0.0009057362132276653, "epoch": 5.576519916142558, "percentage": 27.88, "elapsed_time": "0:27:09", "remaining_time": "1:10:13", "throughput": 4272.72, "total_tokens": 6961304} {"current_steps": 10645, "total_steps": 38160, "loss": 0.5046, "lr": 0.0009056025289970009, "epoch": 5.579140461215933, "percentage": 27.9, "elapsed_time": "0:27:09", "remaining_time": "1:10:12", "throughput": 4272.58, "total_tokens": 6963704} {"current_steps": 10650, "total_steps": 38160, "loss": 0.5066, "lr": 0.0009054687599189148, "epoch": 5.581761006289308, "percentage": 27.91, "elapsed_time": "0:27:10", "remaining_time": "1:10:11", "throughput": 4272.53, "total_tokens": 6966488} {"current_steps": 10655, "total_steps": 38160, "loss": 0.7508, "lr": 0.0009053349060213899, "epoch": 5.584381551362683, "percentage": 27.92, "elapsed_time": "0:27:11", "remaining_time": "1:10:11", "throughput": 4272.8, "total_tokens": 6970360} {"current_steps": 10660, "total_steps": 38160, "loss": 0.5078, "lr": 0.0009052009673324269, "epoch": 5.587002096436059, "percentage": 27.94, "elapsed_time": "0:27:11", "remaining_time": "1:10:10", "throughput": 4272.7, "total_tokens": 6972952} {"current_steps": 10665, "total_steps": 38160, "loss": 0.3782, "lr": 0.0009050669438800445, "epoch": 5.589622641509434, "percentage": 27.95, "elapsed_time": "0:27:12", "remaining_time": "1:10:09", "throughput": 4272.97, "total_tokens": 6976888} {"current_steps": 10670, "total_steps": 38160, "loss": 0.576, "lr": 0.0009049328356922786, "epoch": 5.5922431865828095, "percentage": 27.96, "elapsed_time": "0:27:13", "remaining_time": "1:10:08", "throughput": 4272.92, "total_tokens": 6979608} {"current_steps": 10675, "total_steps": 38160, "loss": 0.5047, "lr": 0.0009047986427971831, "epoch": 5.594863731656185, "percentage": 27.97, "elapsed_time": "0:27:14", "remaining_time": "1:10:07", "throughput": 4273.25, "total_tokens": 6983704} {"current_steps": 10680, "total_steps": 38160, "loss": 0.6341, "lr": 0.0009046643652228297, "epoch": 5.59748427672956, "percentage": 27.99, "elapsed_time": "0:27:14", "remaining_time": "1:10:06", "throughput": 4273.3, "total_tokens": 6986808} {"current_steps": 10685, "total_steps": 38160, "loss": 0.5021, "lr": 0.0009045300029973079, "epoch": 5.600104821802935, "percentage": 28.0, "elapsed_time": "0:27:15", "remaining_time": "1:10:05", "throughput": 4273.3, "total_tokens": 6989784} {"current_steps": 10690, "total_steps": 38160, "loss": 0.3977, "lr": 0.0009043955561487245, "epoch": 5.60272536687631, "percentage": 28.01, "elapsed_time": "0:27:16", "remaining_time": "1:10:05", "throughput": 4273.37, "total_tokens": 6992952} {"current_steps": 10695, "total_steps": 38160, "loss": 0.4012, "lr": 0.0009042610247052044, "epoch": 5.605345911949685, "percentage": 28.03, "elapsed_time": "0:27:17", "remaining_time": "1:10:04", "throughput": 4273.42, "total_tokens": 6996056} {"current_steps": 10700, "total_steps": 38160, "loss": 0.4507, "lr": 0.0009041264086948899, "epoch": 5.6079664570230605, "percentage": 28.04, "elapsed_time": "0:27:17", "remaining_time": "1:10:03", "throughput": 4273.67, "total_tokens": 6999960} {"current_steps": 10705, "total_steps": 38160, "loss": 0.4946, "lr": 0.0009039917081459414, "epoch": 5.610587002096436, "percentage": 28.05, "elapsed_time": "0:27:18", "remaining_time": "1:10:02", "throughput": 4273.86, "total_tokens": 7003608} {"current_steps": 10710, "total_steps": 38160, "loss": 0.4232, "lr": 0.0009038569230865363, "epoch": 5.613207547169811, "percentage": 28.07, "elapsed_time": "0:27:19", "remaining_time": "1:10:01", "throughput": 4273.92, "total_tokens": 7006680} {"current_steps": 10715, "total_steps": 38160, "loss": 0.4802, "lr": 0.0009037220535448705, "epoch": 5.615828092243187, "percentage": 28.08, "elapsed_time": "0:27:20", "remaining_time": "1:10:00", "throughput": 4273.88, "total_tokens": 7009592} {"current_steps": 10720, "total_steps": 38160, "loss": 0.4115, "lr": 0.0009035870995491571, "epoch": 5.618448637316562, "percentage": 28.09, "elapsed_time": "0:27:20", "remaining_time": "1:09:59", "throughput": 4273.73, "total_tokens": 7011960} {"current_steps": 10725, "total_steps": 38160, "loss": 0.4254, "lr": 0.0009034520611276265, "epoch": 5.621069182389937, "percentage": 28.11, "elapsed_time": "0:27:21", "remaining_time": "1:09:58", "throughput": 4273.86, "total_tokens": 7015384} {"current_steps": 10730, "total_steps": 38160, "loss": 0.5356, "lr": 0.0009033169383085278, "epoch": 5.623689727463312, "percentage": 28.12, "elapsed_time": "0:27:22", "remaining_time": "1:09:58", "throughput": 4274.31, "total_tokens": 7019928} {"current_steps": 10735, "total_steps": 38160, "loss": 0.4037, "lr": 0.0009031817311201268, "epoch": 5.626310272536688, "percentage": 28.13, "elapsed_time": "0:27:23", "remaining_time": "1:09:57", "throughput": 4274.45, "total_tokens": 7023384} {"current_steps": 10740, "total_steps": 38160, "loss": 0.4207, "lr": 0.0009030464395907074, "epoch": 5.628930817610063, "percentage": 28.14, "elapsed_time": "0:27:23", "remaining_time": "1:09:56", "throughput": 4274.44, "total_tokens": 7026296} {"current_steps": 10745, "total_steps": 38160, "loss": 0.3764, "lr": 0.0009029110637485711, "epoch": 5.631551362683438, "percentage": 28.16, "elapsed_time": "0:27:24", "remaining_time": "1:09:55", "throughput": 4274.46, "total_tokens": 7029304} {"current_steps": 10750, "total_steps": 38160, "loss": 0.3777, "lr": 0.0009027756036220368, "epoch": 5.634171907756813, "percentage": 28.17, "elapsed_time": "0:27:25", "remaining_time": "1:09:54", "throughput": 4274.38, "total_tokens": 7031960} {"current_steps": 10755, "total_steps": 38160, "loss": 0.4087, "lr": 0.0009026400592394415, "epoch": 5.636792452830189, "percentage": 28.18, "elapsed_time": "0:27:25", "remaining_time": "1:09:53", "throughput": 4274.38, "total_tokens": 7035000} {"current_steps": 10760, "total_steps": 38160, "loss": 0.46, "lr": 0.0009025044306291393, "epoch": 5.639412997903564, "percentage": 28.2, "elapsed_time": "0:27:26", "remaining_time": "1:09:53", "throughput": 4274.47, "total_tokens": 7038392} {"current_steps": 10765, "total_steps": 38160, "loss": 0.4294, "lr": 0.0009023687178195022, "epoch": 5.6420335429769395, "percentage": 28.21, "elapsed_time": "0:27:27", "remaining_time": "1:09:52", "throughput": 4274.54, "total_tokens": 7041528} {"current_steps": 10770, "total_steps": 38160, "loss": 0.3869, "lr": 0.0009022329208389196, "epoch": 5.644654088050315, "percentage": 28.22, "elapsed_time": "0:27:28", "remaining_time": "1:09:51", "throughput": 4274.78, "total_tokens": 7045304} {"current_steps": 10775, "total_steps": 38160, "loss": 0.4966, "lr": 0.000902097039715799, "epoch": 5.64727463312369, "percentage": 28.24, "elapsed_time": "0:27:29", "remaining_time": "1:09:51", "throughput": 4275.23, "total_tokens": 7049880} {"current_steps": 10780, "total_steps": 38160, "loss": 0.3368, "lr": 0.0009019610744785651, "epoch": 5.649895178197065, "percentage": 28.25, "elapsed_time": "0:27:29", "remaining_time": "1:09:49", "throughput": 4275.08, "total_tokens": 7052312} {"current_steps": 10785, "total_steps": 38160, "loss": 0.3918, "lr": 0.0009018250251556603, "epoch": 5.65251572327044, "percentage": 28.26, "elapsed_time": "0:27:30", "remaining_time": "1:09:48", "throughput": 4275.15, "total_tokens": 7055448} {"current_steps": 10790, "total_steps": 38160, "loss": 0.4923, "lr": 0.0009016888917755445, "epoch": 5.655136268343815, "percentage": 28.28, "elapsed_time": "0:27:31", "remaining_time": "1:09:48", "throughput": 4275.17, "total_tokens": 7058520} {"current_steps": 10795, "total_steps": 38160, "loss": 0.3836, "lr": 0.0009015526743666951, "epoch": 5.6577568134171905, "percentage": 28.29, "elapsed_time": "0:27:31", "remaining_time": "1:09:47", "throughput": 4275.1, "total_tokens": 7061208} {"current_steps": 10800, "total_steps": 38160, "loss": 0.3714, "lr": 0.0009014163729576074, "epoch": 5.660377358490566, "percentage": 28.3, "elapsed_time": "0:27:32", "remaining_time": "1:09:46", "throughput": 4275.37, "total_tokens": 7065080} {"current_steps": 10805, "total_steps": 38160, "loss": 0.4087, "lr": 0.0009012799875767943, "epoch": 5.662997903563941, "percentage": 28.31, "elapsed_time": "0:27:33", "remaining_time": "1:09:45", "throughput": 4275.32, "total_tokens": 7067864} {"current_steps": 10810, "total_steps": 38160, "loss": 0.4081, "lr": 0.0009011435182527856, "epoch": 5.665618448637317, "percentage": 28.33, "elapsed_time": "0:27:33", "remaining_time": "1:09:44", "throughput": 4275.13, "total_tokens": 7070200} {"current_steps": 10815, "total_steps": 38160, "loss": 0.4394, "lr": 0.0009010069650141295, "epoch": 5.668238993710692, "percentage": 28.34, "elapsed_time": "0:27:34", "remaining_time": "1:09:43", "throughput": 4275.18, "total_tokens": 7073304} {"current_steps": 10820, "total_steps": 38160, "loss": 0.3678, "lr": 0.0009008703278893913, "epoch": 5.670859538784067, "percentage": 28.35, "elapsed_time": "0:27:35", "remaining_time": "1:09:42", "throughput": 4275.36, "total_tokens": 7076824} {"current_steps": 10825, "total_steps": 38160, "loss": 0.6282, "lr": 0.0009007336069071537, "epoch": 5.673480083857442, "percentage": 28.37, "elapsed_time": "0:27:36", "remaining_time": "1:09:41", "throughput": 4275.57, "total_tokens": 7080504} {"current_steps": 10830, "total_steps": 38160, "loss": 0.4127, "lr": 0.0009005968020960175, "epoch": 5.676100628930818, "percentage": 28.38, "elapsed_time": "0:27:36", "remaining_time": "1:09:40", "throughput": 4275.41, "total_tokens": 7082840} {"current_steps": 10835, "total_steps": 38160, "loss": 0.514, "lr": 0.0009004599134846004, "epoch": 5.678721174004193, "percentage": 28.39, "elapsed_time": "0:27:37", "remaining_time": "1:09:39", "throughput": 4275.46, "total_tokens": 7086008} {"current_steps": 10840, "total_steps": 38160, "loss": 0.456, "lr": 0.0009003229411015382, "epoch": 5.681341719077568, "percentage": 28.41, "elapsed_time": "0:27:38", "remaining_time": "1:09:38", "throughput": 4275.42, "total_tokens": 7088760} {"current_steps": 10845, "total_steps": 38160, "loss": 0.5384, "lr": 0.0009001858849754838, "epoch": 5.683962264150943, "percentage": 28.42, "elapsed_time": "0:27:38", "remaining_time": "1:09:37", "throughput": 4275.4, "total_tokens": 7091672} {"current_steps": 10850, "total_steps": 38160, "loss": 0.4719, "lr": 0.0009000487451351078, "epoch": 5.686582809224319, "percentage": 28.43, "elapsed_time": "0:27:39", "remaining_time": "1:09:37", "throughput": 4275.69, "total_tokens": 7095608} {"current_steps": 10855, "total_steps": 38160, "loss": 0.4353, "lr": 0.0008999115216090985, "epoch": 5.689203354297694, "percentage": 28.45, "elapsed_time": "0:27:40", "remaining_time": "1:09:36", "throughput": 4275.64, "total_tokens": 7098456} {"current_steps": 10860, "total_steps": 38160, "loss": 0.4764, "lr": 0.0008997742144261612, "epoch": 5.6918238993710695, "percentage": 28.46, "elapsed_time": "0:27:40", "remaining_time": "1:09:35", "throughput": 4275.63, "total_tokens": 7101304} {"current_steps": 10865, "total_steps": 38160, "loss": 0.4442, "lr": 0.000899636823615019, "epoch": 5.694444444444445, "percentage": 28.47, "elapsed_time": "0:27:41", "remaining_time": "1:09:34", "throughput": 4275.9, "total_tokens": 7105176} {"current_steps": 10870, "total_steps": 38160, "loss": 0.7117, "lr": 0.0008994993492044127, "epoch": 5.69706498951782, "percentage": 28.49, "elapsed_time": "0:27:42", "remaining_time": "1:09:33", "throughput": 4276.12, "total_tokens": 7109080} {"current_steps": 10875, "total_steps": 38160, "loss": 0.5641, "lr": 0.0008993617912231003, "epoch": 5.699685534591195, "percentage": 28.5, "elapsed_time": "0:27:43", "remaining_time": "1:09:33", "throughput": 4276.25, "total_tokens": 7112504} {"current_steps": 10880, "total_steps": 38160, "loss": 0.478, "lr": 0.0008992241496998572, "epoch": 5.70230607966457, "percentage": 28.51, "elapsed_time": "0:27:43", "remaining_time": "1:09:32", "throughput": 4276.34, "total_tokens": 7115768} {"current_steps": 10885, "total_steps": 38160, "loss": 0.5118, "lr": 0.0008990864246634767, "epoch": 5.704926624737945, "percentage": 28.52, "elapsed_time": "0:27:44", "remaining_time": "1:09:31", "throughput": 4276.35, "total_tokens": 7118712} {"current_steps": 10890, "total_steps": 38160, "loss": 0.3243, "lr": 0.0008989486161427691, "epoch": 5.7075471698113205, "percentage": 28.54, "elapsed_time": "0:27:45", "remaining_time": "1:09:30", "throughput": 4276.32, "total_tokens": 7121624} {"current_steps": 10895, "total_steps": 38160, "loss": 0.663, "lr": 0.0008988107241665624, "epoch": 5.710167714884696, "percentage": 28.55, "elapsed_time": "0:27:46", "remaining_time": "1:09:29", "throughput": 4276.36, "total_tokens": 7124696} {"current_steps": 10900, "total_steps": 38160, "loss": 0.6733, "lr": 0.0008986727487637022, "epoch": 5.712788259958071, "percentage": 28.56, "elapsed_time": "0:27:46", "remaining_time": "1:09:28", "throughput": 4276.52, "total_tokens": 7128216} {"current_steps": 10905, "total_steps": 38160, "loss": 0.5192, "lr": 0.0008985346899630513, "epoch": 5.715408805031447, "percentage": 28.58, "elapsed_time": "0:27:47", "remaining_time": "1:09:27", "throughput": 4276.48, "total_tokens": 7131064} {"current_steps": 10910, "total_steps": 38160, "loss": 0.5687, "lr": 0.0008983965477934899, "epoch": 5.718029350104822, "percentage": 28.59, "elapsed_time": "0:27:48", "remaining_time": "1:09:26", "throughput": 4276.41, "total_tokens": 7133784} {"current_steps": 10915, "total_steps": 38160, "loss": 0.4093, "lr": 0.0008982583222839158, "epoch": 5.720649895178197, "percentage": 28.6, "elapsed_time": "0:27:48", "remaining_time": "1:09:25", "throughput": 4276.64, "total_tokens": 7137496} {"current_steps": 10920, "total_steps": 38160, "loss": 0.5077, "lr": 0.0008981200134632444, "epoch": 5.723270440251572, "percentage": 28.62, "elapsed_time": "0:27:49", "remaining_time": "1:09:25", "throughput": 4276.69, "total_tokens": 7140792} {"current_steps": 10925, "total_steps": 38160, "loss": 0.3682, "lr": 0.000897981621360408, "epoch": 5.725890985324948, "percentage": 28.63, "elapsed_time": "0:27:50", "remaining_time": "1:09:24", "throughput": 4276.7, "total_tokens": 7143768} {"current_steps": 10930, "total_steps": 38160, "loss": 0.432, "lr": 0.0008978431460043569, "epoch": 5.728511530398323, "percentage": 28.64, "elapsed_time": "0:27:51", "remaining_time": "1:09:23", "throughput": 4276.72, "total_tokens": 7146904} {"current_steps": 10935, "total_steps": 38160, "loss": 0.4631, "lr": 0.0008977045874240585, "epoch": 5.731132075471698, "percentage": 28.66, "elapsed_time": "0:27:51", "remaining_time": "1:09:22", "throughput": 4276.7, "total_tokens": 7149816} {"current_steps": 10940, "total_steps": 38160, "loss": 0.4463, "lr": 0.0008975659456484977, "epoch": 5.733752620545073, "percentage": 28.67, "elapsed_time": "0:27:52", "remaining_time": "1:09:21", "throughput": 4276.68, "total_tokens": 7152760} {"current_steps": 10945, "total_steps": 38160, "loss": 0.5189, "lr": 0.0008974272207066767, "epoch": 5.736373165618449, "percentage": 28.68, "elapsed_time": "0:27:53", "remaining_time": "1:09:20", "throughput": 4276.64, "total_tokens": 7155576} {"current_steps": 10950, "total_steps": 38160, "loss": 0.5425, "lr": 0.0008972884126276152, "epoch": 5.738993710691824, "percentage": 28.69, "elapsed_time": "0:27:53", "remaining_time": "1:09:19", "throughput": 4276.38, "total_tokens": 7157688} {"current_steps": 10955, "total_steps": 38160, "loss": 0.4439, "lr": 0.0008971495214403502, "epoch": 5.7416142557651995, "percentage": 28.71, "elapsed_time": "0:27:54", "remaining_time": "1:09:18", "throughput": 4276.39, "total_tokens": 7160696} {"current_steps": 10960, "total_steps": 38160, "loss": 0.3907, "lr": 0.0008970105471739364, "epoch": 5.744234800838575, "percentage": 28.72, "elapsed_time": "0:27:55", "remaining_time": "1:09:18", "throughput": 4276.94, "total_tokens": 7165720} {"current_steps": 10965, "total_steps": 38160, "loss": 0.4039, "lr": 0.0008968714898574454, "epoch": 5.74685534591195, "percentage": 28.73, "elapsed_time": "0:27:56", "remaining_time": "1:09:17", "throughput": 4277.17, "total_tokens": 7169496} {"current_steps": 10970, "total_steps": 38160, "loss": 0.5426, "lr": 0.0008967323495199665, "epoch": 5.749475890985325, "percentage": 28.75, "elapsed_time": "0:27:56", "remaining_time": "1:09:16", "throughput": 4277.33, "total_tokens": 7172984} {"current_steps": 10975, "total_steps": 38160, "loss": 0.3941, "lr": 0.0008965931261906061, "epoch": 5.7520964360587, "percentage": 28.76, "elapsed_time": "0:27:57", "remaining_time": "1:09:15", "throughput": 4277.54, "total_tokens": 7176664} {"current_steps": 10980, "total_steps": 38160, "loss": 0.426, "lr": 0.0008964538198984885, "epoch": 5.754716981132075, "percentage": 28.77, "elapsed_time": "0:27:58", "remaining_time": "1:09:14", "throughput": 4277.52, "total_tokens": 7179544} {"current_steps": 10985, "total_steps": 38160, "loss": 0.4529, "lr": 0.0008963144306727547, "epoch": 5.7573375262054505, "percentage": 28.79, "elapsed_time": "0:27:59", "remaining_time": "1:09:13", "throughput": 4277.57, "total_tokens": 7182680} {"current_steps": 10990, "total_steps": 38160, "loss": 0.6472, "lr": 0.0008961749585425634, "epoch": 5.759958071278826, "percentage": 28.8, "elapsed_time": "0:27:59", "remaining_time": "1:09:13", "throughput": 4277.62, "total_tokens": 7185880} {"current_steps": 10995, "total_steps": 38160, "loss": 0.4404, "lr": 0.0008960354035370905, "epoch": 5.762578616352201, "percentage": 28.81, "elapsed_time": "0:28:00", "remaining_time": "1:09:12", "throughput": 4277.59, "total_tokens": 7188760} {"current_steps": 11000, "total_steps": 38160, "loss": 0.4819, "lr": 0.0008958957656855294, "epoch": 5.765199161425577, "percentage": 28.83, "elapsed_time": "0:28:01", "remaining_time": "1:09:11", "throughput": 4277.87, "total_tokens": 7192632} {"current_steps": 11005, "total_steps": 38160, "loss": 0.4353, "lr": 0.0008957560450170907, "epoch": 5.767819706498952, "percentage": 28.84, "elapsed_time": "0:28:02", "remaining_time": "1:09:10", "throughput": 4277.87, "total_tokens": 7195576} {"current_steps": 11010, "total_steps": 38160, "loss": 0.5292, "lr": 0.0008956162415610025, "epoch": 5.770440251572327, "percentage": 28.85, "elapsed_time": "0:28:02", "remaining_time": "1:09:09", "throughput": 4278.14, "total_tokens": 7199512} {"current_steps": 11015, "total_steps": 38160, "loss": 0.5609, "lr": 0.00089547635534651, "epoch": 5.773060796645702, "percentage": 28.87, "elapsed_time": "0:28:03", "remaining_time": "1:09:08", "throughput": 4278.06, "total_tokens": 7202168} {"current_steps": 11020, "total_steps": 38160, "loss": 0.4451, "lr": 0.0008953363864028758, "epoch": 5.7756813417190775, "percentage": 28.88, "elapsed_time": "0:28:04", "remaining_time": "1:09:08", "throughput": 4278.36, "total_tokens": 7206200} {"current_steps": 11025, "total_steps": 38160, "loss": 0.5304, "lr": 0.0008951963347593796, "epoch": 5.778301886792453, "percentage": 28.89, "elapsed_time": "0:28:05", "remaining_time": "1:09:07", "throughput": 4278.56, "total_tokens": 7209848} {"current_steps": 11030, "total_steps": 38160, "loss": 0.4836, "lr": 0.0008950562004453191, "epoch": 5.780922431865828, "percentage": 28.9, "elapsed_time": "0:28:05", "remaining_time": "1:09:06", "throughput": 4278.85, "total_tokens": 7213848} {"current_steps": 11035, "total_steps": 38160, "loss": 0.2964, "lr": 0.0008949159834900082, "epoch": 5.783542976939203, "percentage": 28.92, "elapsed_time": "0:28:06", "remaining_time": "1:09:05", "throughput": 4278.92, "total_tokens": 7217048} {"current_steps": 11040, "total_steps": 38160, "loss": 0.4228, "lr": 0.0008947756839227792, "epoch": 5.786163522012579, "percentage": 28.93, "elapsed_time": "0:28:07", "remaining_time": "1:09:05", "throughput": 4279.03, "total_tokens": 7220344} {"current_steps": 11045, "total_steps": 38160, "loss": 0.4384, "lr": 0.0008946353017729809, "epoch": 5.788784067085954, "percentage": 28.94, "elapsed_time": "0:28:08", "remaining_time": "1:09:04", "throughput": 4278.95, "total_tokens": 7222936} {"current_steps": 11050, "total_steps": 38160, "loss": 0.4354, "lr": 0.0008944948370699798, "epoch": 5.7914046121593294, "percentage": 28.96, "elapsed_time": "0:28:08", "remaining_time": "1:09:03", "throughput": 4278.99, "total_tokens": 7226040} {"current_steps": 11055, "total_steps": 38160, "loss": 0.4812, "lr": 0.0008943542898431593, "epoch": 5.794025157232705, "percentage": 28.97, "elapsed_time": "0:28:09", "remaining_time": "1:09:02", "throughput": 4279.22, "total_tokens": 7229752} {"current_steps": 11060, "total_steps": 38160, "loss": 0.4029, "lr": 0.0008942136601219205, "epoch": 5.79664570230608, "percentage": 28.98, "elapsed_time": "0:28:10", "remaining_time": "1:09:01", "throughput": 4279.16, "total_tokens": 7232504} {"current_steps": 11065, "total_steps": 38160, "loss": 0.4121, "lr": 0.0008940729479356813, "epoch": 5.799266247379455, "percentage": 29.0, "elapsed_time": "0:28:10", "remaining_time": "1:09:00", "throughput": 4279.25, "total_tokens": 7235928} {"current_steps": 11070, "total_steps": 38160, "loss": 0.45, "lr": 0.0008939321533138774, "epoch": 5.80188679245283, "percentage": 29.01, "elapsed_time": "0:28:11", "remaining_time": "1:08:59", "throughput": 4279.18, "total_tokens": 7238616} {"current_steps": 11075, "total_steps": 38160, "loss": 0.5843, "lr": 0.0008937912762859611, "epoch": 5.804507337526205, "percentage": 29.02, "elapsed_time": "0:28:12", "remaining_time": "1:08:58", "throughput": 4279.34, "total_tokens": 7242200} {"current_steps": 11080, "total_steps": 38160, "loss": 0.422, "lr": 0.0008936503168814024, "epoch": 5.8071278825995805, "percentage": 29.04, "elapsed_time": "0:28:13", "remaining_time": "1:08:57", "throughput": 4279.42, "total_tokens": 7245400} {"current_steps": 11085, "total_steps": 38160, "loss": 0.4229, "lr": 0.0008935092751296885, "epoch": 5.809748427672956, "percentage": 29.05, "elapsed_time": "0:28:13", "remaining_time": "1:08:56", "throughput": 4279.32, "total_tokens": 7247960} {"current_steps": 11090, "total_steps": 38160, "loss": 0.4178, "lr": 0.0008933681510603235, "epoch": 5.812368972746331, "percentage": 29.06, "elapsed_time": "0:28:14", "remaining_time": "1:08:56", "throughput": 4279.49, "total_tokens": 7251512} {"current_steps": 11095, "total_steps": 38160, "loss": 0.4262, "lr": 0.0008932269447028292, "epoch": 5.814989517819707, "percentage": 29.07, "elapsed_time": "0:28:15", "remaining_time": "1:08:54", "throughput": 4279.3, "total_tokens": 7253784} {"current_steps": 11100, "total_steps": 38160, "loss": 0.5427, "lr": 0.0008930856560867442, "epoch": 5.817610062893082, "percentage": 29.09, "elapsed_time": "0:28:15", "remaining_time": "1:08:54", "throughput": 4279.35, "total_tokens": 7256824} {"current_steps": 11105, "total_steps": 38160, "loss": 0.5621, "lr": 0.0008929442852416245, "epoch": 5.820230607966457, "percentage": 29.1, "elapsed_time": "0:28:16", "remaining_time": "1:08:53", "throughput": 4279.41, "total_tokens": 7259928} {"current_steps": 11110, "total_steps": 38160, "loss": 0.5909, "lr": 0.0008928028321970433, "epoch": 5.822851153039832, "percentage": 29.11, "elapsed_time": "0:28:17", "remaining_time": "1:08:52", "throughput": 4279.38, "total_tokens": 7262680} {"current_steps": 11115, "total_steps": 38160, "loss": 0.5574, "lr": 0.0008926612969825909, "epoch": 5.8254716981132075, "percentage": 29.13, "elapsed_time": "0:28:17", "remaining_time": "1:08:51", "throughput": 4279.34, "total_tokens": 7265432} {"current_steps": 11120, "total_steps": 38160, "loss": 0.3929, "lr": 0.000892519679627875, "epoch": 5.828092243186583, "percentage": 29.14, "elapsed_time": "0:28:18", "remaining_time": "1:08:50", "throughput": 4279.29, "total_tokens": 7268120} {"current_steps": 11125, "total_steps": 38160, "loss": 0.5152, "lr": 0.00089237798016252, "epoch": 5.830712788259958, "percentage": 29.15, "elapsed_time": "0:28:19", "remaining_time": "1:08:49", "throughput": 4279.32, "total_tokens": 7271160} {"current_steps": 11130, "total_steps": 38160, "loss": 0.6891, "lr": 0.0008922361986161682, "epoch": 5.833333333333333, "percentage": 29.17, "elapsed_time": "0:28:19", "remaining_time": "1:08:48", "throughput": 4279.68, "total_tokens": 7275416} {"current_steps": 11135, "total_steps": 38160, "loss": 0.4436, "lr": 0.0008920943350184785, "epoch": 5.835953878406709, "percentage": 29.18, "elapsed_time": "0:28:20", "remaining_time": "1:08:47", "throughput": 4279.67, "total_tokens": 7278360} {"current_steps": 11140, "total_steps": 38160, "loss": 0.5912, "lr": 0.0008919523893991271, "epoch": 5.838574423480084, "percentage": 29.19, "elapsed_time": "0:28:21", "remaining_time": "1:08:46", "throughput": 4279.82, "total_tokens": 7281752} {"current_steps": 11145, "total_steps": 38160, "loss": 0.5289, "lr": 0.0008918103617878075, "epoch": 5.841194968553459, "percentage": 29.21, "elapsed_time": "0:28:22", "remaining_time": "1:08:45", "throughput": 4279.75, "total_tokens": 7284472} {"current_steps": 11150, "total_steps": 38160, "loss": 0.4683, "lr": 0.0008916682522142302, "epoch": 5.843815513626835, "percentage": 29.22, "elapsed_time": "0:28:22", "remaining_time": "1:08:44", "throughput": 4279.76, "total_tokens": 7287448} {"current_steps": 11155, "total_steps": 38160, "loss": 0.4345, "lr": 0.000891526060708123, "epoch": 5.84643605870021, "percentage": 29.23, "elapsed_time": "0:28:23", "remaining_time": "1:08:43", "throughput": 4279.87, "total_tokens": 7290776} {"current_steps": 11160, "total_steps": 38160, "loss": 0.4834, "lr": 0.0008913837872992306, "epoch": 5.849056603773585, "percentage": 29.25, "elapsed_time": "0:28:24", "remaining_time": "1:08:43", "throughput": 4279.89, "total_tokens": 7293752} {"current_steps": 11165, "total_steps": 38160, "loss": 0.6157, "lr": 0.000891241432017315, "epoch": 5.85167714884696, "percentage": 29.26, "elapsed_time": "0:28:24", "remaining_time": "1:08:42", "throughput": 4279.95, "total_tokens": 7296856} {"current_steps": 11170, "total_steps": 38160, "loss": 0.5377, "lr": 0.0008910989948921555, "epoch": 5.854297693920335, "percentage": 29.27, "elapsed_time": "0:28:25", "remaining_time": "1:08:41", "throughput": 4280.01, "total_tokens": 7299992} {"current_steps": 11175, "total_steps": 38160, "loss": 0.582, "lr": 0.000890956475953548, "epoch": 5.8569182389937104, "percentage": 29.28, "elapsed_time": "0:28:26", "remaining_time": "1:08:40", "throughput": 4279.98, "total_tokens": 7302808} {"current_steps": 11180, "total_steps": 38160, "loss": 0.6008, "lr": 0.0008908138752313061, "epoch": 5.859538784067086, "percentage": 29.3, "elapsed_time": "0:28:27", "remaining_time": "1:08:39", "throughput": 4280.04, "total_tokens": 7306040} {"current_steps": 11185, "total_steps": 38160, "loss": 0.4098, "lr": 0.0008906711927552601, "epoch": 5.862159329140461, "percentage": 29.31, "elapsed_time": "0:28:27", "remaining_time": "1:08:38", "throughput": 4279.98, "total_tokens": 7308760} {"current_steps": 11190, "total_steps": 38160, "loss": 0.4474, "lr": 0.0008905284285552575, "epoch": 5.864779874213837, "percentage": 29.32, "elapsed_time": "0:28:28", "remaining_time": "1:08:37", "throughput": 4279.82, "total_tokens": 7311128} {"current_steps": 11195, "total_steps": 38160, "loss": 0.51, "lr": 0.0008903855826611631, "epoch": 5.867400419287212, "percentage": 29.34, "elapsed_time": "0:28:29", "remaining_time": "1:08:36", "throughput": 4279.91, "total_tokens": 7314424} {"current_steps": 11200, "total_steps": 38160, "loss": 0.4654, "lr": 0.0008902426551028586, "epoch": 5.870020964360587, "percentage": 29.35, "elapsed_time": "0:28:29", "remaining_time": "1:08:35", "throughput": 4280.0, "total_tokens": 7317656} {"current_steps": 11205, "total_steps": 38160, "loss": 0.5562, "lr": 0.0008900996459102428, "epoch": 5.872641509433962, "percentage": 29.36, "elapsed_time": "0:28:30", "remaining_time": "1:08:34", "throughput": 4280.23, "total_tokens": 7321432} {"current_steps": 11210, "total_steps": 38160, "loss": 0.5058, "lr": 0.0008899565551132315, "epoch": 5.8752620545073375, "percentage": 29.38, "elapsed_time": "0:28:31", "remaining_time": "1:08:34", "throughput": 4280.41, "total_tokens": 7325016} {"current_steps": 11215, "total_steps": 38160, "loss": 0.4113, "lr": 0.0008898133827417578, "epoch": 5.877882599580713, "percentage": 29.39, "elapsed_time": "0:28:31", "remaining_time": "1:08:33", "throughput": 4280.34, "total_tokens": 7327704} {"current_steps": 11220, "total_steps": 38160, "loss": 0.3972, "lr": 0.0008896701288257716, "epoch": 5.880503144654088, "percentage": 29.4, "elapsed_time": "0:28:32", "remaining_time": "1:08:32", "throughput": 4280.5, "total_tokens": 7331288} {"current_steps": 11225, "total_steps": 38160, "loss": 0.4082, "lr": 0.00088952679339524, "epoch": 5.883123689727463, "percentage": 29.42, "elapsed_time": "0:28:33", "remaining_time": "1:08:31", "throughput": 4280.36, "total_tokens": 7333784} {"current_steps": 11230, "total_steps": 38160, "loss": 0.5052, "lr": 0.0008893833764801473, "epoch": 5.885744234800838, "percentage": 29.43, "elapsed_time": "0:28:34", "remaining_time": "1:08:30", "throughput": 4280.28, "total_tokens": 7336440} {"current_steps": 11235, "total_steps": 38160, "loss": 0.5028, "lr": 0.0008892398781104945, "epoch": 5.888364779874214, "percentage": 29.44, "elapsed_time": "0:28:35", "remaining_time": "1:08:30", "throughput": 4281.05, "total_tokens": 7342360} {"current_steps": 11240, "total_steps": 38160, "loss": 0.4241, "lr": 0.0008890962983162997, "epoch": 5.890985324947589, "percentage": 29.45, "elapsed_time": "0:28:35", "remaining_time": "1:08:29", "throughput": 4280.88, "total_tokens": 7344664} {"current_steps": 11245, "total_steps": 38160, "loss": 0.4587, "lr": 0.0008889526371275987, "epoch": 5.893605870020965, "percentage": 29.47, "elapsed_time": "0:28:36", "remaining_time": "1:08:28", "throughput": 4280.91, "total_tokens": 7347736} {"current_steps": 11250, "total_steps": 38160, "loss": 0.5503, "lr": 0.0008888088945744432, "epoch": 5.89622641509434, "percentage": 29.48, "elapsed_time": "0:28:37", "remaining_time": "1:08:27", "throughput": 4280.89, "total_tokens": 7350584} {"current_steps": 11255, "total_steps": 38160, "loss": 0.4344, "lr": 0.0008886650706869027, "epoch": 5.898846960167715, "percentage": 29.49, "elapsed_time": "0:28:37", "remaining_time": "1:08:26", "throughput": 4280.83, "total_tokens": 7353368} {"current_steps": 11260, "total_steps": 38160, "loss": 0.437, "lr": 0.0008885211654950636, "epoch": 5.90146750524109, "percentage": 29.51, "elapsed_time": "0:28:38", "remaining_time": "1:08:25", "throughput": 4281.0, "total_tokens": 7356952} {"current_steps": 11265, "total_steps": 38160, "loss": 0.6152, "lr": 0.0008883771790290291, "epoch": 5.904088050314465, "percentage": 29.52, "elapsed_time": "0:28:39", "remaining_time": "1:08:24", "throughput": 4281.1, "total_tokens": 7360280} {"current_steps": 11270, "total_steps": 38160, "loss": 0.424, "lr": 0.0008882331113189197, "epoch": 5.90670859538784, "percentage": 29.53, "elapsed_time": "0:28:39", "remaining_time": "1:08:23", "throughput": 4281.12, "total_tokens": 7363352} {"current_steps": 11275, "total_steps": 38160, "loss": 0.3943, "lr": 0.0008880889623948724, "epoch": 5.909329140461216, "percentage": 29.55, "elapsed_time": "0:28:40", "remaining_time": "1:08:22", "throughput": 4281.07, "total_tokens": 7366104} {"current_steps": 11280, "total_steps": 38160, "loss": 0.4557, "lr": 0.000887944732287042, "epoch": 5.911949685534591, "percentage": 29.56, "elapsed_time": "0:28:41", "remaining_time": "1:08:21", "throughput": 4281.05, "total_tokens": 7368952} {"current_steps": 11285, "total_steps": 38160, "loss": 0.4602, "lr": 0.0008878004210255995, "epoch": 5.914570230607967, "percentage": 29.57, "elapsed_time": "0:28:42", "remaining_time": "1:08:20", "throughput": 4281.1, "total_tokens": 7372120} {"current_steps": 11290, "total_steps": 38160, "loss": 0.3098, "lr": 0.0008876560286407329, "epoch": 5.917190775681342, "percentage": 29.59, "elapsed_time": "0:28:42", "remaining_time": "1:08:20", "throughput": 4281.28, "total_tokens": 7375768} {"current_steps": 11295, "total_steps": 38160, "loss": 0.4483, "lr": 0.000887511555162648, "epoch": 5.919811320754717, "percentage": 29.6, "elapsed_time": "0:28:43", "remaining_time": "1:08:19", "throughput": 4281.24, "total_tokens": 7378520} {"current_steps": 11300, "total_steps": 38160, "loss": 0.4288, "lr": 0.0008873670006215666, "epoch": 5.922431865828092, "percentage": 29.61, "elapsed_time": "0:28:44", "remaining_time": "1:08:18", "throughput": 4281.19, "total_tokens": 7381304} {"current_steps": 11305, "total_steps": 38160, "loss": 0.3978, "lr": 0.0008872223650477281, "epoch": 5.9250524109014675, "percentage": 29.63, "elapsed_time": "0:28:44", "remaining_time": "1:08:17", "throughput": 4281.28, "total_tokens": 7384632} {"current_steps": 11310, "total_steps": 38160, "loss": 0.526, "lr": 0.0008870776484713882, "epoch": 5.927672955974843, "percentage": 29.64, "elapsed_time": "0:28:45", "remaining_time": "1:08:16", "throughput": 4281.24, "total_tokens": 7387320} {"current_steps": 11315, "total_steps": 38160, "loss": 0.4415, "lr": 0.0008869328509228205, "epoch": 5.930293501048218, "percentage": 29.65, "elapsed_time": "0:28:46", "remaining_time": "1:08:15", "throughput": 4281.25, "total_tokens": 7390328} {"current_steps": 11320, "total_steps": 38160, "loss": 0.4505, "lr": 0.0008867879724323147, "epoch": 5.932914046121593, "percentage": 29.66, "elapsed_time": "0:28:46", "remaining_time": "1:08:14", "throughput": 4281.44, "total_tokens": 7393976} {"current_steps": 11325, "total_steps": 38160, "loss": 0.5664, "lr": 0.0008866430130301777, "epoch": 5.935534591194968, "percentage": 29.68, "elapsed_time": "0:28:47", "remaining_time": "1:08:13", "throughput": 4281.45, "total_tokens": 7396984} {"current_steps": 11330, "total_steps": 38160, "loss": 0.5457, "lr": 0.0008864979727467335, "epoch": 5.938155136268344, "percentage": 29.69, "elapsed_time": "0:28:48", "remaining_time": "1:08:12", "throughput": 4281.42, "total_tokens": 7399832} {"current_steps": 11335, "total_steps": 38160, "loss": 0.5273, "lr": 0.000886352851612323, "epoch": 5.940775681341719, "percentage": 29.7, "elapsed_time": "0:28:49", "remaining_time": "1:08:11", "throughput": 4281.52, "total_tokens": 7403064} {"current_steps": 11340, "total_steps": 38160, "loss": 0.5641, "lr": 0.0008862076496573034, "epoch": 5.943396226415095, "percentage": 29.72, "elapsed_time": "0:28:49", "remaining_time": "1:08:10", "throughput": 4281.37, "total_tokens": 7405432} {"current_steps": 11345, "total_steps": 38160, "loss": 0.3942, "lr": 0.0008860623669120496, "epoch": 5.94601677148847, "percentage": 29.73, "elapsed_time": "0:28:50", "remaining_time": "1:08:09", "throughput": 4281.2, "total_tokens": 7407800} {"current_steps": 11350, "total_steps": 38160, "loss": 0.4601, "lr": 0.0008859170034069533, "epoch": 5.948637316561845, "percentage": 29.74, "elapsed_time": "0:28:50", "remaining_time": "1:08:08", "throughput": 4281.14, "total_tokens": 7410552} {"current_steps": 11355, "total_steps": 38160, "loss": 0.5205, "lr": 0.0008857715591724225, "epoch": 5.95125786163522, "percentage": 29.76, "elapsed_time": "0:28:51", "remaining_time": "1:08:07", "throughput": 4281.25, "total_tokens": 7413912} {"current_steps": 11360, "total_steps": 38160, "loss": 0.5179, "lr": 0.0008856260342388827, "epoch": 5.953878406708595, "percentage": 29.77, "elapsed_time": "0:28:52", "remaining_time": "1:08:07", "throughput": 4281.38, "total_tokens": 7417400} {"current_steps": 11365, "total_steps": 38160, "loss": 0.4656, "lr": 0.0008854804286367758, "epoch": 5.95649895178197, "percentage": 29.78, "elapsed_time": "0:28:53", "remaining_time": "1:08:06", "throughput": 4281.37, "total_tokens": 7420344} {"current_steps": 11370, "total_steps": 38160, "loss": 0.4086, "lr": 0.0008853347423965612, "epoch": 5.959119496855346, "percentage": 29.8, "elapsed_time": "0:28:53", "remaining_time": "1:08:05", "throughput": 4281.38, "total_tokens": 7423288} {"current_steps": 11375, "total_steps": 38160, "loss": 0.4152, "lr": 0.0008851889755487146, "epoch": 5.961740041928721, "percentage": 29.81, "elapsed_time": "0:28:54", "remaining_time": "1:08:05", "throughput": 4281.99, "total_tokens": 7428536} {"current_steps": 11380, "total_steps": 38160, "loss": 0.5324, "lr": 0.0008850431281237288, "epoch": 5.964360587002097, "percentage": 29.82, "elapsed_time": "0:28:55", "remaining_time": "1:08:04", "throughput": 4282.06, "total_tokens": 7431736} {"current_steps": 11385, "total_steps": 38160, "loss": 0.5942, "lr": 0.0008848972001521134, "epoch": 5.966981132075472, "percentage": 29.83, "elapsed_time": "0:28:56", "remaining_time": "1:08:03", "throughput": 4281.91, "total_tokens": 7434136} {"current_steps": 11390, "total_steps": 38160, "loss": 0.5001, "lr": 0.0008847511916643948, "epoch": 5.969601677148847, "percentage": 29.85, "elapsed_time": "0:28:56", "remaining_time": "1:08:02", "throughput": 4281.91, "total_tokens": 7437112} {"current_steps": 11395, "total_steps": 38160, "loss": 0.4516, "lr": 0.0008846051026911164, "epoch": 5.972222222222222, "percentage": 29.86, "elapsed_time": "0:28:57", "remaining_time": "1:08:01", "throughput": 4281.92, "total_tokens": 7440120} {"current_steps": 11400, "total_steps": 38160, "loss": 0.6278, "lr": 0.0008844589332628383, "epoch": 5.9748427672955975, "percentage": 29.87, "elapsed_time": "0:28:58", "remaining_time": "1:08:00", "throughput": 4282.07, "total_tokens": 7443608} {"current_steps": 11405, "total_steps": 38160, "loss": 0.4145, "lr": 0.0008843126834101376, "epoch": 5.977463312368973, "percentage": 29.89, "elapsed_time": "0:28:59", "remaining_time": "1:07:59", "throughput": 4282.13, "total_tokens": 7446808} {"current_steps": 11410, "total_steps": 38160, "loss": 0.3683, "lr": 0.000884166353163608, "epoch": 5.980083857442348, "percentage": 29.9, "elapsed_time": "0:28:59", "remaining_time": "1:07:58", "throughput": 4282.14, "total_tokens": 7449880} {"current_steps": 11415, "total_steps": 38160, "loss": 0.5175, "lr": 0.0008840199425538599, "epoch": 5.982704402515723, "percentage": 29.91, "elapsed_time": "0:29:00", "remaining_time": "1:07:58", "throughput": 4282.47, "total_tokens": 7454040} {"current_steps": 11420, "total_steps": 38160, "loss": 0.5049, "lr": 0.0008838734516115213, "epoch": 5.985324947589098, "percentage": 29.93, "elapsed_time": "0:29:01", "remaining_time": "1:07:57", "throughput": 4282.47, "total_tokens": 7456984} {"current_steps": 11425, "total_steps": 38160, "loss": 0.4272, "lr": 0.0008837268803672359, "epoch": 5.987945492662474, "percentage": 29.94, "elapsed_time": "0:29:02", "remaining_time": "1:07:56", "throughput": 4282.59, "total_tokens": 7460440} {"current_steps": 11430, "total_steps": 38160, "loss": 0.4139, "lr": 0.0008835802288516647, "epoch": 5.990566037735849, "percentage": 29.95, "elapsed_time": "0:29:02", "remaining_time": "1:07:56", "throughput": 4283.12, "total_tokens": 7465336} {"current_steps": 11435, "total_steps": 38160, "loss": 0.4585, "lr": 0.0008834334970954861, "epoch": 5.993186582809225, "percentage": 29.97, "elapsed_time": "0:29:03", "remaining_time": "1:07:55", "throughput": 4283.21, "total_tokens": 7468536} {"current_steps": 11440, "total_steps": 38160, "loss": 0.3776, "lr": 0.0008832866851293941, "epoch": 5.9958071278826, "percentage": 29.98, "elapsed_time": "0:29:04", "remaining_time": "1:07:54", "throughput": 4283.31, "total_tokens": 7471928} {"current_steps": 11445, "total_steps": 38160, "loss": 0.4036, "lr": 0.0008831397929841005, "epoch": 5.998427672955975, "percentage": 29.99, "elapsed_time": "0:29:05", "remaining_time": "1:07:53", "throughput": 4283.42, "total_tokens": 7475320} {"current_steps": 11448, "total_steps": 38160, "eval_loss": 0.49057719111442566, "epoch": 6.0, "percentage": 30.0, "elapsed_time": "0:29:19", "remaining_time": "1:08:25", "throughput": 4249.42, "total_tokens": 7476480} {"current_steps": 11450, "total_steps": 38160, "loss": 0.3927, "lr": 0.0008829928206903333, "epoch": 6.00104821802935, "percentage": 30.01, "elapsed_time": "0:29:21", "remaining_time": "1:08:28", "throughput": 4245.33, "total_tokens": 7477440} {"current_steps": 11455, "total_steps": 38160, "loss": 0.4461, "lr": 0.0008828457682788373, "epoch": 6.003668763102725, "percentage": 30.02, "elapsed_time": "0:29:22", "remaining_time": "1:08:27", "throughput": 4245.29, "total_tokens": 7480224} {"current_steps": 11460, "total_steps": 38160, "loss": 0.3373, "lr": 0.0008826986357803743, "epoch": 6.0062893081761, "percentage": 30.03, "elapsed_time": "0:29:22", "remaining_time": "1:08:26", "throughput": 4245.35, "total_tokens": 7483392} {"current_steps": 11465, "total_steps": 38160, "loss": 0.3575, "lr": 0.0008825514232257228, "epoch": 6.008909853249476, "percentage": 30.04, "elapsed_time": "0:29:23", "remaining_time": "1:08:26", "throughput": 4245.44, "total_tokens": 7486688} {"current_steps": 11470, "total_steps": 38160, "loss": 0.4384, "lr": 0.000882404130645678, "epoch": 6.011530398322851, "percentage": 30.06, "elapsed_time": "0:29:24", "remaining_time": "1:08:24", "throughput": 4245.33, "total_tokens": 7489216} {"current_steps": 11475, "total_steps": 38160, "loss": 0.3793, "lr": 0.0008822567580710518, "epoch": 6.014150943396227, "percentage": 30.07, "elapsed_time": "0:29:24", "remaining_time": "1:08:23", "throughput": 4245.3, "total_tokens": 7491968} {"current_steps": 11480, "total_steps": 38160, "loss": 0.4231, "lr": 0.0008821093055326728, "epoch": 6.016771488469602, "percentage": 30.08, "elapsed_time": "0:29:25", "remaining_time": "1:08:23", "throughput": 4245.49, "total_tokens": 7495648} {"current_steps": 11485, "total_steps": 38160, "loss": 0.3416, "lr": 0.0008819617730613863, "epoch": 6.019392033542977, "percentage": 30.1, "elapsed_time": "0:29:26", "remaining_time": "1:08:22", "throughput": 4245.28, "total_tokens": 7497792} {"current_steps": 11490, "total_steps": 38160, "loss": 0.4165, "lr": 0.0008818141606880545, "epoch": 6.022012578616352, "percentage": 30.11, "elapsed_time": "0:29:26", "remaining_time": "1:08:21", "throughput": 4245.3, "total_tokens": 7500736} {"current_steps": 11495, "total_steps": 38160, "loss": 0.4544, "lr": 0.0008816664684435564, "epoch": 6.0246331236897275, "percentage": 30.12, "elapsed_time": "0:29:27", "remaining_time": "1:08:20", "throughput": 4245.51, "total_tokens": 7504480} {"current_steps": 11500, "total_steps": 38160, "loss": 0.555, "lr": 0.0008815186963587873, "epoch": 6.027253668763103, "percentage": 30.14, "elapsed_time": "0:29:28", "remaining_time": "1:08:19", "throughput": 4245.5, "total_tokens": 7507392} {"current_steps": 11505, "total_steps": 38160, "loss": 0.4647, "lr": 0.0008813708444646596, "epoch": 6.029874213836478, "percentage": 30.15, "elapsed_time": "0:29:29", "remaining_time": "1:08:19", "throughput": 4246.11, "total_tokens": 7512896} {"current_steps": 11510, "total_steps": 38160, "loss": 0.5681, "lr": 0.0008812229127921021, "epoch": 6.032494758909853, "percentage": 30.16, "elapsed_time": "0:29:30", "remaining_time": "1:08:18", "throughput": 4246.2, "total_tokens": 7516064} {"current_steps": 11515, "total_steps": 38160, "loss": 0.49, "lr": 0.0008810749013720605, "epoch": 6.035115303983228, "percentage": 30.18, "elapsed_time": "0:29:30", "remaining_time": "1:08:17", "throughput": 4246.1, "total_tokens": 7518560} {"current_steps": 11520, "total_steps": 38160, "loss": 0.3788, "lr": 0.0008809268102354969, "epoch": 6.037735849056604, "percentage": 30.19, "elapsed_time": "0:29:31", "remaining_time": "1:08:16", "throughput": 4246.52, "total_tokens": 7523168} {"current_steps": 11525, "total_steps": 38160, "loss": 0.4558, "lr": 0.0008807786394133905, "epoch": 6.040356394129979, "percentage": 30.2, "elapsed_time": "0:29:32", "remaining_time": "1:08:15", "throughput": 4246.54, "total_tokens": 7526144} {"current_steps": 11530, "total_steps": 38160, "loss": 0.4494, "lr": 0.0008806303889367371, "epoch": 6.0429769392033545, "percentage": 30.21, "elapsed_time": "0:29:33", "remaining_time": "1:08:15", "throughput": 4246.85, "total_tokens": 7530240} {"current_steps": 11535, "total_steps": 38160, "loss": 0.3604, "lr": 0.0008804820588365485, "epoch": 6.04559748427673, "percentage": 30.23, "elapsed_time": "0:29:33", "remaining_time": "1:08:14", "throughput": 4247.16, "total_tokens": 7534304} {"current_steps": 11540, "total_steps": 38160, "loss": 0.6082, "lr": 0.0008803336491438543, "epoch": 6.048218029350105, "percentage": 30.24, "elapsed_time": "0:29:34", "remaining_time": "1:08:13", "throughput": 4247.11, "total_tokens": 7537088} {"current_steps": 11545, "total_steps": 38160, "loss": 0.4887, "lr": 0.0008801851598896995, "epoch": 6.05083857442348, "percentage": 30.25, "elapsed_time": "0:29:35", "remaining_time": "1:08:12", "throughput": 4247.29, "total_tokens": 7540768} {"current_steps": 11550, "total_steps": 38160, "loss": 0.4509, "lr": 0.0008800365911051467, "epoch": 6.053459119496855, "percentage": 30.27, "elapsed_time": "0:29:36", "remaining_time": "1:08:12", "throughput": 4247.36, "total_tokens": 7543968} {"current_steps": 11555, "total_steps": 38160, "loss": 0.3844, "lr": 0.0008798879428212747, "epoch": 6.05607966457023, "percentage": 30.28, "elapsed_time": "0:29:36", "remaining_time": "1:08:11", "throughput": 4247.47, "total_tokens": 7547296} {"current_steps": 11560, "total_steps": 38160, "loss": 0.4765, "lr": 0.0008797392150691792, "epoch": 6.058700209643606, "percentage": 30.29, "elapsed_time": "0:29:37", "remaining_time": "1:08:10", "throughput": 4247.63, "total_tokens": 7550720} {"current_steps": 11565, "total_steps": 38160, "loss": 0.4565, "lr": 0.000879590407879972, "epoch": 6.061320754716981, "percentage": 30.31, "elapsed_time": "0:29:38", "remaining_time": "1:08:09", "throughput": 4247.76, "total_tokens": 7554208} {"current_steps": 11570, "total_steps": 38160, "loss": 0.4437, "lr": 0.0008794415212847822, "epoch": 6.063941299790357, "percentage": 30.32, "elapsed_time": "0:29:39", "remaining_time": "1:08:09", "throughput": 4248.49, "total_tokens": 7560288} {"current_steps": 11575, "total_steps": 38160, "loss": 0.3973, "lr": 0.000879292555314755, "epoch": 6.066561844863732, "percentage": 30.33, "elapsed_time": "0:29:40", "remaining_time": "1:08:08", "throughput": 4248.51, "total_tokens": 7563264} {"current_steps": 11580, "total_steps": 38160, "loss": 0.3984, "lr": 0.0008791435100010524, "epoch": 6.069182389937107, "percentage": 30.35, "elapsed_time": "0:29:40", "remaining_time": "1:08:07", "throughput": 4248.61, "total_tokens": 7566624} {"current_steps": 11585, "total_steps": 38160, "loss": 0.5022, "lr": 0.000878994385374853, "epoch": 6.071802935010482, "percentage": 30.36, "elapsed_time": "0:29:41", "remaining_time": "1:08:07", "throughput": 4248.72, "total_tokens": 7569952} {"current_steps": 11590, "total_steps": 38160, "loss": 0.4367, "lr": 0.0008788451814673521, "epoch": 6.0744234800838575, "percentage": 30.37, "elapsed_time": "0:29:42", "remaining_time": "1:08:06", "throughput": 4249.06, "total_tokens": 7574240} {"current_steps": 11595, "total_steps": 38160, "loss": 0.4496, "lr": 0.0008786958983097613, "epoch": 6.077044025157233, "percentage": 30.39, "elapsed_time": "0:29:43", "remaining_time": "1:08:05", "throughput": 4249.21, "total_tokens": 7577792} {"current_steps": 11600, "total_steps": 38160, "loss": 0.4815, "lr": 0.0008785465359333088, "epoch": 6.079664570230608, "percentage": 30.4, "elapsed_time": "0:29:44", "remaining_time": "1:08:05", "throughput": 4249.4, "total_tokens": 7581440} {"current_steps": 11605, "total_steps": 38160, "loss": 0.3073, "lr": 0.0008783970943692398, "epoch": 6.082285115303983, "percentage": 30.41, "elapsed_time": "0:29:44", "remaining_time": "1:08:04", "throughput": 4249.47, "total_tokens": 7584640} {"current_steps": 11610, "total_steps": 38160, "loss": 0.4496, "lr": 0.0008782475736488156, "epoch": 6.084905660377358, "percentage": 30.42, "elapsed_time": "0:29:45", "remaining_time": "1:08:03", "throughput": 4249.53, "total_tokens": 7587776} {"current_steps": 11615, "total_steps": 38160, "loss": 0.4005, "lr": 0.0008780979738033142, "epoch": 6.087526205450734, "percentage": 30.44, "elapsed_time": "0:29:46", "remaining_time": "1:08:02", "throughput": 4249.75, "total_tokens": 7591520} {"current_steps": 11620, "total_steps": 38160, "loss": 0.4348, "lr": 0.0008779482948640305, "epoch": 6.090146750524109, "percentage": 30.45, "elapsed_time": "0:29:47", "remaining_time": "1:08:01", "throughput": 4249.92, "total_tokens": 7595040} {"current_steps": 11625, "total_steps": 38160, "loss": 0.5604, "lr": 0.0008777985368622752, "epoch": 6.0927672955974845, "percentage": 30.46, "elapsed_time": "0:29:47", "remaining_time": "1:08:00", "throughput": 4249.96, "total_tokens": 7598048} {"current_steps": 11630, "total_steps": 38160, "loss": 0.4277, "lr": 0.0008776486998293762, "epoch": 6.09538784067086, "percentage": 30.48, "elapsed_time": "0:29:48", "remaining_time": "1:07:59", "throughput": 4250.06, "total_tokens": 7601344} {"current_steps": 11635, "total_steps": 38160, "loss": 0.4449, "lr": 0.0008774987837966775, "epoch": 6.098008385744235, "percentage": 30.49, "elapsed_time": "0:29:49", "remaining_time": "1:07:58", "throughput": 4250.08, "total_tokens": 7604256} {"current_steps": 11640, "total_steps": 38160, "loss": 0.4104, "lr": 0.0008773487887955401, "epoch": 6.10062893081761, "percentage": 30.5, "elapsed_time": "0:29:49", "remaining_time": "1:07:58", "throughput": 4250.17, "total_tokens": 7607456} {"current_steps": 11645, "total_steps": 38160, "loss": 0.5189, "lr": 0.000877198714857341, "epoch": 6.103249475890985, "percentage": 30.52, "elapsed_time": "0:29:50", "remaining_time": "1:07:57", "throughput": 4250.45, "total_tokens": 7611456} {"current_steps": 11650, "total_steps": 38160, "loss": 0.4501, "lr": 0.000877048562013474, "epoch": 6.10587002096436, "percentage": 30.53, "elapsed_time": "0:29:51", "remaining_time": "1:07:56", "throughput": 4250.59, "total_tokens": 7614912} {"current_steps": 11655, "total_steps": 38160, "loss": 0.4868, "lr": 0.0008768983302953498, "epoch": 6.1084905660377355, "percentage": 30.54, "elapsed_time": "0:29:52", "remaining_time": "1:07:55", "throughput": 4250.79, "total_tokens": 7618688} {"current_steps": 11660, "total_steps": 38160, "loss": 0.5174, "lr": 0.0008767480197343945, "epoch": 6.111111111111111, "percentage": 30.56, "elapsed_time": "0:29:52", "remaining_time": "1:07:54", "throughput": 4250.72, "total_tokens": 7621280} {"current_steps": 11665, "total_steps": 38160, "loss": 0.5224, "lr": 0.0008765976303620515, "epoch": 6.113731656184487, "percentage": 30.57, "elapsed_time": "0:29:53", "remaining_time": "1:07:54", "throughput": 4251.05, "total_tokens": 7625600} {"current_steps": 11670, "total_steps": 38160, "loss": 0.5304, "lr": 0.0008764471622097809, "epoch": 6.116352201257862, "percentage": 30.58, "elapsed_time": "0:29:54", "remaining_time": "1:07:53", "throughput": 4251.17, "total_tokens": 7628992} {"current_steps": 11675, "total_steps": 38160, "loss": 0.3745, "lr": 0.0008762966153090588, "epoch": 6.118972746331237, "percentage": 30.59, "elapsed_time": "0:29:55", "remaining_time": "1:07:52", "throughput": 4251.17, "total_tokens": 7631904} {"current_steps": 11680, "total_steps": 38160, "loss": 0.4421, "lr": 0.0008761459896913776, "epoch": 6.121593291404612, "percentage": 30.61, "elapsed_time": "0:29:56", "remaining_time": "1:07:51", "throughput": 4251.33, "total_tokens": 7635424} {"current_steps": 11685, "total_steps": 38160, "loss": 0.6252, "lr": 0.0008759952853882466, "epoch": 6.1242138364779874, "percentage": 30.62, "elapsed_time": "0:29:56", "remaining_time": "1:07:50", "throughput": 4251.29, "total_tokens": 7638240} {"current_steps": 11690, "total_steps": 38160, "loss": 0.4187, "lr": 0.0008758445024311917, "epoch": 6.126834381551363, "percentage": 30.63, "elapsed_time": "0:29:57", "remaining_time": "1:07:49", "throughput": 4251.2, "total_tokens": 7640768} {"current_steps": 11695, "total_steps": 38160, "loss": 0.3826, "lr": 0.0008756936408517547, "epoch": 6.129454926624738, "percentage": 30.65, "elapsed_time": "0:29:58", "remaining_time": "1:07:48", "throughput": 4251.26, "total_tokens": 7643904} {"current_steps": 11700, "total_steps": 38160, "loss": 0.439, "lr": 0.000875542700681494, "epoch": 6.132075471698113, "percentage": 30.66, "elapsed_time": "0:29:58", "remaining_time": "1:07:47", "throughput": 4251.24, "total_tokens": 7646720} {"current_steps": 11705, "total_steps": 38160, "loss": 0.3769, "lr": 0.0008753916819519849, "epoch": 6.134696016771488, "percentage": 30.67, "elapsed_time": "0:29:59", "remaining_time": "1:07:46", "throughput": 4251.04, "total_tokens": 7648928} {"current_steps": 11710, "total_steps": 38160, "loss": 0.5477, "lr": 0.0008752405846948186, "epoch": 6.137316561844864, "percentage": 30.69, "elapsed_time": "0:30:00", "remaining_time": "1:07:45", "throughput": 4251.17, "total_tokens": 7652320} {"current_steps": 11715, "total_steps": 38160, "loss": 0.5974, "lr": 0.0008750894089416029, "epoch": 6.139937106918239, "percentage": 30.7, "elapsed_time": "0:30:00", "remaining_time": "1:07:45", "throughput": 4251.38, "total_tokens": 7656096} {"current_steps": 11720, "total_steps": 38160, "loss": 0.4389, "lr": 0.0008749381547239621, "epoch": 6.1425576519916145, "percentage": 30.71, "elapsed_time": "0:30:01", "remaining_time": "1:07:44", "throughput": 4251.48, "total_tokens": 7659328} {"current_steps": 11725, "total_steps": 38160, "loss": 0.3313, "lr": 0.000874786822073537, "epoch": 6.14517819706499, "percentage": 30.73, "elapsed_time": "0:30:02", "remaining_time": "1:07:43", "throughput": 4251.42, "total_tokens": 7661984} {"current_steps": 11730, "total_steps": 38160, "loss": 0.5802, "lr": 0.0008746354110219843, "epoch": 6.147798742138365, "percentage": 30.74, "elapsed_time": "0:30:03", "remaining_time": "1:07:42", "throughput": 4251.61, "total_tokens": 7665728} {"current_steps": 11735, "total_steps": 38160, "loss": 0.4687, "lr": 0.0008744839216009779, "epoch": 6.15041928721174, "percentage": 30.75, "elapsed_time": "0:30:03", "remaining_time": "1:07:41", "throughput": 4251.9, "total_tokens": 7669760} {"current_steps": 11740, "total_steps": 38160, "loss": 0.3484, "lr": 0.0008743323538422072, "epoch": 6.153039832285115, "percentage": 30.77, "elapsed_time": "0:30:04", "remaining_time": "1:07:41", "throughput": 4252.02, "total_tokens": 7673120} {"current_steps": 11745, "total_steps": 38160, "loss": 0.4865, "lr": 0.0008741807077773789, "epoch": 6.15566037735849, "percentage": 30.78, "elapsed_time": "0:30:05", "remaining_time": "1:07:40", "throughput": 4252.1, "total_tokens": 7676384} {"current_steps": 11750, "total_steps": 38160, "loss": 0.4923, "lr": 0.0008740289834382153, "epoch": 6.1582809224318655, "percentage": 30.79, "elapsed_time": "0:30:06", "remaining_time": "1:07:39", "throughput": 4252.13, "total_tokens": 7679424} {"current_steps": 11755, "total_steps": 38160, "loss": 0.4166, "lr": 0.0008738771808564555, "epoch": 6.160901467505241, "percentage": 30.8, "elapsed_time": "0:30:06", "remaining_time": "1:07:38", "throughput": 4252.24, "total_tokens": 7682816} {"current_steps": 11760, "total_steps": 38160, "loss": 0.439, "lr": 0.000873725300063855, "epoch": 6.163522012578617, "percentage": 30.82, "elapsed_time": "0:30:07", "remaining_time": "1:07:38", "throughput": 4252.66, "total_tokens": 7687488} {"current_steps": 11765, "total_steps": 38160, "loss": 0.4401, "lr": 0.0008735733410921853, "epoch": 6.166142557651992, "percentage": 30.83, "elapsed_time": "0:30:08", "remaining_time": "1:07:37", "throughput": 4252.97, "total_tokens": 7691648} {"current_steps": 11770, "total_steps": 38160, "loss": 0.2647, "lr": 0.0008734213039732346, "epoch": 6.168763102725367, "percentage": 30.84, "elapsed_time": "0:30:09", "remaining_time": "1:07:37", "throughput": 4253.55, "total_tokens": 7696928} {"current_steps": 11775, "total_steps": 38160, "loss": 0.3419, "lr": 0.0008732691887388073, "epoch": 6.171383647798742, "percentage": 30.86, "elapsed_time": "0:30:10", "remaining_time": "1:07:36", "throughput": 4253.52, "total_tokens": 7699744} {"current_steps": 11780, "total_steps": 38160, "loss": 0.5722, "lr": 0.0008731169954207243, "epoch": 6.174004192872117, "percentage": 30.87, "elapsed_time": "0:30:10", "remaining_time": "1:07:35", "throughput": 4253.55, "total_tokens": 7702912} {"current_steps": 11785, "total_steps": 38160, "loss": 0.5086, "lr": 0.0008729647240508225, "epoch": 6.176624737945493, "percentage": 30.88, "elapsed_time": "0:30:11", "remaining_time": "1:07:34", "throughput": 4253.73, "total_tokens": 7706560} {"current_steps": 11790, "total_steps": 38160, "loss": 0.6377, "lr": 0.0008728123746609555, "epoch": 6.179245283018868, "percentage": 30.9, "elapsed_time": "0:30:12", "remaining_time": "1:07:33", "throughput": 4253.92, "total_tokens": 7710304} {"current_steps": 11795, "total_steps": 38160, "loss": 0.4569, "lr": 0.000872659947282993, "epoch": 6.181865828092243, "percentage": 30.91, "elapsed_time": "0:30:13", "remaining_time": "1:07:32", "throughput": 4253.94, "total_tokens": 7713184} {"current_steps": 11800, "total_steps": 38160, "loss": 0.6832, "lr": 0.000872507441948821, "epoch": 6.184486373165618, "percentage": 30.92, "elapsed_time": "0:30:13", "remaining_time": "1:07:32", "throughput": 4253.96, "total_tokens": 7716192} {"current_steps": 11805, "total_steps": 38160, "loss": 0.477, "lr": 0.0008723548586903418, "epoch": 6.187106918238993, "percentage": 30.94, "elapsed_time": "0:30:14", "remaining_time": "1:07:31", "throughput": 4254.25, "total_tokens": 7720256} {"current_steps": 11810, "total_steps": 38160, "loss": 0.5111, "lr": 0.0008722021975394745, "epoch": 6.189727463312369, "percentage": 30.95, "elapsed_time": "0:30:15", "remaining_time": "1:07:30", "throughput": 4254.31, "total_tokens": 7723392} {"current_steps": 11815, "total_steps": 38160, "loss": 0.4829, "lr": 0.0008720494585281536, "epoch": 6.1923480083857445, "percentage": 30.96, "elapsed_time": "0:30:16", "remaining_time": "1:07:29", "throughput": 4254.42, "total_tokens": 7726720} {"current_steps": 11820, "total_steps": 38160, "loss": 0.4152, "lr": 0.0008718966416883306, "epoch": 6.19496855345912, "percentage": 30.97, "elapsed_time": "0:30:16", "remaining_time": "1:07:28", "throughput": 4254.34, "total_tokens": 7729248} {"current_steps": 11825, "total_steps": 38160, "loss": 0.517, "lr": 0.0008717437470519729, "epoch": 6.197589098532495, "percentage": 30.99, "elapsed_time": "0:30:17", "remaining_time": "1:07:27", "throughput": 4254.52, "total_tokens": 7732800} {"current_steps": 11830, "total_steps": 38160, "loss": 0.4187, "lr": 0.0008715907746510645, "epoch": 6.20020964360587, "percentage": 31.0, "elapsed_time": "0:30:18", "remaining_time": "1:07:26", "throughput": 4254.62, "total_tokens": 7736032} {"current_steps": 11835, "total_steps": 38160, "loss": 0.4445, "lr": 0.0008714377245176054, "epoch": 6.202830188679245, "percentage": 31.01, "elapsed_time": "0:30:18", "remaining_time": "1:07:25", "throughput": 4254.55, "total_tokens": 7738624} {"current_steps": 11840, "total_steps": 38160, "loss": 0.4904, "lr": 0.0008712845966836119, "epoch": 6.20545073375262, "percentage": 31.03, "elapsed_time": "0:30:19", "remaining_time": "1:07:24", "throughput": 4254.62, "total_tokens": 7741728} {"current_steps": 11845, "total_steps": 38160, "loss": 0.4621, "lr": 0.0008711313911811165, "epoch": 6.2080712788259955, "percentage": 31.04, "elapsed_time": "0:30:20", "remaining_time": "1:07:23", "throughput": 4254.55, "total_tokens": 7744288} {"current_steps": 11850, "total_steps": 38160, "loss": 0.5106, "lr": 0.0008709781080421681, "epoch": 6.210691823899371, "percentage": 31.05, "elapsed_time": "0:30:21", "remaining_time": "1:07:23", "throughput": 4254.83, "total_tokens": 7748448} {"current_steps": 11855, "total_steps": 38160, "loss": 0.4623, "lr": 0.0008708247472988319, "epoch": 6.213312368972747, "percentage": 31.07, "elapsed_time": "0:30:21", "remaining_time": "1:07:22", "throughput": 4255.03, "total_tokens": 7752096} {"current_steps": 11860, "total_steps": 38160, "loss": 0.444, "lr": 0.0008706713089831893, "epoch": 6.215932914046122, "percentage": 31.08, "elapsed_time": "0:30:22", "remaining_time": "1:07:21", "throughput": 4255.05, "total_tokens": 7755104} {"current_steps": 11865, "total_steps": 38160, "loss": 0.4078, "lr": 0.0008705177931273377, "epoch": 6.218553459119497, "percentage": 31.09, "elapsed_time": "0:30:23", "remaining_time": "1:07:20", "throughput": 4255.18, "total_tokens": 7758592} {"current_steps": 11870, "total_steps": 38160, "loss": 0.4699, "lr": 0.0008703641997633907, "epoch": 6.221174004192872, "percentage": 31.11, "elapsed_time": "0:30:24", "remaining_time": "1:07:20", "throughput": 4255.54, "total_tokens": 7762880} {"current_steps": 11875, "total_steps": 38160, "loss": 0.5627, "lr": 0.0008702105289234786, "epoch": 6.223794549266247, "percentage": 31.12, "elapsed_time": "0:30:25", "remaining_time": "1:07:19", "throughput": 4255.82, "total_tokens": 7766944} {"current_steps": 11880, "total_steps": 38160, "loss": 0.3582, "lr": 0.0008700567806397473, "epoch": 6.226415094339623, "percentage": 31.13, "elapsed_time": "0:30:25", "remaining_time": "1:07:18", "throughput": 4256.02, "total_tokens": 7770656} {"current_steps": 11885, "total_steps": 38160, "loss": 0.5546, "lr": 0.0008699029549443595, "epoch": 6.229035639412998, "percentage": 31.15, "elapsed_time": "0:30:26", "remaining_time": "1:07:17", "throughput": 4255.98, "total_tokens": 7773504} {"current_steps": 11890, "total_steps": 38160, "loss": 0.5279, "lr": 0.0008697490518694935, "epoch": 6.231656184486373, "percentage": 31.16, "elapsed_time": "0:30:27", "remaining_time": "1:07:17", "throughput": 4256.18, "total_tokens": 7777216} {"current_steps": 11895, "total_steps": 38160, "loss": 0.5441, "lr": 0.0008695950714473442, "epoch": 6.234276729559748, "percentage": 31.17, "elapsed_time": "0:30:27", "remaining_time": "1:07:16", "throughput": 4256.25, "total_tokens": 7780384} {"current_steps": 11900, "total_steps": 38160, "loss": 0.491, "lr": 0.0008694410137101224, "epoch": 6.236897274633123, "percentage": 31.18, "elapsed_time": "0:30:28", "remaining_time": "1:07:15", "throughput": 4256.38, "total_tokens": 7783776} {"current_steps": 11905, "total_steps": 38160, "loss": 0.5042, "lr": 0.0008692868786900554, "epoch": 6.239517819706499, "percentage": 31.2, "elapsed_time": "0:30:29", "remaining_time": "1:07:14", "throughput": 4256.54, "total_tokens": 7787296} {"current_steps": 11910, "total_steps": 38160, "loss": 0.5633, "lr": 0.0008691326664193865, "epoch": 6.2421383647798745, "percentage": 31.21, "elapsed_time": "0:30:30", "remaining_time": "1:07:13", "throughput": 4256.47, "total_tokens": 7789888} {"current_steps": 11915, "total_steps": 38160, "loss": 0.4247, "lr": 0.000868978376930375, "epoch": 6.24475890985325, "percentage": 31.22, "elapsed_time": "0:30:30", "remaining_time": "1:07:12", "throughput": 4256.58, "total_tokens": 7793280} {"current_steps": 11920, "total_steps": 38160, "loss": 0.452, "lr": 0.0008688240102552965, "epoch": 6.247379454926625, "percentage": 31.24, "elapsed_time": "0:30:31", "remaining_time": "1:07:11", "throughput": 4256.6, "total_tokens": 7796224} {"current_steps": 11925, "total_steps": 38160, "loss": 0.4967, "lr": 0.000868669566426443, "epoch": 6.25, "percentage": 31.25, "elapsed_time": "0:30:32", "remaining_time": "1:07:11", "throughput": 4256.66, "total_tokens": 7799424} {"current_steps": 11930, "total_steps": 38160, "loss": 0.4614, "lr": 0.0008685150454761222, "epoch": 6.252620545073375, "percentage": 31.26, "elapsed_time": "0:30:32", "remaining_time": "1:07:10", "throughput": 4256.71, "total_tokens": 7802528} {"current_steps": 11935, "total_steps": 38160, "loss": 0.4914, "lr": 0.000868360447436658, "epoch": 6.25524109014675, "percentage": 31.28, "elapsed_time": "0:30:33", "remaining_time": "1:07:09", "throughput": 4256.93, "total_tokens": 7806272} {"current_steps": 11940, "total_steps": 38160, "loss": 0.5016, "lr": 0.0008682057723403907, "epoch": 6.2578616352201255, "percentage": 31.29, "elapsed_time": "0:30:34", "remaining_time": "1:07:08", "throughput": 4256.93, "total_tokens": 7809248} {"current_steps": 11945, "total_steps": 38160, "loss": 0.4546, "lr": 0.0008680510202196765, "epoch": 6.260482180293501, "percentage": 31.3, "elapsed_time": "0:30:35", "remaining_time": "1:07:07", "throughput": 4257.26, "total_tokens": 7813536} {"current_steps": 11950, "total_steps": 38160, "loss": 0.4248, "lr": 0.0008678961911068879, "epoch": 6.263102725366876, "percentage": 31.32, "elapsed_time": "0:30:36", "remaining_time": "1:07:07", "throughput": 4257.33, "total_tokens": 7816768} {"current_steps": 11955, "total_steps": 38160, "loss": 0.3611, "lr": 0.0008677412850344133, "epoch": 6.265723270440252, "percentage": 31.33, "elapsed_time": "0:30:36", "remaining_time": "1:07:06", "throughput": 4257.48, "total_tokens": 7820224} {"current_steps": 11960, "total_steps": 38160, "loss": 0.6978, "lr": 0.0008675863020346573, "epoch": 6.268343815513627, "percentage": 31.34, "elapsed_time": "0:30:37", "remaining_time": "1:07:05", "throughput": 4257.46, "total_tokens": 7823104} {"current_steps": 11965, "total_steps": 38160, "loss": 0.4793, "lr": 0.0008674312421400405, "epoch": 6.270964360587002, "percentage": 31.35, "elapsed_time": "0:30:38", "remaining_time": "1:07:04", "throughput": 4257.63, "total_tokens": 7826688} {"current_steps": 11970, "total_steps": 38160, "loss": 0.4137, "lr": 0.0008672761053829997, "epoch": 6.273584905660377, "percentage": 31.37, "elapsed_time": "0:30:39", "remaining_time": "1:07:03", "throughput": 4257.8, "total_tokens": 7830272} {"current_steps": 11975, "total_steps": 38160, "loss": 0.4209, "lr": 0.0008671208917959878, "epoch": 6.276205450733753, "percentage": 31.38, "elapsed_time": "0:30:39", "remaining_time": "1:07:03", "throughput": 4257.95, "total_tokens": 7833824} {"current_steps": 11980, "total_steps": 38160, "loss": 0.4305, "lr": 0.0008669656014114737, "epoch": 6.278825995807128, "percentage": 31.39, "elapsed_time": "0:30:40", "remaining_time": "1:07:02", "throughput": 4258.19, "total_tokens": 7837632} {"current_steps": 11985, "total_steps": 38160, "loss": 0.4343, "lr": 0.0008668102342619424, "epoch": 6.281446540880503, "percentage": 31.41, "elapsed_time": "0:30:41", "remaining_time": "1:07:01", "throughput": 4258.3, "total_tokens": 7840928} {"current_steps": 11990, "total_steps": 38160, "loss": 0.6079, "lr": 0.0008666547903798947, "epoch": 6.284067085953878, "percentage": 31.42, "elapsed_time": "0:30:42", "remaining_time": "1:07:01", "throughput": 4259.11, "total_tokens": 7847680} {"current_steps": 11995, "total_steps": 38160, "loss": 0.4067, "lr": 0.000866499269797848, "epoch": 6.286687631027253, "percentage": 31.43, "elapsed_time": "0:30:43", "remaining_time": "1:07:01", "throughput": 4259.83, "total_tokens": 7853984} {"current_steps": 12000, "total_steps": 38160, "loss": 0.6126, "lr": 0.0008663436725483354, "epoch": 6.289308176100629, "percentage": 31.45, "elapsed_time": "0:30:44", "remaining_time": "1:07:01", "throughput": 4260.0, "total_tokens": 7857600} {"current_steps": 12005, "total_steps": 38160, "loss": 0.5287, "lr": 0.0008661879986639058, "epoch": 6.2919287211740045, "percentage": 31.46, "elapsed_time": "0:30:45", "remaining_time": "1:07:00", "throughput": 4259.97, "total_tokens": 7860448} {"current_steps": 12010, "total_steps": 38160, "loss": 0.4203, "lr": 0.0008660322481771246, "epoch": 6.29454926624738, "percentage": 31.47, "elapsed_time": "0:30:45", "remaining_time": "1:06:59", "throughput": 4259.98, "total_tokens": 7863424} {"current_steps": 12015, "total_steps": 38160, "loss": 0.5744, "lr": 0.0008658764211205731, "epoch": 6.297169811320755, "percentage": 31.49, "elapsed_time": "0:30:46", "remaining_time": "1:06:58", "throughput": 4259.98, "total_tokens": 7866400} {"current_steps": 12020, "total_steps": 38160, "loss": 0.3236, "lr": 0.0008657205175268484, "epoch": 6.29979035639413, "percentage": 31.5, "elapsed_time": "0:30:47", "remaining_time": "1:06:57", "throughput": 4260.23, "total_tokens": 7870240} {"current_steps": 12025, "total_steps": 38160, "loss": 0.4501, "lr": 0.0008655645374285637, "epoch": 6.302410901467505, "percentage": 31.51, "elapsed_time": "0:30:48", "remaining_time": "1:06:56", "throughput": 4260.27, "total_tokens": 7873280} {"current_steps": 12030, "total_steps": 38160, "loss": 0.5623, "lr": 0.0008654084808583485, "epoch": 6.30503144654088, "percentage": 31.53, "elapsed_time": "0:30:48", "remaining_time": "1:06:55", "throughput": 4260.4, "total_tokens": 7876640} {"current_steps": 12035, "total_steps": 38160, "loss": 0.4479, "lr": 0.0008652523478488478, "epoch": 6.3076519916142555, "percentage": 31.54, "elapsed_time": "0:30:49", "remaining_time": "1:06:55", "throughput": 4260.57, "total_tokens": 7880352} {"current_steps": 12040, "total_steps": 38160, "loss": 0.497, "lr": 0.000865096138432723, "epoch": 6.310272536687631, "percentage": 31.55, "elapsed_time": "0:30:50", "remaining_time": "1:06:54", "throughput": 4260.52, "total_tokens": 7883040} {"current_steps": 12045, "total_steps": 38160, "loss": 0.5114, "lr": 0.0008649398526426512, "epoch": 6.312893081761006, "percentage": 31.56, "elapsed_time": "0:30:50", "remaining_time": "1:06:53", "throughput": 4260.54, "total_tokens": 7886112} {"current_steps": 12050, "total_steps": 38160, "loss": 0.4872, "lr": 0.0008647834905113256, "epoch": 6.315513626834382, "percentage": 31.58, "elapsed_time": "0:30:51", "remaining_time": "1:06:52", "throughput": 4260.39, "total_tokens": 7888512} {"current_steps": 12055, "total_steps": 38160, "loss": 0.446, "lr": 0.0008646270520714556, "epoch": 6.318134171907757, "percentage": 31.59, "elapsed_time": "0:30:52", "remaining_time": "1:06:51", "throughput": 4260.34, "total_tokens": 7891296} {"current_steps": 12060, "total_steps": 38160, "loss": 0.5716, "lr": 0.0008644705373557663, "epoch": 6.320754716981132, "percentage": 31.6, "elapsed_time": "0:30:52", "remaining_time": "1:06:49", "throughput": 4260.21, "total_tokens": 7893696} {"current_steps": 12065, "total_steps": 38160, "loss": 0.3955, "lr": 0.0008643139463969985, "epoch": 6.323375262054507, "percentage": 31.62, "elapsed_time": "0:30:53", "remaining_time": "1:06:49", "throughput": 4260.46, "total_tokens": 7897632} {"current_steps": 12070, "total_steps": 38160, "loss": 0.4058, "lr": 0.0008641572792279095, "epoch": 6.325995807127883, "percentage": 31.63, "elapsed_time": "0:30:54", "remaining_time": "1:06:48", "throughput": 4260.31, "total_tokens": 7899936} {"current_steps": 12075, "total_steps": 38160, "loss": 0.4464, "lr": 0.0008640005358812723, "epoch": 6.328616352201258, "percentage": 31.64, "elapsed_time": "0:30:54", "remaining_time": "1:06:47", "throughput": 4260.3, "total_tokens": 7902848} {"current_steps": 12080, "total_steps": 38160, "loss": 0.3901, "lr": 0.0008638437163898756, "epoch": 6.331236897274633, "percentage": 31.66, "elapsed_time": "0:30:55", "remaining_time": "1:06:46", "throughput": 4260.4, "total_tokens": 7906176} {"current_steps": 12085, "total_steps": 38160, "loss": 0.3824, "lr": 0.0008636868207865244, "epoch": 6.333857442348008, "percentage": 31.67, "elapsed_time": "0:30:56", "remaining_time": "1:06:45", "throughput": 4260.48, "total_tokens": 7909408} {"current_steps": 12090, "total_steps": 38160, "loss": 0.3359, "lr": 0.0008635298491040394, "epoch": 6.336477987421383, "percentage": 31.68, "elapsed_time": "0:30:57", "remaining_time": "1:06:44", "throughput": 4260.52, "total_tokens": 7912576} {"current_steps": 12095, "total_steps": 38160, "loss": 0.6443, "lr": 0.0008633728013752574, "epoch": 6.339098532494759, "percentage": 31.7, "elapsed_time": "0:30:57", "remaining_time": "1:06:43", "throughput": 4260.55, "total_tokens": 7915552} {"current_steps": 12100, "total_steps": 38160, "loss": 0.3865, "lr": 0.000863215677633031, "epoch": 6.3417190775681345, "percentage": 31.71, "elapsed_time": "0:30:58", "remaining_time": "1:06:43", "throughput": 4261.05, "total_tokens": 7920384} {"current_steps": 12105, "total_steps": 38160, "loss": 0.4193, "lr": 0.0008630584779102285, "epoch": 6.34433962264151, "percentage": 31.72, "elapsed_time": "0:30:59", "remaining_time": "1:06:42", "throughput": 4261.11, "total_tokens": 7923552} {"current_steps": 12110, "total_steps": 38160, "loss": 0.5047, "lr": 0.0008629012022397344, "epoch": 6.346960167714885, "percentage": 31.73, "elapsed_time": "0:31:00", "remaining_time": "1:06:41", "throughput": 4261.01, "total_tokens": 7926080} {"current_steps": 12115, "total_steps": 38160, "loss": 0.5841, "lr": 0.0008627438506544491, "epoch": 6.34958071278826, "percentage": 31.75, "elapsed_time": "0:31:00", "remaining_time": "1:06:40", "throughput": 4261.02, "total_tokens": 7928992} {"current_steps": 12120, "total_steps": 38160, "loss": 0.5475, "lr": 0.0008625864231872886, "epoch": 6.352201257861635, "percentage": 31.76, "elapsed_time": "0:31:01", "remaining_time": "1:06:39", "throughput": 4261.04, "total_tokens": 7931936} {"current_steps": 12125, "total_steps": 38160, "loss": 0.4309, "lr": 0.000862428919871185, "epoch": 6.35482180293501, "percentage": 31.77, "elapsed_time": "0:31:02", "remaining_time": "1:06:38", "throughput": 4260.91, "total_tokens": 7934368} {"current_steps": 12130, "total_steps": 38160, "loss": 0.4049, "lr": 0.0008622713407390861, "epoch": 6.3574423480083855, "percentage": 31.79, "elapsed_time": "0:31:02", "remaining_time": "1:06:37", "throughput": 4260.85, "total_tokens": 7937088} {"current_steps": 12135, "total_steps": 38160, "loss": 0.4146, "lr": 0.0008621136858239557, "epoch": 6.360062893081761, "percentage": 31.8, "elapsed_time": "0:31:03", "remaining_time": "1:06:36", "throughput": 4260.81, "total_tokens": 7939776} {"current_steps": 12140, "total_steps": 38160, "loss": 0.4455, "lr": 0.0008619559551587736, "epoch": 6.362683438155136, "percentage": 31.81, "elapsed_time": "0:31:04", "remaining_time": "1:06:35", "throughput": 4260.87, "total_tokens": 7942944} {"current_steps": 12145, "total_steps": 38160, "loss": 0.5282, "lr": 0.0008617981487765349, "epoch": 6.365303983228512, "percentage": 31.83, "elapsed_time": "0:31:04", "remaining_time": "1:06:34", "throughput": 4260.97, "total_tokens": 7946336} {"current_steps": 12150, "total_steps": 38160, "loss": 0.4731, "lr": 0.0008616402667102512, "epoch": 6.367924528301887, "percentage": 31.84, "elapsed_time": "0:31:05", "remaining_time": "1:06:34", "throughput": 4261.35, "total_tokens": 7950880} {"current_steps": 12155, "total_steps": 38160, "loss": 0.5522, "lr": 0.0008614823089929495, "epoch": 6.370545073375262, "percentage": 31.85, "elapsed_time": "0:31:06", "remaining_time": "1:06:33", "throughput": 4261.37, "total_tokens": 7953856} {"current_steps": 12160, "total_steps": 38160, "loss": 0.4072, "lr": 0.0008613242756576728, "epoch": 6.373165618448637, "percentage": 31.87, "elapsed_time": "0:31:07", "remaining_time": "1:06:32", "throughput": 4261.35, "total_tokens": 7956672} {"current_steps": 12165, "total_steps": 38160, "loss": 0.4206, "lr": 0.0008611661667374798, "epoch": 6.3757861635220126, "percentage": 31.88, "elapsed_time": "0:31:07", "remaining_time": "1:06:31", "throughput": 4261.35, "total_tokens": 7959552} {"current_steps": 12170, "total_steps": 38160, "loss": 0.4959, "lr": 0.0008610079822654451, "epoch": 6.378406708595388, "percentage": 31.89, "elapsed_time": "0:31:08", "remaining_time": "1:06:30", "throughput": 4261.42, "total_tokens": 7962816} {"current_steps": 12175, "total_steps": 38160, "loss": 0.5339, "lr": 0.0008608497222746591, "epoch": 6.381027253668763, "percentage": 31.91, "elapsed_time": "0:31:09", "remaining_time": "1:06:29", "throughput": 4261.41, "total_tokens": 7965664} {"current_steps": 12180, "total_steps": 38160, "loss": 0.5819, "lr": 0.000860691386798228, "epoch": 6.383647798742138, "percentage": 31.92, "elapsed_time": "0:31:10", "remaining_time": "1:06:28", "throughput": 4261.67, "total_tokens": 7969632} {"current_steps": 12185, "total_steps": 38160, "loss": 0.4403, "lr": 0.000860532975869274, "epoch": 6.386268343815513, "percentage": 31.93, "elapsed_time": "0:31:10", "remaining_time": "1:06:28", "throughput": 4261.85, "total_tokens": 7973216} {"current_steps": 12190, "total_steps": 38160, "loss": 0.4187, "lr": 0.0008603744895209342, "epoch": 6.388888888888889, "percentage": 31.94, "elapsed_time": "0:31:11", "remaining_time": "1:06:27", "throughput": 4261.8, "total_tokens": 7975936} {"current_steps": 12195, "total_steps": 38160, "loss": 0.5019, "lr": 0.0008602159277863628, "epoch": 6.3915094339622645, "percentage": 31.96, "elapsed_time": "0:31:12", "remaining_time": "1:06:26", "throughput": 4261.95, "total_tokens": 7979456} {"current_steps": 12200, "total_steps": 38160, "loss": 0.618, "lr": 0.0008600572906987289, "epoch": 6.39412997903564, "percentage": 31.97, "elapsed_time": "0:31:12", "remaining_time": "1:06:25", "throughput": 4262.0, "total_tokens": 7982528} {"current_steps": 12205, "total_steps": 38160, "loss": 0.5315, "lr": 0.0008598985782912174, "epoch": 6.396750524109015, "percentage": 31.98, "elapsed_time": "0:31:13", "remaining_time": "1:06:24", "throughput": 4261.97, "total_tokens": 7985344} {"current_steps": 12210, "total_steps": 38160, "loss": 0.4276, "lr": 0.0008597397905970293, "epoch": 6.39937106918239, "percentage": 32.0, "elapsed_time": "0:31:14", "remaining_time": "1:06:23", "throughput": 4262.2, "total_tokens": 7989088} {"current_steps": 12215, "total_steps": 38160, "loss": 0.5094, "lr": 0.0008595809276493812, "epoch": 6.401991614255765, "percentage": 32.01, "elapsed_time": "0:31:15", "remaining_time": "1:06:22", "throughput": 4262.37, "total_tokens": 7992736} {"current_steps": 12220, "total_steps": 38160, "loss": 0.5078, "lr": 0.0008594219894815054, "epoch": 6.40461215932914, "percentage": 32.02, "elapsed_time": "0:31:15", "remaining_time": "1:06:21", "throughput": 4262.22, "total_tokens": 7995072} {"current_steps": 12225, "total_steps": 38160, "loss": 0.4947, "lr": 0.0008592629761266497, "epoch": 6.4072327044025155, "percentage": 32.04, "elapsed_time": "0:31:16", "remaining_time": "1:06:20", "throughput": 4262.27, "total_tokens": 7998240} {"current_steps": 12230, "total_steps": 38160, "loss": 0.4595, "lr": 0.0008591038876180784, "epoch": 6.409853249475891, "percentage": 32.05, "elapsed_time": "0:31:17", "remaining_time": "1:06:20", "throughput": 4262.37, "total_tokens": 8001600} {"current_steps": 12235, "total_steps": 38160, "loss": 0.3454, "lr": 0.0008589447239890705, "epoch": 6.412473794549266, "percentage": 32.06, "elapsed_time": "0:31:17", "remaining_time": "1:06:19", "throughput": 4262.28, "total_tokens": 8004128} {"current_steps": 12240, "total_steps": 38160, "loss": 0.4818, "lr": 0.0008587854852729213, "epoch": 6.415094339622642, "percentage": 32.08, "elapsed_time": "0:31:18", "remaining_time": "1:06:18", "throughput": 4262.48, "total_tokens": 8007936} {"current_steps": 12245, "total_steps": 38160, "loss": 0.4537, "lr": 0.000858626171502942, "epoch": 6.417714884696017, "percentage": 32.09, "elapsed_time": "0:31:19", "remaining_time": "1:06:17", "throughput": 4262.65, "total_tokens": 8011488} {"current_steps": 12250, "total_steps": 38160, "loss": 0.4891, "lr": 0.0008584667827124589, "epoch": 6.420335429769392, "percentage": 32.1, "elapsed_time": "0:31:20", "remaining_time": "1:06:16", "throughput": 4262.71, "total_tokens": 8014656} {"current_steps": 12255, "total_steps": 38160, "loss": 0.3967, "lr": 0.0008583073189348145, "epoch": 6.422955974842767, "percentage": 32.11, "elapsed_time": "0:31:20", "remaining_time": "1:06:15", "throughput": 4262.68, "total_tokens": 8017504} {"current_steps": 12260, "total_steps": 38160, "loss": 0.3873, "lr": 0.0008581477802033668, "epoch": 6.4255765199161425, "percentage": 32.13, "elapsed_time": "0:31:21", "remaining_time": "1:06:15", "throughput": 4262.99, "total_tokens": 8021728} {"current_steps": 12265, "total_steps": 38160, "loss": 0.4365, "lr": 0.0008579881665514895, "epoch": 6.428197064989518, "percentage": 32.14, "elapsed_time": "0:31:22", "remaining_time": "1:06:14", "throughput": 4263.02, "total_tokens": 8024832} {"current_steps": 12270, "total_steps": 38160, "loss": 0.4667, "lr": 0.0008578284780125718, "epoch": 6.430817610062893, "percentage": 32.15, "elapsed_time": "0:31:23", "remaining_time": "1:06:13", "throughput": 4263.11, "total_tokens": 8028192} {"current_steps": 12275, "total_steps": 38160, "loss": 0.4987, "lr": 0.0008576687146200189, "epoch": 6.433438155136268, "percentage": 32.17, "elapsed_time": "0:31:23", "remaining_time": "1:06:12", "throughput": 4263.11, "total_tokens": 8031168} {"current_steps": 12280, "total_steps": 38160, "loss": 0.475, "lr": 0.0008575088764072511, "epoch": 6.436058700209643, "percentage": 32.18, "elapsed_time": "0:31:24", "remaining_time": "1:06:11", "throughput": 4263.12, "total_tokens": 8034208} {"current_steps": 12285, "total_steps": 38160, "loss": 0.4589, "lr": 0.0008573489634077054, "epoch": 6.438679245283019, "percentage": 32.19, "elapsed_time": "0:31:25", "remaining_time": "1:06:10", "throughput": 4263.1, "total_tokens": 8037088} {"current_steps": 12290, "total_steps": 38160, "loss": 0.6793, "lr": 0.0008571889756548333, "epoch": 6.441299790356394, "percentage": 32.21, "elapsed_time": "0:31:25", "remaining_time": "1:06:09", "throughput": 4263.1, "total_tokens": 8039968} {"current_steps": 12295, "total_steps": 38160, "loss": 0.4268, "lr": 0.0008570289131821025, "epoch": 6.44392033542977, "percentage": 32.22, "elapsed_time": "0:31:26", "remaining_time": "1:06:08", "throughput": 4263.06, "total_tokens": 8042720} {"current_steps": 12300, "total_steps": 38160, "loss": 0.4571, "lr": 0.0008568687760229963, "epoch": 6.446540880503145, "percentage": 32.23, "elapsed_time": "0:31:27", "remaining_time": "1:06:07", "throughput": 4263.08, "total_tokens": 8045792} {"current_steps": 12305, "total_steps": 38160, "loss": 0.4297, "lr": 0.0008567085642110135, "epoch": 6.44916142557652, "percentage": 32.25, "elapsed_time": "0:31:27", "remaining_time": "1:06:06", "throughput": 4263.02, "total_tokens": 8048512} {"current_steps": 12310, "total_steps": 38160, "loss": 0.4903, "lr": 0.0008565482777796687, "epoch": 6.451781970649895, "percentage": 32.26, "elapsed_time": "0:31:28", "remaining_time": "1:06:05", "throughput": 4262.95, "total_tokens": 8051168} {"current_steps": 12315, "total_steps": 38160, "loss": 0.4204, "lr": 0.0008563879167624919, "epoch": 6.45440251572327, "percentage": 32.27, "elapsed_time": "0:31:29", "remaining_time": "1:06:04", "throughput": 4262.76, "total_tokens": 8053376} {"current_steps": 12320, "total_steps": 38160, "loss": 0.5587, "lr": 0.0008562274811930287, "epoch": 6.4570230607966455, "percentage": 32.29, "elapsed_time": "0:31:29", "remaining_time": "1:06:03", "throughput": 4262.72, "total_tokens": 8056128} {"current_steps": 12325, "total_steps": 38160, "loss": 0.4942, "lr": 0.0008560669711048406, "epoch": 6.459643605870021, "percentage": 32.3, "elapsed_time": "0:31:30", "remaining_time": "1:06:02", "throughput": 4262.78, "total_tokens": 8059232} {"current_steps": 12330, "total_steps": 38160, "loss": 0.4686, "lr": 0.0008559063865315042, "epoch": 6.462264150943396, "percentage": 32.31, "elapsed_time": "0:31:31", "remaining_time": "1:06:02", "throughput": 4262.91, "total_tokens": 8062688} {"current_steps": 12335, "total_steps": 38160, "loss": 0.4893, "lr": 0.0008557457275066122, "epoch": 6.464884696016772, "percentage": 32.32, "elapsed_time": "0:31:32", "remaining_time": "1:06:01", "throughput": 4262.97, "total_tokens": 8065952} {"current_steps": 12340, "total_steps": 38160, "loss": 0.4974, "lr": 0.0008555849940637725, "epoch": 6.467505241090147, "percentage": 32.34, "elapsed_time": "0:31:32", "remaining_time": "1:06:00", "throughput": 4262.99, "total_tokens": 8068960} {"current_steps": 12345, "total_steps": 38160, "loss": 0.4267, "lr": 0.000855424186236609, "epoch": 6.470125786163522, "percentage": 32.35, "elapsed_time": "0:31:33", "remaining_time": "1:05:59", "throughput": 4262.97, "total_tokens": 8071776} {"current_steps": 12350, "total_steps": 38160, "loss": 0.5787, "lr": 0.0008552633040587605, "epoch": 6.472746331236897, "percentage": 32.36, "elapsed_time": "0:31:34", "remaining_time": "1:05:58", "throughput": 4262.75, "total_tokens": 8073856} {"current_steps": 12355, "total_steps": 38160, "loss": 0.5713, "lr": 0.0008551023475638819, "epoch": 6.4753668763102725, "percentage": 32.38, "elapsed_time": "0:31:34", "remaining_time": "1:05:57", "throughput": 4262.83, "total_tokens": 8077248} {"current_steps": 12360, "total_steps": 38160, "loss": 0.3526, "lr": 0.0008549413167856432, "epoch": 6.477987421383648, "percentage": 32.39, "elapsed_time": "0:31:35", "remaining_time": "1:05:56", "throughput": 4263.02, "total_tokens": 8080992} {"current_steps": 12365, "total_steps": 38160, "loss": 0.526, "lr": 0.0008547802117577307, "epoch": 6.480607966457023, "percentage": 32.4, "elapsed_time": "0:31:36", "remaining_time": "1:05:55", "throughput": 4263.06, "total_tokens": 8084096} {"current_steps": 12370, "total_steps": 38160, "loss": 0.5003, "lr": 0.0008546190325138454, "epoch": 6.483228511530398, "percentage": 32.42, "elapsed_time": "0:31:37", "remaining_time": "1:05:55", "throughput": 4263.08, "total_tokens": 8087072} {"current_steps": 12375, "total_steps": 38160, "loss": 0.4288, "lr": 0.000854457779087704, "epoch": 6.485849056603773, "percentage": 32.43, "elapsed_time": "0:31:37", "remaining_time": "1:05:54", "throughput": 4263.29, "total_tokens": 8090912} {"current_steps": 12380, "total_steps": 38160, "loss": 0.439, "lr": 0.0008542964515130392, "epoch": 6.488469601677149, "percentage": 32.44, "elapsed_time": "0:31:38", "remaining_time": "1:05:53", "throughput": 4263.18, "total_tokens": 8093408} {"current_steps": 12385, "total_steps": 38160, "loss": 0.455, "lr": 0.0008541350498235989, "epoch": 6.491090146750524, "percentage": 32.46, "elapsed_time": "0:31:39", "remaining_time": "1:05:52", "throughput": 4263.21, "total_tokens": 8096480} {"current_steps": 12390, "total_steps": 38160, "loss": 0.4421, "lr": 0.0008539735740531462, "epoch": 6.4937106918239, "percentage": 32.47, "elapsed_time": "0:31:39", "remaining_time": "1:05:51", "throughput": 4263.16, "total_tokens": 8099200} {"current_steps": 12395, "total_steps": 38160, "loss": 0.5148, "lr": 0.0008538120242354602, "epoch": 6.496331236897275, "percentage": 32.48, "elapsed_time": "0:31:40", "remaining_time": "1:05:50", "throughput": 4263.19, "total_tokens": 8102272} {"current_steps": 12400, "total_steps": 38160, "loss": 0.3485, "lr": 0.0008536504004043353, "epoch": 6.49895178197065, "percentage": 32.49, "elapsed_time": "0:31:41", "remaining_time": "1:05:49", "throughput": 4263.25, "total_tokens": 8105440} {"current_steps": 12405, "total_steps": 38160, "loss": 0.4898, "lr": 0.0008534887025935811, "epoch": 6.501572327044025, "percentage": 32.51, "elapsed_time": "0:31:41", "remaining_time": "1:05:48", "throughput": 4263.23, "total_tokens": 8108320} {"current_steps": 12410, "total_steps": 38160, "loss": 0.5698, "lr": 0.0008533269308370233, "epoch": 6.5041928721174, "percentage": 32.52, "elapsed_time": "0:31:42", "remaining_time": "1:05:47", "throughput": 4263.34, "total_tokens": 8111744} {"current_steps": 12415, "total_steps": 38160, "loss": 0.4451, "lr": 0.0008531650851685025, "epoch": 6.506813417190775, "percentage": 32.53, "elapsed_time": "0:31:43", "remaining_time": "1:05:47", "throughput": 4263.37, "total_tokens": 8114848} {"current_steps": 12420, "total_steps": 38160, "loss": 0.4037, "lr": 0.000853003165621875, "epoch": 6.509433962264151, "percentage": 32.55, "elapsed_time": "0:31:44", "remaining_time": "1:05:46", "throughput": 4263.29, "total_tokens": 8117504} {"current_steps": 12425, "total_steps": 38160, "loss": 0.3773, "lr": 0.0008528411722310126, "epoch": 6.512054507337526, "percentage": 32.56, "elapsed_time": "0:31:44", "remaining_time": "1:05:45", "throughput": 4263.54, "total_tokens": 8121344} {"current_steps": 12430, "total_steps": 38160, "loss": 0.5454, "lr": 0.0008526791050298022, "epoch": 6.514675052410902, "percentage": 32.57, "elapsed_time": "0:31:45", "remaining_time": "1:05:44", "throughput": 4263.53, "total_tokens": 8124288} {"current_steps": 12435, "total_steps": 38160, "loss": 0.4847, "lr": 0.0008525169640521467, "epoch": 6.517295597484277, "percentage": 32.59, "elapsed_time": "0:31:46", "remaining_time": "1:05:43", "throughput": 4263.61, "total_tokens": 8127552} {"current_steps": 12440, "total_steps": 38160, "loss": 0.5407, "lr": 0.0008523547493319641, "epoch": 6.519916142557652, "percentage": 32.6, "elapsed_time": "0:31:47", "remaining_time": "1:05:42", "throughput": 4263.8, "total_tokens": 8131264} {"current_steps": 12445, "total_steps": 38160, "loss": 0.4146, "lr": 0.0008521924609031877, "epoch": 6.522536687631027, "percentage": 32.61, "elapsed_time": "0:31:47", "remaining_time": "1:05:41", "throughput": 4263.86, "total_tokens": 8134432} {"current_steps": 12450, "total_steps": 38160, "loss": 0.5407, "lr": 0.0008520300987997667, "epoch": 6.5251572327044025, "percentage": 32.63, "elapsed_time": "0:31:48", "remaining_time": "1:05:41", "throughput": 4263.8, "total_tokens": 8137152} {"current_steps": 12455, "total_steps": 38160, "loss": 0.4049, "lr": 0.000851867663055665, "epoch": 6.527777777777778, "percentage": 32.64, "elapsed_time": "0:31:49", "remaining_time": "1:05:40", "throughput": 4263.88, "total_tokens": 8140512} {"current_steps": 12460, "total_steps": 38160, "loss": 0.5617, "lr": 0.0008517051537048625, "epoch": 6.530398322851153, "percentage": 32.65, "elapsed_time": "0:31:49", "remaining_time": "1:05:39", "throughput": 4264.06, "total_tokens": 8144160} {"current_steps": 12465, "total_steps": 38160, "loss": 0.3608, "lr": 0.0008515425707813544, "epoch": 6.533018867924528, "percentage": 32.67, "elapsed_time": "0:31:50", "remaining_time": "1:05:39", "throughput": 4264.58, "total_tokens": 8149184} {"current_steps": 12470, "total_steps": 38160, "loss": 0.6247, "lr": 0.0008513799143191512, "epoch": 6.535639412997903, "percentage": 32.68, "elapsed_time": "0:31:51", "remaining_time": "1:05:38", "throughput": 4264.61, "total_tokens": 8152224} {"current_steps": 12475, "total_steps": 38160, "loss": 0.4639, "lr": 0.0008512171843522786, "epoch": 6.538259958071279, "percentage": 32.69, "elapsed_time": "0:31:52", "remaining_time": "1:05:37", "throughput": 4264.64, "total_tokens": 8155232} {"current_steps": 12480, "total_steps": 38160, "loss": 0.426, "lr": 0.000851054380914778, "epoch": 6.540880503144654, "percentage": 32.7, "elapsed_time": "0:31:52", "remaining_time": "1:05:36", "throughput": 4264.49, "total_tokens": 8157536} {"current_steps": 12485, "total_steps": 38160, "loss": 0.4337, "lr": 0.0008508915040407057, "epoch": 6.54350104821803, "percentage": 32.72, "elapsed_time": "0:31:53", "remaining_time": "1:05:35", "throughput": 4264.34, "total_tokens": 8159872} {"current_steps": 12490, "total_steps": 38160, "loss": 0.4741, "lr": 0.0008507285537641342, "epoch": 6.546121593291405, "percentage": 32.73, "elapsed_time": "0:31:54", "remaining_time": "1:05:34", "throughput": 4264.59, "total_tokens": 8163872} {"current_steps": 12495, "total_steps": 38160, "loss": 0.4351, "lr": 0.0008505655301191504, "epoch": 6.54874213836478, "percentage": 32.74, "elapsed_time": "0:31:55", "remaining_time": "1:05:33", "throughput": 4264.69, "total_tokens": 8167168} {"current_steps": 12500, "total_steps": 38160, "loss": 0.3674, "lr": 0.0008504024331398572, "epoch": 6.551362683438155, "percentage": 32.76, "elapsed_time": "0:31:55", "remaining_time": "1:05:32", "throughput": 4264.91, "total_tokens": 8171040} {"current_steps": 12505, "total_steps": 38160, "loss": 0.3588, "lr": 0.0008502392628603727, "epoch": 6.55398322851153, "percentage": 32.77, "elapsed_time": "0:31:56", "remaining_time": "1:05:32", "throughput": 4265.0, "total_tokens": 8174336} {"current_steps": 12510, "total_steps": 38160, "loss": 0.4093, "lr": 0.0008500760193148301, "epoch": 6.556603773584905, "percentage": 32.78, "elapsed_time": "0:31:57", "remaining_time": "1:05:31", "throughput": 4265.24, "total_tokens": 8178144} {"current_steps": 12515, "total_steps": 38160, "loss": 0.4664, "lr": 0.0008499127025373781, "epoch": 6.559224318658281, "percentage": 32.8, "elapsed_time": "0:31:58", "remaining_time": "1:05:30", "throughput": 4265.38, "total_tokens": 8181664} {"current_steps": 12520, "total_steps": 38160, "loss": 0.6175, "lr": 0.0008497493125621807, "epoch": 6.561844863731656, "percentage": 32.81, "elapsed_time": "0:31:58", "remaining_time": "1:05:29", "throughput": 4265.55, "total_tokens": 8185344} {"current_steps": 12525, "total_steps": 38160, "loss": 0.4386, "lr": 0.0008495858494234173, "epoch": 6.564465408805032, "percentage": 32.82, "elapsed_time": "0:31:59", "remaining_time": "1:05:28", "throughput": 4265.42, "total_tokens": 8187840} {"current_steps": 12530, "total_steps": 38160, "loss": 0.3959, "lr": 0.0008494223131552825, "epoch": 6.567085953878407, "percentage": 32.84, "elapsed_time": "0:32:00", "remaining_time": "1:05:28", "throughput": 4265.6, "total_tokens": 8191520} {"current_steps": 12535, "total_steps": 38160, "loss": 0.3352, "lr": 0.0008492587037919864, "epoch": 6.569706498951782, "percentage": 32.85, "elapsed_time": "0:32:01", "remaining_time": "1:05:27", "throughput": 4265.74, "total_tokens": 8194976} {"current_steps": 12540, "total_steps": 38160, "loss": 0.4572, "lr": 0.0008490950213677537, "epoch": 6.572327044025157, "percentage": 32.86, "elapsed_time": "0:32:01", "remaining_time": "1:05:26", "throughput": 4265.68, "total_tokens": 8197600} {"current_steps": 12545, "total_steps": 38160, "loss": 0.4097, "lr": 0.0008489312659168254, "epoch": 6.5749475890985325, "percentage": 32.87, "elapsed_time": "0:32:02", "remaining_time": "1:05:25", "throughput": 4265.65, "total_tokens": 8200448} {"current_steps": 12550, "total_steps": 38160, "loss": 0.4976, "lr": 0.0008487674374734569, "epoch": 6.577568134171908, "percentage": 32.89, "elapsed_time": "0:32:03", "remaining_time": "1:05:24", "throughput": 4265.63, "total_tokens": 8203328} {"current_steps": 12555, "total_steps": 38160, "loss": 0.4853, "lr": 0.0008486035360719197, "epoch": 6.580188679245283, "percentage": 32.9, "elapsed_time": "0:32:04", "remaining_time": "1:05:24", "throughput": 4266.13, "total_tokens": 8208480} {"current_steps": 12560, "total_steps": 38160, "loss": 0.3859, "lr": 0.0008484395617464997, "epoch": 6.582809224318658, "percentage": 32.91, "elapsed_time": "0:32:04", "remaining_time": "1:05:23", "throughput": 4266.12, "total_tokens": 8211424} {"current_steps": 12565, "total_steps": 38160, "loss": 0.4486, "lr": 0.0008482755145314986, "epoch": 6.585429769392033, "percentage": 32.93, "elapsed_time": "0:32:05", "remaining_time": "1:05:22", "throughput": 4266.24, "total_tokens": 8214848} {"current_steps": 12570, "total_steps": 38160, "loss": 0.4242, "lr": 0.0008481113944612331, "epoch": 6.588050314465409, "percentage": 32.94, "elapsed_time": "0:32:06", "remaining_time": "1:05:21", "throughput": 4266.17, "total_tokens": 8217568} {"current_steps": 12575, "total_steps": 38160, "loss": 0.5092, "lr": 0.0008479472015700356, "epoch": 6.590670859538784, "percentage": 32.95, "elapsed_time": "0:32:06", "remaining_time": "1:05:20", "throughput": 4266.22, "total_tokens": 8220672} {"current_steps": 12580, "total_steps": 38160, "loss": 0.4371, "lr": 0.0008477829358922529, "epoch": 6.59329140461216, "percentage": 32.97, "elapsed_time": "0:32:07", "remaining_time": "1:05:19", "throughput": 4266.31, "total_tokens": 8224032} {"current_steps": 12585, "total_steps": 38160, "loss": 0.5699, "lr": 0.0008476185974622477, "epoch": 6.595911949685535, "percentage": 32.98, "elapsed_time": "0:32:08", "remaining_time": "1:05:19", "throughput": 4266.52, "total_tokens": 8227872} {"current_steps": 12590, "total_steps": 38160, "loss": 0.5244, "lr": 0.0008474541863143978, "epoch": 6.59853249475891, "percentage": 32.99, "elapsed_time": "0:32:09", "remaining_time": "1:05:18", "throughput": 4266.5, "total_tokens": 8230720} {"current_steps": 12595, "total_steps": 38160, "loss": 0.4564, "lr": 0.0008472897024830961, "epoch": 6.601153039832285, "percentage": 33.01, "elapsed_time": "0:32:09", "remaining_time": "1:05:17", "throughput": 4266.61, "total_tokens": 8234080} {"current_steps": 12600, "total_steps": 38160, "loss": 0.534, "lr": 0.0008471251460027508, "epoch": 6.60377358490566, "percentage": 33.02, "elapsed_time": "0:32:10", "remaining_time": "1:05:16", "throughput": 4266.73, "total_tokens": 8237568} {"current_steps": 12605, "total_steps": 38160, "loss": 0.4218, "lr": 0.0008469605169077852, "epoch": 6.606394129979035, "percentage": 33.03, "elapsed_time": "0:32:11", "remaining_time": "1:05:15", "throughput": 4266.72, "total_tokens": 8240544} {"current_steps": 12610, "total_steps": 38160, "loss": 0.4703, "lr": 0.0008467958152326377, "epoch": 6.609014675052411, "percentage": 33.05, "elapsed_time": "0:32:12", "remaining_time": "1:05:14", "throughput": 4266.7, "total_tokens": 8243488} {"current_steps": 12615, "total_steps": 38160, "loss": 0.4656, "lr": 0.0008466310410117622, "epoch": 6.611635220125786, "percentage": 33.06, "elapsed_time": "0:32:12", "remaining_time": "1:05:13", "throughput": 4266.65, "total_tokens": 8246208} {"current_steps": 12620, "total_steps": 38160, "loss": 0.5373, "lr": 0.0008464661942796275, "epoch": 6.614255765199162, "percentage": 33.07, "elapsed_time": "0:32:13", "remaining_time": "1:05:12", "throughput": 4266.79, "total_tokens": 8249728} {"current_steps": 12625, "total_steps": 38160, "loss": 0.5101, "lr": 0.0008463012750707175, "epoch": 6.616876310272537, "percentage": 33.08, "elapsed_time": "0:32:14", "remaining_time": "1:05:11", "throughput": 4266.73, "total_tokens": 8252512} {"current_steps": 12630, "total_steps": 38160, "loss": 0.4263, "lr": 0.0008461362834195316, "epoch": 6.619496855345912, "percentage": 33.1, "elapsed_time": "0:32:14", "remaining_time": "1:05:10", "throughput": 4266.64, "total_tokens": 8255136} {"current_steps": 12635, "total_steps": 38160, "loss": 0.8086, "lr": 0.0008459712193605842, "epoch": 6.622117400419287, "percentage": 33.11, "elapsed_time": "0:32:15", "remaining_time": "1:05:10", "throughput": 4266.65, "total_tokens": 8258112} {"current_steps": 12640, "total_steps": 38160, "loss": 0.5408, "lr": 0.0008458060829284048, "epoch": 6.6247379454926625, "percentage": 33.12, "elapsed_time": "0:32:16", "remaining_time": "1:05:09", "throughput": 4266.72, "total_tokens": 8261312} {"current_steps": 12645, "total_steps": 38160, "loss": 0.3626, "lr": 0.0008456408741575378, "epoch": 6.627358490566038, "percentage": 33.14, "elapsed_time": "0:32:16", "remaining_time": "1:05:08", "throughput": 4266.79, "total_tokens": 8264608} {"current_steps": 12650, "total_steps": 38160, "loss": 0.5325, "lr": 0.0008454755930825435, "epoch": 6.629979035639413, "percentage": 33.15, "elapsed_time": "0:32:17", "remaining_time": "1:05:07", "throughput": 4266.74, "total_tokens": 8267328} {"current_steps": 12655, "total_steps": 38160, "loss": 0.5578, "lr": 0.0008453102397379963, "epoch": 6.632599580712788, "percentage": 33.16, "elapsed_time": "0:32:18", "remaining_time": "1:05:06", "throughput": 4266.67, "total_tokens": 8269984} {"current_steps": 12660, "total_steps": 38160, "loss": 0.485, "lr": 0.0008451448141584868, "epoch": 6.635220125786163, "percentage": 33.18, "elapsed_time": "0:32:19", "remaining_time": "1:05:05", "throughput": 4266.8, "total_tokens": 8273472} {"current_steps": 12665, "total_steps": 38160, "loss": 0.4392, "lr": 0.0008449793163786194, "epoch": 6.637840670859539, "percentage": 33.19, "elapsed_time": "0:32:19", "remaining_time": "1:05:04", "throughput": 4266.77, "total_tokens": 8276320} {"current_steps": 12670, "total_steps": 38160, "loss": 0.5848, "lr": 0.0008448137464330149, "epoch": 6.640461215932914, "percentage": 33.2, "elapsed_time": "0:32:20", "remaining_time": "1:05:03", "throughput": 4266.76, "total_tokens": 8279200} {"current_steps": 12675, "total_steps": 38160, "loss": 0.5031, "lr": 0.0008446481043563086, "epoch": 6.6430817610062896, "percentage": 33.22, "elapsed_time": "0:32:21", "remaining_time": "1:05:02", "throughput": 4266.81, "total_tokens": 8282400} {"current_steps": 12680, "total_steps": 38160, "loss": 0.3477, "lr": 0.0008444823901831507, "epoch": 6.645702306079665, "percentage": 33.23, "elapsed_time": "0:32:21", "remaining_time": "1:05:02", "throughput": 4266.9, "total_tokens": 8285728} {"current_steps": 12685, "total_steps": 38160, "loss": 0.3524, "lr": 0.0008443166039482067, "epoch": 6.64832285115304, "percentage": 33.24, "elapsed_time": "0:32:22", "remaining_time": "1:05:01", "throughput": 4266.91, "total_tokens": 8288704} {"current_steps": 12690, "total_steps": 38160, "loss": 0.4862, "lr": 0.0008441507456861575, "epoch": 6.650943396226415, "percentage": 33.25, "elapsed_time": "0:32:23", "remaining_time": "1:05:00", "throughput": 4266.96, "total_tokens": 8291904} {"current_steps": 12695, "total_steps": 38160, "loss": 0.4708, "lr": 0.0008439848154316985, "epoch": 6.65356394129979, "percentage": 33.27, "elapsed_time": "0:32:24", "remaining_time": "1:04:59", "throughput": 4267.12, "total_tokens": 8295488} {"current_steps": 12700, "total_steps": 38160, "loss": 0.4571, "lr": 0.0008438188132195406, "epoch": 6.656184486373165, "percentage": 33.28, "elapsed_time": "0:32:24", "remaining_time": "1:04:58", "throughput": 4267.23, "total_tokens": 8298784} {"current_steps": 12705, "total_steps": 38160, "loss": 0.4955, "lr": 0.0008436527390844094, "epoch": 6.658805031446541, "percentage": 33.29, "elapsed_time": "0:32:25", "remaining_time": "1:04:57", "throughput": 4267.15, "total_tokens": 8301376} {"current_steps": 12710, "total_steps": 38160, "loss": 0.6671, "lr": 0.0008434865930610458, "epoch": 6.661425576519916, "percentage": 33.31, "elapsed_time": "0:32:26", "remaining_time": "1:04:56", "throughput": 4267.2, "total_tokens": 8304544} {"current_steps": 12715, "total_steps": 38160, "loss": 0.5489, "lr": 0.0008433203751842057, "epoch": 6.664046121593291, "percentage": 33.32, "elapsed_time": "0:32:26", "remaining_time": "1:04:55", "throughput": 4267.14, "total_tokens": 8307232} {"current_steps": 12720, "total_steps": 38160, "loss": 0.5288, "lr": 0.0008431540854886598, "epoch": 6.666666666666667, "percentage": 33.33, "elapsed_time": "0:32:27", "remaining_time": "1:04:55", "throughput": 4267.27, "total_tokens": 8310816} {"current_steps": 12725, "total_steps": 38160, "loss": 0.4737, "lr": 0.0008429877240091941, "epoch": 6.669287211740042, "percentage": 33.35, "elapsed_time": "0:32:28", "remaining_time": "1:04:54", "throughput": 4267.26, "total_tokens": 8313632} {"current_steps": 12730, "total_steps": 38160, "loss": 0.3869, "lr": 0.0008428212907806097, "epoch": 6.671907756813417, "percentage": 33.36, "elapsed_time": "0:32:28", "remaining_time": "1:04:53", "throughput": 4267.22, "total_tokens": 8316416} {"current_steps": 12735, "total_steps": 38160, "loss": 0.4943, "lr": 0.0008426547858377222, "epoch": 6.6745283018867925, "percentage": 33.37, "elapsed_time": "0:32:29", "remaining_time": "1:04:52", "throughput": 4267.6, "total_tokens": 8321056} {"current_steps": 12740, "total_steps": 38160, "loss": 0.3601, "lr": 0.0008424882092153629, "epoch": 6.677148846960168, "percentage": 33.39, "elapsed_time": "0:32:30", "remaining_time": "1:04:51", "throughput": 4267.6, "total_tokens": 8324064} {"current_steps": 12745, "total_steps": 38160, "loss": 0.519, "lr": 0.0008423215609483774, "epoch": 6.679769392033543, "percentage": 33.4, "elapsed_time": "0:32:31", "remaining_time": "1:04:50", "throughput": 4267.5, "total_tokens": 8326592} {"current_steps": 12750, "total_steps": 38160, "loss": 0.3981, "lr": 0.0008421548410716269, "epoch": 6.682389937106918, "percentage": 33.41, "elapsed_time": "0:32:31", "remaining_time": "1:04:49", "throughput": 4267.37, "total_tokens": 8328992} {"current_steps": 12755, "total_steps": 38160, "loss": 0.5012, "lr": 0.0008419880496199869, "epoch": 6.685010482180293, "percentage": 33.43, "elapsed_time": "0:32:32", "remaining_time": "1:04:49", "throughput": 4267.49, "total_tokens": 8332448} {"current_steps": 12760, "total_steps": 38160, "loss": 0.4498, "lr": 0.0008418211866283488, "epoch": 6.687631027253669, "percentage": 33.44, "elapsed_time": "0:32:33", "remaining_time": "1:04:48", "throughput": 4267.45, "total_tokens": 8335136} {"current_steps": 12765, "total_steps": 38160, "loss": 0.5852, "lr": 0.0008416542521316182, "epoch": 6.690251572327044, "percentage": 33.45, "elapsed_time": "0:32:33", "remaining_time": "1:04:47", "throughput": 4267.6, "total_tokens": 8338688} {"current_steps": 12770, "total_steps": 38160, "loss": 0.5659, "lr": 0.0008414872461647156, "epoch": 6.6928721174004195, "percentage": 33.46, "elapsed_time": "0:32:34", "remaining_time": "1:04:46", "throughput": 4267.74, "total_tokens": 8342208} {"current_steps": 12775, "total_steps": 38160, "loss": 0.455, "lr": 0.0008413201687625772, "epoch": 6.695492662473795, "percentage": 33.48, "elapsed_time": "0:32:35", "remaining_time": "1:04:45", "throughput": 4267.75, "total_tokens": 8345088} {"current_steps": 12780, "total_steps": 38160, "loss": 0.4646, "lr": 0.0008411530199601534, "epoch": 6.69811320754717, "percentage": 33.49, "elapsed_time": "0:32:36", "remaining_time": "1:04:44", "throughput": 4267.81, "total_tokens": 8348192} {"current_steps": 12785, "total_steps": 38160, "loss": 0.4273, "lr": 0.0008409857997924097, "epoch": 6.700733752620545, "percentage": 33.5, "elapsed_time": "0:32:36", "remaining_time": "1:04:43", "throughput": 4267.9, "total_tokens": 8351488} {"current_steps": 12790, "total_steps": 38160, "loss": 0.4284, "lr": 0.0008408185082943271, "epoch": 6.70335429769392, "percentage": 33.52, "elapsed_time": "0:32:37", "remaining_time": "1:04:42", "throughput": 4267.77, "total_tokens": 8353856} {"current_steps": 12795, "total_steps": 38160, "loss": 0.3141, "lr": 0.0008406511455009007, "epoch": 6.705974842767295, "percentage": 33.53, "elapsed_time": "0:32:38", "remaining_time": "1:04:41", "throughput": 4267.95, "total_tokens": 8357568} {"current_steps": 12800, "total_steps": 38160, "loss": 0.4492, "lr": 0.000840483711447141, "epoch": 6.7085953878406706, "percentage": 33.54, "elapsed_time": "0:32:38", "remaining_time": "1:04:40", "throughput": 4267.78, "total_tokens": 8359808} {"current_steps": 12805, "total_steps": 38160, "loss": 0.369, "lr": 0.0008403162061680736, "epoch": 6.711215932914046, "percentage": 33.56, "elapsed_time": "0:32:39", "remaining_time": "1:04:40", "throughput": 4267.92, "total_tokens": 8363424} {"current_steps": 12810, "total_steps": 38160, "loss": 0.4346, "lr": 0.0008401486296987382, "epoch": 6.713836477987421, "percentage": 33.57, "elapsed_time": "0:32:40", "remaining_time": "1:04:39", "throughput": 4267.75, "total_tokens": 8365696} {"current_steps": 12815, "total_steps": 38160, "loss": 0.4805, "lr": 0.0008399809820741901, "epoch": 6.716457023060797, "percentage": 33.58, "elapsed_time": "0:32:41", "remaining_time": "1:04:38", "throughput": 4268.14, "total_tokens": 8370240} {"current_steps": 12820, "total_steps": 38160, "loss": 0.4243, "lr": 0.0008398132633294993, "epoch": 6.719077568134172, "percentage": 33.6, "elapsed_time": "0:32:42", "remaining_time": "1:04:38", "throughput": 4269.09, "total_tokens": 8377792} {"current_steps": 12825, "total_steps": 38160, "loss": 0.4334, "lr": 0.0008396454734997506, "epoch": 6.721698113207547, "percentage": 33.61, "elapsed_time": "0:32:43", "remaining_time": "1:04:37", "throughput": 4269.03, "total_tokens": 8380448} {"current_steps": 12830, "total_steps": 38160, "loss": 0.3984, "lr": 0.0008394776126200436, "epoch": 6.7243186582809225, "percentage": 33.62, "elapsed_time": "0:32:44", "remaining_time": "1:04:37", "throughput": 4269.44, "total_tokens": 8385248} {"current_steps": 12835, "total_steps": 38160, "loss": 0.3701, "lr": 0.0008393096807254931, "epoch": 6.726939203354298, "percentage": 33.63, "elapsed_time": "0:32:44", "remaining_time": "1:04:36", "throughput": 4269.4, "total_tokens": 8387968} {"current_steps": 12840, "total_steps": 38160, "loss": 0.4932, "lr": 0.0008391416778512284, "epoch": 6.729559748427673, "percentage": 33.65, "elapsed_time": "0:32:45", "remaining_time": "1:04:35", "throughput": 4269.44, "total_tokens": 8391008} {"current_steps": 12845, "total_steps": 38160, "loss": 0.5, "lr": 0.0008389736040323939, "epoch": 6.732180293501048, "percentage": 33.66, "elapsed_time": "0:32:46", "remaining_time": "1:04:34", "throughput": 4269.69, "total_tokens": 8395008} {"current_steps": 12850, "total_steps": 38160, "loss": 0.4612, "lr": 0.0008388054593041485, "epoch": 6.734800838574423, "percentage": 33.67, "elapsed_time": "0:32:46", "remaining_time": "1:04:33", "throughput": 4269.56, "total_tokens": 8397376} {"current_steps": 12855, "total_steps": 38160, "loss": 0.3939, "lr": 0.0008386372437016665, "epoch": 6.737421383647799, "percentage": 33.69, "elapsed_time": "0:32:47", "remaining_time": "1:04:33", "throughput": 4269.66, "total_tokens": 8400704} {"current_steps": 12860, "total_steps": 38160, "loss": 0.5059, "lr": 0.0008384689572601364, "epoch": 6.740041928721174, "percentage": 33.7, "elapsed_time": "0:32:48", "remaining_time": "1:04:32", "throughput": 4269.81, "total_tokens": 8404384} {"current_steps": 12865, "total_steps": 38160, "loss": 0.5303, "lr": 0.000838300600014762, "epoch": 6.7426624737945495, "percentage": 33.71, "elapsed_time": "0:32:48", "remaining_time": "1:04:31", "throughput": 4269.75, "total_tokens": 8407072} {"current_steps": 12870, "total_steps": 38160, "loss": 0.4351, "lr": 0.0008381321720007613, "epoch": 6.745283018867925, "percentage": 33.73, "elapsed_time": "0:32:49", "remaining_time": "1:04:30", "throughput": 4269.92, "total_tokens": 8410816} {"current_steps": 12875, "total_steps": 38160, "loss": 0.4234, "lr": 0.0008379636732533681, "epoch": 6.7479035639413, "percentage": 33.74, "elapsed_time": "0:32:50", "remaining_time": "1:04:29", "throughput": 4269.9, "total_tokens": 8413632} {"current_steps": 12880, "total_steps": 38160, "loss": 0.4237, "lr": 0.0008377951038078302, "epoch": 6.750524109014675, "percentage": 33.75, "elapsed_time": "0:32:51", "remaining_time": "1:04:28", "throughput": 4269.94, "total_tokens": 8416864} {"current_steps": 12885, "total_steps": 38160, "loss": 0.5016, "lr": 0.0008376264636994102, "epoch": 6.75314465408805, "percentage": 33.77, "elapsed_time": "0:32:51", "remaining_time": "1:04:28", "throughput": 4270.19, "total_tokens": 8420800} {"current_steps": 12890, "total_steps": 38160, "loss": 0.378, "lr": 0.000837457752963386, "epoch": 6.755765199161425, "percentage": 33.78, "elapsed_time": "0:32:52", "remaining_time": "1:04:27", "throughput": 4270.13, "total_tokens": 8423520} {"current_steps": 12895, "total_steps": 38160, "loss": 0.5011, "lr": 0.0008372889716350496, "epoch": 6.7583857442348005, "percentage": 33.79, "elapsed_time": "0:32:53", "remaining_time": "1:04:26", "throughput": 4270.14, "total_tokens": 8426496} {"current_steps": 12900, "total_steps": 38160, "loss": 0.4165, "lr": 0.0008371201197497084, "epoch": 6.761006289308176, "percentage": 33.81, "elapsed_time": "0:32:54", "remaining_time": "1:04:25", "throughput": 4270.27, "total_tokens": 8430048} {"current_steps": 12905, "total_steps": 38160, "loss": 0.5303, "lr": 0.0008369511973426842, "epoch": 6.763626834381551, "percentage": 33.82, "elapsed_time": "0:32:54", "remaining_time": "1:04:24", "throughput": 4270.27, "total_tokens": 8432960} {"current_steps": 12910, "total_steps": 38160, "loss": 0.438, "lr": 0.0008367822044493138, "epoch": 6.766247379454927, "percentage": 33.83, "elapsed_time": "0:32:55", "remaining_time": "1:04:23", "throughput": 4270.43, "total_tokens": 8436544} {"current_steps": 12915, "total_steps": 38160, "loss": 0.3973, "lr": 0.0008366131411049483, "epoch": 6.768867924528302, "percentage": 33.84, "elapsed_time": "0:32:56", "remaining_time": "1:04:23", "throughput": 4270.5, "total_tokens": 8439840} {"current_steps": 12920, "total_steps": 38160, "loss": 0.3551, "lr": 0.000836444007344954, "epoch": 6.771488469601677, "percentage": 33.86, "elapsed_time": "0:32:57", "remaining_time": "1:04:22", "throughput": 4270.57, "total_tokens": 8443104} {"current_steps": 12925, "total_steps": 38160, "loss": 0.4947, "lr": 0.0008362748032047119, "epoch": 6.774109014675052, "percentage": 33.87, "elapsed_time": "0:32:57", "remaining_time": "1:04:21", "throughput": 4270.66, "total_tokens": 8446528} {"current_steps": 12930, "total_steps": 38160, "loss": 0.3979, "lr": 0.0008361055287196171, "epoch": 6.776729559748428, "percentage": 33.88, "elapsed_time": "0:32:58", "remaining_time": "1:04:20", "throughput": 4270.55, "total_tokens": 8449024} {"current_steps": 12935, "total_steps": 38160, "loss": 0.453, "lr": 0.0008359361839250803, "epoch": 6.779350104821803, "percentage": 33.9, "elapsed_time": "0:32:59", "remaining_time": "1:04:19", "throughput": 4270.82, "total_tokens": 8453184} {"current_steps": 12940, "total_steps": 38160, "loss": 0.4247, "lr": 0.0008357667688565265, "epoch": 6.781970649895178, "percentage": 33.91, "elapsed_time": "0:32:59", "remaining_time": "1:04:18", "throughput": 4270.75, "total_tokens": 8455776} {"current_steps": 12945, "total_steps": 38160, "loss": 0.4501, "lr": 0.0008355972835493951, "epoch": 6.784591194968553, "percentage": 33.92, "elapsed_time": "0:33:00", "remaining_time": "1:04:17", "throughput": 4270.68, "total_tokens": 8458528} {"current_steps": 12950, "total_steps": 38160, "loss": 0.4506, "lr": 0.0008354277280391408, "epoch": 6.787211740041929, "percentage": 33.94, "elapsed_time": "0:33:01", "remaining_time": "1:04:17", "throughput": 4270.88, "total_tokens": 8462240} {"current_steps": 12955, "total_steps": 38160, "loss": 0.5828, "lr": 0.0008352581023612324, "epoch": 6.789832285115304, "percentage": 33.95, "elapsed_time": "0:33:02", "remaining_time": "1:04:16", "throughput": 4270.97, "total_tokens": 8465568} {"current_steps": 12960, "total_steps": 38160, "loss": 0.4564, "lr": 0.0008350884065511541, "epoch": 6.7924528301886795, "percentage": 33.96, "elapsed_time": "0:33:02", "remaining_time": "1:04:15", "throughput": 4270.95, "total_tokens": 8468384} {"current_steps": 12965, "total_steps": 38160, "loss": 0.4886, "lr": 0.0008349186406444038, "epoch": 6.795073375262055, "percentage": 33.98, "elapsed_time": "0:33:03", "remaining_time": "1:04:14", "throughput": 4270.93, "total_tokens": 8471232} {"current_steps": 12970, "total_steps": 38160, "loss": 0.4386, "lr": 0.0008347488046764949, "epoch": 6.79769392033543, "percentage": 33.99, "elapsed_time": "0:33:04", "remaining_time": "1:04:13", "throughput": 4271.02, "total_tokens": 8474624} {"current_steps": 12975, "total_steps": 38160, "loss": 0.4101, "lr": 0.0008345788986829551, "epoch": 6.800314465408805, "percentage": 34.0, "elapsed_time": "0:33:04", "remaining_time": "1:04:12", "throughput": 4271.19, "total_tokens": 8478240} {"current_steps": 12980, "total_steps": 38160, "loss": 0.3734, "lr": 0.0008344089226993268, "epoch": 6.80293501048218, "percentage": 34.01, "elapsed_time": "0:33:05", "remaining_time": "1:04:12", "throughput": 4271.22, "total_tokens": 8481408} {"current_steps": 12985, "total_steps": 38160, "loss": 0.4287, "lr": 0.000834238876761167, "epoch": 6.805555555555555, "percentage": 34.03, "elapsed_time": "0:33:06", "remaining_time": "1:04:11", "throughput": 4271.31, "total_tokens": 8484672} {"current_steps": 12990, "total_steps": 38160, "loss": 0.3833, "lr": 0.0008340687609040473, "epoch": 6.8081761006289305, "percentage": 34.04, "elapsed_time": "0:33:07", "remaining_time": "1:04:10", "throughput": 4271.39, "total_tokens": 8488032} {"current_steps": 12995, "total_steps": 38160, "loss": 0.366, "lr": 0.0008338985751635542, "epoch": 6.810796645702306, "percentage": 34.05, "elapsed_time": "0:33:07", "remaining_time": "1:04:09", "throughput": 4271.56, "total_tokens": 8491648} {"current_steps": 13000, "total_steps": 38160, "loss": 0.5727, "lr": 0.0008337283195752883, "epoch": 6.813417190775681, "percentage": 34.07, "elapsed_time": "0:33:08", "remaining_time": "1:04:08", "throughput": 4271.5, "total_tokens": 8494336} {"current_steps": 13005, "total_steps": 38160, "loss": 0.3979, "lr": 0.0008335579941748654, "epoch": 6.816037735849057, "percentage": 34.08, "elapsed_time": "0:33:09", "remaining_time": "1:04:07", "throughput": 4271.64, "total_tokens": 8497888} {"current_steps": 13010, "total_steps": 38160, "loss": 0.4999, "lr": 0.0008333875989979156, "epoch": 6.818658280922432, "percentage": 34.09, "elapsed_time": "0:33:10", "remaining_time": "1:04:07", "throughput": 4271.6, "total_tokens": 8500704} {"current_steps": 13015, "total_steps": 38160, "loss": 0.587, "lr": 0.0008332171340800835, "epoch": 6.821278825995807, "percentage": 34.11, "elapsed_time": "0:33:10", "remaining_time": "1:04:06", "throughput": 4271.64, "total_tokens": 8503872} {"current_steps": 13020, "total_steps": 38160, "loss": 0.5176, "lr": 0.0008330465994570287, "epoch": 6.823899371069182, "percentage": 34.12, "elapsed_time": "0:33:11", "remaining_time": "1:04:05", "throughput": 4271.62, "total_tokens": 8506816} {"current_steps": 13025, "total_steps": 38160, "loss": 0.5645, "lr": 0.0008328759951644247, "epoch": 6.826519916142558, "percentage": 34.13, "elapsed_time": "0:33:12", "remaining_time": "1:04:04", "throughput": 4271.73, "total_tokens": 8510272} {"current_steps": 13030, "total_steps": 38160, "loss": 0.5247, "lr": 0.0008327053212379603, "epoch": 6.829140461215933, "percentage": 34.15, "elapsed_time": "0:33:13", "remaining_time": "1:04:03", "throughput": 4272.12, "total_tokens": 8514784} {"current_steps": 13035, "total_steps": 38160, "loss": 0.4952, "lr": 0.0008325345777133382, "epoch": 6.831761006289308, "percentage": 34.16, "elapsed_time": "0:33:13", "remaining_time": "1:04:03", "throughput": 4272.12, "total_tokens": 8517728} {"current_steps": 13040, "total_steps": 38160, "loss": 0.4174, "lr": 0.0008323637646262763, "epoch": 6.834381551362683, "percentage": 34.17, "elapsed_time": "0:33:14", "remaining_time": "1:04:02", "throughput": 4272.09, "total_tokens": 8520608} {"current_steps": 13045, "total_steps": 38160, "loss": 0.5401, "lr": 0.0008321928820125067, "epoch": 6.837002096436059, "percentage": 34.19, "elapsed_time": "0:33:15", "remaining_time": "1:04:01", "throughput": 4272.06, "total_tokens": 8523360} {"current_steps": 13050, "total_steps": 38160, "loss": 0.4711, "lr": 0.000832021929907776, "epoch": 6.839622641509434, "percentage": 34.2, "elapsed_time": "0:33:15", "remaining_time": "1:04:00", "throughput": 4272.19, "total_tokens": 8526976} {"current_steps": 13055, "total_steps": 38160, "loss": 0.5583, "lr": 0.0008318509083478454, "epoch": 6.8422431865828095, "percentage": 34.21, "elapsed_time": "0:33:16", "remaining_time": "1:03:59", "throughput": 4272.34, "total_tokens": 8530624} {"current_steps": 13060, "total_steps": 38160, "loss": 0.4108, "lr": 0.0008316798173684907, "epoch": 6.844863731656185, "percentage": 34.22, "elapsed_time": "0:33:17", "remaining_time": "1:03:59", "throughput": 4272.74, "total_tokens": 8535424} {"current_steps": 13065, "total_steps": 38160, "loss": 0.4234, "lr": 0.0008315086570055024, "epoch": 6.84748427672956, "percentage": 34.24, "elapsed_time": "0:33:18", "remaining_time": "1:03:58", "throughput": 4272.67, "total_tokens": 8538112} {"current_steps": 13070, "total_steps": 38160, "loss": 0.6007, "lr": 0.000831337427294685, "epoch": 6.850104821802935, "percentage": 34.25, "elapsed_time": "0:33:19", "remaining_time": "1:03:57", "throughput": 4272.79, "total_tokens": 8541696} {"current_steps": 13075, "total_steps": 38160, "loss": 0.4002, "lr": 0.0008311661282718579, "epoch": 6.85272536687631, "percentage": 34.26, "elapsed_time": "0:33:19", "remaining_time": "1:03:56", "throughput": 4272.85, "total_tokens": 8544832} {"current_steps": 13080, "total_steps": 38160, "loss": 0.471, "lr": 0.0008309947599728549, "epoch": 6.855345911949685, "percentage": 34.28, "elapsed_time": "0:33:20", "remaining_time": "1:03:55", "throughput": 4272.73, "total_tokens": 8547328} {"current_steps": 13085, "total_steps": 38160, "loss": 0.3947, "lr": 0.0008308233224335243, "epoch": 6.8579664570230605, "percentage": 34.29, "elapsed_time": "0:33:21", "remaining_time": "1:03:54", "throughput": 4272.8, "total_tokens": 8550592} {"current_steps": 13090, "total_steps": 38160, "loss": 0.4411, "lr": 0.0008306518156897289, "epoch": 6.860587002096436, "percentage": 34.3, "elapsed_time": "0:33:21", "remaining_time": "1:03:53", "throughput": 4272.77, "total_tokens": 8553408} {"current_steps": 13095, "total_steps": 38160, "loss": 0.487, "lr": 0.0008304802397773459, "epoch": 6.863207547169811, "percentage": 34.32, "elapsed_time": "0:33:22", "remaining_time": "1:03:53", "throughput": 4272.86, "total_tokens": 8556768} {"current_steps": 13100, "total_steps": 38160, "loss": 0.4347, "lr": 0.0008303085947322672, "epoch": 6.865828092243187, "percentage": 34.33, "elapsed_time": "0:33:23", "remaining_time": "1:03:52", "throughput": 4273.03, "total_tokens": 8560416} {"current_steps": 13105, "total_steps": 38160, "loss": 0.4715, "lr": 0.0008301368805903988, "epoch": 6.868448637316562, "percentage": 34.34, "elapsed_time": "0:33:24", "remaining_time": "1:03:51", "throughput": 4273.03, "total_tokens": 8563424} {"current_steps": 13110, "total_steps": 38160, "loss": 0.3709, "lr": 0.0008299650973876611, "epoch": 6.871069182389937, "percentage": 34.36, "elapsed_time": "0:33:24", "remaining_time": "1:03:50", "throughput": 4273.08, "total_tokens": 8566560} {"current_steps": 13115, "total_steps": 38160, "loss": 0.3944, "lr": 0.0008297932451599898, "epoch": 6.873689727463312, "percentage": 34.37, "elapsed_time": "0:33:25", "remaining_time": "1:03:49", "throughput": 4273.19, "total_tokens": 8570080} {"current_steps": 13120, "total_steps": 38160, "loss": 0.5727, "lr": 0.0008296213239433339, "epoch": 6.876310272536688, "percentage": 34.38, "elapsed_time": "0:33:26", "remaining_time": "1:03:48", "throughput": 4273.12, "total_tokens": 8572704} {"current_steps": 13125, "total_steps": 38160, "loss": 0.549, "lr": 0.0008294493337736577, "epoch": 6.878930817610063, "percentage": 34.39, "elapsed_time": "0:33:26", "remaining_time": "1:03:48", "throughput": 4273.15, "total_tokens": 8575872} {"current_steps": 13130, "total_steps": 38160, "loss": 0.4289, "lr": 0.0008292772746869392, "epoch": 6.881551362683438, "percentage": 34.41, "elapsed_time": "0:33:27", "remaining_time": "1:03:47", "throughput": 4273.27, "total_tokens": 8579392} {"current_steps": 13135, "total_steps": 38160, "loss": 0.5037, "lr": 0.0008291051467191717, "epoch": 6.884171907756813, "percentage": 34.42, "elapsed_time": "0:33:28", "remaining_time": "1:03:46", "throughput": 4273.21, "total_tokens": 8582144} {"current_steps": 13140, "total_steps": 38160, "loss": 0.3473, "lr": 0.000828932949906362, "epoch": 6.886792452830189, "percentage": 34.43, "elapsed_time": "0:33:29", "remaining_time": "1:03:45", "throughput": 4273.24, "total_tokens": 8585184} {"current_steps": 13145, "total_steps": 38160, "loss": 0.7568, "lr": 0.0008287606842845319, "epoch": 6.889412997903564, "percentage": 34.45, "elapsed_time": "0:33:29", "remaining_time": "1:03:44", "throughput": 4273.22, "total_tokens": 8588128} {"current_steps": 13150, "total_steps": 38160, "loss": 0.4803, "lr": 0.0008285883498897174, "epoch": 6.8920335429769395, "percentage": 34.46, "elapsed_time": "0:33:30", "remaining_time": "1:03:43", "throughput": 4273.2, "total_tokens": 8591008} {"current_steps": 13155, "total_steps": 38160, "loss": 0.614, "lr": 0.0008284159467579686, "epoch": 6.894654088050315, "percentage": 34.47, "elapsed_time": "0:33:31", "remaining_time": "1:03:42", "throughput": 4273.36, "total_tokens": 8594592} {"current_steps": 13160, "total_steps": 38160, "loss": 0.6831, "lr": 0.0008282434749253507, "epoch": 6.89727463312369, "percentage": 34.49, "elapsed_time": "0:33:31", "remaining_time": "1:03:42", "throughput": 4273.5, "total_tokens": 8598112} {"current_steps": 13165, "total_steps": 38160, "loss": 0.5119, "lr": 0.0008280709344279426, "epoch": 6.899895178197065, "percentage": 34.5, "elapsed_time": "0:33:32", "remaining_time": "1:03:41", "throughput": 4273.76, "total_tokens": 8602272} {"current_steps": 13170, "total_steps": 38160, "loss": 0.3943, "lr": 0.0008278983253018377, "epoch": 6.90251572327044, "percentage": 34.51, "elapsed_time": "0:33:33", "remaining_time": "1:03:40", "throughput": 4273.89, "total_tokens": 8605760} {"current_steps": 13175, "total_steps": 38160, "loss": 0.408, "lr": 0.0008277256475831443, "epoch": 6.905136268343815, "percentage": 34.53, "elapsed_time": "0:33:34", "remaining_time": "1:03:39", "throughput": 4273.97, "total_tokens": 8609056} {"current_steps": 13180, "total_steps": 38160, "loss": 0.541, "lr": 0.0008275529013079841, "epoch": 6.9077568134171905, "percentage": 34.54, "elapsed_time": "0:33:35", "remaining_time": "1:03:39", "throughput": 4274.07, "total_tokens": 8612480} {"current_steps": 13185, "total_steps": 38160, "loss": 0.3311, "lr": 0.0008273800865124941, "epoch": 6.910377358490566, "percentage": 34.55, "elapsed_time": "0:33:35", "remaining_time": "1:03:38", "throughput": 4274.11, "total_tokens": 8615584} {"current_steps": 13190, "total_steps": 38160, "loss": 0.4079, "lr": 0.0008272072032328246, "epoch": 6.912997903563941, "percentage": 34.56, "elapsed_time": "0:33:36", "remaining_time": "1:03:37", "throughput": 4274.16, "total_tokens": 8618816} {"current_steps": 13195, "total_steps": 38160, "loss": 0.4603, "lr": 0.0008270342515051414, "epoch": 6.915618448637317, "percentage": 34.58, "elapsed_time": "0:33:37", "remaining_time": "1:03:36", "throughput": 4274.24, "total_tokens": 8622176} {"current_steps": 13200, "total_steps": 38160, "loss": 0.4483, "lr": 0.0008268612313656238, "epoch": 6.918238993710692, "percentage": 34.59, "elapsed_time": "0:33:38", "remaining_time": "1:03:35", "throughput": 4274.42, "total_tokens": 8625984} {"current_steps": 13205, "total_steps": 38160, "loss": 0.6036, "lr": 0.0008266881428504655, "epoch": 6.920859538784067, "percentage": 34.6, "elapsed_time": "0:33:38", "remaining_time": "1:03:35", "throughput": 4274.44, "total_tokens": 8629056} {"current_steps": 13210, "total_steps": 38160, "loss": 0.4053, "lr": 0.000826514985995875, "epoch": 6.923480083857442, "percentage": 34.62, "elapsed_time": "0:33:39", "remaining_time": "1:03:34", "throughput": 4274.74, "total_tokens": 8633312} {"current_steps": 13215, "total_steps": 38160, "loss": 0.5571, "lr": 0.0008263417608380743, "epoch": 6.926100628930818, "percentage": 34.63, "elapsed_time": "0:33:40", "remaining_time": "1:03:33", "throughput": 4274.98, "total_tokens": 8637376} {"current_steps": 13220, "total_steps": 38160, "loss": 0.4371, "lr": 0.0008261684674133003, "epoch": 6.928721174004193, "percentage": 34.64, "elapsed_time": "0:33:41", "remaining_time": "1:03:32", "throughput": 4275.05, "total_tokens": 8640544} {"current_steps": 13225, "total_steps": 38160, "loss": 0.5609, "lr": 0.0008259951057578041, "epoch": 6.931341719077568, "percentage": 34.66, "elapsed_time": "0:33:41", "remaining_time": "1:03:32", "throughput": 4275.17, "total_tokens": 8644032} {"current_steps": 13230, "total_steps": 38160, "loss": 0.384, "lr": 0.000825821675907851, "epoch": 6.933962264150943, "percentage": 34.67, "elapsed_time": "0:33:42", "remaining_time": "1:03:31", "throughput": 4275.04, "total_tokens": 8646432} {"current_steps": 13235, "total_steps": 38160, "loss": 0.4962, "lr": 0.0008256481778997205, "epoch": 6.936582809224319, "percentage": 34.68, "elapsed_time": "0:33:43", "remaining_time": "1:03:30", "throughput": 4275.05, "total_tokens": 8649472} {"current_steps": 13240, "total_steps": 38160, "loss": 0.4478, "lr": 0.0008254746117697062, "epoch": 6.939203354297694, "percentage": 34.7, "elapsed_time": "0:33:43", "remaining_time": "1:03:29", "throughput": 4275.16, "total_tokens": 8652864} {"current_steps": 13245, "total_steps": 38160, "loss": 0.4661, "lr": 0.0008253009775541165, "epoch": 6.9418238993710695, "percentage": 34.71, "elapsed_time": "0:33:44", "remaining_time": "1:03:28", "throughput": 4275.42, "total_tokens": 8657024} {"current_steps": 13250, "total_steps": 38160, "loss": 0.4481, "lr": 0.0008251272752892733, "epoch": 6.944444444444445, "percentage": 34.72, "elapsed_time": "0:33:45", "remaining_time": "1:03:27", "throughput": 4275.4, "total_tokens": 8659872} {"current_steps": 13255, "total_steps": 38160, "loss": 0.4459, "lr": 0.0008249535050115135, "epoch": 6.94706498951782, "percentage": 34.74, "elapsed_time": "0:33:46", "remaining_time": "1:03:26", "throughput": 4275.33, "total_tokens": 8662528} {"current_steps": 13260, "total_steps": 38160, "loss": 0.457, "lr": 0.0008247796667571879, "epoch": 6.949685534591195, "percentage": 34.75, "elapsed_time": "0:33:46", "remaining_time": "1:03:26", "throughput": 4275.46, "total_tokens": 8665920} {"current_steps": 13265, "total_steps": 38160, "loss": 0.5489, "lr": 0.000824605760562661, "epoch": 6.95230607966457, "percentage": 34.76, "elapsed_time": "0:33:47", "remaining_time": "1:03:25", "throughput": 4275.38, "total_tokens": 8668480} {"current_steps": 13270, "total_steps": 38160, "loss": 0.4582, "lr": 0.0008244317864643125, "epoch": 6.954926624737945, "percentage": 34.77, "elapsed_time": "0:33:48", "remaining_time": "1:03:24", "throughput": 4275.57, "total_tokens": 8672224} {"current_steps": 13275, "total_steps": 38160, "loss": 0.4802, "lr": 0.0008242577444985355, "epoch": 6.9575471698113205, "percentage": 34.79, "elapsed_time": "0:33:49", "remaining_time": "1:03:23", "throughput": 4275.6, "total_tokens": 8675296} {"current_steps": 13280, "total_steps": 38160, "loss": 0.4226, "lr": 0.0008240836347017375, "epoch": 6.960167714884696, "percentage": 34.8, "elapsed_time": "0:33:49", "remaining_time": "1:03:22", "throughput": 4275.63, "total_tokens": 8678272} {"current_steps": 13285, "total_steps": 38160, "loss": 0.575, "lr": 0.0008239094571103408, "epoch": 6.962788259958071, "percentage": 34.81, "elapsed_time": "0:33:50", "remaining_time": "1:03:21", "throughput": 4275.73, "total_tokens": 8681568} {"current_steps": 13290, "total_steps": 38160, "loss": 0.5061, "lr": 0.0008237352117607808, "epoch": 6.965408805031447, "percentage": 34.83, "elapsed_time": "0:33:51", "remaining_time": "1:03:20", "throughput": 4275.73, "total_tokens": 8684544} {"current_steps": 13295, "total_steps": 38160, "loss": 0.4313, "lr": 0.000823560898689508, "epoch": 6.968029350104822, "percentage": 34.84, "elapsed_time": "0:33:51", "remaining_time": "1:03:19", "throughput": 4275.62, "total_tokens": 8687072} {"current_steps": 13300, "total_steps": 38160, "loss": 0.4524, "lr": 0.0008233865179329865, "epoch": 6.970649895178197, "percentage": 34.85, "elapsed_time": "0:33:52", "remaining_time": "1:03:19", "throughput": 4275.72, "total_tokens": 8690496} {"current_steps": 13305, "total_steps": 38160, "loss": 0.3862, "lr": 0.0008232120695276948, "epoch": 6.973270440251572, "percentage": 34.87, "elapsed_time": "0:33:53", "remaining_time": "1:03:18", "throughput": 4275.69, "total_tokens": 8693376} {"current_steps": 13310, "total_steps": 38160, "loss": 0.5463, "lr": 0.0008230375535101255, "epoch": 6.975890985324948, "percentage": 34.88, "elapsed_time": "0:33:53", "remaining_time": "1:03:17", "throughput": 4275.7, "total_tokens": 8696384} {"current_steps": 13315, "total_steps": 38160, "loss": 0.5672, "lr": 0.0008228629699167855, "epoch": 6.978511530398323, "percentage": 34.89, "elapsed_time": "0:33:54", "remaining_time": "1:03:16", "throughput": 4275.7, "total_tokens": 8699264} {"current_steps": 13320, "total_steps": 38160, "loss": 0.4689, "lr": 0.0008226883187841957, "epoch": 6.981132075471698, "percentage": 34.91, "elapsed_time": "0:33:55", "remaining_time": "1:03:15", "throughput": 4275.6, "total_tokens": 8701760} {"current_steps": 13325, "total_steps": 38160, "loss": 0.3358, "lr": 0.0008225136001488908, "epoch": 6.983752620545073, "percentage": 34.92, "elapsed_time": "0:33:55", "remaining_time": "1:03:14", "throughput": 4275.54, "total_tokens": 8704352} {"current_steps": 13330, "total_steps": 38160, "loss": 0.4029, "lr": 0.0008223388140474205, "epoch": 6.986373165618449, "percentage": 34.93, "elapsed_time": "0:33:56", "remaining_time": "1:03:13", "throughput": 4275.37, "total_tokens": 8706560} {"current_steps": 13335, "total_steps": 38160, "loss": 0.4408, "lr": 0.0008221639605163476, "epoch": 6.988993710691824, "percentage": 34.94, "elapsed_time": "0:33:57", "remaining_time": "1:03:12", "throughput": 4275.33, "total_tokens": 8709408} {"current_steps": 13340, "total_steps": 38160, "loss": 0.4355, "lr": 0.0008219890395922495, "epoch": 6.9916142557651995, "percentage": 34.96, "elapsed_time": "0:33:57", "remaining_time": "1:03:11", "throughput": 4275.57, "total_tokens": 8713440} {"current_steps": 13345, "total_steps": 38160, "loss": 0.4241, "lr": 0.0008218140513117178, "epoch": 6.994234800838575, "percentage": 34.97, "elapsed_time": "0:33:58", "remaining_time": "1:03:10", "throughput": 4275.57, "total_tokens": 8716352} {"current_steps": 13350, "total_steps": 38160, "loss": 0.4044, "lr": 0.0008216389957113582, "epoch": 6.99685534591195, "percentage": 34.98, "elapsed_time": "0:33:59", "remaining_time": "1:03:09", "throughput": 4275.5, "total_tokens": 8718944} {"current_steps": 13355, "total_steps": 38160, "loss": 0.425, "lr": 0.0008214638728277899, "epoch": 6.999475890985325, "percentage": 35.0, "elapsed_time": "0:34:00", "remaining_time": "1:03:09", "throughput": 4275.61, "total_tokens": 8722304} {"current_steps": 13356, "total_steps": 38160, "eval_loss": 0.4845752716064453, "epoch": 7.0, "percentage": 35.0, "elapsed_time": "0:34:14", "remaining_time": "1:03:34", "throughput": 4246.53, "total_tokens": 8722408} {"current_steps": 13360, "total_steps": 38160, "loss": 0.3979, "lr": 0.0008212886826976469, "epoch": 7.0020964360587, "percentage": 35.01, "elapsed_time": "0:34:16", "remaining_time": "1:03:37", "throughput": 4243.19, "total_tokens": 8725256} {"current_steps": 13365, "total_steps": 38160, "loss": 0.5, "lr": 0.0008211134253575769, "epoch": 7.004716981132075, "percentage": 35.02, "elapsed_time": "0:34:17", "remaining_time": "1:03:36", "throughput": 4243.54, "total_tokens": 8729704} {"current_steps": 13370, "total_steps": 38160, "loss": 0.4194, "lr": 0.000820938100844242, "epoch": 7.0073375262054505, "percentage": 35.04, "elapsed_time": "0:34:18", "remaining_time": "1:03:36", "throughput": 4244.04, "total_tokens": 8734888} {"current_steps": 13375, "total_steps": 38160, "loss": 0.4624, "lr": 0.0008207627091943177, "epoch": 7.009958071278826, "percentage": 35.05, "elapsed_time": "0:34:18", "remaining_time": "1:03:35", "throughput": 4244.25, "total_tokens": 8738728} {"current_steps": 13380, "total_steps": 38160, "loss": 0.4605, "lr": 0.000820587250444494, "epoch": 7.012578616352202, "percentage": 35.06, "elapsed_time": "0:34:19", "remaining_time": "1:03:34", "throughput": 4244.39, "total_tokens": 8742248} {"current_steps": 13385, "total_steps": 38160, "loss": 0.454, "lr": 0.0008204117246314752, "epoch": 7.015199161425577, "percentage": 35.08, "elapsed_time": "0:34:20", "remaining_time": "1:03:33", "throughput": 4244.5, "total_tokens": 8745672} {"current_steps": 13390, "total_steps": 38160, "loss": 0.3518, "lr": 0.0008202361317919788, "epoch": 7.017819706498952, "percentage": 35.09, "elapsed_time": "0:34:21", "remaining_time": "1:03:33", "throughput": 4244.78, "total_tokens": 8749768} {"current_steps": 13395, "total_steps": 38160, "loss": 0.3888, "lr": 0.0008200604719627373, "epoch": 7.020440251572327, "percentage": 35.1, "elapsed_time": "0:34:22", "remaining_time": "1:03:32", "throughput": 4245.01, "total_tokens": 8753864} {"current_steps": 13400, "total_steps": 38160, "loss": 0.3908, "lr": 0.0008198847451804964, "epoch": 7.023060796645702, "percentage": 35.12, "elapsed_time": "0:34:22", "remaining_time": "1:03:31", "throughput": 4245.12, "total_tokens": 8757256} {"current_steps": 13405, "total_steps": 38160, "loss": 0.3507, "lr": 0.0008197089514820162, "epoch": 7.0256813417190775, "percentage": 35.13, "elapsed_time": "0:34:23", "remaining_time": "1:03:30", "throughput": 4245.24, "total_tokens": 8760808} {"current_steps": 13410, "total_steps": 38160, "loss": 0.3022, "lr": 0.0008195330909040708, "epoch": 7.028301886792453, "percentage": 35.14, "elapsed_time": "0:34:24", "remaining_time": "1:03:30", "throughput": 4245.67, "total_tokens": 8765896} {"current_steps": 13415, "total_steps": 38160, "loss": 0.56, "lr": 0.0008193571634834483, "epoch": 7.030922431865828, "percentage": 35.15, "elapsed_time": "0:34:25", "remaining_time": "1:03:29", "throughput": 4245.59, "total_tokens": 8768488} {"current_steps": 13420, "total_steps": 38160, "loss": 0.3781, "lr": 0.0008191811692569506, "epoch": 7.033542976939203, "percentage": 35.17, "elapsed_time": "0:34:25", "remaining_time": "1:03:28", "throughput": 4245.42, "total_tokens": 8770664} {"current_steps": 13425, "total_steps": 38160, "loss": 0.4088, "lr": 0.0008190051082613936, "epoch": 7.036163522012578, "percentage": 35.18, "elapsed_time": "0:34:26", "remaining_time": "1:03:27", "throughput": 4245.46, "total_tokens": 8773768} {"current_steps": 13430, "total_steps": 38160, "loss": 0.5192, "lr": 0.0008188289805336074, "epoch": 7.038784067085954, "percentage": 35.19, "elapsed_time": "0:34:27", "remaining_time": "1:03:27", "throughput": 4245.81, "total_tokens": 8778280} {"current_steps": 13435, "total_steps": 38160, "loss": 0.5352, "lr": 0.0008186527861104359, "epoch": 7.0414046121593294, "percentage": 35.21, "elapsed_time": "0:34:28", "remaining_time": "1:03:26", "throughput": 4245.82, "total_tokens": 8781256} {"current_steps": 13440, "total_steps": 38160, "loss": 0.387, "lr": 0.0008184765250287369, "epoch": 7.044025157232705, "percentage": 35.22, "elapsed_time": "0:34:28", "remaining_time": "1:03:25", "throughput": 4245.77, "total_tokens": 8783976} {"current_steps": 13445, "total_steps": 38160, "loss": 0.4082, "lr": 0.0008183001973253823, "epoch": 7.04664570230608, "percentage": 35.23, "elapsed_time": "0:34:29", "remaining_time": "1:03:24", "throughput": 4245.6, "total_tokens": 8786184} {"current_steps": 13450, "total_steps": 38160, "loss": 0.4156, "lr": 0.0008181238030372576, "epoch": 7.049266247379455, "percentage": 35.25, "elapsed_time": "0:34:30", "remaining_time": "1:03:23", "throughput": 4245.67, "total_tokens": 8789512} {"current_steps": 13455, "total_steps": 38160, "loss": 0.4668, "lr": 0.0008179473422012628, "epoch": 7.05188679245283, "percentage": 35.26, "elapsed_time": "0:34:30", "remaining_time": "1:03:22", "throughput": 4245.73, "total_tokens": 8792680} {"current_steps": 13460, "total_steps": 38160, "loss": 0.3294, "lr": 0.0008177708148543114, "epoch": 7.054507337526205, "percentage": 35.27, "elapsed_time": "0:34:31", "remaining_time": "1:03:21", "throughput": 4245.86, "total_tokens": 8796104} {"current_steps": 13465, "total_steps": 38160, "loss": 0.5598, "lr": 0.0008175942210333307, "epoch": 7.0571278825995805, "percentage": 35.29, "elapsed_time": "0:34:32", "remaining_time": "1:03:20", "throughput": 4245.86, "total_tokens": 8799112} {"current_steps": 13470, "total_steps": 38160, "loss": 0.5034, "lr": 0.0008174175607752626, "epoch": 7.059748427672956, "percentage": 35.3, "elapsed_time": "0:34:33", "remaining_time": "1:03:20", "throughput": 4246.13, "total_tokens": 8803272} {"current_steps": 13475, "total_steps": 38160, "loss": 0.523, "lr": 0.0008172408341170617, "epoch": 7.062368972746331, "percentage": 35.31, "elapsed_time": "0:34:34", "remaining_time": "1:03:19", "throughput": 4246.38, "total_tokens": 8807304} {"current_steps": 13480, "total_steps": 38160, "loss": 0.4976, "lr": 0.0008170640410956976, "epoch": 7.064989517819707, "percentage": 35.32, "elapsed_time": "0:34:34", "remaining_time": "1:03:18", "throughput": 4246.34, "total_tokens": 8810024} {"current_steps": 13485, "total_steps": 38160, "loss": 0.5882, "lr": 0.0008168871817481536, "epoch": 7.067610062893082, "percentage": 35.34, "elapsed_time": "0:34:35", "remaining_time": "1:03:17", "throughput": 4246.34, "total_tokens": 8812936} {"current_steps": 13490, "total_steps": 38160, "loss": 0.4028, "lr": 0.0008167102561114261, "epoch": 7.070230607966457, "percentage": 35.35, "elapsed_time": "0:34:36", "remaining_time": "1:03:16", "throughput": 4246.35, "total_tokens": 8815912} {"current_steps": 13495, "total_steps": 38160, "loss": 0.3742, "lr": 0.0008165332642225265, "epoch": 7.072851153039832, "percentage": 35.36, "elapsed_time": "0:34:36", "remaining_time": "1:03:15", "throughput": 4246.5, "total_tokens": 8819528} {"current_steps": 13500, "total_steps": 38160, "loss": 0.4625, "lr": 0.0008163562061184791, "epoch": 7.0754716981132075, "percentage": 35.38, "elapsed_time": "0:34:37", "remaining_time": "1:03:14", "throughput": 4246.44, "total_tokens": 8822152} {"current_steps": 13505, "total_steps": 38160, "loss": 0.422, "lr": 0.0008161790818363227, "epoch": 7.078092243186583, "percentage": 35.39, "elapsed_time": "0:34:38", "remaining_time": "1:03:14", "throughput": 4246.46, "total_tokens": 8825160} {"current_steps": 13510, "total_steps": 38160, "loss": 0.6775, "lr": 0.0008160018914131094, "epoch": 7.080712788259958, "percentage": 35.4, "elapsed_time": "0:34:38", "remaining_time": "1:03:13", "throughput": 4246.5, "total_tokens": 8828264} {"current_steps": 13515, "total_steps": 38160, "loss": 0.4619, "lr": 0.0008158246348859057, "epoch": 7.083333333333333, "percentage": 35.42, "elapsed_time": "0:34:39", "remaining_time": "1:03:12", "throughput": 4246.59, "total_tokens": 8831560} {"current_steps": 13520, "total_steps": 38160, "loss": 0.4193, "lr": 0.0008156473122917913, "epoch": 7.085953878406708, "percentage": 35.43, "elapsed_time": "0:34:40", "remaining_time": "1:03:11", "throughput": 4246.59, "total_tokens": 8834408} {"current_steps": 13525, "total_steps": 38160, "loss": 0.4431, "lr": 0.0008154699236678604, "epoch": 7.088574423480084, "percentage": 35.44, "elapsed_time": "0:34:41", "remaining_time": "1:03:10", "throughput": 4246.61, "total_tokens": 8837448} {"current_steps": 13530, "total_steps": 38160, "loss": 0.3974, "lr": 0.0008152924690512205, "epoch": 7.091194968553459, "percentage": 35.46, "elapsed_time": "0:34:41", "remaining_time": "1:03:09", "throughput": 4246.62, "total_tokens": 8840392} {"current_steps": 13535, "total_steps": 38160, "loss": 0.3343, "lr": 0.0008151149484789932, "epoch": 7.093815513626835, "percentage": 35.47, "elapsed_time": "0:34:42", "remaining_time": "1:03:08", "throughput": 4246.74, "total_tokens": 8843816} {"current_steps": 13540, "total_steps": 38160, "loss": 0.6094, "lr": 0.0008149373619883136, "epoch": 7.09643605870021, "percentage": 35.48, "elapsed_time": "0:34:43", "remaining_time": "1:03:08", "throughput": 4246.88, "total_tokens": 8847368} {"current_steps": 13545, "total_steps": 38160, "loss": 0.5352, "lr": 0.0008147597096163308, "epoch": 7.099056603773585, "percentage": 35.5, "elapsed_time": "0:34:43", "remaining_time": "1:03:07", "throughput": 4246.93, "total_tokens": 8850536} {"current_steps": 13550, "total_steps": 38160, "loss": 0.4685, "lr": 0.0008145819914002079, "epoch": 7.10167714884696, "percentage": 35.51, "elapsed_time": "0:34:44", "remaining_time": "1:03:06", "throughput": 4246.98, "total_tokens": 8853672} {"current_steps": 13555, "total_steps": 38160, "loss": 0.449, "lr": 0.0008144042073771214, "epoch": 7.104297693920335, "percentage": 35.52, "elapsed_time": "0:34:45", "remaining_time": "1:03:05", "throughput": 4247.0, "total_tokens": 8856712} {"current_steps": 13560, "total_steps": 38160, "loss": 0.3542, "lr": 0.0008142263575842615, "epoch": 7.1069182389937104, "percentage": 35.53, "elapsed_time": "0:34:46", "remaining_time": "1:03:04", "throughput": 4247.01, "total_tokens": 8859656} {"current_steps": 13565, "total_steps": 38160, "loss": 0.4207, "lr": 0.0008140484420588323, "epoch": 7.109538784067086, "percentage": 35.55, "elapsed_time": "0:34:46", "remaining_time": "1:03:03", "throughput": 4247.12, "total_tokens": 8863144} {"current_steps": 13570, "total_steps": 38160, "loss": 0.4047, "lr": 0.000813870460838052, "epoch": 7.112159329140461, "percentage": 35.56, "elapsed_time": "0:34:47", "remaining_time": "1:03:02", "throughput": 4247.13, "total_tokens": 8866216} {"current_steps": 13575, "total_steps": 38160, "loss": 0.5419, "lr": 0.0008136924139591522, "epoch": 7.114779874213837, "percentage": 35.57, "elapsed_time": "0:34:48", "remaining_time": "1:03:02", "throughput": 4247.23, "total_tokens": 8869640} {"current_steps": 13580, "total_steps": 38160, "loss": 0.4117, "lr": 0.0008135143014593782, "epoch": 7.117400419287212, "percentage": 35.59, "elapsed_time": "0:34:48", "remaining_time": "1:03:01", "throughput": 4247.2, "total_tokens": 8872392} {"current_steps": 13585, "total_steps": 38160, "loss": 0.3064, "lr": 0.000813336123375989, "epoch": 7.120020964360587, "percentage": 35.6, "elapsed_time": "0:34:49", "remaining_time": "1:03:00", "throughput": 4247.06, "total_tokens": 8874728} {"current_steps": 13590, "total_steps": 38160, "loss": 0.5211, "lr": 0.0008131578797462575, "epoch": 7.122641509433962, "percentage": 35.61, "elapsed_time": "0:34:50", "remaining_time": "1:02:59", "throughput": 4246.98, "total_tokens": 8877256} {"current_steps": 13595, "total_steps": 38160, "loss": 0.5817, "lr": 0.0008129795706074703, "epoch": 7.1252620545073375, "percentage": 35.63, "elapsed_time": "0:34:50", "remaining_time": "1:02:58", "throughput": 4247.02, "total_tokens": 8880392} {"current_steps": 13600, "total_steps": 38160, "loss": 0.3781, "lr": 0.0008128011959969277, "epoch": 7.127882599580713, "percentage": 35.64, "elapsed_time": "0:34:51", "remaining_time": "1:02:57", "throughput": 4247.12, "total_tokens": 8883656} {"current_steps": 13605, "total_steps": 38160, "loss": 0.3675, "lr": 0.0008126227559519434, "epoch": 7.130503144654088, "percentage": 35.65, "elapsed_time": "0:34:52", "remaining_time": "1:02:57", "throughput": 4247.62, "total_tokens": 8889320} {"current_steps": 13610, "total_steps": 38160, "loss": 0.4786, "lr": 0.0008124442505098452, "epoch": 7.133123689727463, "percentage": 35.67, "elapsed_time": "0:34:53", "remaining_time": "1:02:56", "throughput": 4247.67, "total_tokens": 8892424} {"current_steps": 13615, "total_steps": 38160, "loss": 0.4225, "lr": 0.0008122656797079744, "epoch": 7.135744234800838, "percentage": 35.68, "elapsed_time": "0:34:54", "remaining_time": "1:02:55", "throughput": 4247.75, "total_tokens": 8895784} {"current_steps": 13620, "total_steps": 38160, "loss": 0.5608, "lr": 0.0008120870435836858, "epoch": 7.138364779874214, "percentage": 35.69, "elapsed_time": "0:34:54", "remaining_time": "1:02:54", "throughput": 4247.81, "total_tokens": 8899016} {"current_steps": 13625, "total_steps": 38160, "loss": 0.578, "lr": 0.0008119083421743481, "epoch": 7.140985324947589, "percentage": 35.7, "elapsed_time": "0:34:55", "remaining_time": "1:02:53", "throughput": 4247.64, "total_tokens": 8901224} {"current_steps": 13630, "total_steps": 38160, "loss": 0.4202, "lr": 0.0008117295755173437, "epoch": 7.143605870020965, "percentage": 35.72, "elapsed_time": "0:34:56", "remaining_time": "1:02:52", "throughput": 4247.7, "total_tokens": 8904392} {"current_steps": 13635, "total_steps": 38160, "loss": 0.4185, "lr": 0.0008115507436500687, "epoch": 7.14622641509434, "percentage": 35.73, "elapsed_time": "0:34:57", "remaining_time": "1:02:51", "throughput": 4247.93, "total_tokens": 8908264} {"current_steps": 13640, "total_steps": 38160, "loss": 0.5655, "lr": 0.0008113718466099322, "epoch": 7.148846960167715, "percentage": 35.74, "elapsed_time": "0:34:57", "remaining_time": "1:02:51", "throughput": 4247.94, "total_tokens": 8911208} {"current_steps": 13645, "total_steps": 38160, "loss": 0.4688, "lr": 0.0008111928844343579, "epoch": 7.15146750524109, "percentage": 35.76, "elapsed_time": "0:34:58", "remaining_time": "1:02:50", "throughput": 4248.11, "total_tokens": 8914792} {"current_steps": 13650, "total_steps": 38160, "loss": 0.417, "lr": 0.0008110138571607823, "epoch": 7.154088050314465, "percentage": 35.77, "elapsed_time": "0:34:59", "remaining_time": "1:02:49", "throughput": 4248.1, "total_tokens": 8917640} {"current_steps": 13655, "total_steps": 38160, "loss": 0.4516, "lr": 0.0008108347648266563, "epoch": 7.15670859538784, "percentage": 35.78, "elapsed_time": "0:34:59", "remaining_time": "1:02:48", "throughput": 4248.11, "total_tokens": 8920616} {"current_steps": 13660, "total_steps": 38160, "loss": 0.385, "lr": 0.0008106556074694434, "epoch": 7.159329140461216, "percentage": 35.8, "elapsed_time": "0:35:00", "remaining_time": "1:02:47", "throughput": 4248.28, "total_tokens": 8924360} {"current_steps": 13665, "total_steps": 38160, "loss": 0.4403, "lr": 0.0008104763851266216, "epoch": 7.161949685534591, "percentage": 35.81, "elapsed_time": "0:35:01", "remaining_time": "1:02:46", "throughput": 4248.39, "total_tokens": 8927752} {"current_steps": 13670, "total_steps": 38160, "loss": 0.3781, "lr": 0.0008102970978356822, "epoch": 7.164570230607967, "percentage": 35.82, "elapsed_time": "0:35:02", "remaining_time": "1:02:45", "throughput": 4248.37, "total_tokens": 8930568} {"current_steps": 13675, "total_steps": 38160, "loss": 0.4839, "lr": 0.00081011774563413, "epoch": 7.167190775681342, "percentage": 35.84, "elapsed_time": "0:35:02", "remaining_time": "1:02:44", "throughput": 4248.26, "total_tokens": 8933000} {"current_steps": 13680, "total_steps": 38160, "loss": 0.5104, "lr": 0.0008099383285594835, "epoch": 7.169811320754717, "percentage": 35.85, "elapsed_time": "0:35:03", "remaining_time": "1:02:44", "throughput": 4248.34, "total_tokens": 8936264} {"current_steps": 13685, "total_steps": 38160, "loss": 0.3367, "lr": 0.0008097588466492746, "epoch": 7.172431865828092, "percentage": 35.86, "elapsed_time": "0:35:04", "remaining_time": "1:02:43", "throughput": 4248.43, "total_tokens": 8939656} {"current_steps": 13690, "total_steps": 38160, "loss": 0.6069, "lr": 0.0008095792999410487, "epoch": 7.1750524109014675, "percentage": 35.88, "elapsed_time": "0:35:04", "remaining_time": "1:02:42", "throughput": 4248.42, "total_tokens": 8942408} {"current_steps": 13695, "total_steps": 38160, "loss": 0.4029, "lr": 0.0008093996884723653, "epoch": 7.177672955974843, "percentage": 35.89, "elapsed_time": "0:35:05", "remaining_time": "1:02:41", "throughput": 4248.58, "total_tokens": 8946088} {"current_steps": 13700, "total_steps": 38160, "loss": 0.4336, "lr": 0.0008092200122807969, "epoch": 7.180293501048218, "percentage": 35.9, "elapsed_time": "0:35:06", "remaining_time": "1:02:40", "throughput": 4248.5, "total_tokens": 8948680} {"current_steps": 13705, "total_steps": 38160, "loss": 0.4216, "lr": 0.0008090402714039295, "epoch": 7.182914046121593, "percentage": 35.91, "elapsed_time": "0:35:06", "remaining_time": "1:02:39", "throughput": 4248.38, "total_tokens": 8951080} {"current_steps": 13710, "total_steps": 38160, "loss": 0.4107, "lr": 0.0008088604658793632, "epoch": 7.185534591194968, "percentage": 35.93, "elapsed_time": "0:35:07", "remaining_time": "1:02:38", "throughput": 4248.44, "total_tokens": 8954248} {"current_steps": 13715, "total_steps": 38160, "loss": 0.503, "lr": 0.0008086805957447111, "epoch": 7.188155136268344, "percentage": 35.94, "elapsed_time": "0:35:08", "remaining_time": "1:02:37", "throughput": 4248.42, "total_tokens": 8957000} {"current_steps": 13720, "total_steps": 38160, "loss": 0.3878, "lr": 0.0008085006610376, "epoch": 7.190775681341719, "percentage": 35.95, "elapsed_time": "0:35:09", "remaining_time": "1:02:36", "throughput": 4248.43, "total_tokens": 8959944} {"current_steps": 13725, "total_steps": 38160, "loss": 0.4422, "lr": 0.0008083206617956702, "epoch": 7.193396226415095, "percentage": 35.97, "elapsed_time": "0:35:09", "remaining_time": "1:02:35", "throughput": 4248.45, "total_tokens": 8962984} {"current_steps": 13730, "total_steps": 38160, "loss": 0.5427, "lr": 0.0008081405980565755, "epoch": 7.19601677148847, "percentage": 35.98, "elapsed_time": "0:35:10", "remaining_time": "1:02:35", "throughput": 4248.4, "total_tokens": 8965672} {"current_steps": 13735, "total_steps": 38160, "loss": 0.6026, "lr": 0.0008079604698579829, "epoch": 7.198637316561845, "percentage": 35.99, "elapsed_time": "0:35:11", "remaining_time": "1:02:34", "throughput": 4248.43, "total_tokens": 8968680} {"current_steps": 13740, "total_steps": 38160, "loss": 0.373, "lr": 0.0008077802772375736, "epoch": 7.20125786163522, "percentage": 36.01, "elapsed_time": "0:35:11", "remaining_time": "1:02:33", "throughput": 4248.53, "total_tokens": 8972136} {"current_steps": 13745, "total_steps": 38160, "loss": 0.5153, "lr": 0.0008076000202330416, "epoch": 7.203878406708595, "percentage": 36.02, "elapsed_time": "0:35:12", "remaining_time": "1:02:32", "throughput": 4248.67, "total_tokens": 8975688} {"current_steps": 13750, "total_steps": 38160, "loss": 0.335, "lr": 0.0008074196988820945, "epoch": 7.20649895178197, "percentage": 36.03, "elapsed_time": "0:35:13", "remaining_time": "1:02:31", "throughput": 4248.72, "total_tokens": 8978792} {"current_steps": 13755, "total_steps": 38160, "loss": 0.5204, "lr": 0.0008072393132224539, "epoch": 7.209119496855346, "percentage": 36.05, "elapsed_time": "0:35:13", "remaining_time": "1:02:30", "throughput": 4248.73, "total_tokens": 8981768} {"current_steps": 13760, "total_steps": 38160, "loss": 0.6547, "lr": 0.0008070588632918541, "epoch": 7.211740041928721, "percentage": 36.06, "elapsed_time": "0:35:14", "remaining_time": "1:02:29", "throughput": 4248.66, "total_tokens": 8984328} {"current_steps": 13765, "total_steps": 38160, "loss": 0.4848, "lr": 0.000806878349128043, "epoch": 7.214360587002097, "percentage": 36.07, "elapsed_time": "0:35:15", "remaining_time": "1:02:28", "throughput": 4248.61, "total_tokens": 8987016} {"current_steps": 13770, "total_steps": 38160, "loss": 0.5999, "lr": 0.0008066977707687826, "epoch": 7.216981132075472, "percentage": 36.08, "elapsed_time": "0:35:16", "remaining_time": "1:02:28", "throughput": 4249.12, "total_tokens": 8992264} {"current_steps": 13775, "total_steps": 38160, "loss": 0.5009, "lr": 0.0008065171282518473, "epoch": 7.219601677148847, "percentage": 36.1, "elapsed_time": "0:35:16", "remaining_time": "1:02:27", "throughput": 4249.16, "total_tokens": 8995368} {"current_steps": 13780, "total_steps": 38160, "loss": 0.4163, "lr": 0.0008063364216150257, "epoch": 7.222222222222222, "percentage": 36.11, "elapsed_time": "0:35:17", "remaining_time": "1:02:26", "throughput": 4249.12, "total_tokens": 8998120} {"current_steps": 13785, "total_steps": 38160, "loss": 0.376, "lr": 0.0008061556508961199, "epoch": 7.2248427672955975, "percentage": 36.12, "elapsed_time": "0:35:18", "remaining_time": "1:02:25", "throughput": 4249.27, "total_tokens": 9001768} {"current_steps": 13790, "total_steps": 38160, "loss": 0.6137, "lr": 0.0008059748161329443, "epoch": 7.227463312368973, "percentage": 36.14, "elapsed_time": "0:35:19", "remaining_time": "1:02:24", "throughput": 4249.19, "total_tokens": 9004328} {"current_steps": 13795, "total_steps": 38160, "loss": 0.6264, "lr": 0.0008057939173633282, "epoch": 7.230083857442348, "percentage": 36.15, "elapsed_time": "0:35:19", "remaining_time": "1:02:24", "throughput": 4249.26, "total_tokens": 9007688} {"current_steps": 13800, "total_steps": 38160, "loss": 0.5459, "lr": 0.0008056129546251132, "epoch": 7.232704402515723, "percentage": 36.16, "elapsed_time": "0:35:20", "remaining_time": "1:02:23", "throughput": 4249.35, "total_tokens": 9011112} {"current_steps": 13805, "total_steps": 38160, "loss": 0.4775, "lr": 0.0008054319279561546, "epoch": 7.235324947589098, "percentage": 36.18, "elapsed_time": "0:35:21", "remaining_time": "1:02:22", "throughput": 4249.32, "total_tokens": 9013864} {"current_steps": 13810, "total_steps": 38160, "loss": 0.5129, "lr": 0.0008052508373943214, "epoch": 7.237945492662474, "percentage": 36.19, "elapsed_time": "0:35:21", "remaining_time": "1:02:21", "throughput": 4249.36, "total_tokens": 9017000} {"current_steps": 13815, "total_steps": 38160, "loss": 0.415, "lr": 0.0008050696829774954, "epoch": 7.240566037735849, "percentage": 36.2, "elapsed_time": "0:35:22", "remaining_time": "1:02:20", "throughput": 4249.55, "total_tokens": 9020744} {"current_steps": 13820, "total_steps": 38160, "loss": 0.5997, "lr": 0.0008048884647435721, "epoch": 7.243186582809225, "percentage": 36.22, "elapsed_time": "0:35:23", "remaining_time": "1:02:20", "throughput": 4249.85, "total_tokens": 9025064} {"current_steps": 13825, "total_steps": 38160, "loss": 0.3856, "lr": 0.0008047071827304604, "epoch": 7.2458071278826, "percentage": 36.23, "elapsed_time": "0:35:24", "remaining_time": "1:02:19", "throughput": 4249.76, "total_tokens": 9027688} {"current_steps": 13830, "total_steps": 38160, "loss": 0.5433, "lr": 0.0008045258369760824, "epoch": 7.248427672955975, "percentage": 36.24, "elapsed_time": "0:35:24", "remaining_time": "1:02:18", "throughput": 4249.73, "total_tokens": 9030472} {"current_steps": 13835, "total_steps": 38160, "loss": 0.3711, "lr": 0.0008043444275183735, "epoch": 7.25104821802935, "percentage": 36.26, "elapsed_time": "0:35:25", "remaining_time": "1:02:17", "throughput": 4249.85, "total_tokens": 9033992} {"current_steps": 13840, "total_steps": 38160, "loss": 0.5021, "lr": 0.0008041629543952824, "epoch": 7.253668763102725, "percentage": 36.27, "elapsed_time": "0:35:26", "remaining_time": "1:02:16", "throughput": 4249.86, "total_tokens": 9037000} {"current_steps": 13845, "total_steps": 38160, "loss": 0.4431, "lr": 0.0008039814176447714, "epoch": 7.2562893081761, "percentage": 36.28, "elapsed_time": "0:35:27", "remaining_time": "1:02:15", "throughput": 4249.91, "total_tokens": 9040232} {"current_steps": 13850, "total_steps": 38160, "loss": 0.4879, "lr": 0.0008037998173048157, "epoch": 7.258909853249476, "percentage": 36.29, "elapsed_time": "0:35:27", "remaining_time": "1:02:14", "throughput": 4249.92, "total_tokens": 9043112} {"current_steps": 13855, "total_steps": 38160, "loss": 0.4535, "lr": 0.0008036181534134044, "epoch": 7.261530398322851, "percentage": 36.31, "elapsed_time": "0:35:28", "remaining_time": "1:02:13", "throughput": 4249.82, "total_tokens": 9045672} {"current_steps": 13860, "total_steps": 38160, "loss": 0.4151, "lr": 0.0008034364260085391, "epoch": 7.264150943396227, "percentage": 36.32, "elapsed_time": "0:35:29", "remaining_time": "1:02:12", "throughput": 4249.71, "total_tokens": 9048072} {"current_steps": 13865, "total_steps": 38160, "loss": 0.5385, "lr": 0.0008032546351282353, "epoch": 7.266771488469602, "percentage": 36.33, "elapsed_time": "0:35:29", "remaining_time": "1:02:11", "throughput": 4249.73, "total_tokens": 9051080} {"current_steps": 13870, "total_steps": 38160, "loss": 0.5325, "lr": 0.0008030727808105215, "epoch": 7.269392033542977, "percentage": 36.35, "elapsed_time": "0:35:30", "remaining_time": "1:02:11", "throughput": 4249.68, "total_tokens": 9053864} {"current_steps": 13875, "total_steps": 38160, "loss": 0.3619, "lr": 0.0008028908630934397, "epoch": 7.272012578616352, "percentage": 36.36, "elapsed_time": "0:35:31", "remaining_time": "1:02:10", "throughput": 4249.84, "total_tokens": 9057544} {"current_steps": 13880, "total_steps": 38160, "loss": 0.4853, "lr": 0.0008027088820150447, "epoch": 7.2746331236897275, "percentage": 36.37, "elapsed_time": "0:35:31", "remaining_time": "1:02:09", "throughput": 4249.9, "total_tokens": 9060776} {"current_steps": 13885, "total_steps": 38160, "loss": 0.3885, "lr": 0.0008025268376134054, "epoch": 7.277253668763103, "percentage": 36.39, "elapsed_time": "0:35:32", "remaining_time": "1:02:08", "throughput": 4250.09, "total_tokens": 9064648} {"current_steps": 13890, "total_steps": 38160, "loss": 0.387, "lr": 0.0008023447299266027, "epoch": 7.279874213836478, "percentage": 36.4, "elapsed_time": "0:35:33", "remaining_time": "1:02:07", "throughput": 4250.11, "total_tokens": 9067688} {"current_steps": 13895, "total_steps": 38160, "loss": 0.5866, "lr": 0.0008021625589927321, "epoch": 7.282494758909853, "percentage": 36.41, "elapsed_time": "0:35:34", "remaining_time": "1:02:07", "throughput": 4250.27, "total_tokens": 9071368} {"current_steps": 13900, "total_steps": 38160, "loss": 0.4685, "lr": 0.0008019803248499013, "epoch": 7.285115303983228, "percentage": 36.43, "elapsed_time": "0:35:34", "remaining_time": "1:02:06", "throughput": 4250.24, "total_tokens": 9074120} {"current_steps": 13905, "total_steps": 38160, "loss": 0.3884, "lr": 0.0008017980275362318, "epoch": 7.287735849056604, "percentage": 36.44, "elapsed_time": "0:35:35", "remaining_time": "1:02:05", "throughput": 4250.42, "total_tokens": 9077896} {"current_steps": 13910, "total_steps": 38160, "loss": 0.4161, "lr": 0.000801615667089858, "epoch": 7.290356394129979, "percentage": 36.45, "elapsed_time": "0:35:36", "remaining_time": "1:02:04", "throughput": 4250.45, "total_tokens": 9080968} {"current_steps": 13915, "total_steps": 38160, "loss": 0.3435, "lr": 0.0008014332435489275, "epoch": 7.2929769392033545, "percentage": 36.46, "elapsed_time": "0:35:37", "remaining_time": "1:02:03", "throughput": 4250.57, "total_tokens": 9084456} {"current_steps": 13920, "total_steps": 38160, "loss": 0.452, "lr": 0.0008012507569516016, "epoch": 7.29559748427673, "percentage": 36.48, "elapsed_time": "0:35:37", "remaining_time": "1:02:02", "throughput": 4250.46, "total_tokens": 9086856} {"current_steps": 13925, "total_steps": 38160, "loss": 0.5027, "lr": 0.0008010682073360541, "epoch": 7.298218029350105, "percentage": 36.49, "elapsed_time": "0:35:38", "remaining_time": "1:02:01", "throughput": 4250.45, "total_tokens": 9089768} {"current_steps": 13930, "total_steps": 38160, "loss": 0.3939, "lr": 0.0008008855947404724, "epoch": 7.30083857442348, "percentage": 36.5, "elapsed_time": "0:35:39", "remaining_time": "1:02:00", "throughput": 4250.37, "total_tokens": 9092424} {"current_steps": 13935, "total_steps": 38160, "loss": 0.668, "lr": 0.000800702919203057, "epoch": 7.303459119496855, "percentage": 36.52, "elapsed_time": "0:35:39", "remaining_time": "1:02:00", "throughput": 4250.37, "total_tokens": 9095304} {"current_steps": 13940, "total_steps": 38160, "loss": 0.5238, "lr": 0.0008005201807620214, "epoch": 7.30607966457023, "percentage": 36.53, "elapsed_time": "0:35:40", "remaining_time": "1:01:59", "throughput": 4250.38, "total_tokens": 9098248} {"current_steps": 13945, "total_steps": 38160, "loss": 0.5002, "lr": 0.0008003373794555926, "epoch": 7.308700209643606, "percentage": 36.54, "elapsed_time": "0:35:41", "remaining_time": "1:01:58", "throughput": 4250.51, "total_tokens": 9101768} {"current_steps": 13950, "total_steps": 38160, "loss": 0.3494, "lr": 0.0008001545153220104, "epoch": 7.311320754716981, "percentage": 36.56, "elapsed_time": "0:35:42", "remaining_time": "1:01:57", "throughput": 4250.6, "total_tokens": 9105128} {"current_steps": 13955, "total_steps": 38160, "loss": 0.3947, "lr": 0.000799971588399528, "epoch": 7.313941299790357, "percentage": 36.57, "elapsed_time": "0:35:42", "remaining_time": "1:01:56", "throughput": 4250.79, "total_tokens": 9108936} {"current_steps": 13960, "total_steps": 38160, "loss": 0.4747, "lr": 0.0007997885987264115, "epoch": 7.316561844863732, "percentage": 36.58, "elapsed_time": "0:35:43", "remaining_time": "1:01:55", "throughput": 4250.77, "total_tokens": 9111784} {"current_steps": 13965, "total_steps": 38160, "loss": 0.4762, "lr": 0.0007996055463409403, "epoch": 7.319182389937107, "percentage": 36.6, "elapsed_time": "0:35:44", "remaining_time": "1:01:55", "throughput": 4250.94, "total_tokens": 9115464} {"current_steps": 13970, "total_steps": 38160, "loss": 0.4112, "lr": 0.000799422431281407, "epoch": 7.321802935010482, "percentage": 36.61, "elapsed_time": "0:35:45", "remaining_time": "1:01:54", "throughput": 4250.92, "total_tokens": 9118280} {"current_steps": 13975, "total_steps": 38160, "loss": 0.4459, "lr": 0.000799239253586117, "epoch": 7.3244234800838575, "percentage": 36.62, "elapsed_time": "0:35:45", "remaining_time": "1:01:53", "throughput": 4251.21, "total_tokens": 9122728} {"current_steps": 13980, "total_steps": 38160, "loss": 0.3985, "lr": 0.0007990560132933891, "epoch": 7.327044025157233, "percentage": 36.64, "elapsed_time": "0:35:46", "remaining_time": "1:01:53", "throughput": 4251.46, "total_tokens": 9126856} {"current_steps": 13985, "total_steps": 38160, "loss": 0.3756, "lr": 0.0007988727104415549, "epoch": 7.329664570230608, "percentage": 36.65, "elapsed_time": "0:35:47", "remaining_time": "1:01:52", "throughput": 4251.47, "total_tokens": 9129864} {"current_steps": 13990, "total_steps": 38160, "loss": 0.4402, "lr": 0.0007986893450689594, "epoch": 7.332285115303983, "percentage": 36.66, "elapsed_time": "0:35:48", "remaining_time": "1:01:51", "throughput": 4251.52, "total_tokens": 9133064} {"current_steps": 13995, "total_steps": 38160, "loss": 0.3877, "lr": 0.0007985059172139606, "epoch": 7.334905660377358, "percentage": 36.67, "elapsed_time": "0:35:48", "remaining_time": "1:01:50", "throughput": 4251.59, "total_tokens": 9136264} {"current_steps": 14000, "total_steps": 38160, "loss": 0.4467, "lr": 0.0007983224269149296, "epoch": 7.337526205450734, "percentage": 36.69, "elapsed_time": "0:35:49", "remaining_time": "1:01:49", "throughput": 4251.56, "total_tokens": 9139016} {"current_steps": 14005, "total_steps": 38160, "loss": 0.5598, "lr": 0.00079813887421025, "epoch": 7.340146750524109, "percentage": 36.7, "elapsed_time": "0:35:50", "remaining_time": "1:01:48", "throughput": 4251.51, "total_tokens": 9141704} {"current_steps": 14010, "total_steps": 38160, "loss": 0.3992, "lr": 0.0007979552591383195, "epoch": 7.3427672955974845, "percentage": 36.71, "elapsed_time": "0:35:50", "remaining_time": "1:01:47", "throughput": 4251.5, "total_tokens": 9144616} {"current_steps": 14015, "total_steps": 38160, "loss": 0.4889, "lr": 0.0007977715817375481, "epoch": 7.34538784067086, "percentage": 36.73, "elapsed_time": "0:35:51", "remaining_time": "1:01:46", "throughput": 4251.68, "total_tokens": 9148456} {"current_steps": 14020, "total_steps": 38160, "loss": 0.5465, "lr": 0.0007975878420463588, "epoch": 7.348008385744235, "percentage": 36.74, "elapsed_time": "0:35:52", "remaining_time": "1:01:46", "throughput": 4251.59, "total_tokens": 9151016} {"current_steps": 14025, "total_steps": 38160, "loss": 0.5864, "lr": 0.0007974040401031882, "epoch": 7.35062893081761, "percentage": 36.75, "elapsed_time": "0:35:53", "remaining_time": "1:01:45", "throughput": 4251.8, "total_tokens": 9155016} {"current_steps": 14030, "total_steps": 38160, "loss": 0.454, "lr": 0.0007972201759464851, "epoch": 7.353249475890985, "percentage": 36.77, "elapsed_time": "0:35:53", "remaining_time": "1:01:44", "throughput": 4251.76, "total_tokens": 9157800} {"current_steps": 14035, "total_steps": 38160, "loss": 0.4266, "lr": 0.0007970362496147121, "epoch": 7.35587002096436, "percentage": 36.78, "elapsed_time": "0:35:54", "remaining_time": "1:01:43", "throughput": 4251.99, "total_tokens": 9161736} {"current_steps": 14040, "total_steps": 38160, "loss": 0.4099, "lr": 0.0007968522611463447, "epoch": 7.3584905660377355, "percentage": 36.79, "elapsed_time": "0:35:55", "remaining_time": "1:01:42", "throughput": 4252.02, "total_tokens": 9164872} {"current_steps": 14045, "total_steps": 38160, "loss": 0.4867, "lr": 0.0007966682105798708, "epoch": 7.361111111111111, "percentage": 36.81, "elapsed_time": "0:35:56", "remaining_time": "1:01:42", "throughput": 4252.21, "total_tokens": 9168712} {"current_steps": 14050, "total_steps": 38160, "loss": 0.4604, "lr": 0.0007964840979537918, "epoch": 7.363731656184487, "percentage": 36.82, "elapsed_time": "0:35:56", "remaining_time": "1:01:41", "throughput": 4252.2, "total_tokens": 9171592} {"current_steps": 14055, "total_steps": 38160, "loss": 0.4576, "lr": 0.0007962999233066219, "epoch": 7.366352201257862, "percentage": 36.83, "elapsed_time": "0:35:57", "remaining_time": "1:01:40", "throughput": 4252.44, "total_tokens": 9175688} {"current_steps": 14060, "total_steps": 38160, "loss": 0.3578, "lr": 0.0007961156866768885, "epoch": 7.368972746331237, "percentage": 36.84, "elapsed_time": "0:35:58", "remaining_time": "1:01:40", "throughput": 4252.79, "total_tokens": 9180232} {"current_steps": 14065, "total_steps": 38160, "loss": 0.5708, "lr": 0.0007959313881031317, "epoch": 7.371593291404612, "percentage": 36.86, "elapsed_time": "0:35:59", "remaining_time": "1:01:39", "throughput": 4252.82, "total_tokens": 9183304} {"current_steps": 14070, "total_steps": 38160, "loss": 0.4826, "lr": 0.0007957470276239048, "epoch": 7.3742138364779874, "percentage": 36.87, "elapsed_time": "0:35:59", "remaining_time": "1:01:38", "throughput": 4252.73, "total_tokens": 9185832} {"current_steps": 14075, "total_steps": 38160, "loss": 0.4624, "lr": 0.0007955626052777735, "epoch": 7.376834381551363, "percentage": 36.88, "elapsed_time": "0:36:00", "remaining_time": "1:01:37", "throughput": 4252.74, "total_tokens": 9188872} {"current_steps": 14080, "total_steps": 38160, "loss": 0.4817, "lr": 0.0007953781211033173, "epoch": 7.379454926624738, "percentage": 36.9, "elapsed_time": "0:36:01", "remaining_time": "1:01:36", "throughput": 4252.8, "total_tokens": 9192072} {"current_steps": 14085, "total_steps": 38160, "loss": 0.3604, "lr": 0.000795193575139128, "epoch": 7.382075471698113, "percentage": 36.91, "elapsed_time": "0:36:02", "remaining_time": "1:01:35", "throughput": 4253.0, "total_tokens": 9195848} {"current_steps": 14090, "total_steps": 38160, "loss": 0.5585, "lr": 0.0007950089674238106, "epoch": 7.384696016771488, "percentage": 36.92, "elapsed_time": "0:36:02", "remaining_time": "1:01:34", "throughput": 4252.94, "total_tokens": 9198472} {"current_steps": 14095, "total_steps": 38160, "loss": 0.4458, "lr": 0.0007948242979959828, "epoch": 7.387316561844864, "percentage": 36.94, "elapsed_time": "0:36:03", "remaining_time": "1:01:33", "throughput": 4252.98, "total_tokens": 9201576} {"current_steps": 14100, "total_steps": 38160, "loss": 0.4058, "lr": 0.0007946395668942754, "epoch": 7.389937106918239, "percentage": 36.95, "elapsed_time": "0:36:04", "remaining_time": "1:01:33", "throughput": 4253.03, "total_tokens": 9204712} {"current_steps": 14105, "total_steps": 38160, "loss": 0.4595, "lr": 0.0007944547741573319, "epoch": 7.3925576519916145, "percentage": 36.96, "elapsed_time": "0:36:04", "remaining_time": "1:01:32", "throughput": 4253.07, "total_tokens": 9207816} {"current_steps": 14110, "total_steps": 38160, "loss": 0.4377, "lr": 0.0007942699198238091, "epoch": 7.39517819706499, "percentage": 36.98, "elapsed_time": "0:36:05", "remaining_time": "1:01:31", "throughput": 4253.21, "total_tokens": 9211432} {"current_steps": 14115, "total_steps": 38160, "loss": 0.4214, "lr": 0.0007940850039323763, "epoch": 7.397798742138365, "percentage": 36.99, "elapsed_time": "0:36:06", "remaining_time": "1:01:30", "throughput": 4253.16, "total_tokens": 9214248} {"current_steps": 14120, "total_steps": 38160, "loss": 0.4728, "lr": 0.0007939000265217156, "epoch": 7.40041928721174, "percentage": 37.0, "elapsed_time": "0:36:07", "remaining_time": "1:01:29", "throughput": 4253.08, "total_tokens": 9216904} {"current_steps": 14125, "total_steps": 38160, "loss": 0.446, "lr": 0.0007937149876305226, "epoch": 7.403039832285115, "percentage": 37.02, "elapsed_time": "0:36:07", "remaining_time": "1:01:28", "throughput": 4253.1, "total_tokens": 9219880} {"current_steps": 14130, "total_steps": 38160, "loss": 0.5436, "lr": 0.000793529887297505, "epoch": 7.40566037735849, "percentage": 37.03, "elapsed_time": "0:36:08", "remaining_time": "1:01:28", "throughput": 4253.5, "total_tokens": 9224808} {"current_steps": 14135, "total_steps": 38160, "loss": 0.5174, "lr": 0.0007933447255613835, "epoch": 7.4082809224318655, "percentage": 37.04, "elapsed_time": "0:36:09", "remaining_time": "1:01:27", "throughput": 4253.67, "total_tokens": 9228552} {"current_steps": 14140, "total_steps": 38160, "loss": 0.3931, "lr": 0.0007931595024608924, "epoch": 7.410901467505241, "percentage": 37.05, "elapsed_time": "0:36:10", "remaining_time": "1:01:26", "throughput": 4253.91, "total_tokens": 9232680} {"current_steps": 14145, "total_steps": 38160, "loss": 0.4198, "lr": 0.0007929742180347776, "epoch": 7.413522012578617, "percentage": 37.07, "elapsed_time": "0:36:11", "remaining_time": "1:01:25", "throughput": 4253.87, "total_tokens": 9235400} {"current_steps": 14150, "total_steps": 38160, "loss": 0.4846, "lr": 0.0007927888723217991, "epoch": 7.416142557651992, "percentage": 37.08, "elapsed_time": "0:36:11", "remaining_time": "1:01:25", "throughput": 4253.8, "total_tokens": 9238056} {"current_steps": 14155, "total_steps": 38160, "loss": 0.3454, "lr": 0.0007926034653607288, "epoch": 7.418763102725367, "percentage": 37.09, "elapsed_time": "0:36:12", "remaining_time": "1:01:24", "throughput": 4253.87, "total_tokens": 9241288} {"current_steps": 14160, "total_steps": 38160, "loss": 0.5136, "lr": 0.0007924179971903516, "epoch": 7.421383647798742, "percentage": 37.11, "elapsed_time": "0:36:13", "remaining_time": "1:01:23", "throughput": 4253.99, "total_tokens": 9244872} {"current_steps": 14165, "total_steps": 38160, "loss": 0.4677, "lr": 0.0007922324678494655, "epoch": 7.424004192872117, "percentage": 37.12, "elapsed_time": "0:36:13", "remaining_time": "1:01:22", "throughput": 4253.98, "total_tokens": 9247784} {"current_steps": 14170, "total_steps": 38160, "loss": 0.425, "lr": 0.0007920468773768811, "epoch": 7.426624737945493, "percentage": 37.13, "elapsed_time": "0:36:14", "remaining_time": "1:01:22", "throughput": 4254.44, "total_tokens": 9252904} {"current_steps": 14175, "total_steps": 38160, "loss": 0.395, "lr": 0.0007918612258114217, "epoch": 7.429245283018868, "percentage": 37.15, "elapsed_time": "0:36:15", "remaining_time": "1:01:21", "throughput": 4254.46, "total_tokens": 9255944} {"current_steps": 14180, "total_steps": 38160, "loss": 0.4965, "lr": 0.0007916755131919238, "epoch": 7.431865828092243, "percentage": 37.16, "elapsed_time": "0:36:16", "remaining_time": "1:01:20", "throughput": 4254.35, "total_tokens": 9258376} {"current_steps": 14185, "total_steps": 38160, "loss": 0.4408, "lr": 0.000791489739557236, "epoch": 7.434486373165618, "percentage": 37.17, "elapsed_time": "0:36:16", "remaining_time": "1:01:19", "throughput": 4254.4, "total_tokens": 9261640} {"current_steps": 14190, "total_steps": 38160, "loss": 0.506, "lr": 0.0007913039049462203, "epoch": 7.437106918238994, "percentage": 37.19, "elapsed_time": "0:36:17", "remaining_time": "1:01:18", "throughput": 4254.42, "total_tokens": 9264712} {"current_steps": 14195, "total_steps": 38160, "loss": 0.425, "lr": 0.0007911180093977511, "epoch": 7.439727463312369, "percentage": 37.2, "elapsed_time": "0:36:18", "remaining_time": "1:01:17", "throughput": 4254.7, "total_tokens": 9268936} {"current_steps": 14200, "total_steps": 38160, "loss": 0.6974, "lr": 0.0007909320529507154, "epoch": 7.4423480083857445, "percentage": 37.21, "elapsed_time": "0:36:19", "remaining_time": "1:01:17", "throughput": 4254.78, "total_tokens": 9272328} {"current_steps": 14205, "total_steps": 38160, "loss": 0.3399, "lr": 0.0007907460356440134, "epoch": 7.44496855345912, "percentage": 37.22, "elapsed_time": "0:36:20", "remaining_time": "1:01:16", "throughput": 4254.85, "total_tokens": 9275592} {"current_steps": 14210, "total_steps": 38160, "loss": 0.4793, "lr": 0.0007905599575165577, "epoch": 7.447589098532495, "percentage": 37.24, "elapsed_time": "0:36:20", "remaining_time": "1:01:15", "throughput": 4255.03, "total_tokens": 9279336} {"current_steps": 14215, "total_steps": 38160, "loss": 0.3435, "lr": 0.0007903738186072739, "epoch": 7.45020964360587, "percentage": 37.25, "elapsed_time": "0:36:21", "remaining_time": "1:01:14", "throughput": 4255.02, "total_tokens": 9282280} {"current_steps": 14220, "total_steps": 38160, "loss": 0.457, "lr": 0.0007901876189550999, "epoch": 7.452830188679245, "percentage": 37.26, "elapsed_time": "0:36:22", "remaining_time": "1:01:13", "throughput": 4255.18, "total_tokens": 9285960} {"current_steps": 14225, "total_steps": 38160, "loss": 0.3265, "lr": 0.0007900013585989867, "epoch": 7.45545073375262, "percentage": 37.28, "elapsed_time": "0:36:23", "remaining_time": "1:01:13", "throughput": 4255.7, "total_tokens": 9291464} {"current_steps": 14230, "total_steps": 38160, "loss": 0.4238, "lr": 0.0007898150375778979, "epoch": 7.4580712788259955, "percentage": 37.29, "elapsed_time": "0:36:24", "remaining_time": "1:01:12", "throughput": 4255.9, "total_tokens": 9295432} {"current_steps": 14235, "total_steps": 38160, "loss": 0.4215, "lr": 0.0007896286559308095, "epoch": 7.460691823899371, "percentage": 37.3, "elapsed_time": "0:36:24", "remaining_time": "1:01:12", "throughput": 4255.92, "total_tokens": 9298600} {"current_steps": 14240, "total_steps": 38160, "loss": 0.3796, "lr": 0.0007894422136967105, "epoch": 7.463312368972747, "percentage": 37.32, "elapsed_time": "0:36:25", "remaining_time": "1:01:11", "throughput": 4255.9, "total_tokens": 9301416} {"current_steps": 14245, "total_steps": 38160, "loss": 0.4368, "lr": 0.0007892557109146026, "epoch": 7.465932914046122, "percentage": 37.33, "elapsed_time": "0:36:26", "remaining_time": "1:01:10", "throughput": 4255.89, "total_tokens": 9304328} {"current_steps": 14250, "total_steps": 38160, "loss": 0.3973, "lr": 0.0007890691476234999, "epoch": 7.468553459119497, "percentage": 37.34, "elapsed_time": "0:36:26", "remaining_time": "1:01:09", "throughput": 4255.84, "total_tokens": 9307016} {"current_steps": 14255, "total_steps": 38160, "loss": 0.4734, "lr": 0.0007888825238624294, "epoch": 7.471174004192872, "percentage": 37.36, "elapsed_time": "0:36:27", "remaining_time": "1:01:08", "throughput": 4255.96, "total_tokens": 9310504} {"current_steps": 14260, "total_steps": 38160, "loss": 0.4044, "lr": 0.0007886958396704307, "epoch": 7.473794549266247, "percentage": 37.37, "elapsed_time": "0:36:28", "remaining_time": "1:01:07", "throughput": 4255.98, "total_tokens": 9313512} {"current_steps": 14265, "total_steps": 38160, "loss": 0.4804, "lr": 0.0007885090950865559, "epoch": 7.476415094339623, "percentage": 37.38, "elapsed_time": "0:36:29", "remaining_time": "1:01:06", "throughput": 4256.13, "total_tokens": 9317128} {"current_steps": 14270, "total_steps": 38160, "loss": 0.7895, "lr": 0.0007883222901498701, "epoch": 7.479035639412998, "percentage": 37.4, "elapsed_time": "0:36:29", "remaining_time": "1:01:05", "throughput": 4256.02, "total_tokens": 9319560} {"current_steps": 14275, "total_steps": 38160, "loss": 0.4505, "lr": 0.0007881354248994503, "epoch": 7.481656184486373, "percentage": 37.41, "elapsed_time": "0:36:30", "remaining_time": "1:01:05", "throughput": 4256.03, "total_tokens": 9322504} {"current_steps": 14280, "total_steps": 38160, "loss": 0.4168, "lr": 0.0007879484993743869, "epoch": 7.484276729559748, "percentage": 37.42, "elapsed_time": "0:36:31", "remaining_time": "1:01:04", "throughput": 4256.16, "total_tokens": 9325992} {"current_steps": 14285, "total_steps": 38160, "loss": 0.4474, "lr": 0.0007877615136137827, "epoch": 7.486897274633124, "percentage": 37.43, "elapsed_time": "0:36:31", "remaining_time": "1:01:03", "throughput": 4256.09, "total_tokens": 9328520} {"current_steps": 14290, "total_steps": 38160, "loss": 0.4135, "lr": 0.0007875744676567527, "epoch": 7.489517819706499, "percentage": 37.45, "elapsed_time": "0:36:32", "remaining_time": "1:01:02", "throughput": 4255.94, "total_tokens": 9330760} {"current_steps": 14295, "total_steps": 38160, "loss": 0.5899, "lr": 0.0007873873615424248, "epoch": 7.4921383647798745, "percentage": 37.46, "elapsed_time": "0:36:33", "remaining_time": "1:01:01", "throughput": 4255.85, "total_tokens": 9333256} {"current_steps": 14300, "total_steps": 38160, "loss": 0.5415, "lr": 0.0007872001953099396, "epoch": 7.49475890985325, "percentage": 37.47, "elapsed_time": "0:36:33", "remaining_time": "1:01:00", "throughput": 4256.08, "total_tokens": 9337352} {"current_steps": 14305, "total_steps": 38160, "loss": 0.5921, "lr": 0.0007870129689984501, "epoch": 7.497379454926625, "percentage": 37.49, "elapsed_time": "0:36:34", "remaining_time": "1:00:59", "throughput": 4256.05, "total_tokens": 9340104} {"current_steps": 14310, "total_steps": 38160, "loss": 0.4686, "lr": 0.000786825682647122, "epoch": 7.5, "percentage": 37.5, "elapsed_time": "0:36:35", "remaining_time": "1:00:58", "throughput": 4256.01, "total_tokens": 9342888} {"current_steps": 14315, "total_steps": 38160, "loss": 0.4156, "lr": 0.0007866383362951332, "epoch": 7.502620545073375, "percentage": 37.51, "elapsed_time": "0:36:35", "remaining_time": "1:00:57", "throughput": 4255.91, "total_tokens": 9345320} {"current_steps": 14320, "total_steps": 38160, "loss": 0.4879, "lr": 0.0007864509299816746, "epoch": 7.50524109014675, "percentage": 37.53, "elapsed_time": "0:36:36", "remaining_time": "1:00:56", "throughput": 4255.98, "total_tokens": 9348648} {"current_steps": 14325, "total_steps": 38160, "loss": 0.5179, "lr": 0.0007862634637459496, "epoch": 7.5078616352201255, "percentage": 37.54, "elapsed_time": "0:36:37", "remaining_time": "1:00:55", "throughput": 4255.86, "total_tokens": 9351112} {"current_steps": 14330, "total_steps": 38160, "loss": 0.5272, "lr": 0.0007860759376271737, "epoch": 7.510482180293501, "percentage": 37.55, "elapsed_time": "0:36:37", "remaining_time": "1:00:55", "throughput": 4255.93, "total_tokens": 9354280} {"current_steps": 14335, "total_steps": 38160, "loss": 0.5919, "lr": 0.0007858883516645755, "epoch": 7.513102725366876, "percentage": 37.57, "elapsed_time": "0:36:38", "remaining_time": "1:00:54", "throughput": 4255.92, "total_tokens": 9357224} {"current_steps": 14340, "total_steps": 38160, "loss": 0.4844, "lr": 0.0007857007058973957, "epoch": 7.515723270440252, "percentage": 37.58, "elapsed_time": "0:36:39", "remaining_time": "1:00:53", "throughput": 4255.79, "total_tokens": 9359592} {"current_steps": 14345, "total_steps": 38160, "loss": 0.4105, "lr": 0.0007855130003648876, "epoch": 7.518343815513627, "percentage": 37.59, "elapsed_time": "0:36:40", "remaining_time": "1:00:52", "throughput": 4255.97, "total_tokens": 9363400} {"current_steps": 14350, "total_steps": 38160, "loss": 0.3673, "lr": 0.0007853252351063171, "epoch": 7.520964360587002, "percentage": 37.6, "elapsed_time": "0:36:40", "remaining_time": "1:00:51", "throughput": 4255.83, "total_tokens": 9365832} {"current_steps": 14355, "total_steps": 38160, "loss": 0.4456, "lr": 0.0007851374101609627, "epoch": 7.523584905660377, "percentage": 37.62, "elapsed_time": "0:36:41", "remaining_time": "1:00:50", "throughput": 4255.91, "total_tokens": 9369256} {"current_steps": 14360, "total_steps": 38160, "loss": 0.5105, "lr": 0.000784949525568115, "epoch": 7.526205450733753, "percentage": 37.63, "elapsed_time": "0:36:42", "remaining_time": "1:00:49", "throughput": 4255.96, "total_tokens": 9372392} {"current_steps": 14365, "total_steps": 38160, "loss": 0.5253, "lr": 0.0007847615813670776, "epoch": 7.528825995807128, "percentage": 37.64, "elapsed_time": "0:36:42", "remaining_time": "1:00:49", "throughput": 4256.06, "total_tokens": 9375752} {"current_steps": 14370, "total_steps": 38160, "loss": 0.4187, "lr": 0.000784573577597166, "epoch": 7.531446540880503, "percentage": 37.66, "elapsed_time": "0:36:43", "remaining_time": "1:00:48", "throughput": 4256.28, "total_tokens": 9379816} {"current_steps": 14375, "total_steps": 38160, "loss": 0.5662, "lr": 0.0007843855142977086, "epoch": 7.534067085953878, "percentage": 37.67, "elapsed_time": "0:36:44", "remaining_time": "1:00:47", "throughput": 4256.53, "total_tokens": 9383976} {"current_steps": 14380, "total_steps": 38160, "loss": 0.5117, "lr": 0.000784197391508046, "epoch": 7.536687631027254, "percentage": 37.68, "elapsed_time": "0:36:45", "remaining_time": "1:00:46", "throughput": 4256.63, "total_tokens": 9387400} {"current_steps": 14385, "total_steps": 38160, "loss": 0.4547, "lr": 0.0007840092092675313, "epoch": 7.539308176100629, "percentage": 37.7, "elapsed_time": "0:36:46", "remaining_time": "1:00:46", "throughput": 4256.61, "total_tokens": 9390216} {"current_steps": 14390, "total_steps": 38160, "loss": 0.4336, "lr": 0.0007838209676155302, "epoch": 7.5419287211740045, "percentage": 37.71, "elapsed_time": "0:36:46", "remaining_time": "1:00:45", "throughput": 4256.79, "total_tokens": 9393960} {"current_steps": 14395, "total_steps": 38160, "loss": 0.3266, "lr": 0.0007836326665914209, "epoch": 7.54454926624738, "percentage": 37.72, "elapsed_time": "0:36:47", "remaining_time": "1:00:44", "throughput": 4256.89, "total_tokens": 9397416} {"current_steps": 14400, "total_steps": 38160, "loss": 0.4449, "lr": 0.0007834443062345932, "epoch": 7.547169811320755, "percentage": 37.74, "elapsed_time": "0:36:48", "remaining_time": "1:00:43", "throughput": 4256.86, "total_tokens": 9400232} {"current_steps": 14405, "total_steps": 38160, "loss": 0.456, "lr": 0.0007832558865844507, "epoch": 7.54979035639413, "percentage": 37.75, "elapsed_time": "0:36:48", "remaining_time": "1:00:42", "throughput": 4256.72, "total_tokens": 9402568} {"current_steps": 14410, "total_steps": 38160, "loss": 0.434, "lr": 0.0007830674076804083, "epoch": 7.552410901467505, "percentage": 37.76, "elapsed_time": "0:36:49", "remaining_time": "1:00:41", "throughput": 4256.58, "total_tokens": 9404904} {"current_steps": 14415, "total_steps": 38160, "loss": 0.4495, "lr": 0.0007828788695618934, "epoch": 7.55503144654088, "percentage": 37.78, "elapsed_time": "0:36:50", "remaining_time": "1:00:40", "throughput": 4256.56, "total_tokens": 9407720} {"current_steps": 14420, "total_steps": 38160, "loss": 0.5566, "lr": 0.0007826902722683462, "epoch": 7.5576519916142555, "percentage": 37.79, "elapsed_time": "0:36:50", "remaining_time": "1:00:39", "throughput": 4256.49, "total_tokens": 9410280} {"current_steps": 14425, "total_steps": 38160, "loss": 0.4576, "lr": 0.0007825016158392193, "epoch": 7.560272536687631, "percentage": 37.8, "elapsed_time": "0:36:51", "remaining_time": "1:00:38", "throughput": 4256.45, "total_tokens": 9413032} {"current_steps": 14430, "total_steps": 38160, "loss": 0.4294, "lr": 0.0007823129003139773, "epoch": 7.562893081761006, "percentage": 37.81, "elapsed_time": "0:36:52", "remaining_time": "1:00:37", "throughput": 4256.56, "total_tokens": 9416488} {"current_steps": 14435, "total_steps": 38160, "loss": 0.4144, "lr": 0.0007821241257320972, "epoch": 7.565513626834382, "percentage": 37.83, "elapsed_time": "0:36:52", "remaining_time": "1:00:37", "throughput": 4256.61, "total_tokens": 9419720} {"current_steps": 14440, "total_steps": 38160, "loss": 0.5558, "lr": 0.0007819352921330689, "epoch": 7.568134171907757, "percentage": 37.84, "elapsed_time": "0:36:53", "remaining_time": "1:00:36", "throughput": 4256.67, "total_tokens": 9422824} {"current_steps": 14445, "total_steps": 38160, "loss": 0.4359, "lr": 0.0007817463995563938, "epoch": 7.570754716981132, "percentage": 37.85, "elapsed_time": "0:36:54", "remaining_time": "1:00:35", "throughput": 4256.77, "total_tokens": 9426248} {"current_steps": 14450, "total_steps": 38160, "loss": 0.4692, "lr": 0.0007815574480415864, "epoch": 7.573375262054507, "percentage": 37.87, "elapsed_time": "0:36:55", "remaining_time": "1:00:34", "throughput": 4256.74, "total_tokens": 9429032} {"current_steps": 14455, "total_steps": 38160, "loss": 0.4284, "lr": 0.0007813684376281729, "epoch": 7.575995807127883, "percentage": 37.88, "elapsed_time": "0:36:55", "remaining_time": "1:00:33", "throughput": 4256.84, "total_tokens": 9432520} {"current_steps": 14460, "total_steps": 38160, "loss": 0.5969, "lr": 0.0007811793683556922, "epoch": 7.578616352201258, "percentage": 37.89, "elapsed_time": "0:36:56", "remaining_time": "1:00:32", "throughput": 4256.88, "total_tokens": 9435592} {"current_steps": 14465, "total_steps": 38160, "loss": 0.6081, "lr": 0.0007809902402636957, "epoch": 7.581236897274633, "percentage": 37.91, "elapsed_time": "0:36:57", "remaining_time": "1:00:32", "throughput": 4257.15, "total_tokens": 9439784} {"current_steps": 14470, "total_steps": 38160, "loss": 0.4261, "lr": 0.0007808010533917464, "epoch": 7.583857442348008, "percentage": 37.92, "elapsed_time": "0:36:58", "remaining_time": "1:00:31", "throughput": 4257.09, "total_tokens": 9442408} {"current_steps": 14475, "total_steps": 38160, "loss": 0.418, "lr": 0.0007806118077794205, "epoch": 7.586477987421384, "percentage": 37.93, "elapsed_time": "0:36:58", "remaining_time": "1:00:30", "throughput": 4257.04, "total_tokens": 9445096} {"current_steps": 14480, "total_steps": 38160, "loss": 0.4032, "lr": 0.0007804225034663058, "epoch": 7.589098532494759, "percentage": 37.95, "elapsed_time": "0:36:59", "remaining_time": "1:00:29", "throughput": 4257.29, "total_tokens": 9449224} {"current_steps": 14485, "total_steps": 38160, "loss": 0.446, "lr": 0.0007802331404920024, "epoch": 7.5917190775681345, "percentage": 37.96, "elapsed_time": "0:37:00", "remaining_time": "1:00:29", "throughput": 4257.92, "total_tokens": 9455784} {"current_steps": 14490, "total_steps": 38160, "loss": 0.424, "lr": 0.0007800437188961232, "epoch": 7.59433962264151, "percentage": 37.97, "elapsed_time": "0:37:01", "remaining_time": "1:00:29", "throughput": 4258.53, "total_tokens": 9461704} {"current_steps": 14495, "total_steps": 38160, "loss": 0.3536, "lr": 0.0007798542387182929, "epoch": 7.596960167714885, "percentage": 37.98, "elapsed_time": "0:37:02", "remaining_time": "1:00:28", "throughput": 4258.54, "total_tokens": 9464744} {"current_steps": 14500, "total_steps": 38160, "loss": 0.5024, "lr": 0.0007796646999981488, "epoch": 7.59958071278826, "percentage": 38.0, "elapsed_time": "0:37:03", "remaining_time": "1:00:27", "throughput": 4258.64, "total_tokens": 9468168} {"current_steps": 14505, "total_steps": 38160, "loss": 0.4426, "lr": 0.0007794751027753397, "epoch": 7.602201257861635, "percentage": 38.01, "elapsed_time": "0:37:03", "remaining_time": "1:00:26", "throughput": 4258.54, "total_tokens": 9470600} {"current_steps": 14510, "total_steps": 38160, "loss": 0.4476, "lr": 0.0007792854470895278, "epoch": 7.60482180293501, "percentage": 38.02, "elapsed_time": "0:37:04", "remaining_time": "1:00:25", "throughput": 4258.55, "total_tokens": 9473608} {"current_steps": 14515, "total_steps": 38160, "loss": 0.4809, "lr": 0.0007790957329803865, "epoch": 7.6074423480083855, "percentage": 38.04, "elapsed_time": "0:37:05", "remaining_time": "1:00:24", "throughput": 4258.42, "total_tokens": 9475976} {"current_steps": 14520, "total_steps": 38160, "loss": 0.4107, "lr": 0.0007789059604876019, "epoch": 7.610062893081761, "percentage": 38.05, "elapsed_time": "0:37:06", "remaining_time": "1:00:24", "throughput": 4258.58, "total_tokens": 9479624} {"current_steps": 14525, "total_steps": 38160, "loss": 0.5807, "lr": 0.0007787161296508724, "epoch": 7.612683438155136, "percentage": 38.06, "elapsed_time": "0:37:06", "remaining_time": "1:00:23", "throughput": 4258.5, "total_tokens": 9482216} {"current_steps": 14530, "total_steps": 38160, "loss": 0.4659, "lr": 0.0007785262405099083, "epoch": 7.615303983228512, "percentage": 38.08, "elapsed_time": "0:37:07", "remaining_time": "1:00:22", "throughput": 4258.42, "total_tokens": 9484744} {"current_steps": 14535, "total_steps": 38160, "loss": 0.3513, "lr": 0.0007783362931044322, "epoch": 7.617924528301887, "percentage": 38.09, "elapsed_time": "0:37:07", "remaining_time": "1:00:21", "throughput": 4258.37, "total_tokens": 9487528} {"current_steps": 14540, "total_steps": 38160, "loss": 0.3818, "lr": 0.0007781462874741793, "epoch": 7.620545073375262, "percentage": 38.1, "elapsed_time": "0:37:08", "remaining_time": "1:00:20", "throughput": 4258.47, "total_tokens": 9490856} {"current_steps": 14545, "total_steps": 38160, "loss": 0.4826, "lr": 0.000777956223658896, "epoch": 7.623165618448637, "percentage": 38.12, "elapsed_time": "0:37:09", "remaining_time": "1:00:19", "throughput": 4258.48, "total_tokens": 9493832} {"current_steps": 14550, "total_steps": 38160, "loss": 0.3662, "lr": 0.000777766101698342, "epoch": 7.6257861635220126, "percentage": 38.13, "elapsed_time": "0:37:10", "remaining_time": "1:00:18", "throughput": 4258.5, "total_tokens": 9496872} {"current_steps": 14555, "total_steps": 38160, "loss": 0.5816, "lr": 0.0007775759216322882, "epoch": 7.628406708595388, "percentage": 38.14, "elapsed_time": "0:37:10", "remaining_time": "1:00:17", "throughput": 4258.58, "total_tokens": 9500072} {"current_steps": 14560, "total_steps": 38160, "loss": 0.4558, "lr": 0.0007773856835005187, "epoch": 7.631027253668763, "percentage": 38.16, "elapsed_time": "0:37:11", "remaining_time": "1:00:16", "throughput": 4258.54, "total_tokens": 9502792} {"current_steps": 14565, "total_steps": 38160, "loss": 0.3356, "lr": 0.0007771953873428285, "epoch": 7.633647798742138, "percentage": 38.17, "elapsed_time": "0:37:12", "remaining_time": "1:00:15", "throughput": 4258.45, "total_tokens": 9505320} {"current_steps": 14570, "total_steps": 38160, "loss": 0.429, "lr": 0.0007770050331990259, "epoch": 7.636268343815514, "percentage": 38.18, "elapsed_time": "0:37:12", "remaining_time": "1:00:15", "throughput": 4258.46, "total_tokens": 9508232} {"current_steps": 14575, "total_steps": 38160, "loss": 0.4504, "lr": 0.0007768146211089304, "epoch": 7.638888888888889, "percentage": 38.19, "elapsed_time": "0:37:13", "remaining_time": "1:00:14", "throughput": 4258.49, "total_tokens": 9511304} {"current_steps": 14580, "total_steps": 38160, "loss": 0.519, "lr": 0.0007766241511123744, "epoch": 7.6415094339622645, "percentage": 38.21, "elapsed_time": "0:37:14", "remaining_time": "1:00:13", "throughput": 4258.65, "total_tokens": 9514952} {"current_steps": 14585, "total_steps": 38160, "loss": 0.404, "lr": 0.0007764336232492018, "epoch": 7.64412997903564, "percentage": 38.22, "elapsed_time": "0:37:15", "remaining_time": "1:00:12", "throughput": 4258.95, "total_tokens": 9519272} {"current_steps": 14590, "total_steps": 38160, "loss": 0.494, "lr": 0.0007762430375592689, "epoch": 7.646750524109015, "percentage": 38.23, "elapsed_time": "0:37:15", "remaining_time": "1:00:12", "throughput": 4259.12, "total_tokens": 9523112} {"current_steps": 14595, "total_steps": 38160, "loss": 0.4281, "lr": 0.0007760523940824441, "epoch": 7.64937106918239, "percentage": 38.25, "elapsed_time": "0:37:16", "remaining_time": "1:00:11", "throughput": 4259.28, "total_tokens": 9526792} {"current_steps": 14600, "total_steps": 38160, "loss": 0.5249, "lr": 0.0007758616928586077, "epoch": 7.651991614255765, "percentage": 38.26, "elapsed_time": "0:37:17", "remaining_time": "1:00:10", "throughput": 4259.28, "total_tokens": 9529736} {"current_steps": 14605, "total_steps": 38160, "loss": 0.4032, "lr": 0.0007756709339276527, "epoch": 7.65461215932914, "percentage": 38.27, "elapsed_time": "0:37:18", "remaining_time": "1:00:09", "throughput": 4259.36, "total_tokens": 9532968} {"current_steps": 14610, "total_steps": 38160, "loss": 0.4101, "lr": 0.0007754801173294831, "epoch": 7.6572327044025155, "percentage": 38.29, "elapsed_time": "0:37:18", "remaining_time": "1:00:09", "throughput": 4259.66, "total_tokens": 9537320} {"current_steps": 14615, "total_steps": 38160, "loss": 0.5201, "lr": 0.0007752892431040158, "epoch": 7.659853249475891, "percentage": 38.3, "elapsed_time": "0:37:19", "remaining_time": "1:00:08", "throughput": 4259.74, "total_tokens": 9540680} {"current_steps": 14620, "total_steps": 38160, "loss": 0.6766, "lr": 0.0007750983112911796, "epoch": 7.662473794549266, "percentage": 38.31, "elapsed_time": "0:37:20", "remaining_time": "1:00:07", "throughput": 4259.81, "total_tokens": 9543944} {"current_steps": 14625, "total_steps": 38160, "loss": 0.3875, "lr": 0.0007749073219309151, "epoch": 7.665094339622642, "percentage": 38.33, "elapsed_time": "0:37:21", "remaining_time": "1:00:06", "throughput": 4259.78, "total_tokens": 9546728} {"current_steps": 14630, "total_steps": 38160, "loss": 0.4825, "lr": 0.0007747162750631751, "epoch": 7.667714884696017, "percentage": 38.34, "elapsed_time": "0:37:21", "remaining_time": "1:00:05", "throughput": 4259.9, "total_tokens": 9550280} {"current_steps": 14635, "total_steps": 38160, "loss": 0.5362, "lr": 0.0007745251707279246, "epoch": 7.670335429769392, "percentage": 38.35, "elapsed_time": "0:37:22", "remaining_time": "1:00:04", "throughput": 4259.75, "total_tokens": 9552488} {"current_steps": 14640, "total_steps": 38160, "loss": 0.366, "lr": 0.0007743340089651403, "epoch": 7.672955974842767, "percentage": 38.36, "elapsed_time": "0:37:23", "remaining_time": "1:00:03", "throughput": 4259.74, "total_tokens": 9555304} {"current_steps": 14645, "total_steps": 38160, "loss": 0.5468, "lr": 0.0007741427898148111, "epoch": 7.6755765199161425, "percentage": 38.38, "elapsed_time": "0:37:24", "remaining_time": "1:00:03", "throughput": 4260.09, "total_tokens": 9560008} {"current_steps": 14650, "total_steps": 38160, "loss": 0.3873, "lr": 0.0007739515133169379, "epoch": 7.678197064989518, "percentage": 38.39, "elapsed_time": "0:37:24", "remaining_time": "1:00:02", "throughput": 4260.06, "total_tokens": 9562792} {"current_steps": 14655, "total_steps": 38160, "loss": 0.3965, "lr": 0.0007737601795115334, "epoch": 7.680817610062893, "percentage": 38.4, "elapsed_time": "0:37:25", "remaining_time": "1:00:01", "throughput": 4259.99, "total_tokens": 9565416} {"current_steps": 14660, "total_steps": 38160, "loss": 0.4329, "lr": 0.0007735687884386226, "epoch": 7.683438155136268, "percentage": 38.42, "elapsed_time": "0:37:26", "remaining_time": "1:00:00", "throughput": 4259.99, "total_tokens": 9568296} {"current_steps": 14665, "total_steps": 38160, "loss": 0.5181, "lr": 0.0007733773401382424, "epoch": 7.686058700209644, "percentage": 38.43, "elapsed_time": "0:37:26", "remaining_time": "0:59:59", "throughput": 4260.08, "total_tokens": 9571624} {"current_steps": 14670, "total_steps": 38160, "loss": 0.5434, "lr": 0.0007731858346504414, "epoch": 7.688679245283019, "percentage": 38.44, "elapsed_time": "0:37:27", "remaining_time": "0:59:58", "throughput": 4260.12, "total_tokens": 9574728} {"current_steps": 14675, "total_steps": 38160, "loss": 0.3496, "lr": 0.0007729942720152805, "epoch": 7.691299790356394, "percentage": 38.46, "elapsed_time": "0:37:28", "remaining_time": "0:59:57", "throughput": 4260.03, "total_tokens": 9577192} {"current_steps": 14680, "total_steps": 38160, "loss": 0.404, "lr": 0.0007728026522728324, "epoch": 7.69392033542977, "percentage": 38.47, "elapsed_time": "0:37:29", "remaining_time": "0:59:57", "throughput": 4260.37, "total_tokens": 9581928} {"current_steps": 14685, "total_steps": 38160, "loss": 0.7131, "lr": 0.0007726109754631817, "epoch": 7.696540880503145, "percentage": 38.48, "elapsed_time": "0:37:29", "remaining_time": "0:59:56", "throughput": 4260.41, "total_tokens": 9585096} {"current_steps": 14690, "total_steps": 38160, "loss": 0.4912, "lr": 0.000772419241626425, "epoch": 7.69916142557652, "percentage": 38.5, "elapsed_time": "0:37:30", "remaining_time": "0:59:55", "throughput": 4260.48, "total_tokens": 9588360} {"current_steps": 14695, "total_steps": 38160, "loss": 0.503, "lr": 0.000772227450802671, "epoch": 7.701781970649895, "percentage": 38.51, "elapsed_time": "0:37:31", "remaining_time": "0:59:54", "throughput": 4260.49, "total_tokens": 9591304} {"current_steps": 14700, "total_steps": 38160, "loss": 0.4175, "lr": 0.0007720356030320399, "epoch": 7.70440251572327, "percentage": 38.52, "elapsed_time": "0:37:31", "remaining_time": "0:59:53", "throughput": 4260.39, "total_tokens": 9593704} {"current_steps": 14705, "total_steps": 38160, "loss": 0.6132, "lr": 0.0007718436983546642, "epoch": 7.7070230607966455, "percentage": 38.54, "elapsed_time": "0:37:32", "remaining_time": "0:59:53", "throughput": 4260.53, "total_tokens": 9597416} {"current_steps": 14710, "total_steps": 38160, "loss": 0.4834, "lr": 0.0007716517368106882, "epoch": 7.709643605870021, "percentage": 38.55, "elapsed_time": "0:37:33", "remaining_time": "0:59:52", "throughput": 4260.52, "total_tokens": 9600264} {"current_steps": 14715, "total_steps": 38160, "loss": 0.5582, "lr": 0.000771459718440268, "epoch": 7.712264150943396, "percentage": 38.56, "elapsed_time": "0:37:34", "remaining_time": "0:59:51", "throughput": 4260.63, "total_tokens": 9603880} {"current_steps": 14720, "total_steps": 38160, "loss": 0.5076, "lr": 0.0007712676432835717, "epoch": 7.714884696016772, "percentage": 38.57, "elapsed_time": "0:37:34", "remaining_time": "0:59:50", "throughput": 4260.72, "total_tokens": 9607144} {"current_steps": 14725, "total_steps": 38160, "loss": 0.392, "lr": 0.0007710755113807794, "epoch": 7.717505241090147, "percentage": 38.59, "elapsed_time": "0:37:35", "remaining_time": "0:59:49", "throughput": 4260.78, "total_tokens": 9610312} {"current_steps": 14730, "total_steps": 38160, "loss": 0.4196, "lr": 0.0007708833227720824, "epoch": 7.720125786163522, "percentage": 38.6, "elapsed_time": "0:37:36", "remaining_time": "0:59:48", "throughput": 4260.78, "total_tokens": 9613224} {"current_steps": 14735, "total_steps": 38160, "loss": 0.5381, "lr": 0.0007706910774976848, "epoch": 7.722746331236897, "percentage": 38.61, "elapsed_time": "0:37:36", "remaining_time": "0:59:47", "throughput": 4260.85, "total_tokens": 9616456} {"current_steps": 14740, "total_steps": 38160, "loss": 0.5206, "lr": 0.0007704987755978021, "epoch": 7.7253668763102725, "percentage": 38.63, "elapsed_time": "0:37:37", "remaining_time": "0:59:47", "throughput": 4261.04, "total_tokens": 9620328} {"current_steps": 14745, "total_steps": 38160, "loss": 0.4048, "lr": 0.0007703064171126615, "epoch": 7.727987421383648, "percentage": 38.64, "elapsed_time": "0:37:38", "remaining_time": "0:59:46", "throughput": 4261.01, "total_tokens": 9623016} {"current_steps": 14750, "total_steps": 38160, "loss": 0.5056, "lr": 0.0007701140020825022, "epoch": 7.730607966457023, "percentage": 38.65, "elapsed_time": "0:37:39", "remaining_time": "0:59:45", "throughput": 4260.99, "total_tokens": 9625800} {"current_steps": 14755, "total_steps": 38160, "loss": 0.6275, "lr": 0.0007699215305475753, "epoch": 7.733228511530398, "percentage": 38.67, "elapsed_time": "0:37:39", "remaining_time": "0:59:44", "throughput": 4261.07, "total_tokens": 9629032} {"current_steps": 14760, "total_steps": 38160, "loss": 0.4863, "lr": 0.0007697290025481436, "epoch": 7.735849056603773, "percentage": 38.68, "elapsed_time": "0:37:40", "remaining_time": "0:59:43", "throughput": 4261.32, "total_tokens": 9633160} {"current_steps": 14765, "total_steps": 38160, "loss": 0.565, "lr": 0.0007695364181244819, "epoch": 7.738469601677149, "percentage": 38.69, "elapsed_time": "0:37:41", "remaining_time": "0:59:43", "throughput": 4261.54, "total_tokens": 9637160} {"current_steps": 14770, "total_steps": 38160, "loss": 0.5996, "lr": 0.0007693437773168764, "epoch": 7.741090146750524, "percentage": 38.71, "elapsed_time": "0:37:42", "remaining_time": "0:59:42", "throughput": 4261.58, "total_tokens": 9640264} {"current_steps": 14775, "total_steps": 38160, "loss": 0.6013, "lr": 0.0007691510801656256, "epoch": 7.7437106918239, "percentage": 38.72, "elapsed_time": "0:37:42", "remaining_time": "0:59:41", "throughput": 4261.7, "total_tokens": 9643816} {"current_steps": 14780, "total_steps": 38160, "loss": 0.3735, "lr": 0.0007689583267110395, "epoch": 7.746331236897275, "percentage": 38.73, "elapsed_time": "0:37:43", "remaining_time": "0:59:40", "throughput": 4261.77, "total_tokens": 9647112} {"current_steps": 14785, "total_steps": 38160, "loss": 0.3795, "lr": 0.0007687655169934398, "epoch": 7.74895178197065, "percentage": 38.74, "elapsed_time": "0:37:44", "remaining_time": "0:59:39", "throughput": 4261.84, "total_tokens": 9650248} {"current_steps": 14790, "total_steps": 38160, "loss": 0.5907, "lr": 0.0007685726510531603, "epoch": 7.751572327044025, "percentage": 38.76, "elapsed_time": "0:37:44", "remaining_time": "0:59:38", "throughput": 4261.74, "total_tokens": 9652680} {"current_steps": 14795, "total_steps": 38160, "loss": 0.3552, "lr": 0.0007683797289305463, "epoch": 7.7541928721174, "percentage": 38.77, "elapsed_time": "0:37:45", "remaining_time": "0:59:38", "throughput": 4261.82, "total_tokens": 9655976} {"current_steps": 14800, "total_steps": 38160, "loss": 0.5961, "lr": 0.0007681867506659548, "epoch": 7.756813417190775, "percentage": 38.78, "elapsed_time": "0:37:46", "remaining_time": "0:59:37", "throughput": 4261.79, "total_tokens": 9658664} {"current_steps": 14805, "total_steps": 38160, "loss": 0.5973, "lr": 0.0007679937162997546, "epoch": 7.759433962264151, "percentage": 38.8, "elapsed_time": "0:37:47", "remaining_time": "0:59:36", "throughput": 4261.82, "total_tokens": 9661736} {"current_steps": 14810, "total_steps": 38160, "loss": 0.3508, "lr": 0.0007678006258723264, "epoch": 7.762054507337526, "percentage": 38.81, "elapsed_time": "0:37:47", "remaining_time": "0:59:35", "throughput": 4261.87, "total_tokens": 9664904} {"current_steps": 14815, "total_steps": 38160, "loss": 0.4612, "lr": 0.0007676074794240626, "epoch": 7.764675052410902, "percentage": 38.82, "elapsed_time": "0:37:48", "remaining_time": "0:59:34", "throughput": 4261.86, "total_tokens": 9667816} {"current_steps": 14820, "total_steps": 38160, "loss": 0.3764, "lr": 0.000767414276995367, "epoch": 7.767295597484277, "percentage": 38.84, "elapsed_time": "0:37:49", "remaining_time": "0:59:33", "throughput": 4261.96, "total_tokens": 9671208} {"current_steps": 14825, "total_steps": 38160, "loss": 0.3575, "lr": 0.0007672210186266555, "epoch": 7.769916142557652, "percentage": 38.85, "elapsed_time": "0:37:49", "remaining_time": "0:59:32", "throughput": 4261.92, "total_tokens": 9673864} {"current_steps": 14830, "total_steps": 38160, "loss": 0.4257, "lr": 0.0007670277043583556, "epoch": 7.772536687631027, "percentage": 38.86, "elapsed_time": "0:37:50", "remaining_time": "0:59:32", "throughput": 4262.11, "total_tokens": 9677768} {"current_steps": 14835, "total_steps": 38160, "loss": 0.4373, "lr": 0.0007668343342309063, "epoch": 7.7751572327044025, "percentage": 38.88, "elapsed_time": "0:37:51", "remaining_time": "0:59:31", "throughput": 4262.3, "total_tokens": 9681640} {"current_steps": 14840, "total_steps": 38160, "loss": 0.3746, "lr": 0.0007666409082847586, "epoch": 7.777777777777778, "percentage": 38.89, "elapsed_time": "0:37:52", "remaining_time": "0:59:30", "throughput": 4262.44, "total_tokens": 9685192} {"current_steps": 14845, "total_steps": 38160, "loss": 0.4786, "lr": 0.0007664474265603747, "epoch": 7.780398322851153, "percentage": 38.9, "elapsed_time": "0:37:52", "remaining_time": "0:59:29", "throughput": 4262.49, "total_tokens": 9688392} {"current_steps": 14850, "total_steps": 38160, "loss": 0.4205, "lr": 0.0007662538890982291, "epoch": 7.783018867924528, "percentage": 38.92, "elapsed_time": "0:37:53", "remaining_time": "0:59:28", "throughput": 4262.52, "total_tokens": 9691528} {"current_steps": 14855, "total_steps": 38160, "loss": 0.3919, "lr": 0.0007660602959388075, "epoch": 7.785639412997903, "percentage": 38.93, "elapsed_time": "0:37:54", "remaining_time": "0:59:28", "throughput": 4262.49, "total_tokens": 9694248} {"current_steps": 14860, "total_steps": 38160, "loss": 0.5012, "lr": 0.0007658666471226073, "epoch": 7.788259958071279, "percentage": 38.94, "elapsed_time": "0:37:55", "remaining_time": "0:59:27", "throughput": 4262.51, "total_tokens": 9697288} {"current_steps": 14865, "total_steps": 38160, "loss": 0.6352, "lr": 0.0007656729426901377, "epoch": 7.790880503144654, "percentage": 38.95, "elapsed_time": "0:37:55", "remaining_time": "0:59:26", "throughput": 4262.7, "total_tokens": 9701000} {"current_steps": 14870, "total_steps": 38160, "loss": 0.4089, "lr": 0.0007654791826819194, "epoch": 7.79350104821803, "percentage": 38.97, "elapsed_time": "0:37:56", "remaining_time": "0:59:25", "throughput": 4262.72, "total_tokens": 9704008} {"current_steps": 14875, "total_steps": 38160, "loss": 0.3573, "lr": 0.0007652853671384847, "epoch": 7.796121593291405, "percentage": 38.98, "elapsed_time": "0:37:57", "remaining_time": "0:59:24", "throughput": 4262.81, "total_tokens": 9707336} {"current_steps": 14880, "total_steps": 38160, "loss": 0.2923, "lr": 0.0007650914961003781, "epoch": 7.79874213836478, "percentage": 38.99, "elapsed_time": "0:37:57", "remaining_time": "0:59:23", "throughput": 4262.65, "total_tokens": 9709480} {"current_steps": 14885, "total_steps": 38160, "loss": 0.5359, "lr": 0.0007648975696081546, "epoch": 7.801362683438155, "percentage": 39.01, "elapsed_time": "0:37:58", "remaining_time": "0:59:22", "throughput": 4262.77, "total_tokens": 9712936} {"current_steps": 14890, "total_steps": 38160, "loss": 0.4165, "lr": 0.0007647035877023816, "epoch": 7.80398322851153, "percentage": 39.02, "elapsed_time": "0:37:59", "remaining_time": "0:59:21", "throughput": 4262.68, "total_tokens": 9715432} {"current_steps": 14895, "total_steps": 38160, "loss": 0.5161, "lr": 0.0007645095504236381, "epoch": 7.806603773584905, "percentage": 39.03, "elapsed_time": "0:37:59", "remaining_time": "0:59:20", "throughput": 4262.67, "total_tokens": 9718280} {"current_steps": 14900, "total_steps": 38160, "loss": 0.3823, "lr": 0.0007643154578125142, "epoch": 7.809224318658281, "percentage": 39.05, "elapsed_time": "0:38:00", "remaining_time": "0:59:20", "throughput": 4262.78, "total_tokens": 9721736} {"current_steps": 14905, "total_steps": 38160, "loss": 0.5444, "lr": 0.0007641213099096121, "epoch": 7.811844863731656, "percentage": 39.06, "elapsed_time": "0:38:01", "remaining_time": "0:59:19", "throughput": 4262.77, "total_tokens": 9724616} {"current_steps": 14910, "total_steps": 38160, "loss": 0.5207, "lr": 0.0007639271067555452, "epoch": 7.814465408805032, "percentage": 39.07, "elapsed_time": "0:38:02", "remaining_time": "0:59:18", "throughput": 4263.03, "total_tokens": 9728648} {"current_steps": 14915, "total_steps": 38160, "loss": 0.6143, "lr": 0.0007637328483909385, "epoch": 7.817085953878407, "percentage": 39.09, "elapsed_time": "0:38:02", "remaining_time": "0:59:17", "throughput": 4263.15, "total_tokens": 9732168} {"current_steps": 14920, "total_steps": 38160, "loss": 0.4861, "lr": 0.000763538534856429, "epoch": 7.819706498951782, "percentage": 39.1, "elapsed_time": "0:38:03", "remaining_time": "0:59:17", "throughput": 4263.22, "total_tokens": 9735432} {"current_steps": 14925, "total_steps": 38160, "loss": 0.5795, "lr": 0.0007633441661926643, "epoch": 7.822327044025157, "percentage": 39.11, "elapsed_time": "0:38:04", "remaining_time": "0:59:16", "throughput": 4263.18, "total_tokens": 9738088} {"current_steps": 14930, "total_steps": 38160, "loss": 0.4821, "lr": 0.0007631497424403046, "epoch": 7.8249475890985325, "percentage": 39.12, "elapsed_time": "0:38:05", "remaining_time": "0:59:15", "throughput": 4263.68, "total_tokens": 9743816} {"current_steps": 14935, "total_steps": 38160, "loss": 0.4123, "lr": 0.000762955263640021, "epoch": 7.827568134171908, "percentage": 39.14, "elapsed_time": "0:38:06", "remaining_time": "0:59:14", "throughput": 4263.78, "total_tokens": 9747272} {"current_steps": 14940, "total_steps": 38160, "loss": 0.4136, "lr": 0.0007627607298324961, "epoch": 7.830188679245283, "percentage": 39.15, "elapsed_time": "0:38:06", "remaining_time": "0:59:14", "throughput": 4263.95, "total_tokens": 9751016} {"current_steps": 14945, "total_steps": 38160, "loss": 0.5296, "lr": 0.0007625661410584244, "epoch": 7.832809224318658, "percentage": 39.16, "elapsed_time": "0:38:07", "remaining_time": "0:59:13", "throughput": 4263.95, "total_tokens": 9753992} {"current_steps": 14950, "total_steps": 38160, "loss": 0.4042, "lr": 0.0007623714973585113, "epoch": 7.835429769392033, "percentage": 39.18, "elapsed_time": "0:38:08", "remaining_time": "0:59:12", "throughput": 4263.83, "total_tokens": 9756456} {"current_steps": 14955, "total_steps": 38160, "loss": 0.4797, "lr": 0.0007621767987734743, "epoch": 7.838050314465409, "percentage": 39.19, "elapsed_time": "0:38:08", "remaining_time": "0:59:11", "throughput": 4264.0, "total_tokens": 9760264} {"current_steps": 14960, "total_steps": 38160, "loss": 0.559, "lr": 0.000761982045344042, "epoch": 7.840670859538784, "percentage": 39.2, "elapsed_time": "0:38:09", "remaining_time": "0:59:10", "throughput": 4264.13, "total_tokens": 9763848} {"current_steps": 14965, "total_steps": 38160, "loss": 0.4204, "lr": 0.0007617872371109549, "epoch": 7.84329140461216, "percentage": 39.22, "elapsed_time": "0:38:10", "remaining_time": "0:59:10", "throughput": 4264.15, "total_tokens": 9766824} {"current_steps": 14970, "total_steps": 38160, "loss": 0.3736, "lr": 0.0007615923741149643, "epoch": 7.845911949685535, "percentage": 39.23, "elapsed_time": "0:38:11", "remaining_time": "0:59:09", "throughput": 4264.46, "total_tokens": 9771368} {"current_steps": 14975, "total_steps": 38160, "loss": 0.3151, "lr": 0.0007613974563968333, "epoch": 7.84853249475891, "percentage": 39.24, "elapsed_time": "0:38:12", "remaining_time": "0:59:08", "throughput": 4264.44, "total_tokens": 9774248} {"current_steps": 14980, "total_steps": 38160, "loss": 0.4397, "lr": 0.0007612024839973368, "epoch": 7.851153039832285, "percentage": 39.26, "elapsed_time": "0:38:12", "remaining_time": "0:59:07", "throughput": 4264.39, "total_tokens": 9776936} {"current_steps": 14985, "total_steps": 38160, "loss": 0.3944, "lr": 0.0007610074569572605, "epoch": 7.85377358490566, "percentage": 39.27, "elapsed_time": "0:38:13", "remaining_time": "0:59:06", "throughput": 4264.42, "total_tokens": 9780104} {"current_steps": 14990, "total_steps": 38160, "loss": 0.3567, "lr": 0.0007608123753174019, "epoch": 7.856394129979035, "percentage": 39.28, "elapsed_time": "0:38:14", "remaining_time": "0:59:05", "throughput": 4264.34, "total_tokens": 9782600} {"current_steps": 14995, "total_steps": 38160, "loss": 0.4605, "lr": 0.00076061723911857, "epoch": 7.859014675052411, "percentage": 39.3, "elapsed_time": "0:38:14", "remaining_time": "0:59:05", "throughput": 4264.34, "total_tokens": 9785544} {"current_steps": 15000, "total_steps": 38160, "loss": 0.3478, "lr": 0.0007604220484015849, "epoch": 7.861635220125786, "percentage": 39.31, "elapsed_time": "0:38:15", "remaining_time": "0:59:04", "throughput": 4264.43, "total_tokens": 9788936} {"current_steps": 15005, "total_steps": 38160, "loss": 0.5385, "lr": 0.0007602268032072784, "epoch": 7.864255765199162, "percentage": 39.32, "elapsed_time": "0:38:16", "remaining_time": "0:59:03", "throughput": 4264.47, "total_tokens": 9792136} {"current_steps": 15010, "total_steps": 38160, "loss": 0.5787, "lr": 0.0007600315035764933, "epoch": 7.866876310272537, "percentage": 39.33, "elapsed_time": "0:38:16", "remaining_time": "0:59:02", "throughput": 4264.51, "total_tokens": 9795208} {"current_steps": 15015, "total_steps": 38160, "loss": 0.4236, "lr": 0.0007598361495500844, "epoch": 7.869496855345912, "percentage": 39.35, "elapsed_time": "0:38:17", "remaining_time": "0:59:01", "throughput": 4264.68, "total_tokens": 9799016} {"current_steps": 15020, "total_steps": 38160, "loss": 0.5325, "lr": 0.0007596407411689173, "epoch": 7.872117400419287, "percentage": 39.36, "elapsed_time": "0:38:18", "remaining_time": "0:59:00", "throughput": 4264.76, "total_tokens": 9802248} {"current_steps": 15025, "total_steps": 38160, "loss": 0.5021, "lr": 0.0007594452784738695, "epoch": 7.8747379454926625, "percentage": 39.37, "elapsed_time": "0:38:19", "remaining_time": "0:59:00", "throughput": 4264.97, "total_tokens": 9806184} {"current_steps": 15030, "total_steps": 38160, "loss": 0.4973, "lr": 0.000759249761505829, "epoch": 7.877358490566038, "percentage": 39.39, "elapsed_time": "0:38:19", "remaining_time": "0:58:59", "throughput": 4264.89, "total_tokens": 9808776} {"current_steps": 15035, "total_steps": 38160, "loss": 0.4626, "lr": 0.0007590541903056963, "epoch": 7.879979035639413, "percentage": 39.4, "elapsed_time": "0:38:20", "remaining_time": "0:58:58", "throughput": 4264.97, "total_tokens": 9812008} {"current_steps": 15040, "total_steps": 38160, "loss": 0.4387, "lr": 0.0007588585649143825, "epoch": 7.882599580712788, "percentage": 39.41, "elapsed_time": "0:38:21", "remaining_time": "0:58:57", "throughput": 4265.0, "total_tokens": 9815144} {"current_steps": 15045, "total_steps": 38160, "loss": 0.4566, "lr": 0.0007586628853728099, "epoch": 7.885220125786163, "percentage": 39.43, "elapsed_time": "0:38:21", "remaining_time": "0:58:56", "throughput": 4264.91, "total_tokens": 9817672} {"current_steps": 15050, "total_steps": 38160, "loss": 0.6592, "lr": 0.0007584671517219128, "epoch": 7.887840670859539, "percentage": 39.44, "elapsed_time": "0:38:22", "remaining_time": "0:58:55", "throughput": 4265.01, "total_tokens": 9821128} {"current_steps": 15055, "total_steps": 38160, "loss": 0.4255, "lr": 0.0007582713640026364, "epoch": 7.890461215932914, "percentage": 39.45, "elapsed_time": "0:38:23", "remaining_time": "0:58:55", "throughput": 4265.01, "total_tokens": 9824040} {"current_steps": 15060, "total_steps": 38160, "loss": 0.5073, "lr": 0.000758075522255937, "epoch": 7.8930817610062896, "percentage": 39.47, "elapsed_time": "0:38:24", "remaining_time": "0:58:54", "throughput": 4265.12, "total_tokens": 9827496} {"current_steps": 15065, "total_steps": 38160, "loss": 0.4884, "lr": 0.0007578796265227828, "epoch": 7.895702306079665, "percentage": 39.48, "elapsed_time": "0:38:24", "remaining_time": "0:58:53", "throughput": 4265.17, "total_tokens": 9830728} {"current_steps": 15070, "total_steps": 38160, "loss": 0.4722, "lr": 0.0007576836768441525, "epoch": 7.89832285115304, "percentage": 39.49, "elapsed_time": "0:38:25", "remaining_time": "0:58:52", "throughput": 4265.37, "total_tokens": 9834600} {"current_steps": 15075, "total_steps": 38160, "loss": 0.3636, "lr": 0.0007574876732610369, "epoch": 7.900943396226415, "percentage": 39.5, "elapsed_time": "0:38:26", "remaining_time": "0:58:51", "throughput": 4265.48, "total_tokens": 9837992} {"current_steps": 15080, "total_steps": 38160, "loss": 0.4652, "lr": 0.0007572916158144379, "epoch": 7.90356394129979, "percentage": 39.52, "elapsed_time": "0:38:27", "remaining_time": "0:58:51", "throughput": 4265.58, "total_tokens": 9841384} {"current_steps": 15085, "total_steps": 38160, "loss": 0.4622, "lr": 0.0007570955045453679, "epoch": 7.906184486373165, "percentage": 39.53, "elapsed_time": "0:38:27", "remaining_time": "0:58:50", "throughput": 4265.5, "total_tokens": 9843976} {"current_steps": 15090, "total_steps": 38160, "loss": 0.5002, "lr": 0.0007568993394948516, "epoch": 7.908805031446541, "percentage": 39.54, "elapsed_time": "0:38:28", "remaining_time": "0:58:49", "throughput": 4265.54, "total_tokens": 9847144} {"current_steps": 15095, "total_steps": 38160, "loss": 0.4654, "lr": 0.0007567031207039243, "epoch": 7.911425576519916, "percentage": 39.56, "elapsed_time": "0:38:29", "remaining_time": "0:58:48", "throughput": 4265.62, "total_tokens": 9850536} {"current_steps": 15100, "total_steps": 38160, "loss": 0.3047, "lr": 0.0007565068482136328, "epoch": 7.914046121593291, "percentage": 39.57, "elapsed_time": "0:38:30", "remaining_time": "0:58:47", "throughput": 4265.73, "total_tokens": 9854024} {"current_steps": 15105, "total_steps": 38160, "loss": 0.3969, "lr": 0.000756310522065035, "epoch": 7.916666666666667, "percentage": 39.58, "elapsed_time": "0:38:30", "remaining_time": "0:58:47", "throughput": 4265.88, "total_tokens": 9857640} {"current_steps": 15110, "total_steps": 38160, "loss": 0.5025, "lr": 0.0007561141422992002, "epoch": 7.919287211740042, "percentage": 39.6, "elapsed_time": "0:38:31", "remaining_time": "0:58:46", "throughput": 4265.81, "total_tokens": 9860264} {"current_steps": 15115, "total_steps": 38160, "loss": 0.358, "lr": 0.0007559177089572086, "epoch": 7.921907756813417, "percentage": 39.61, "elapsed_time": "0:38:32", "remaining_time": "0:58:45", "throughput": 4265.96, "total_tokens": 9863912} {"current_steps": 15120, "total_steps": 38160, "loss": 0.5095, "lr": 0.0007557212220801521, "epoch": 7.9245283018867925, "percentage": 39.62, "elapsed_time": "0:38:33", "remaining_time": "0:58:45", "throughput": 4266.55, "total_tokens": 9870408} {"current_steps": 15125, "total_steps": 38160, "loss": 0.6273, "lr": 0.0007555246817091332, "epoch": 7.927148846960168, "percentage": 39.64, "elapsed_time": "0:38:34", "remaining_time": "0:58:44", "throughput": 4266.71, "total_tokens": 9874152} {"current_steps": 15130, "total_steps": 38160, "loss": 0.4722, "lr": 0.0007553280878852663, "epoch": 7.929769392033543, "percentage": 39.65, "elapsed_time": "0:38:34", "remaining_time": "0:58:43", "throughput": 4266.79, "total_tokens": 9877480} {"current_steps": 15135, "total_steps": 38160, "loss": 0.4456, "lr": 0.0007551314406496762, "epoch": 7.932389937106918, "percentage": 39.66, "elapsed_time": "0:38:35", "remaining_time": "0:58:42", "throughput": 4266.91, "total_tokens": 9881032} {"current_steps": 15140, "total_steps": 38160, "loss": 0.3996, "lr": 0.0007549347400434994, "epoch": 7.935010482180293, "percentage": 39.68, "elapsed_time": "0:38:36", "remaining_time": "0:58:42", "throughput": 4267.04, "total_tokens": 9884680} {"current_steps": 15145, "total_steps": 38160, "loss": 0.4667, "lr": 0.0007547379861078835, "epoch": 7.937631027253669, "percentage": 39.69, "elapsed_time": "0:38:37", "remaining_time": "0:58:41", "throughput": 4267.19, "total_tokens": 9888392} {"current_steps": 15150, "total_steps": 38160, "loss": 0.4619, "lr": 0.0007545411788839871, "epoch": 7.940251572327044, "percentage": 39.7, "elapsed_time": "0:38:37", "remaining_time": "0:58:40", "throughput": 4267.13, "total_tokens": 9890952} {"current_steps": 15155, "total_steps": 38160, "loss": 0.3332, "lr": 0.0007543443184129799, "epoch": 7.9428721174004195, "percentage": 39.71, "elapsed_time": "0:38:38", "remaining_time": "0:58:39", "throughput": 4267.11, "total_tokens": 9893704} {"current_steps": 15160, "total_steps": 38160, "loss": 0.4339, "lr": 0.000754147404736043, "epoch": 7.945492662473795, "percentage": 39.73, "elapsed_time": "0:38:39", "remaining_time": "0:58:38", "throughput": 4267.23, "total_tokens": 9897256} {"current_steps": 15165, "total_steps": 38160, "loss": 0.6201, "lr": 0.0007539504378943686, "epoch": 7.94811320754717, "percentage": 39.74, "elapsed_time": "0:38:40", "remaining_time": "0:58:38", "throughput": 4267.41, "total_tokens": 9901160} {"current_steps": 15170, "total_steps": 38160, "loss": 0.4044, "lr": 0.0007537534179291599, "epoch": 7.950733752620545, "percentage": 39.75, "elapsed_time": "0:38:40", "remaining_time": "0:58:37", "throughput": 4267.57, "total_tokens": 9904872} {"current_steps": 15175, "total_steps": 38160, "loss": 0.4659, "lr": 0.000753556344881631, "epoch": 7.95335429769392, "percentage": 39.77, "elapsed_time": "0:38:41", "remaining_time": "0:58:36", "throughput": 4267.66, "total_tokens": 9908232} {"current_steps": 15180, "total_steps": 38160, "loss": 0.4356, "lr": 0.0007533592187930076, "epoch": 7.955974842767295, "percentage": 39.78, "elapsed_time": "0:38:42", "remaining_time": "0:58:35", "throughput": 4267.69, "total_tokens": 9911368} {"current_steps": 15185, "total_steps": 38160, "loss": 0.5555, "lr": 0.000753162039704526, "epoch": 7.9585953878406706, "percentage": 39.79, "elapsed_time": "0:38:43", "remaining_time": "0:58:34", "throughput": 4267.69, "total_tokens": 9914312} {"current_steps": 15190, "total_steps": 38160, "loss": 0.5729, "lr": 0.000752964807657434, "epoch": 7.961215932914046, "percentage": 39.81, "elapsed_time": "0:38:43", "remaining_time": "0:58:34", "throughput": 4267.76, "total_tokens": 9917640} {"current_steps": 15195, "total_steps": 38160, "loss": 0.4466, "lr": 0.0007527675226929902, "epoch": 7.963836477987421, "percentage": 39.82, "elapsed_time": "0:38:44", "remaining_time": "0:58:33", "throughput": 4267.75, "total_tokens": 9920424} {"current_steps": 15200, "total_steps": 38160, "loss": 0.4929, "lr": 0.0007525701848524643, "epoch": 7.966457023060797, "percentage": 39.83, "elapsed_time": "0:38:45", "remaining_time": "0:58:32", "throughput": 4267.64, "total_tokens": 9922856} {"current_steps": 15205, "total_steps": 38160, "loss": 0.4493, "lr": 0.0007523727941771372, "epoch": 7.969077568134172, "percentage": 39.85, "elapsed_time": "0:38:45", "remaining_time": "0:58:31", "throughput": 4267.69, "total_tokens": 9926024} {"current_steps": 15210, "total_steps": 38160, "loss": 0.4954, "lr": 0.0007521753507083009, "epoch": 7.971698113207547, "percentage": 39.86, "elapsed_time": "0:38:46", "remaining_time": "0:58:30", "throughput": 4267.78, "total_tokens": 9929416} {"current_steps": 15215, "total_steps": 38160, "loss": 0.6218, "lr": 0.0007519778544872581, "epoch": 7.9743186582809225, "percentage": 39.87, "elapsed_time": "0:38:47", "remaining_time": "0:58:29", "throughput": 4267.91, "total_tokens": 9933000} {"current_steps": 15220, "total_steps": 38160, "loss": 0.3807, "lr": 0.000751780305555323, "epoch": 7.976939203354298, "percentage": 39.88, "elapsed_time": "0:38:47", "remaining_time": "0:58:28", "throughput": 4267.82, "total_tokens": 9935464} {"current_steps": 15225, "total_steps": 38160, "loss": 0.494, "lr": 0.0007515827039538202, "epoch": 7.979559748427673, "percentage": 39.9, "elapsed_time": "0:38:48", "remaining_time": "0:58:28", "throughput": 4267.88, "total_tokens": 9938760} {"current_steps": 15230, "total_steps": 38160, "loss": 0.4017, "lr": 0.0007513850497240861, "epoch": 7.982180293501048, "percentage": 39.91, "elapsed_time": "0:38:49", "remaining_time": "0:58:27", "throughput": 4268.14, "total_tokens": 9943016} {"current_steps": 15235, "total_steps": 38160, "loss": 0.3163, "lr": 0.0007511873429074676, "epoch": 7.984800838574423, "percentage": 39.92, "elapsed_time": "0:38:50", "remaining_time": "0:58:26", "throughput": 4268.09, "total_tokens": 9945640} {"current_steps": 15240, "total_steps": 38160, "loss": 0.5696, "lr": 0.0007509895835453224, "epoch": 7.987421383647799, "percentage": 39.94, "elapsed_time": "0:38:51", "remaining_time": "0:58:25", "throughput": 4268.32, "total_tokens": 9949672} {"current_steps": 15245, "total_steps": 38160, "loss": 0.4931, "lr": 0.0007507917716790201, "epoch": 7.990041928721174, "percentage": 39.95, "elapsed_time": "0:38:51", "remaining_time": "0:58:25", "throughput": 4268.6, "total_tokens": 9954120} {"current_steps": 15250, "total_steps": 38160, "loss": 0.445, "lr": 0.0007505939073499401, "epoch": 7.9926624737945495, "percentage": 39.96, "elapsed_time": "0:38:52", "remaining_time": "0:58:24", "throughput": 4268.85, "total_tokens": 9958344} {"current_steps": 15255, "total_steps": 38160, "loss": 0.521, "lr": 0.0007503959905994737, "epoch": 7.995283018867925, "percentage": 39.98, "elapsed_time": "0:38:53", "remaining_time": "0:58:23", "throughput": 4268.86, "total_tokens": 9961320} {"current_steps": 15260, "total_steps": 38160, "loss": 0.4785, "lr": 0.0007501980214690227, "epoch": 7.9979035639413, "percentage": 39.99, "elapsed_time": "0:38:54", "remaining_time": "0:58:22", "throughput": 4269.04, "total_tokens": 9965160} {"current_steps": 15264, "total_steps": 38160, "eval_loss": 0.4831865429878235, "epoch": 8.0, "percentage": 40.0, "elapsed_time": "0:39:08", "remaining_time": "0:58:42", "throughput": 4243.76, "total_tokens": 9967176} {"current_steps": 15265, "total_steps": 38160, "loss": 0.6209, "lr": 0.00075, "epoch": 8.000524109014675, "percentage": 40.0, "elapsed_time": "0:39:10", "remaining_time": "0:58:45", "throughput": 4241.05, "total_tokens": 9968520} {"current_steps": 15270, "total_steps": 38160, "loss": 0.3794, "lr": 0.0007498019262338295, "epoch": 8.00314465408805, "percentage": 40.02, "elapsed_time": "0:39:11", "remaining_time": "0:58:44", "throughput": 4241.22, "total_tokens": 9972328} {"current_steps": 15275, "total_steps": 38160, "loss": 0.5855, "lr": 0.0007496038002119459, "epoch": 8.005765199161425, "percentage": 40.03, "elapsed_time": "0:39:12", "remaining_time": "0:58:43", "throughput": 4241.31, "total_tokens": 9975688} {"current_steps": 15280, "total_steps": 38160, "loss": 0.4945, "lr": 0.000749405621975795, "epoch": 8.0083857442348, "percentage": 40.04, "elapsed_time": "0:39:12", "remaining_time": "0:58:42", "throughput": 4241.18, "total_tokens": 9977960} {"current_steps": 15285, "total_steps": 38160, "loss": 0.4301, "lr": 0.0007492073915668334, "epoch": 8.011006289308176, "percentage": 40.06, "elapsed_time": "0:39:13", "remaining_time": "0:58:41", "throughput": 4241.21, "total_tokens": 9981192} {"current_steps": 15290, "total_steps": 38160, "loss": 0.4121, "lr": 0.0007490091090265283, "epoch": 8.01362683438155, "percentage": 40.07, "elapsed_time": "0:39:14", "remaining_time": "0:58:41", "throughput": 4241.12, "total_tokens": 9983624} {"current_steps": 15295, "total_steps": 38160, "loss": 0.5182, "lr": 0.0007488107743963587, "epoch": 8.016247379454926, "percentage": 40.08, "elapsed_time": "0:39:14", "remaining_time": "0:58:40", "throughput": 4241.15, "total_tokens": 9986728} {"current_steps": 15300, "total_steps": 38160, "loss": 0.4628, "lr": 0.0007486123877178136, "epoch": 8.018867924528301, "percentage": 40.09, "elapsed_time": "0:39:15", "remaining_time": "0:58:39", "throughput": 4241.34, "total_tokens": 9990792} {"current_steps": 15305, "total_steps": 38160, "loss": 0.4581, "lr": 0.0007484139490323932, "epoch": 8.021488469601676, "percentage": 40.11, "elapsed_time": "0:39:16", "remaining_time": "0:58:38", "throughput": 4241.41, "total_tokens": 9994056} {"current_steps": 15310, "total_steps": 38160, "loss": 0.4087, "lr": 0.000748215458381609, "epoch": 8.024109014675052, "percentage": 40.12, "elapsed_time": "0:39:17", "remaining_time": "0:58:37", "throughput": 4241.53, "total_tokens": 9997480} {"current_steps": 15315, "total_steps": 38160, "loss": 0.5442, "lr": 0.0007480169158069826, "epoch": 8.026729559748428, "percentage": 40.13, "elapsed_time": "0:39:17", "remaining_time": "0:58:36", "throughput": 4241.51, "total_tokens": 10000296} {"current_steps": 15320, "total_steps": 38160, "loss": 0.44, "lr": 0.0007478183213500468, "epoch": 8.029350104821804, "percentage": 40.15, "elapsed_time": "0:39:18", "remaining_time": "0:58:35", "throughput": 4241.46, "total_tokens": 10002888} {"current_steps": 15325, "total_steps": 38160, "loss": 0.4862, "lr": 0.0007476196750523456, "epoch": 8.031970649895179, "percentage": 40.16, "elapsed_time": "0:39:19", "remaining_time": "0:58:35", "throughput": 4241.56, "total_tokens": 10006216} {"current_steps": 15330, "total_steps": 38160, "loss": 0.4556, "lr": 0.000747420976955433, "epoch": 8.034591194968554, "percentage": 40.17, "elapsed_time": "0:39:19", "remaining_time": "0:58:34", "throughput": 4241.7, "total_tokens": 10009928} {"current_steps": 15335, "total_steps": 38160, "loss": 0.4258, "lr": 0.0007472222271008752, "epoch": 8.03721174004193, "percentage": 40.19, "elapsed_time": "0:39:20", "remaining_time": "0:58:33", "throughput": 4241.55, "total_tokens": 10012072} {"current_steps": 15340, "total_steps": 38160, "loss": 0.465, "lr": 0.0007470234255302478, "epoch": 8.039832285115304, "percentage": 40.2, "elapsed_time": "0:39:21", "remaining_time": "0:58:32", "throughput": 4241.78, "total_tokens": 10016168} {"current_steps": 15345, "total_steps": 38160, "loss": 0.4841, "lr": 0.0007468245722851379, "epoch": 8.04245283018868, "percentage": 40.21, "elapsed_time": "0:39:21", "remaining_time": "0:58:31", "throughput": 4241.7, "total_tokens": 10018664} {"current_steps": 15350, "total_steps": 38160, "loss": 0.3235, "lr": 0.0007466256674071434, "epoch": 8.045073375262055, "percentage": 40.23, "elapsed_time": "0:39:22", "remaining_time": "0:58:30", "throughput": 4241.79, "total_tokens": 10022088} {"current_steps": 15355, "total_steps": 38160, "loss": 0.4337, "lr": 0.000746426710937873, "epoch": 8.04769392033543, "percentage": 40.24, "elapsed_time": "0:39:23", "remaining_time": "0:58:29", "throughput": 4241.67, "total_tokens": 10024456} {"current_steps": 15360, "total_steps": 38160, "loss": 0.4122, "lr": 0.0007462277029189461, "epoch": 8.050314465408805, "percentage": 40.25, "elapsed_time": "0:39:24", "remaining_time": "0:58:29", "throughput": 4241.69, "total_tokens": 10027464} {"current_steps": 15365, "total_steps": 38160, "loss": 0.4893, "lr": 0.0007460286433919928, "epoch": 8.05293501048218, "percentage": 40.26, "elapsed_time": "0:39:24", "remaining_time": "0:58:28", "throughput": 4241.71, "total_tokens": 10030504} {"current_steps": 15370, "total_steps": 38160, "loss": 0.5919, "lr": 0.0007458295323986542, "epoch": 8.055555555555555, "percentage": 40.28, "elapsed_time": "0:39:25", "remaining_time": "0:58:27", "throughput": 4241.74, "total_tokens": 10033512} {"current_steps": 15375, "total_steps": 38160, "loss": 0.4559, "lr": 0.0007456303699805817, "epoch": 8.05817610062893, "percentage": 40.29, "elapsed_time": "0:39:26", "remaining_time": "0:58:26", "throughput": 4241.73, "total_tokens": 10036456} {"current_steps": 15380, "total_steps": 38160, "loss": 0.4119, "lr": 0.0007454311561794386, "epoch": 8.060796645702306, "percentage": 40.3, "elapsed_time": "0:39:26", "remaining_time": "0:58:25", "throughput": 4241.76, "total_tokens": 10039528} {"current_steps": 15385, "total_steps": 38160, "loss": 0.6434, "lr": 0.0007452318910368972, "epoch": 8.06341719077568, "percentage": 40.32, "elapsed_time": "0:39:27", "remaining_time": "0:58:24", "throughput": 4241.69, "total_tokens": 10042152} {"current_steps": 15390, "total_steps": 38160, "loss": 0.3756, "lr": 0.0007450325745946422, "epoch": 8.066037735849056, "percentage": 40.33, "elapsed_time": "0:39:28", "remaining_time": "0:58:23", "throughput": 4241.54, "total_tokens": 10044328} {"current_steps": 15395, "total_steps": 38160, "loss": 0.3869, "lr": 0.0007448332068943681, "epoch": 8.068658280922431, "percentage": 40.34, "elapsed_time": "0:39:28", "remaining_time": "0:58:22", "throughput": 4241.47, "total_tokens": 10046856} {"current_steps": 15400, "total_steps": 38160, "loss": 0.4307, "lr": 0.0007446337879777802, "epoch": 8.071278825995806, "percentage": 40.36, "elapsed_time": "0:39:29", "remaining_time": "0:58:21", "throughput": 4241.45, "total_tokens": 10049576} {"current_steps": 15405, "total_steps": 38160, "loss": 0.3692, "lr": 0.0007444343178865948, "epoch": 8.073899371069182, "percentage": 40.37, "elapsed_time": "0:39:30", "remaining_time": "0:58:20", "throughput": 4241.48, "total_tokens": 10052648} {"current_steps": 15410, "total_steps": 38160, "loss": 0.4333, "lr": 0.0007442347966625389, "epoch": 8.076519916142558, "percentage": 40.38, "elapsed_time": "0:39:30", "remaining_time": "0:58:19", "throughput": 4241.43, "total_tokens": 10055272} {"current_steps": 15415, "total_steps": 38160, "loss": 0.3926, "lr": 0.0007440352243473496, "epoch": 8.079140461215934, "percentage": 40.4, "elapsed_time": "0:39:31", "remaining_time": "0:58:19", "throughput": 4241.41, "total_tokens": 10058056} {"current_steps": 15420, "total_steps": 38160, "loss": 0.4644, "lr": 0.0007438356009827758, "epoch": 8.081761006289309, "percentage": 40.41, "elapsed_time": "0:39:32", "remaining_time": "0:58:18", "throughput": 4241.75, "total_tokens": 10062696} {"current_steps": 15425, "total_steps": 38160, "loss": 0.5034, "lr": 0.0007436359266105759, "epoch": 8.084381551362684, "percentage": 40.42, "elapsed_time": "0:39:33", "remaining_time": "0:58:17", "throughput": 4241.82, "total_tokens": 10065960} {"current_steps": 15430, "total_steps": 38160, "loss": 0.5353, "lr": 0.0007434362012725198, "epoch": 8.08700209643606, "percentage": 40.44, "elapsed_time": "0:39:33", "remaining_time": "0:58:16", "throughput": 4241.85, "total_tokens": 10069000} {"current_steps": 15435, "total_steps": 38160, "loss": 0.3678, "lr": 0.0007432364250103877, "epoch": 8.089622641509434, "percentage": 40.45, "elapsed_time": "0:39:34", "remaining_time": "0:58:16", "throughput": 4242.49, "total_tokens": 10075624} {"current_steps": 15440, "total_steps": 38160, "loss": 0.3361, "lr": 0.0007430365978659704, "epoch": 8.09224318658281, "percentage": 40.46, "elapsed_time": "0:39:35", "remaining_time": "0:58:15", "throughput": 4242.5, "total_tokens": 10078600} {"current_steps": 15445, "total_steps": 38160, "loss": 0.5137, "lr": 0.0007428367198810694, "epoch": 8.094863731656185, "percentage": 40.47, "elapsed_time": "0:39:36", "remaining_time": "0:58:14", "throughput": 4242.57, "total_tokens": 10081736} {"current_steps": 15450, "total_steps": 38160, "loss": 0.444, "lr": 0.0007426367910974973, "epoch": 8.09748427672956, "percentage": 40.49, "elapsed_time": "0:39:37", "remaining_time": "0:58:14", "throughput": 4242.76, "total_tokens": 10085544} {"current_steps": 15455, "total_steps": 38160, "loss": 0.411, "lr": 0.0007424368115570763, "epoch": 8.100104821802935, "percentage": 40.5, "elapsed_time": "0:39:37", "remaining_time": "0:58:13", "throughput": 4242.95, "total_tokens": 10089480} {"current_steps": 15460, "total_steps": 38160, "loss": 0.4239, "lr": 0.0007422367813016405, "epoch": 8.10272536687631, "percentage": 40.51, "elapsed_time": "0:39:38", "remaining_time": "0:58:12", "throughput": 4242.95, "total_tokens": 10092392} {"current_steps": 15465, "total_steps": 38160, "loss": 0.45, "lr": 0.0007420367003730335, "epoch": 8.105345911949685, "percentage": 40.53, "elapsed_time": "0:39:39", "remaining_time": "0:58:11", "throughput": 4243.02, "total_tokens": 10095720} {"current_steps": 15470, "total_steps": 38160, "loss": 0.4406, "lr": 0.0007418365688131103, "epoch": 8.10796645702306, "percentage": 40.54, "elapsed_time": "0:39:40", "remaining_time": "0:58:10", "throughput": 4243.16, "total_tokens": 10099272} {"current_steps": 15475, "total_steps": 38160, "loss": 0.418, "lr": 0.0007416363866637356, "epoch": 8.110587002096436, "percentage": 40.55, "elapsed_time": "0:39:41", "remaining_time": "0:58:10", "throughput": 4243.89, "total_tokens": 10106504} {"current_steps": 15480, "total_steps": 38160, "loss": 0.4964, "lr": 0.0007414361539667857, "epoch": 8.11320754716981, "percentage": 40.57, "elapsed_time": "0:39:42", "remaining_time": "0:58:10", "throughput": 4243.92, "total_tokens": 10109672} {"current_steps": 15485, "total_steps": 38160, "loss": 0.4812, "lr": 0.0007412358707641468, "epoch": 8.115828092243186, "percentage": 40.58, "elapsed_time": "0:39:42", "remaining_time": "0:58:09", "throughput": 4244.03, "total_tokens": 10113192} {"current_steps": 15490, "total_steps": 38160, "loss": 0.4541, "lr": 0.0007410355370977158, "epoch": 8.118448637316561, "percentage": 40.59, "elapsed_time": "0:39:43", "remaining_time": "0:58:08", "throughput": 4244.07, "total_tokens": 10116264} {"current_steps": 15495, "total_steps": 38160, "loss": 0.4878, "lr": 0.0007408351530094005, "epoch": 8.121069182389936, "percentage": 40.61, "elapsed_time": "0:39:44", "remaining_time": "0:58:07", "throughput": 4244.14, "total_tokens": 10119496} {"current_steps": 15500, "total_steps": 38160, "loss": 0.68, "lr": 0.0007406347185411187, "epoch": 8.123689727463312, "percentage": 40.62, "elapsed_time": "0:39:45", "remaining_time": "0:58:06", "throughput": 4244.24, "total_tokens": 10122888} {"current_steps": 15505, "total_steps": 38160, "loss": 0.5411, "lr": 0.0007404342337347992, "epoch": 8.126310272536688, "percentage": 40.63, "elapsed_time": "0:39:45", "remaining_time": "0:58:05", "throughput": 4244.15, "total_tokens": 10125288} {"current_steps": 15510, "total_steps": 38160, "loss": 0.4326, "lr": 0.000740233698632381, "epoch": 8.128930817610064, "percentage": 40.64, "elapsed_time": "0:39:46", "remaining_time": "0:58:05", "throughput": 4244.26, "total_tokens": 10128712} {"current_steps": 15515, "total_steps": 38160, "loss": 0.3991, "lr": 0.0007400331132758136, "epoch": 8.131551362683439, "percentage": 40.66, "elapsed_time": "0:39:47", "remaining_time": "0:58:04", "throughput": 4244.34, "total_tokens": 10132072} {"current_steps": 15520, "total_steps": 38160, "loss": 0.4111, "lr": 0.0007398324777070576, "epoch": 8.134171907756814, "percentage": 40.67, "elapsed_time": "0:39:47", "remaining_time": "0:58:03", "throughput": 4244.46, "total_tokens": 10135592} {"current_steps": 15525, "total_steps": 38160, "loss": 0.3723, "lr": 0.0007396317919680832, "epoch": 8.13679245283019, "percentage": 40.68, "elapsed_time": "0:39:48", "remaining_time": "0:58:02", "throughput": 4244.5, "total_tokens": 10138600} {"current_steps": 15530, "total_steps": 38160, "loss": 0.4405, "lr": 0.0007394310561008717, "epoch": 8.139412997903564, "percentage": 40.7, "elapsed_time": "0:39:49", "remaining_time": "0:58:01", "throughput": 4244.59, "total_tokens": 10141896} {"current_steps": 15535, "total_steps": 38160, "loss": 0.4751, "lr": 0.0007392302701474151, "epoch": 8.14203354297694, "percentage": 40.71, "elapsed_time": "0:39:50", "remaining_time": "0:58:01", "throughput": 4244.83, "total_tokens": 10146024} {"current_steps": 15540, "total_steps": 38160, "loss": 0.3869, "lr": 0.0007390294341497151, "epoch": 8.144654088050315, "percentage": 40.72, "elapsed_time": "0:39:50", "remaining_time": "0:58:00", "throughput": 4244.86, "total_tokens": 10149000} {"current_steps": 15545, "total_steps": 38160, "loss": 0.5363, "lr": 0.0007388285481497845, "epoch": 8.14727463312369, "percentage": 40.74, "elapsed_time": "0:39:51", "remaining_time": "0:57:59", "throughput": 4244.87, "total_tokens": 10151976} {"current_steps": 15550, "total_steps": 38160, "loss": 0.3916, "lr": 0.0007386276121896465, "epoch": 8.149895178197065, "percentage": 40.75, "elapsed_time": "0:39:52", "remaining_time": "0:57:58", "throughput": 4245.12, "total_tokens": 10156104} {"current_steps": 15555, "total_steps": 38160, "loss": 0.3551, "lr": 0.0007384266263113342, "epoch": 8.15251572327044, "percentage": 40.76, "elapsed_time": "0:39:53", "remaining_time": "0:57:57", "throughput": 4245.06, "total_tokens": 10158664} {"current_steps": 15560, "total_steps": 38160, "loss": 0.5179, "lr": 0.0007382255905568919, "epoch": 8.155136268343815, "percentage": 40.78, "elapsed_time": "0:39:53", "remaining_time": "0:57:56", "throughput": 4245.09, "total_tokens": 10161768} {"current_steps": 15565, "total_steps": 38160, "loss": 0.4961, "lr": 0.000738024504968374, "epoch": 8.15775681341719, "percentage": 40.79, "elapsed_time": "0:39:54", "remaining_time": "0:57:56", "throughput": 4245.16, "total_tokens": 10165288} {"current_steps": 15570, "total_steps": 38160, "loss": 0.5998, "lr": 0.0007378233695878449, "epoch": 8.160377358490566, "percentage": 40.8, "elapsed_time": "0:39:55", "remaining_time": "0:57:55", "throughput": 4245.09, "total_tokens": 10167848} {"current_steps": 15575, "total_steps": 38160, "loss": 0.476, "lr": 0.0007376221844573803, "epoch": 8.16299790356394, "percentage": 40.81, "elapsed_time": "0:39:55", "remaining_time": "0:57:54", "throughput": 4245.16, "total_tokens": 10171144} {"current_steps": 15580, "total_steps": 38160, "loss": 0.4065, "lr": 0.0007374209496190656, "epoch": 8.165618448637316, "percentage": 40.83, "elapsed_time": "0:39:56", "remaining_time": "0:57:53", "throughput": 4245.3, "total_tokens": 10174792} {"current_steps": 15585, "total_steps": 38160, "loss": 0.4691, "lr": 0.0007372196651149968, "epoch": 8.168238993710691, "percentage": 40.84, "elapsed_time": "0:39:57", "remaining_time": "0:57:52", "throughput": 4245.34, "total_tokens": 10177864} {"current_steps": 15590, "total_steps": 38160, "loss": 0.552, "lr": 0.0007370183309872805, "epoch": 8.170859538784066, "percentage": 40.85, "elapsed_time": "0:39:58", "remaining_time": "0:57:51", "throughput": 4245.33, "total_tokens": 10180776} {"current_steps": 15595, "total_steps": 38160, "loss": 0.4623, "lr": 0.0007368169472780335, "epoch": 8.173480083857442, "percentage": 40.87, "elapsed_time": "0:39:58", "remaining_time": "0:57:50", "throughput": 4245.29, "total_tokens": 10183528} {"current_steps": 15600, "total_steps": 38160, "loss": 0.366, "lr": 0.0007366155140293828, "epoch": 8.176100628930818, "percentage": 40.88, "elapsed_time": "0:39:59", "remaining_time": "0:57:49", "throughput": 4245.26, "total_tokens": 10186248} {"current_steps": 15605, "total_steps": 38160, "loss": 0.5928, "lr": 0.000736414031283466, "epoch": 8.178721174004194, "percentage": 40.89, "elapsed_time": "0:40:00", "remaining_time": "0:57:49", "throughput": 4245.23, "total_tokens": 10188968} {"current_steps": 15610, "total_steps": 38160, "loss": 0.4208, "lr": 0.000736212499082431, "epoch": 8.181341719077569, "percentage": 40.91, "elapsed_time": "0:40:00", "remaining_time": "0:57:48", "throughput": 4245.32, "total_tokens": 10192328} {"current_steps": 15615, "total_steps": 38160, "loss": 0.3611, "lr": 0.0007360109174684359, "epoch": 8.183962264150944, "percentage": 40.92, "elapsed_time": "0:40:01", "remaining_time": "0:57:47", "throughput": 4245.4, "total_tokens": 10195592} {"current_steps": 15620, "total_steps": 38160, "loss": 0.4956, "lr": 0.0007358092864836497, "epoch": 8.18658280922432, "percentage": 40.93, "elapsed_time": "0:40:02", "remaining_time": "0:57:46", "throughput": 4245.49, "total_tokens": 10199016} {"current_steps": 15625, "total_steps": 38160, "loss": 0.4745, "lr": 0.0007356076061702508, "epoch": 8.189203354297694, "percentage": 40.95, "elapsed_time": "0:40:03", "remaining_time": "0:57:45", "throughput": 4245.53, "total_tokens": 10202152} {"current_steps": 15630, "total_steps": 38160, "loss": 0.4911, "lr": 0.0007354058765704288, "epoch": 8.19182389937107, "percentage": 40.96, "elapsed_time": "0:40:03", "remaining_time": "0:57:44", "throughput": 4245.5, "total_tokens": 10204968} {"current_steps": 15635, "total_steps": 38160, "loss": 0.527, "lr": 0.000735204097726383, "epoch": 8.194444444444445, "percentage": 40.97, "elapsed_time": "0:40:04", "remaining_time": "0:57:44", "throughput": 4245.58, "total_tokens": 10208328} {"current_steps": 15640, "total_steps": 38160, "loss": 0.3167, "lr": 0.0007350022696803233, "epoch": 8.19706498951782, "percentage": 40.99, "elapsed_time": "0:40:05", "remaining_time": "0:57:43", "throughput": 4245.51, "total_tokens": 10210888} {"current_steps": 15645, "total_steps": 38160, "loss": 0.3774, "lr": 0.0007348003924744699, "epoch": 8.199685534591195, "percentage": 41.0, "elapsed_time": "0:40:05", "remaining_time": "0:57:42", "throughput": 4245.47, "total_tokens": 10213544} {"current_steps": 15650, "total_steps": 38160, "loss": 0.388, "lr": 0.000734598466151053, "epoch": 8.20230607966457, "percentage": 41.01, "elapsed_time": "0:40:06", "remaining_time": "0:57:41", "throughput": 4245.6, "total_tokens": 10217096} {"current_steps": 15655, "total_steps": 38160, "loss": 0.4081, "lr": 0.0007343964907523135, "epoch": 8.204926624737945, "percentage": 41.02, "elapsed_time": "0:40:07", "remaining_time": "0:57:40", "throughput": 4245.83, "total_tokens": 10221160} {"current_steps": 15660, "total_steps": 38160, "loss": 0.5196, "lr": 0.0007341944663205023, "epoch": 8.20754716981132, "percentage": 41.04, "elapsed_time": "0:40:07", "remaining_time": "0:57:39", "throughput": 4245.77, "total_tokens": 10223720} {"current_steps": 15665, "total_steps": 38160, "loss": 0.4527, "lr": 0.0007339923928978805, "epoch": 8.210167714884696, "percentage": 41.05, "elapsed_time": "0:40:08", "remaining_time": "0:57:38", "throughput": 4245.8, "total_tokens": 10226760} {"current_steps": 15670, "total_steps": 38160, "loss": 0.4832, "lr": 0.0007337902705267197, "epoch": 8.21278825995807, "percentage": 41.06, "elapsed_time": "0:40:09", "remaining_time": "0:57:37", "throughput": 4245.74, "total_tokens": 10229416} {"current_steps": 15675, "total_steps": 38160, "loss": 0.4444, "lr": 0.0007335880992493016, "epoch": 8.215408805031446, "percentage": 41.08, "elapsed_time": "0:40:10", "remaining_time": "0:57:37", "throughput": 4245.76, "total_tokens": 10232488} {"current_steps": 15680, "total_steps": 38160, "loss": 0.4196, "lr": 0.000733385879107918, "epoch": 8.218029350104821, "percentage": 41.09, "elapsed_time": "0:40:10", "remaining_time": "0:57:36", "throughput": 4245.77, "total_tokens": 10235560} {"current_steps": 15685, "total_steps": 38160, "loss": 0.3684, "lr": 0.000733183610144871, "epoch": 8.220649895178196, "percentage": 41.1, "elapsed_time": "0:40:11", "remaining_time": "0:57:35", "throughput": 4245.86, "total_tokens": 10238952} {"current_steps": 15690, "total_steps": 38160, "loss": 0.4444, "lr": 0.0007329812924024732, "epoch": 8.223270440251572, "percentage": 41.12, "elapsed_time": "0:40:12", "remaining_time": "0:57:34", "throughput": 4246.03, "total_tokens": 10242664} {"current_steps": 15695, "total_steps": 38160, "loss": 0.5615, "lr": 0.0007327789259230468, "epoch": 8.225890985324948, "percentage": 41.13, "elapsed_time": "0:40:13", "remaining_time": "0:57:33", "throughput": 4246.21, "total_tokens": 10246536} {"current_steps": 15700, "total_steps": 38160, "loss": 0.4283, "lr": 0.0007325765107489249, "epoch": 8.228511530398324, "percentage": 41.14, "elapsed_time": "0:40:13", "remaining_time": "0:57:33", "throughput": 4246.17, "total_tokens": 10249160} {"current_steps": 15705, "total_steps": 38160, "loss": 0.3738, "lr": 0.0007323740469224505, "epoch": 8.231132075471699, "percentage": 41.16, "elapsed_time": "0:40:14", "remaining_time": "0:57:32", "throughput": 4246.21, "total_tokens": 10252328} {"current_steps": 15710, "total_steps": 38160, "loss": 0.5195, "lr": 0.0007321715344859763, "epoch": 8.233752620545074, "percentage": 41.17, "elapsed_time": "0:40:15", "remaining_time": "0:57:31", "throughput": 4246.48, "total_tokens": 10256584} {"current_steps": 15715, "total_steps": 38160, "loss": 0.3527, "lr": 0.000731968973481866, "epoch": 8.23637316561845, "percentage": 41.18, "elapsed_time": "0:40:15", "remaining_time": "0:57:30", "throughput": 4246.45, "total_tokens": 10259336} {"current_steps": 15720, "total_steps": 38160, "loss": 0.4696, "lr": 0.0007317663639524928, "epoch": 8.238993710691824, "percentage": 41.19, "elapsed_time": "0:40:16", "remaining_time": "0:57:29", "throughput": 4246.47, "total_tokens": 10262440} {"current_steps": 15725, "total_steps": 38160, "loss": 0.4077, "lr": 0.0007315637059402404, "epoch": 8.2416142557652, "percentage": 41.21, "elapsed_time": "0:40:17", "remaining_time": "0:57:28", "throughput": 4246.48, "total_tokens": 10265384} {"current_steps": 15730, "total_steps": 38160, "loss": 0.4782, "lr": 0.0007313609994875024, "epoch": 8.244234800838575, "percentage": 41.22, "elapsed_time": "0:40:18", "remaining_time": "0:57:28", "throughput": 4246.61, "total_tokens": 10268936} {"current_steps": 15735, "total_steps": 38160, "loss": 0.3288, "lr": 0.0007311582446366831, "epoch": 8.24685534591195, "percentage": 41.23, "elapsed_time": "0:40:18", "remaining_time": "0:57:27", "throughput": 4246.51, "total_tokens": 10271304} {"current_steps": 15740, "total_steps": 38160, "loss": 0.6439, "lr": 0.000730955441430196, "epoch": 8.249475890985325, "percentage": 41.25, "elapsed_time": "0:40:19", "remaining_time": "0:57:26", "throughput": 4246.56, "total_tokens": 10274536} {"current_steps": 15745, "total_steps": 38160, "loss": 0.294, "lr": 0.0007307525899104655, "epoch": 8.2520964360587, "percentage": 41.26, "elapsed_time": "0:40:20", "remaining_time": "0:57:25", "throughput": 4246.72, "total_tokens": 10278280} {"current_steps": 15750, "total_steps": 38160, "loss": 0.4055, "lr": 0.0007305496901199259, "epoch": 8.254716981132075, "percentage": 41.27, "elapsed_time": "0:40:20", "remaining_time": "0:57:24", "throughput": 4246.64, "total_tokens": 10280872} {"current_steps": 15755, "total_steps": 38160, "loss": 0.3126, "lr": 0.0007303467421010211, "epoch": 8.25733752620545, "percentage": 41.29, "elapsed_time": "0:40:21", "remaining_time": "0:57:23", "throughput": 4246.82, "total_tokens": 10284680} {"current_steps": 15760, "total_steps": 38160, "loss": 0.5077, "lr": 0.0007301437458962061, "epoch": 8.259958071278826, "percentage": 41.3, "elapsed_time": "0:40:22", "remaining_time": "0:57:23", "throughput": 4246.81, "total_tokens": 10287528} {"current_steps": 15765, "total_steps": 38160, "loss": 0.3121, "lr": 0.0007299407015479448, "epoch": 8.2625786163522, "percentage": 41.31, "elapsed_time": "0:40:23", "remaining_time": "0:57:22", "throughput": 4246.93, "total_tokens": 10291112} {"current_steps": 15770, "total_steps": 38160, "loss": 0.3278, "lr": 0.0007297376090987122, "epoch": 8.265199161425576, "percentage": 41.33, "elapsed_time": "0:40:23", "remaining_time": "0:57:21", "throughput": 4246.97, "total_tokens": 10294248} {"current_steps": 15775, "total_steps": 38160, "loss": 0.5824, "lr": 0.0007295344685909926, "epoch": 8.267819706498951, "percentage": 41.34, "elapsed_time": "0:40:24", "remaining_time": "0:57:20", "throughput": 4246.96, "total_tokens": 10297064} {"current_steps": 15780, "total_steps": 38160, "loss": 0.4577, "lr": 0.000729331280067281, "epoch": 8.270440251572326, "percentage": 41.35, "elapsed_time": "0:40:25", "remaining_time": "0:57:19", "throughput": 4247.17, "total_tokens": 10301000} {"current_steps": 15785, "total_steps": 38160, "loss": 0.4707, "lr": 0.0007291280435700819, "epoch": 8.273060796645701, "percentage": 41.37, "elapsed_time": "0:40:26", "remaining_time": "0:57:18", "throughput": 4247.14, "total_tokens": 10303816} {"current_steps": 15790, "total_steps": 38160, "loss": 0.379, "lr": 0.0007289247591419102, "epoch": 8.275681341719078, "percentage": 41.38, "elapsed_time": "0:40:26", "remaining_time": "0:57:17", "throughput": 4247.08, "total_tokens": 10306440} {"current_steps": 15795, "total_steps": 38160, "loss": 0.5128, "lr": 0.0007287214268252904, "epoch": 8.278301886792454, "percentage": 41.39, "elapsed_time": "0:40:27", "remaining_time": "0:57:17", "throughput": 4247.24, "total_tokens": 10310152} {"current_steps": 15800, "total_steps": 38160, "loss": 0.4132, "lr": 0.0007285180466627577, "epoch": 8.280922431865829, "percentage": 41.4, "elapsed_time": "0:40:28", "remaining_time": "0:57:16", "throughput": 4247.41, "total_tokens": 10313896} {"current_steps": 15805, "total_steps": 38160, "loss": 0.4093, "lr": 0.0007283146186968565, "epoch": 8.283542976939204, "percentage": 41.42, "elapsed_time": "0:40:29", "remaining_time": "0:57:15", "throughput": 4247.53, "total_tokens": 10317320} {"current_steps": 15810, "total_steps": 38160, "loss": 0.3491, "lr": 0.000728111142970142, "epoch": 8.286163522012579, "percentage": 41.43, "elapsed_time": "0:40:29", "remaining_time": "0:57:14", "throughput": 4247.59, "total_tokens": 10320456} {"current_steps": 15815, "total_steps": 38160, "loss": 0.5561, "lr": 0.0007279076195251788, "epoch": 8.288784067085954, "percentage": 41.44, "elapsed_time": "0:40:30", "remaining_time": "0:57:14", "throughput": 4247.93, "total_tokens": 10325224} {"current_steps": 15820, "total_steps": 38160, "loss": 0.4519, "lr": 0.0007277040484045416, "epoch": 8.29140461215933, "percentage": 41.46, "elapsed_time": "0:40:31", "remaining_time": "0:57:13", "throughput": 4247.96, "total_tokens": 10328296} {"current_steps": 15825, "total_steps": 38160, "loss": 0.4569, "lr": 0.0007275004296508154, "epoch": 8.294025157232705, "percentage": 41.47, "elapsed_time": "0:40:32", "remaining_time": "0:57:12", "throughput": 4247.97, "total_tokens": 10331240} {"current_steps": 15830, "total_steps": 38160, "loss": 0.5104, "lr": 0.0007272967633065947, "epoch": 8.29664570230608, "percentage": 41.48, "elapsed_time": "0:40:32", "remaining_time": "0:57:11", "throughput": 4248.1, "total_tokens": 10334824} {"current_steps": 15835, "total_steps": 38160, "loss": 0.4339, "lr": 0.0007270930494144843, "epoch": 8.299266247379455, "percentage": 41.5, "elapsed_time": "0:40:33", "remaining_time": "0:57:11", "throughput": 4248.21, "total_tokens": 10338472} {"current_steps": 15840, "total_steps": 38160, "loss": 0.3763, "lr": 0.0007268892880170988, "epoch": 8.30188679245283, "percentage": 41.51, "elapsed_time": "0:40:34", "remaining_time": "0:57:10", "throughput": 4248.36, "total_tokens": 10342184} {"current_steps": 15845, "total_steps": 38160, "loss": 0.7057, "lr": 0.0007266854791570625, "epoch": 8.304507337526205, "percentage": 41.52, "elapsed_time": "0:40:35", "remaining_time": "0:57:09", "throughput": 4248.37, "total_tokens": 10345128} {"current_steps": 15850, "total_steps": 38160, "loss": 0.5134, "lr": 0.0007264816228770103, "epoch": 8.30712788259958, "percentage": 41.54, "elapsed_time": "0:40:35", "remaining_time": "0:57:08", "throughput": 4248.4, "total_tokens": 10348168} {"current_steps": 15855, "total_steps": 38160, "loss": 0.5348, "lr": 0.0007262777192195866, "epoch": 8.309748427672956, "percentage": 41.55, "elapsed_time": "0:40:36", "remaining_time": "0:57:07", "throughput": 4248.35, "total_tokens": 10350824} {"current_steps": 15860, "total_steps": 38160, "loss": 0.3486, "lr": 0.0007260737682274452, "epoch": 8.31236897274633, "percentage": 41.56, "elapsed_time": "0:40:37", "remaining_time": "0:57:07", "throughput": 4248.68, "total_tokens": 10355464} {"current_steps": 15865, "total_steps": 38160, "loss": 0.4205, "lr": 0.0007258697699432511, "epoch": 8.314989517819706, "percentage": 41.57, "elapsed_time": "0:40:37", "remaining_time": "0:57:06", "throughput": 4248.62, "total_tokens": 10358088} {"current_steps": 15870, "total_steps": 38160, "loss": 0.4048, "lr": 0.0007256657244096775, "epoch": 8.317610062893081, "percentage": 41.59, "elapsed_time": "0:40:38", "remaining_time": "0:57:05", "throughput": 4248.59, "total_tokens": 10360808} {"current_steps": 15875, "total_steps": 38160, "loss": 0.474, "lr": 0.0007254616316694091, "epoch": 8.320230607966456, "percentage": 41.6, "elapsed_time": "0:40:39", "remaining_time": "0:57:04", "throughput": 4248.8, "total_tokens": 10364616} {"current_steps": 15880, "total_steps": 38160, "loss": 0.3674, "lr": 0.0007252574917651398, "epoch": 8.322851153039831, "percentage": 41.61, "elapsed_time": "0:40:40", "remaining_time": "0:57:03", "throughput": 4248.88, "total_tokens": 10368008} {"current_steps": 15885, "total_steps": 38160, "loss": 0.4329, "lr": 0.0007250533047395728, "epoch": 8.325471698113208, "percentage": 41.63, "elapsed_time": "0:40:40", "remaining_time": "0:57:02", "throughput": 4248.93, "total_tokens": 10371144} {"current_steps": 15890, "total_steps": 38160, "loss": 0.4677, "lr": 0.0007248490706354221, "epoch": 8.328092243186584, "percentage": 41.64, "elapsed_time": "0:40:41", "remaining_time": "0:57:02", "throughput": 4249.11, "total_tokens": 10374952} {"current_steps": 15895, "total_steps": 38160, "loss": 0.5339, "lr": 0.0007246447894954109, "epoch": 8.330712788259959, "percentage": 41.65, "elapsed_time": "0:40:42", "remaining_time": "0:57:01", "throughput": 4249.25, "total_tokens": 10378664} {"current_steps": 15900, "total_steps": 38160, "loss": 0.4704, "lr": 0.0007244404613622727, "epoch": 8.333333333333334, "percentage": 41.67, "elapsed_time": "0:40:43", "remaining_time": "0:57:00", "throughput": 4249.36, "total_tokens": 10382216} {"current_steps": 15905, "total_steps": 38160, "loss": 0.4688, "lr": 0.0007242360862787507, "epoch": 8.335953878406709, "percentage": 41.68, "elapsed_time": "0:40:43", "remaining_time": "0:56:59", "throughput": 4249.4, "total_tokens": 10385448} {"current_steps": 15910, "total_steps": 38160, "loss": 0.6443, "lr": 0.0007240316642875975, "epoch": 8.338574423480084, "percentage": 41.69, "elapsed_time": "0:40:44", "remaining_time": "0:56:58", "throughput": 4249.33, "total_tokens": 10388008} {"current_steps": 15915, "total_steps": 38160, "loss": 0.5531, "lr": 0.0007238271954315759, "epoch": 8.34119496855346, "percentage": 41.71, "elapsed_time": "0:40:45", "remaining_time": "0:56:58", "throughput": 4249.6, "total_tokens": 10392328} {"current_steps": 15920, "total_steps": 38160, "loss": 0.3277, "lr": 0.0007236226797534589, "epoch": 8.343815513626835, "percentage": 41.72, "elapsed_time": "0:40:46", "remaining_time": "0:56:57", "throughput": 4249.65, "total_tokens": 10395400} {"current_steps": 15925, "total_steps": 38160, "loss": 0.3593, "lr": 0.0007234181172960283, "epoch": 8.34643605870021, "percentage": 41.73, "elapsed_time": "0:40:46", "remaining_time": "0:56:56", "throughput": 4249.57, "total_tokens": 10397896} {"current_steps": 15930, "total_steps": 38160, "loss": 0.5167, "lr": 0.0007232135081020766, "epoch": 8.349056603773585, "percentage": 41.75, "elapsed_time": "0:40:47", "remaining_time": "0:56:55", "throughput": 4249.61, "total_tokens": 10401032} {"current_steps": 15935, "total_steps": 38160, "loss": 0.4508, "lr": 0.0007230088522144054, "epoch": 8.35167714884696, "percentage": 41.76, "elapsed_time": "0:40:48", "remaining_time": "0:56:54", "throughput": 4249.74, "total_tokens": 10404616} {"current_steps": 15940, "total_steps": 38160, "loss": 0.4143, "lr": 0.0007228041496758265, "epoch": 8.354297693920335, "percentage": 41.77, "elapsed_time": "0:40:48", "remaining_time": "0:56:53", "throughput": 4249.74, "total_tokens": 10407432} {"current_steps": 15945, "total_steps": 38160, "loss": 0.5091, "lr": 0.0007225994005291615, "epoch": 8.35691823899371, "percentage": 41.78, "elapsed_time": "0:40:49", "remaining_time": "0:56:53", "throughput": 4249.97, "total_tokens": 10411560} {"current_steps": 15950, "total_steps": 38160, "loss": 0.5546, "lr": 0.0007223946048172414, "epoch": 8.359538784067086, "percentage": 41.8, "elapsed_time": "0:40:50", "remaining_time": "0:56:52", "throughput": 4249.93, "total_tokens": 10414248} {"current_steps": 15955, "total_steps": 38160, "loss": 0.6098, "lr": 0.0007221897625829072, "epoch": 8.36215932914046, "percentage": 41.81, "elapsed_time": "0:40:51", "remaining_time": "0:56:51", "throughput": 4250.04, "total_tokens": 10417608} {"current_steps": 15960, "total_steps": 38160, "loss": 0.4056, "lr": 0.0007219848738690095, "epoch": 8.364779874213836, "percentage": 41.82, "elapsed_time": "0:40:51", "remaining_time": "0:56:50", "throughput": 4249.92, "total_tokens": 10419912} {"current_steps": 15965, "total_steps": 38160, "loss": 0.4066, "lr": 0.0007217799387184089, "epoch": 8.367400419287211, "percentage": 41.84, "elapsed_time": "0:40:52", "remaining_time": "0:56:49", "throughput": 4249.91, "total_tokens": 10422920} {"current_steps": 15970, "total_steps": 38160, "loss": 0.4588, "lr": 0.0007215749571739752, "epoch": 8.370020964360586, "percentage": 41.85, "elapsed_time": "0:40:53", "remaining_time": "0:56:48", "throughput": 4250.13, "total_tokens": 10426952} {"current_steps": 15975, "total_steps": 38160, "loss": 0.4139, "lr": 0.0007213699292785883, "epoch": 8.372641509433961, "percentage": 41.86, "elapsed_time": "0:40:54", "remaining_time": "0:56:48", "throughput": 4250.25, "total_tokens": 10430568} {"current_steps": 15980, "total_steps": 38160, "loss": 0.4454, "lr": 0.0007211648550751377, "epoch": 8.375262054507338, "percentage": 41.88, "elapsed_time": "0:40:54", "remaining_time": "0:56:47", "throughput": 4250.3, "total_tokens": 10433832} {"current_steps": 15985, "total_steps": 38160, "loss": 0.4467, "lr": 0.0007209597346065226, "epoch": 8.377882599580714, "percentage": 41.89, "elapsed_time": "0:40:55", "remaining_time": "0:56:46", "throughput": 4250.29, "total_tokens": 10436584} {"current_steps": 15990, "total_steps": 38160, "loss": 0.5331, "lr": 0.000720754567915652, "epoch": 8.380503144654089, "percentage": 41.9, "elapsed_time": "0:40:56", "remaining_time": "0:56:45", "throughput": 4250.35, "total_tokens": 10439816} {"current_steps": 15995, "total_steps": 38160, "loss": 0.4603, "lr": 0.000720549355045444, "epoch": 8.383123689727464, "percentage": 41.92, "elapsed_time": "0:40:56", "remaining_time": "0:56:44", "throughput": 4250.38, "total_tokens": 10442920} {"current_steps": 16000, "total_steps": 38160, "loss": 0.3178, "lr": 0.0007203440960388273, "epoch": 8.385744234800839, "percentage": 41.93, "elapsed_time": "0:40:57", "remaining_time": "0:56:43", "throughput": 4250.37, "total_tokens": 10445800} {"current_steps": 16005, "total_steps": 38160, "loss": 0.4725, "lr": 0.0007201387909387396, "epoch": 8.388364779874214, "percentage": 41.94, "elapsed_time": "0:40:58", "remaining_time": "0:56:42", "throughput": 4250.3, "total_tokens": 10448424} {"current_steps": 16010, "total_steps": 38160, "loss": 0.5509, "lr": 0.0007199334397881282, "epoch": 8.39098532494759, "percentage": 41.95, "elapsed_time": "0:40:59", "remaining_time": "0:56:42", "throughput": 4250.47, "total_tokens": 10452104} {"current_steps": 16015, "total_steps": 38160, "loss": 0.5387, "lr": 0.0007197280426299502, "epoch": 8.393605870020965, "percentage": 41.97, "elapsed_time": "0:40:59", "remaining_time": "0:56:41", "throughput": 4250.43, "total_tokens": 10454792} {"current_steps": 16020, "total_steps": 38160, "loss": 0.4741, "lr": 0.0007195225995071727, "epoch": 8.39622641509434, "percentage": 41.98, "elapsed_time": "0:41:00", "remaining_time": "0:56:40", "throughput": 4250.47, "total_tokens": 10457896} {"current_steps": 16025, "total_steps": 38160, "loss": 0.4448, "lr": 0.0007193171104627718, "epoch": 8.398846960167715, "percentage": 41.99, "elapsed_time": "0:41:01", "remaining_time": "0:56:39", "throughput": 4250.58, "total_tokens": 10461416} {"current_steps": 16030, "total_steps": 38160, "loss": 0.4888, "lr": 0.0007191115755397333, "epoch": 8.40146750524109, "percentage": 42.01, "elapsed_time": "0:41:01", "remaining_time": "0:56:38", "throughput": 4250.68, "total_tokens": 10464936} {"current_steps": 16035, "total_steps": 38160, "loss": 0.4346, "lr": 0.0007189059947810531, "epoch": 8.404088050314465, "percentage": 42.02, "elapsed_time": "0:41:02", "remaining_time": "0:56:38", "throughput": 4250.84, "total_tokens": 10468744} {"current_steps": 16040, "total_steps": 38160, "loss": 0.4692, "lr": 0.0007187003682297363, "epoch": 8.40670859538784, "percentage": 42.03, "elapsed_time": "0:41:03", "remaining_time": "0:56:37", "throughput": 4250.82, "total_tokens": 10471528} {"current_steps": 16045, "total_steps": 38160, "loss": 0.4902, "lr": 0.0007184946959287972, "epoch": 8.409329140461216, "percentage": 42.05, "elapsed_time": "0:41:04", "remaining_time": "0:56:36", "throughput": 4250.8, "total_tokens": 10474344} {"current_steps": 16050, "total_steps": 38160, "loss": 0.4365, "lr": 0.0007182889779212609, "epoch": 8.41194968553459, "percentage": 42.06, "elapsed_time": "0:41:04", "remaining_time": "0:56:35", "throughput": 4250.8, "total_tokens": 10477256} {"current_steps": 16055, "total_steps": 38160, "loss": 0.6122, "lr": 0.0007180832142501605, "epoch": 8.414570230607966, "percentage": 42.07, "elapsed_time": "0:41:05", "remaining_time": "0:56:34", "throughput": 4250.8, "total_tokens": 10480104} {"current_steps": 16060, "total_steps": 38160, "loss": 0.4917, "lr": 0.0007178774049585397, "epoch": 8.417190775681341, "percentage": 42.09, "elapsed_time": "0:41:06", "remaining_time": "0:56:33", "throughput": 4251.09, "total_tokens": 10484680} {"current_steps": 16065, "total_steps": 38160, "loss": 0.3988, "lr": 0.0007176715500894515, "epoch": 8.419811320754716, "percentage": 42.1, "elapsed_time": "0:41:07", "remaining_time": "0:56:33", "throughput": 4251.16, "total_tokens": 10488008} {"current_steps": 16070, "total_steps": 38160, "loss": 0.392, "lr": 0.0007174656496859584, "epoch": 8.422431865828091, "percentage": 42.11, "elapsed_time": "0:41:07", "remaining_time": "0:56:32", "throughput": 4251.14, "total_tokens": 10490792} {"current_steps": 16075, "total_steps": 38160, "loss": 0.45, "lr": 0.0007172597037911323, "epoch": 8.425052410901468, "percentage": 42.13, "elapsed_time": "0:41:08", "remaining_time": "0:56:31", "throughput": 4251.6, "total_tokens": 10496200} {"current_steps": 16080, "total_steps": 38160, "loss": 0.4253, "lr": 0.0007170537124480548, "epoch": 8.427672955974844, "percentage": 42.14, "elapsed_time": "0:41:09", "remaining_time": "0:56:30", "throughput": 4251.47, "total_tokens": 10498472} {"current_steps": 16085, "total_steps": 38160, "loss": 0.4889, "lr": 0.0007168476756998169, "epoch": 8.430293501048219, "percentage": 42.15, "elapsed_time": "0:41:10", "remaining_time": "0:56:29", "throughput": 4251.42, "total_tokens": 10501064} {"current_steps": 16090, "total_steps": 38160, "loss": 0.5078, "lr": 0.0007166415935895194, "epoch": 8.432914046121594, "percentage": 42.16, "elapsed_time": "0:41:10", "remaining_time": "0:56:29", "throughput": 4251.54, "total_tokens": 10504616} {"current_steps": 16095, "total_steps": 38160, "loss": 0.5802, "lr": 0.0007164354661602718, "epoch": 8.435534591194969, "percentage": 42.18, "elapsed_time": "0:41:11", "remaining_time": "0:56:28", "throughput": 4251.4, "total_tokens": 10506792} {"current_steps": 16100, "total_steps": 38160, "loss": 0.3515, "lr": 0.000716229293455194, "epoch": 8.438155136268344, "percentage": 42.19, "elapsed_time": "0:41:12", "remaining_time": "0:56:27", "throughput": 4251.34, "total_tokens": 10509384} {"current_steps": 16105, "total_steps": 38160, "loss": 0.4128, "lr": 0.000716023075517415, "epoch": 8.44077568134172, "percentage": 42.2, "elapsed_time": "0:41:12", "remaining_time": "0:56:26", "throughput": 4251.35, "total_tokens": 10512328} {"current_steps": 16110, "total_steps": 38160, "loss": 0.5808, "lr": 0.000715816812390073, "epoch": 8.443396226415095, "percentage": 42.22, "elapsed_time": "0:41:13", "remaining_time": "0:56:25", "throughput": 4251.51, "total_tokens": 10516136} {"current_steps": 16115, "total_steps": 38160, "loss": 0.5335, "lr": 0.0007156105041163161, "epoch": 8.44601677148847, "percentage": 42.23, "elapsed_time": "0:41:14", "remaining_time": "0:56:24", "throughput": 4251.7, "total_tokens": 10520040} {"current_steps": 16120, "total_steps": 38160, "loss": 0.5671, "lr": 0.0007154041507393015, "epoch": 8.448637316561845, "percentage": 42.24, "elapsed_time": "0:41:15", "remaining_time": "0:56:23", "throughput": 4251.74, "total_tokens": 10523144} {"current_steps": 16125, "total_steps": 38160, "loss": 0.4421, "lr": 0.000715197752302196, "epoch": 8.45125786163522, "percentage": 42.26, "elapsed_time": "0:41:15", "remaining_time": "0:56:23", "throughput": 4251.84, "total_tokens": 10526600} {"current_steps": 16130, "total_steps": 38160, "loss": 0.5237, "lr": 0.0007149913088481759, "epoch": 8.453878406708595, "percentage": 42.27, "elapsed_time": "0:41:16", "remaining_time": "0:56:22", "throughput": 4252.21, "total_tokens": 10531560} {"current_steps": 16135, "total_steps": 38160, "loss": 0.4237, "lr": 0.0007147848204204266, "epoch": 8.45649895178197, "percentage": 42.28, "elapsed_time": "0:41:17", "remaining_time": "0:56:21", "throughput": 4252.43, "total_tokens": 10535592} {"current_steps": 16140, "total_steps": 38160, "loss": 0.4198, "lr": 0.0007145782870621435, "epoch": 8.459119496855346, "percentage": 42.3, "elapsed_time": "0:41:18", "remaining_time": "0:56:20", "throughput": 4252.33, "total_tokens": 10537992} {"current_steps": 16145, "total_steps": 38160, "loss": 0.4349, "lr": 0.0007143717088165304, "epoch": 8.46174004192872, "percentage": 42.31, "elapsed_time": "0:41:19", "remaining_time": "0:56:20", "throughput": 4252.54, "total_tokens": 10542152} {"current_steps": 16150, "total_steps": 38160, "loss": 0.4189, "lr": 0.0007141650857268019, "epoch": 8.464360587002096, "percentage": 42.32, "elapsed_time": "0:41:19", "remaining_time": "0:56:19", "throughput": 4252.53, "total_tokens": 10545064} {"current_steps": 16155, "total_steps": 38160, "loss": 0.5031, "lr": 0.0007139584178361807, "epoch": 8.466981132075471, "percentage": 42.33, "elapsed_time": "0:41:20", "remaining_time": "0:56:18", "throughput": 4252.55, "total_tokens": 10548008} {"current_steps": 16160, "total_steps": 38160, "loss": 0.5159, "lr": 0.0007137517051878994, "epoch": 8.469601677148846, "percentage": 42.35, "elapsed_time": "0:41:21", "remaining_time": "0:56:17", "throughput": 4252.56, "total_tokens": 10551048} {"current_steps": 16165, "total_steps": 38160, "loss": 0.4605, "lr": 0.0007135449478251998, "epoch": 8.472222222222221, "percentage": 42.36, "elapsed_time": "0:41:21", "remaining_time": "0:56:16", "throughput": 4252.64, "total_tokens": 10554312} {"current_steps": 16170, "total_steps": 38160, "loss": 0.4649, "lr": 0.0007133381457913336, "epoch": 8.474842767295598, "percentage": 42.37, "elapsed_time": "0:41:22", "remaining_time": "0:56:15", "throughput": 4252.56, "total_tokens": 10556840} {"current_steps": 16175, "total_steps": 38160, "loss": 0.4221, "lr": 0.0007131312991295611, "epoch": 8.477463312368974, "percentage": 42.39, "elapsed_time": "0:41:23", "remaining_time": "0:56:15", "throughput": 4252.98, "total_tokens": 10562376} {"current_steps": 16180, "total_steps": 38160, "loss": 0.4798, "lr": 0.0007129244078831525, "epoch": 8.480083857442349, "percentage": 42.4, "elapsed_time": "0:41:24", "remaining_time": "0:56:14", "throughput": 4252.89, "total_tokens": 10564776} {"current_steps": 16185, "total_steps": 38160, "loss": 0.4264, "lr": 0.0007127174720953866, "epoch": 8.482704402515724, "percentage": 42.41, "elapsed_time": "0:41:24", "remaining_time": "0:56:13", "throughput": 4252.94, "total_tokens": 10567944} {"current_steps": 16190, "total_steps": 38160, "loss": 0.3159, "lr": 0.0007125104918095526, "epoch": 8.485324947589099, "percentage": 42.43, "elapsed_time": "0:41:25", "remaining_time": "0:56:12", "throughput": 4252.95, "total_tokens": 10570952} {"current_steps": 16195, "total_steps": 38160, "loss": 0.2921, "lr": 0.0007123034670689483, "epoch": 8.487945492662474, "percentage": 42.44, "elapsed_time": "0:41:26", "remaining_time": "0:56:11", "throughput": 4252.89, "total_tokens": 10573544} {"current_steps": 16200, "total_steps": 38160, "loss": 0.3643, "lr": 0.0007120963979168804, "epoch": 8.49056603773585, "percentage": 42.45, "elapsed_time": "0:41:27", "remaining_time": "0:56:11", "throughput": 4253.38, "total_tokens": 10579112} {"current_steps": 16205, "total_steps": 38160, "loss": 0.3262, "lr": 0.000711889284396666, "epoch": 8.493186582809225, "percentage": 42.47, "elapsed_time": "0:41:28", "remaining_time": "0:56:10", "throughput": 4253.58, "total_tokens": 10583080} {"current_steps": 16210, "total_steps": 38160, "loss": 0.3927, "lr": 0.0007116821265516307, "epoch": 8.4958071278826, "percentage": 42.48, "elapsed_time": "0:41:28", "remaining_time": "0:56:09", "throughput": 4253.57, "total_tokens": 10585960} {"current_steps": 16215, "total_steps": 38160, "loss": 0.3923, "lr": 0.0007114749244251094, "epoch": 8.498427672955975, "percentage": 42.49, "elapsed_time": "0:41:29", "remaining_time": "0:56:09", "throughput": 4253.53, "total_tokens": 10588584} {"current_steps": 16220, "total_steps": 38160, "loss": 0.3193, "lr": 0.0007112676780604468, "epoch": 8.50104821802935, "percentage": 42.51, "elapsed_time": "0:41:30", "remaining_time": "0:56:08", "throughput": 4253.57, "total_tokens": 10591720} {"current_steps": 16225, "total_steps": 38160, "loss": 0.4303, "lr": 0.000711060387500996, "epoch": 8.503668763102725, "percentage": 42.52, "elapsed_time": "0:41:30", "remaining_time": "0:56:07", "throughput": 4253.61, "total_tokens": 10594760} {"current_steps": 16230, "total_steps": 38160, "loss": 0.4872, "lr": 0.0007108530527901199, "epoch": 8.5062893081761, "percentage": 42.53, "elapsed_time": "0:41:31", "remaining_time": "0:56:06", "throughput": 4253.77, "total_tokens": 10598600} {"current_steps": 16235, "total_steps": 38160, "loss": 0.3659, "lr": 0.000710645673971191, "epoch": 8.508909853249476, "percentage": 42.54, "elapsed_time": "0:41:32", "remaining_time": "0:56:05", "throughput": 4253.84, "total_tokens": 10601864} {"current_steps": 16240, "total_steps": 38160, "loss": 0.3944, "lr": 0.00071043825108759, "epoch": 8.51153039832285, "percentage": 42.56, "elapsed_time": "0:41:32", "remaining_time": "0:56:04", "throughput": 4253.79, "total_tokens": 10604488} {"current_steps": 16245, "total_steps": 38160, "loss": 0.4488, "lr": 0.0007102307841827079, "epoch": 8.514150943396226, "percentage": 42.57, "elapsed_time": "0:41:33", "remaining_time": "0:56:03", "throughput": 4253.78, "total_tokens": 10607400} {"current_steps": 16250, "total_steps": 38160, "loss": 0.4575, "lr": 0.0007100232732999443, "epoch": 8.516771488469601, "percentage": 42.58, "elapsed_time": "0:41:34", "remaining_time": "0:56:03", "throughput": 4253.75, "total_tokens": 10610184} {"current_steps": 16255, "total_steps": 38160, "loss": 0.4986, "lr": 0.0007098157184827076, "epoch": 8.519392033542976, "percentage": 42.6, "elapsed_time": "0:41:34", "remaining_time": "0:56:02", "throughput": 4253.75, "total_tokens": 10613096} {"current_steps": 16260, "total_steps": 38160, "loss": 0.3648, "lr": 0.0007096081197744166, "epoch": 8.522012578616351, "percentage": 42.61, "elapsed_time": "0:41:35", "remaining_time": "0:56:01", "throughput": 4253.9, "total_tokens": 10616872} {"current_steps": 16265, "total_steps": 38160, "loss": 0.426, "lr": 0.0007094004772184981, "epoch": 8.524633123689728, "percentage": 42.62, "elapsed_time": "0:41:36", "remaining_time": "0:56:00", "throughput": 4253.95, "total_tokens": 10620104} {"current_steps": 16270, "total_steps": 38160, "loss": 0.3524, "lr": 0.0007091927908583889, "epoch": 8.527253668763104, "percentage": 42.64, "elapsed_time": "0:41:37", "remaining_time": "0:55:59", "throughput": 4254.02, "total_tokens": 10623400} {"current_steps": 16275, "total_steps": 38160, "loss": 0.4523, "lr": 0.0007089850607375343, "epoch": 8.529874213836479, "percentage": 42.65, "elapsed_time": "0:41:37", "remaining_time": "0:55:58", "throughput": 4254.02, "total_tokens": 10626344} {"current_steps": 16280, "total_steps": 38160, "loss": 0.5826, "lr": 0.0007087772868993894, "epoch": 8.532494758909854, "percentage": 42.66, "elapsed_time": "0:41:38", "remaining_time": "0:55:58", "throughput": 4254.03, "total_tokens": 10629256} {"current_steps": 16285, "total_steps": 38160, "loss": 0.5367, "lr": 0.0007085694693874178, "epoch": 8.535115303983229, "percentage": 42.68, "elapsed_time": "0:41:39", "remaining_time": "0:55:57", "throughput": 4253.93, "total_tokens": 10631624} {"current_steps": 16290, "total_steps": 38160, "loss": 0.5173, "lr": 0.0007083616082450928, "epoch": 8.537735849056604, "percentage": 42.69, "elapsed_time": "0:41:39", "remaining_time": "0:55:56", "throughput": 4253.79, "total_tokens": 10633928} {"current_steps": 16295, "total_steps": 38160, "loss": 0.5625, "lr": 0.0007081537035158962, "epoch": 8.54035639412998, "percentage": 42.7, "elapsed_time": "0:41:40", "remaining_time": "0:55:55", "throughput": 4253.99, "total_tokens": 10637800} {"current_steps": 16300, "total_steps": 38160, "loss": 0.4415, "lr": 0.0007079457552433198, "epoch": 8.542976939203355, "percentage": 42.71, "elapsed_time": "0:41:41", "remaining_time": "0:55:54", "throughput": 4254.05, "total_tokens": 10641096} {"current_steps": 16305, "total_steps": 38160, "loss": 0.4719, "lr": 0.0007077377634708637, "epoch": 8.54559748427673, "percentage": 42.73, "elapsed_time": "0:41:42", "remaining_time": "0:55:53", "throughput": 4254.03, "total_tokens": 10643848} {"current_steps": 16310, "total_steps": 38160, "loss": 0.423, "lr": 0.0007075297282420375, "epoch": 8.548218029350105, "percentage": 42.74, "elapsed_time": "0:41:42", "remaining_time": "0:55:52", "throughput": 4253.96, "total_tokens": 10646408} {"current_steps": 16315, "total_steps": 38160, "loss": 0.5563, "lr": 0.0007073216496003598, "epoch": 8.55083857442348, "percentage": 42.75, "elapsed_time": "0:41:43", "remaining_time": "0:55:52", "throughput": 4254.1, "total_tokens": 10650056} {"current_steps": 16320, "total_steps": 38160, "loss": 0.4976, "lr": 0.0007071135275893584, "epoch": 8.553459119496855, "percentage": 42.77, "elapsed_time": "0:41:44", "remaining_time": "0:55:51", "throughput": 4254.17, "total_tokens": 10653384} {"current_steps": 16325, "total_steps": 38160, "loss": 0.5123, "lr": 0.0007069053622525696, "epoch": 8.55607966457023, "percentage": 42.78, "elapsed_time": "0:41:44", "remaining_time": "0:55:50", "throughput": 4254.28, "total_tokens": 10656936} {"current_steps": 16330, "total_steps": 38160, "loss": 0.3755, "lr": 0.0007066971536335395, "epoch": 8.558700209643606, "percentage": 42.79, "elapsed_time": "0:41:45", "remaining_time": "0:55:49", "throughput": 4254.19, "total_tokens": 10659400} {"current_steps": 16335, "total_steps": 38160, "loss": 0.4376, "lr": 0.0007064889017758234, "epoch": 8.56132075471698, "percentage": 42.81, "elapsed_time": "0:41:46", "remaining_time": "0:55:48", "throughput": 4254.22, "total_tokens": 10662376} {"current_steps": 16340, "total_steps": 38160, "loss": 0.4062, "lr": 0.0007062806067229845, "epoch": 8.563941299790356, "percentage": 42.82, "elapsed_time": "0:41:46", "remaining_time": "0:55:47", "throughput": 4254.21, "total_tokens": 10665288} {"current_steps": 16345, "total_steps": 38160, "loss": 0.4501, "lr": 0.0007060722685185961, "epoch": 8.566561844863731, "percentage": 42.83, "elapsed_time": "0:41:47", "remaining_time": "0:55:47", "throughput": 4254.62, "total_tokens": 10670280} {"current_steps": 16350, "total_steps": 38160, "loss": 0.3068, "lr": 0.00070586388720624, "epoch": 8.569182389937106, "percentage": 42.85, "elapsed_time": "0:41:48", "remaining_time": "0:55:46", "throughput": 4254.55, "total_tokens": 10672872} {"current_steps": 16355, "total_steps": 38160, "loss": 0.4667, "lr": 0.0007056554628295076, "epoch": 8.571802935010481, "percentage": 42.86, "elapsed_time": "0:41:49", "remaining_time": "0:55:45", "throughput": 4254.64, "total_tokens": 10676232} {"current_steps": 16360, "total_steps": 38160, "loss": 0.5032, "lr": 0.0007054469954319984, "epoch": 8.574423480083858, "percentage": 42.87, "elapsed_time": "0:41:50", "remaining_time": "0:55:44", "throughput": 4254.68, "total_tokens": 10679336} {"current_steps": 16365, "total_steps": 38160, "loss": 0.3939, "lr": 0.0007052384850573217, "epoch": 8.577044025157234, "percentage": 42.89, "elapsed_time": "0:41:50", "remaining_time": "0:55:43", "throughput": 4254.63, "total_tokens": 10682024} {"current_steps": 16370, "total_steps": 38160, "loss": 0.4376, "lr": 0.0007050299317490952, "epoch": 8.579664570230609, "percentage": 42.9, "elapsed_time": "0:41:51", "remaining_time": "0:55:42", "throughput": 4254.76, "total_tokens": 10685608} {"current_steps": 16375, "total_steps": 38160, "loss": 0.3681, "lr": 0.0007048213355509463, "epoch": 8.582285115303984, "percentage": 42.91, "elapsed_time": "0:41:52", "remaining_time": "0:55:42", "throughput": 4254.8, "total_tokens": 10688744} {"current_steps": 16380, "total_steps": 38160, "loss": 0.4193, "lr": 0.0007046126965065107, "epoch": 8.584905660377359, "percentage": 42.92, "elapsed_time": "0:41:52", "remaining_time": "0:55:41", "throughput": 4254.88, "total_tokens": 10692104} {"current_steps": 16385, "total_steps": 38160, "loss": 0.4808, "lr": 0.0007044040146594332, "epoch": 8.587526205450734, "percentage": 42.94, "elapsed_time": "0:41:53", "remaining_time": "0:55:40", "throughput": 4254.97, "total_tokens": 10695400} {"current_steps": 16390, "total_steps": 38160, "loss": 0.3634, "lr": 0.0007041952900533681, "epoch": 8.59014675052411, "percentage": 42.95, "elapsed_time": "0:41:54", "remaining_time": "0:55:39", "throughput": 4255.03, "total_tokens": 10698632} {"current_steps": 16395, "total_steps": 38160, "loss": 0.4988, "lr": 0.0007039865227319777, "epoch": 8.592767295597485, "percentage": 42.96, "elapsed_time": "0:41:55", "remaining_time": "0:55:38", "throughput": 4255.04, "total_tokens": 10701672} {"current_steps": 16400, "total_steps": 38160, "loss": 0.4518, "lr": 0.0007037777127389339, "epoch": 8.59538784067086, "percentage": 42.98, "elapsed_time": "0:41:55", "remaining_time": "0:55:38", "throughput": 4255.11, "total_tokens": 10704936} {"current_steps": 16405, "total_steps": 38160, "loss": 0.6561, "lr": 0.0007035688601179177, "epoch": 8.598008385744235, "percentage": 42.99, "elapsed_time": "0:41:56", "remaining_time": "0:55:37", "throughput": 4255.09, "total_tokens": 10707720} {"current_steps": 16410, "total_steps": 38160, "loss": 0.6468, "lr": 0.000703359964912618, "epoch": 8.60062893081761, "percentage": 43.0, "elapsed_time": "0:41:57", "remaining_time": "0:55:36", "throughput": 4255.06, "total_tokens": 10710440} {"current_steps": 16415, "total_steps": 38160, "loss": 0.4958, "lr": 0.000703151027166734, "epoch": 8.603249475890985, "percentage": 43.02, "elapsed_time": "0:41:57", "remaining_time": "0:55:35", "throughput": 4255.16, "total_tokens": 10713896} {"current_steps": 16420, "total_steps": 38160, "loss": 0.4112, "lr": 0.0007029420469239726, "epoch": 8.60587002096436, "percentage": 43.03, "elapsed_time": "0:41:58", "remaining_time": "0:55:34", "throughput": 4255.22, "total_tokens": 10717032} {"current_steps": 16425, "total_steps": 38160, "loss": 0.4158, "lr": 0.0007027330242280503, "epoch": 8.608490566037736, "percentage": 43.04, "elapsed_time": "0:41:59", "remaining_time": "0:55:33", "throughput": 4255.2, "total_tokens": 10719784} {"current_steps": 16430, "total_steps": 38160, "loss": 0.4991, "lr": 0.0007025239591226923, "epoch": 8.61111111111111, "percentage": 43.06, "elapsed_time": "0:41:59", "remaining_time": "0:55:32", "throughput": 4255.1, "total_tokens": 10722216} {"current_steps": 16435, "total_steps": 38160, "loss": 0.4704, "lr": 0.0007023148516516326, "epoch": 8.613731656184486, "percentage": 43.07, "elapsed_time": "0:42:00", "remaining_time": "0:55:31", "throughput": 4255.1, "total_tokens": 10725160} {"current_steps": 16440, "total_steps": 38160, "loss": 0.4313, "lr": 0.0007021057018586139, "epoch": 8.616352201257861, "percentage": 43.08, "elapsed_time": "0:42:01", "remaining_time": "0:55:30", "throughput": 4255.1, "total_tokens": 10728136} {"current_steps": 16445, "total_steps": 38160, "loss": 0.4124, "lr": 0.0007018965097873883, "epoch": 8.618972746331236, "percentage": 43.09, "elapsed_time": "0:42:01", "remaining_time": "0:55:30", "throughput": 4255.05, "total_tokens": 10730920} {"current_steps": 16450, "total_steps": 38160, "loss": 0.5328, "lr": 0.0007016872754817161, "epoch": 8.621593291404611, "percentage": 43.11, "elapsed_time": "0:42:02", "remaining_time": "0:55:29", "throughput": 4255.05, "total_tokens": 10733896} {"current_steps": 16455, "total_steps": 38160, "loss": 0.5628, "lr": 0.0007014779989853668, "epoch": 8.624213836477988, "percentage": 43.12, "elapsed_time": "0:42:03", "remaining_time": "0:55:28", "throughput": 4255.01, "total_tokens": 10736616} {"current_steps": 16460, "total_steps": 38160, "loss": 0.3811, "lr": 0.0007012686803421189, "epoch": 8.626834381551364, "percentage": 43.13, "elapsed_time": "0:42:03", "remaining_time": "0:55:27", "throughput": 4255.01, "total_tokens": 10739560} {"current_steps": 16465, "total_steps": 38160, "loss": 0.437, "lr": 0.000701059319595759, "epoch": 8.629454926624739, "percentage": 43.15, "elapsed_time": "0:42:04", "remaining_time": "0:55:26", "throughput": 4255.01, "total_tokens": 10742472} {"current_steps": 16470, "total_steps": 38160, "loss": 0.5292, "lr": 0.0007008499167900833, "epoch": 8.632075471698114, "percentage": 43.16, "elapsed_time": "0:42:05", "remaining_time": "0:55:25", "throughput": 4255.16, "total_tokens": 10746120} {"current_steps": 16475, "total_steps": 38160, "loss": 0.4213, "lr": 0.0007006404719688966, "epoch": 8.634696016771489, "percentage": 43.17, "elapsed_time": "0:42:06", "remaining_time": "0:55:25", "throughput": 4255.25, "total_tokens": 10749608} {"current_steps": 16480, "total_steps": 38160, "loss": 0.6415, "lr": 0.000700430985176012, "epoch": 8.637316561844864, "percentage": 43.19, "elapsed_time": "0:42:07", "remaining_time": "0:55:24", "throughput": 4255.43, "total_tokens": 10753544} {"current_steps": 16485, "total_steps": 38160, "loss": 0.4962, "lr": 0.0007002214564552521, "epoch": 8.63993710691824, "percentage": 43.2, "elapsed_time": "0:42:07", "remaining_time": "0:55:23", "throughput": 4255.49, "total_tokens": 10756744} {"current_steps": 16490, "total_steps": 38160, "loss": 0.3003, "lr": 0.0007000118858504476, "epoch": 8.642557651991615, "percentage": 43.21, "elapsed_time": "0:42:08", "remaining_time": "0:55:22", "throughput": 4255.64, "total_tokens": 10760424} {"current_steps": 16495, "total_steps": 38160, "loss": 0.4722, "lr": 0.0006998022734054386, "epoch": 8.64517819706499, "percentage": 43.23, "elapsed_time": "0:42:09", "remaining_time": "0:55:21", "throughput": 4255.66, "total_tokens": 10763432} {"current_steps": 16500, "total_steps": 38160, "loss": 0.4912, "lr": 0.0006995926191640734, "epoch": 8.647798742138365, "percentage": 43.24, "elapsed_time": "0:42:09", "remaining_time": "0:55:21", "throughput": 4255.74, "total_tokens": 10766792} {"current_steps": 16505, "total_steps": 38160, "loss": 0.3889, "lr": 0.0006993829231702092, "epoch": 8.65041928721174, "percentage": 43.25, "elapsed_time": "0:42:10", "remaining_time": "0:55:20", "throughput": 4255.95, "total_tokens": 10770888} {"current_steps": 16510, "total_steps": 38160, "loss": 0.3888, "lr": 0.0006991731854677124, "epoch": 8.653039832285115, "percentage": 43.27, "elapsed_time": "0:42:11", "remaining_time": "0:55:19", "throughput": 4256.23, "total_tokens": 10775432} {"current_steps": 16515, "total_steps": 38160, "loss": 0.6009, "lr": 0.0006989634061004572, "epoch": 8.65566037735849, "percentage": 43.28, "elapsed_time": "0:42:12", "remaining_time": "0:55:18", "throughput": 4256.08, "total_tokens": 10777544} {"current_steps": 16520, "total_steps": 38160, "loss": 0.4929, "lr": 0.0006987535851123276, "epoch": 8.658280922431866, "percentage": 43.29, "elapsed_time": "0:42:13", "remaining_time": "0:55:18", "throughput": 4256.15, "total_tokens": 10780840} {"current_steps": 16525, "total_steps": 38160, "loss": 0.4366, "lr": 0.0006985437225472155, "epoch": 8.66090146750524, "percentage": 43.3, "elapsed_time": "0:42:14", "remaining_time": "0:55:17", "throughput": 4256.57, "total_tokens": 10786216} {"current_steps": 16530, "total_steps": 38160, "loss": 0.3113, "lr": 0.0006983338184490215, "epoch": 8.663522012578616, "percentage": 43.32, "elapsed_time": "0:42:14", "remaining_time": "0:55:16", "throughput": 4256.58, "total_tokens": 10789160} {"current_steps": 16535, "total_steps": 38160, "loss": 0.4066, "lr": 0.0006981238728616557, "epoch": 8.666142557651991, "percentage": 43.33, "elapsed_time": "0:42:15", "remaining_time": "0:55:16", "throughput": 4256.75, "total_tokens": 10793032} {"current_steps": 16540, "total_steps": 38160, "loss": 0.495, "lr": 0.0006979138858290358, "epoch": 8.668763102725366, "percentage": 43.34, "elapsed_time": "0:42:16", "remaining_time": "0:55:15", "throughput": 4256.77, "total_tokens": 10796008} {"current_steps": 16545, "total_steps": 38160, "loss": 0.4271, "lr": 0.0006977038573950889, "epoch": 8.671383647798741, "percentage": 43.36, "elapsed_time": "0:42:16", "remaining_time": "0:55:14", "throughput": 4256.79, "total_tokens": 10799016} {"current_steps": 16550, "total_steps": 38160, "loss": 0.6033, "lr": 0.0006974937876037508, "epoch": 8.674004192872118, "percentage": 43.37, "elapsed_time": "0:42:17", "remaining_time": "0:55:13", "throughput": 4256.8, "total_tokens": 10802120} {"current_steps": 16555, "total_steps": 38160, "loss": 0.4006, "lr": 0.0006972836764989652, "epoch": 8.676624737945493, "percentage": 43.38, "elapsed_time": "0:42:18", "remaining_time": "0:55:12", "throughput": 4256.93, "total_tokens": 10805832} {"current_steps": 16560, "total_steps": 38160, "loss": 0.3993, "lr": 0.0006970735241246853, "epoch": 8.679245283018869, "percentage": 43.4, "elapsed_time": "0:42:19", "remaining_time": "0:55:11", "throughput": 4256.95, "total_tokens": 10808744} {"current_steps": 16565, "total_steps": 38160, "loss": 0.3901, "lr": 0.0006968633305248724, "epoch": 8.681865828092244, "percentage": 43.41, "elapsed_time": "0:42:19", "remaining_time": "0:55:11", "throughput": 4257.01, "total_tokens": 10812072} {"current_steps": 16570, "total_steps": 38160, "loss": 0.6024, "lr": 0.0006966530957434968, "epoch": 8.684486373165619, "percentage": 43.42, "elapsed_time": "0:42:20", "remaining_time": "0:55:10", "throughput": 4256.9, "total_tokens": 10814440} {"current_steps": 16575, "total_steps": 38160, "loss": 0.462, "lr": 0.0006964428198245372, "epoch": 8.687106918238994, "percentage": 43.44, "elapsed_time": "0:42:21", "remaining_time": "0:55:09", "throughput": 4256.86, "total_tokens": 10817192} {"current_steps": 16580, "total_steps": 38160, "loss": 0.3784, "lr": 0.0006962325028119806, "epoch": 8.68972746331237, "percentage": 43.45, "elapsed_time": "0:42:21", "remaining_time": "0:55:08", "throughput": 4256.8, "total_tokens": 10819720} {"current_steps": 16585, "total_steps": 38160, "loss": 0.4141, "lr": 0.0006960221447498232, "epoch": 8.692348008385745, "percentage": 43.46, "elapsed_time": "0:42:22", "remaining_time": "0:55:07", "throughput": 4256.81, "total_tokens": 10822600} {"current_steps": 16590, "total_steps": 38160, "loss": 0.3727, "lr": 0.0006958117456820696, "epoch": 8.69496855345912, "percentage": 43.47, "elapsed_time": "0:42:23", "remaining_time": "0:55:06", "throughput": 4256.82, "total_tokens": 10825640} {"current_steps": 16595, "total_steps": 38160, "loss": 0.468, "lr": 0.0006956013056527326, "epoch": 8.697589098532495, "percentage": 43.49, "elapsed_time": "0:42:24", "remaining_time": "0:55:06", "throughput": 4257.46, "total_tokens": 10832648} {"current_steps": 16600, "total_steps": 38160, "loss": 0.4285, "lr": 0.0006953908247058341, "epoch": 8.70020964360587, "percentage": 43.5, "elapsed_time": "0:42:25", "remaining_time": "0:55:05", "throughput": 4257.49, "total_tokens": 10835816} {"current_steps": 16605, "total_steps": 38160, "loss": 0.5071, "lr": 0.0006951803028854041, "epoch": 8.702830188679245, "percentage": 43.51, "elapsed_time": "0:42:25", "remaining_time": "0:55:04", "throughput": 4257.65, "total_tokens": 10839496} {"current_steps": 16610, "total_steps": 38160, "loss": 0.4937, "lr": 0.0006949697402354816, "epoch": 8.70545073375262, "percentage": 43.53, "elapsed_time": "0:42:26", "remaining_time": "0:55:04", "throughput": 4257.84, "total_tokens": 10843432} {"current_steps": 16615, "total_steps": 38160, "loss": 0.3695, "lr": 0.0006947591368001138, "epoch": 8.708071278825996, "percentage": 43.54, "elapsed_time": "0:42:27", "remaining_time": "0:55:03", "throughput": 4257.8, "total_tokens": 10846152} {"current_steps": 16620, "total_steps": 38160, "loss": 0.4312, "lr": 0.0006945484926233563, "epoch": 8.71069182389937, "percentage": 43.55, "elapsed_time": "0:42:28", "remaining_time": "0:55:02", "throughput": 4257.97, "total_tokens": 10849896} {"current_steps": 16625, "total_steps": 38160, "loss": 0.4668, "lr": 0.0006943378077492737, "epoch": 8.713312368972746, "percentage": 43.57, "elapsed_time": "0:42:28", "remaining_time": "0:55:01", "throughput": 4258.0, "total_tokens": 10852904} {"current_steps": 16630, "total_steps": 38160, "loss": 0.4817, "lr": 0.000694127082221939, "epoch": 8.715932914046121, "percentage": 43.58, "elapsed_time": "0:42:29", "remaining_time": "0:55:00", "throughput": 4257.96, "total_tokens": 10855624} {"current_steps": 16635, "total_steps": 38160, "loss": 0.4121, "lr": 0.0006939163160854334, "epoch": 8.718553459119496, "percentage": 43.59, "elapsed_time": "0:42:30", "remaining_time": "0:54:59", "throughput": 4258.11, "total_tokens": 10859432} {"current_steps": 16640, "total_steps": 38160, "loss": 0.3515, "lr": 0.0006937055093838467, "epoch": 8.721174004192871, "percentage": 43.61, "elapsed_time": "0:42:30", "remaining_time": "0:54:59", "throughput": 4258.15, "total_tokens": 10862472} {"current_steps": 16645, "total_steps": 38160, "loss": 0.4401, "lr": 0.0006934946621612774, "epoch": 8.723794549266248, "percentage": 43.62, "elapsed_time": "0:42:31", "remaining_time": "0:54:58", "throughput": 4258.1, "total_tokens": 10865128} {"current_steps": 16650, "total_steps": 38160, "loss": 0.5261, "lr": 0.0006932837744618322, "epoch": 8.726415094339622, "percentage": 43.63, "elapsed_time": "0:42:32", "remaining_time": "0:54:57", "throughput": 4258.17, "total_tokens": 10868520} {"current_steps": 16655, "total_steps": 38160, "loss": 0.5376, "lr": 0.0006930728463296265, "epoch": 8.729035639412999, "percentage": 43.65, "elapsed_time": "0:42:33", "remaining_time": "0:54:56", "throughput": 4258.3, "total_tokens": 10872232} {"current_steps": 16660, "total_steps": 38160, "loss": 0.5506, "lr": 0.0006928618778087842, "epoch": 8.731656184486374, "percentage": 43.66, "elapsed_time": "0:42:34", "remaining_time": "0:54:56", "throughput": 4258.68, "total_tokens": 10877288} {"current_steps": 16665, "total_steps": 38160, "loss": 0.3492, "lr": 0.0006926508689434371, "epoch": 8.734276729559749, "percentage": 43.67, "elapsed_time": "0:42:34", "remaining_time": "0:54:55", "throughput": 4258.73, "total_tokens": 10880424} {"current_steps": 16670, "total_steps": 38160, "loss": 0.3497, "lr": 0.0006924398197777263, "epoch": 8.736897274633124, "percentage": 43.68, "elapsed_time": "0:42:35", "remaining_time": "0:54:54", "throughput": 4258.87, "total_tokens": 10884072} {"current_steps": 16675, "total_steps": 38160, "loss": 0.5118, "lr": 0.0006922287303558006, "epoch": 8.7395178197065, "percentage": 43.7, "elapsed_time": "0:42:36", "remaining_time": "0:54:53", "throughput": 4259.09, "total_tokens": 10888136} {"current_steps": 16680, "total_steps": 38160, "loss": 0.4123, "lr": 0.0006920176007218175, "epoch": 8.742138364779874, "percentage": 43.71, "elapsed_time": "0:42:37", "remaining_time": "0:54:52", "throughput": 4259.1, "total_tokens": 10891080} {"current_steps": 16685, "total_steps": 38160, "loss": 0.4515, "lr": 0.000691806430919943, "epoch": 8.74475890985325, "percentage": 43.72, "elapsed_time": "0:42:37", "remaining_time": "0:54:52", "throughput": 4259.11, "total_tokens": 10894056} {"current_steps": 16690, "total_steps": 38160, "loss": 0.4591, "lr": 0.0006915952209943514, "epoch": 8.747379454926625, "percentage": 43.74, "elapsed_time": "0:42:38", "remaining_time": "0:54:51", "throughput": 4259.19, "total_tokens": 10897416} {"current_steps": 16695, "total_steps": 38160, "loss": 0.5091, "lr": 0.0006913839709892256, "epoch": 8.75, "percentage": 43.75, "elapsed_time": "0:42:39", "remaining_time": "0:54:50", "throughput": 4259.25, "total_tokens": 10900712} {"current_steps": 16700, "total_steps": 38160, "loss": 0.5292, "lr": 0.0006911726809487561, "epoch": 8.752620545073375, "percentage": 43.76, "elapsed_time": "0:42:40", "remaining_time": "0:54:49", "throughput": 4259.33, "total_tokens": 10904200} {"current_steps": 16705, "total_steps": 38160, "loss": 0.6292, "lr": 0.0006909613509171431, "epoch": 8.75524109014675, "percentage": 43.78, "elapsed_time": "0:42:40", "remaining_time": "0:54:48", "throughput": 4259.35, "total_tokens": 10907176} {"current_steps": 16710, "total_steps": 38160, "loss": 0.5508, "lr": 0.0006907499809385941, "epoch": 8.757861635220126, "percentage": 43.79, "elapsed_time": "0:42:41", "remaining_time": "0:54:48", "throughput": 4259.58, "total_tokens": 10911400} {"current_steps": 16715, "total_steps": 38160, "loss": 0.3445, "lr": 0.0006905385710573252, "epoch": 8.7604821802935, "percentage": 43.8, "elapsed_time": "0:42:42", "remaining_time": "0:54:47", "throughput": 4259.67, "total_tokens": 10914792} {"current_steps": 16720, "total_steps": 38160, "loss": 0.3417, "lr": 0.000690327121317561, "epoch": 8.763102725366876, "percentage": 43.82, "elapsed_time": "0:42:43", "remaining_time": "0:54:46", "throughput": 4259.8, "total_tokens": 10918536} {"current_steps": 16725, "total_steps": 38160, "loss": 0.4895, "lr": 0.0006901156317635342, "epoch": 8.765723270440251, "percentage": 43.83, "elapsed_time": "0:42:43", "remaining_time": "0:54:45", "throughput": 4259.85, "total_tokens": 10921704} {"current_steps": 16730, "total_steps": 38160, "loss": 0.4132, "lr": 0.0006899041024394864, "epoch": 8.768343815513626, "percentage": 43.84, "elapsed_time": "0:42:44", "remaining_time": "0:54:44", "throughput": 4259.76, "total_tokens": 10924104} {"current_steps": 16735, "total_steps": 38160, "loss": 0.3756, "lr": 0.000689692533389667, "epoch": 8.770964360587001, "percentage": 43.85, "elapsed_time": "0:42:45", "remaining_time": "0:54:44", "throughput": 4259.83, "total_tokens": 10927368} {"current_steps": 16740, "total_steps": 38160, "loss": 0.4422, "lr": 0.0006894809246583334, "epoch": 8.773584905660378, "percentage": 43.87, "elapsed_time": "0:42:45", "remaining_time": "0:54:43", "throughput": 4259.84, "total_tokens": 10930280} {"current_steps": 16745, "total_steps": 38160, "loss": 0.4879, "lr": 0.0006892692762897523, "epoch": 8.776205450733752, "percentage": 43.88, "elapsed_time": "0:42:46", "remaining_time": "0:54:42", "throughput": 4259.86, "total_tokens": 10933256} {"current_steps": 16750, "total_steps": 38160, "loss": 0.5821, "lr": 0.000689057588328198, "epoch": 8.778825995807129, "percentage": 43.89, "elapsed_time": "0:42:47", "remaining_time": "0:54:41", "throughput": 4259.72, "total_tokens": 10935432} {"current_steps": 16755, "total_steps": 38160, "loss": 0.4426, "lr": 0.0006888458608179528, "epoch": 8.781446540880504, "percentage": 43.91, "elapsed_time": "0:42:47", "remaining_time": "0:54:40", "throughput": 4259.89, "total_tokens": 10939400} {"current_steps": 16760, "total_steps": 38160, "loss": 0.5576, "lr": 0.0006886340938033085, "epoch": 8.784067085953879, "percentage": 43.92, "elapsed_time": "0:42:48", "remaining_time": "0:54:39", "throughput": 4259.83, "total_tokens": 10941928} {"current_steps": 16765, "total_steps": 38160, "loss": 0.3986, "lr": 0.0006884222873285632, "epoch": 8.786687631027254, "percentage": 43.93, "elapsed_time": "0:42:49", "remaining_time": "0:54:38", "throughput": 4259.91, "total_tokens": 10945256} {"current_steps": 16770, "total_steps": 38160, "loss": 0.5403, "lr": 0.0006882104414380254, "epoch": 8.78930817610063, "percentage": 43.95, "elapsed_time": "0:42:50", "remaining_time": "0:54:38", "throughput": 4260.15, "total_tokens": 10949448} {"current_steps": 16775, "total_steps": 38160, "loss": 0.5198, "lr": 0.0006879985561760105, "epoch": 8.791928721174004, "percentage": 43.96, "elapsed_time": "0:42:50", "remaining_time": "0:54:37", "throughput": 4260.12, "total_tokens": 10952264} {"current_steps": 16780, "total_steps": 38160, "loss": 0.6528, "lr": 0.0006877866315868422, "epoch": 8.79454926624738, "percentage": 43.97, "elapsed_time": "0:42:51", "remaining_time": "0:54:36", "throughput": 4260.08, "total_tokens": 10954952} {"current_steps": 16785, "total_steps": 38160, "loss": 0.4562, "lr": 0.0006875746677148531, "epoch": 8.797169811320755, "percentage": 43.99, "elapsed_time": "0:42:52", "remaining_time": "0:54:35", "throughput": 4260.18, "total_tokens": 10958472} {"current_steps": 16790, "total_steps": 38160, "loss": 0.4821, "lr": 0.0006873626646043835, "epoch": 8.79979035639413, "percentage": 44.0, "elapsed_time": "0:42:52", "remaining_time": "0:54:34", "throughput": 4260.14, "total_tokens": 10961256} {"current_steps": 16795, "total_steps": 38160, "loss": 0.3967, "lr": 0.000687150622299782, "epoch": 8.802410901467505, "percentage": 44.01, "elapsed_time": "0:42:53", "remaining_time": "0:54:34", "throughput": 4260.19, "total_tokens": 10964488} {"current_steps": 16800, "total_steps": 38160, "loss": 0.4057, "lr": 0.0006869385408454056, "epoch": 8.80503144654088, "percentage": 44.03, "elapsed_time": "0:42:54", "remaining_time": "0:54:33", "throughput": 4260.16, "total_tokens": 10967272} {"current_steps": 16805, "total_steps": 38160, "loss": 0.4274, "lr": 0.0006867264202856188, "epoch": 8.807651991614255, "percentage": 44.04, "elapsed_time": "0:42:55", "remaining_time": "0:54:32", "throughput": 4260.23, "total_tokens": 10970472} {"current_steps": 16810, "total_steps": 38160, "loss": 0.4975, "lr": 0.0006865142606647954, "epoch": 8.81027253668763, "percentage": 44.05, "elapsed_time": "0:42:55", "remaining_time": "0:54:31", "throughput": 4260.17, "total_tokens": 10973032} {"current_steps": 16815, "total_steps": 38160, "loss": 0.4302, "lr": 0.0006863020620273166, "epoch": 8.812893081761006, "percentage": 44.06, "elapsed_time": "0:42:56", "remaining_time": "0:54:30", "throughput": 4260.21, "total_tokens": 10976136} {"current_steps": 16820, "total_steps": 38160, "loss": 0.3436, "lr": 0.0006860898244175716, "epoch": 8.815513626834381, "percentage": 44.08, "elapsed_time": "0:42:57", "remaining_time": "0:54:29", "throughput": 4260.21, "total_tokens": 10979176} {"current_steps": 16825, "total_steps": 38160, "loss": 0.3823, "lr": 0.0006858775478799586, "epoch": 8.818134171907756, "percentage": 44.09, "elapsed_time": "0:42:57", "remaining_time": "0:54:28", "throughput": 4260.37, "total_tokens": 10983016} {"current_steps": 16830, "total_steps": 38160, "loss": 0.4389, "lr": 0.0006856652324588831, "epoch": 8.820754716981131, "percentage": 44.1, "elapsed_time": "0:42:58", "remaining_time": "0:54:28", "throughput": 4260.33, "total_tokens": 10985704} {"current_steps": 16835, "total_steps": 38160, "loss": 0.4378, "lr": 0.000685452878198759, "epoch": 8.823375262054507, "percentage": 44.12, "elapsed_time": "0:42:59", "remaining_time": "0:54:27", "throughput": 4260.27, "total_tokens": 10988296} {"current_steps": 16840, "total_steps": 38160, "loss": 0.5459, "lr": 0.0006852404851440088, "epoch": 8.825995807127882, "percentage": 44.13, "elapsed_time": "0:43:00", "remaining_time": "0:54:26", "throughput": 4260.46, "total_tokens": 10992232} {"current_steps": 16845, "total_steps": 38160, "loss": 0.4203, "lr": 0.0006850280533390624, "epoch": 8.828616352201259, "percentage": 44.14, "elapsed_time": "0:43:01", "remaining_time": "0:54:26", "throughput": 4261.06, "total_tokens": 10998600} {"current_steps": 16850, "total_steps": 38160, "loss": 0.4427, "lr": 0.0006848155828283581, "epoch": 8.831236897274634, "percentage": 44.16, "elapsed_time": "0:43:02", "remaining_time": "0:54:25", "throughput": 4261.27, "total_tokens": 11002664} {"current_steps": 16855, "total_steps": 38160, "loss": 0.3531, "lr": 0.0006846030736563422, "epoch": 8.833857442348009, "percentage": 44.17, "elapsed_time": "0:43:02", "remaining_time": "0:54:24", "throughput": 4261.23, "total_tokens": 11005320} {"current_steps": 16860, "total_steps": 38160, "loss": 0.4678, "lr": 0.0006843905258674696, "epoch": 8.836477987421384, "percentage": 44.18, "elapsed_time": "0:43:03", "remaining_time": "0:54:23", "throughput": 4261.29, "total_tokens": 11008488} {"current_steps": 16865, "total_steps": 38160, "loss": 0.4479, "lr": 0.0006841779395062026, "epoch": 8.83909853249476, "percentage": 44.2, "elapsed_time": "0:43:04", "remaining_time": "0:54:22", "throughput": 4261.22, "total_tokens": 11011016} {"current_steps": 16870, "total_steps": 38160, "loss": 0.3472, "lr": 0.0006839653146170116, "epoch": 8.841719077568134, "percentage": 44.21, "elapsed_time": "0:43:04", "remaining_time": "0:54:22", "throughput": 4261.4, "total_tokens": 11015016} {"current_steps": 16875, "total_steps": 38160, "loss": 0.5101, "lr": 0.0006837526512443758, "epoch": 8.84433962264151, "percentage": 44.22, "elapsed_time": "0:43:05", "remaining_time": "0:54:21", "throughput": 4261.37, "total_tokens": 11017800} {"current_steps": 16880, "total_steps": 38160, "loss": 0.5476, "lr": 0.0006835399494327818, "epoch": 8.846960167714885, "percentage": 44.23, "elapsed_time": "0:43:06", "remaining_time": "0:54:20", "throughput": 4261.35, "total_tokens": 11020616} {"current_steps": 16885, "total_steps": 38160, "loss": 0.4343, "lr": 0.0006833272092267241, "epoch": 8.84958071278826, "percentage": 44.25, "elapsed_time": "0:43:06", "remaining_time": "0:54:19", "throughput": 4261.5, "total_tokens": 11024296} {"current_steps": 16890, "total_steps": 38160, "loss": 0.4877, "lr": 0.000683114430670706, "epoch": 8.852201257861635, "percentage": 44.26, "elapsed_time": "0:43:07", "remaining_time": "0:54:18", "throughput": 4261.56, "total_tokens": 11027624} {"current_steps": 16895, "total_steps": 38160, "loss": 0.4943, "lr": 0.0006829016138092378, "epoch": 8.85482180293501, "percentage": 44.27, "elapsed_time": "0:43:08", "remaining_time": "0:54:17", "throughput": 4261.52, "total_tokens": 11030472} {"current_steps": 16900, "total_steps": 38160, "loss": 0.5556, "lr": 0.0006826887586868388, "epoch": 8.857442348008385, "percentage": 44.29, "elapsed_time": "0:43:09", "remaining_time": "0:54:17", "throughput": 4261.62, "total_tokens": 11034024} {"current_steps": 16905, "total_steps": 38160, "loss": 0.377, "lr": 0.0006824758653480356, "epoch": 8.86006289308176, "percentage": 44.3, "elapsed_time": "0:43:10", "remaining_time": "0:54:16", "throughput": 4261.9, "total_tokens": 11038472} {"current_steps": 16910, "total_steps": 38160, "loss": 0.3839, "lr": 0.0006822629338373632, "epoch": 8.862683438155136, "percentage": 44.31, "elapsed_time": "0:43:10", "remaining_time": "0:54:15", "throughput": 4261.98, "total_tokens": 11041896} {"current_steps": 16915, "total_steps": 38160, "loss": 0.5108, "lr": 0.0006820499641993644, "epoch": 8.865303983228511, "percentage": 44.33, "elapsed_time": "0:43:11", "remaining_time": "0:54:14", "throughput": 4262.0, "total_tokens": 11044904} {"current_steps": 16920, "total_steps": 38160, "loss": 0.5021, "lr": 0.0006818369564785902, "epoch": 8.867924528301886, "percentage": 44.34, "elapsed_time": "0:43:12", "remaining_time": "0:54:14", "throughput": 4262.16, "total_tokens": 11048648} {"current_steps": 16925, "total_steps": 38160, "loss": 0.3844, "lr": 0.0006816239107195989, "epoch": 8.870545073375261, "percentage": 44.35, "elapsed_time": "0:43:13", "remaining_time": "0:54:13", "throughput": 4262.25, "total_tokens": 11052168} {"current_steps": 16930, "total_steps": 38160, "loss": 0.4307, "lr": 0.000681410826966958, "epoch": 8.873165618448636, "percentage": 44.37, "elapsed_time": "0:43:13", "remaining_time": "0:54:12", "throughput": 4262.33, "total_tokens": 11055496} {"current_steps": 16935, "total_steps": 38160, "loss": 0.4728, "lr": 0.0006811977052652414, "epoch": 8.875786163522012, "percentage": 44.38, "elapsed_time": "0:43:14", "remaining_time": "0:54:11", "throughput": 4262.53, "total_tokens": 11059432} {"current_steps": 16940, "total_steps": 38160, "loss": 0.4782, "lr": 0.000680984545659032, "epoch": 8.878406708595389, "percentage": 44.39, "elapsed_time": "0:43:15", "remaining_time": "0:54:10", "throughput": 4262.54, "total_tokens": 11062376} {"current_steps": 16945, "total_steps": 38160, "loss": 0.4679, "lr": 0.0006807713481929207, "epoch": 8.881027253668764, "percentage": 44.41, "elapsed_time": "0:43:16", "remaining_time": "0:54:10", "throughput": 4262.85, "total_tokens": 11066888} {"current_steps": 16950, "total_steps": 38160, "loss": 0.4651, "lr": 0.0006805581129115055, "epoch": 8.883647798742139, "percentage": 44.42, "elapsed_time": "0:43:16", "remaining_time": "0:54:09", "throughput": 4262.79, "total_tokens": 11069576} {"current_steps": 16955, "total_steps": 38160, "loss": 0.4363, "lr": 0.0006803448398593931, "epoch": 8.886268343815514, "percentage": 44.43, "elapsed_time": "0:43:17", "remaining_time": "0:54:08", "throughput": 4263.25, "total_tokens": 11075144} {"current_steps": 16960, "total_steps": 38160, "loss": 0.4528, "lr": 0.0006801315290811976, "epoch": 8.88888888888889, "percentage": 44.44, "elapsed_time": "0:43:18", "remaining_time": "0:54:08", "throughput": 4263.36, "total_tokens": 11078600} {"current_steps": 16965, "total_steps": 38160, "loss": 0.4264, "lr": 0.0006799181806215413, "epoch": 8.891509433962264, "percentage": 44.46, "elapsed_time": "0:43:19", "remaining_time": "0:54:07", "throughput": 4263.36, "total_tokens": 11081416} {"current_steps": 16970, "total_steps": 38160, "loss": 0.4863, "lr": 0.0006797047945250543, "epoch": 8.89412997903564, "percentage": 44.47, "elapsed_time": "0:43:19", "remaining_time": "0:54:06", "throughput": 4263.38, "total_tokens": 11084520} {"current_steps": 16975, "total_steps": 38160, "loss": 0.6495, "lr": 0.0006794913708363745, "epoch": 8.896750524109015, "percentage": 44.48, "elapsed_time": "0:43:20", "remaining_time": "0:54:05", "throughput": 4263.34, "total_tokens": 11087208} {"current_steps": 16980, "total_steps": 38160, "loss": 0.4883, "lr": 0.0006792779096001475, "epoch": 8.89937106918239, "percentage": 44.5, "elapsed_time": "0:43:21", "remaining_time": "0:54:04", "throughput": 4263.37, "total_tokens": 11090184} {"current_steps": 16985, "total_steps": 38160, "loss": 0.4533, "lr": 0.0006790644108610273, "epoch": 8.901991614255765, "percentage": 44.51, "elapsed_time": "0:43:21", "remaining_time": "0:54:03", "throughput": 4263.43, "total_tokens": 11093416} {"current_steps": 16990, "total_steps": 38160, "loss": 0.3837, "lr": 0.0006788508746636751, "epoch": 8.90461215932914, "percentage": 44.52, "elapsed_time": "0:43:22", "remaining_time": "0:54:03", "throughput": 4263.56, "total_tokens": 11097096} {"current_steps": 16995, "total_steps": 38160, "loss": 0.4101, "lr": 0.0006786373010527605, "epoch": 8.907232704402515, "percentage": 44.54, "elapsed_time": "0:43:23", "remaining_time": "0:54:02", "throughput": 4263.61, "total_tokens": 11100360} {"current_steps": 17000, "total_steps": 38160, "loss": 0.5602, "lr": 0.0006784236900729603, "epoch": 8.90985324947589, "percentage": 44.55, "elapsed_time": "0:43:24", "remaining_time": "0:54:01", "throughput": 4263.61, "total_tokens": 11103272} {"current_steps": 17005, "total_steps": 38160, "loss": 0.5303, "lr": 0.0006782100417689599, "epoch": 8.912473794549266, "percentage": 44.56, "elapsed_time": "0:43:24", "remaining_time": "0:54:00", "throughput": 4263.67, "total_tokens": 11106568} {"current_steps": 17010, "total_steps": 38160, "loss": 0.3559, "lr": 0.0006779963561854517, "epoch": 8.915094339622641, "percentage": 44.58, "elapsed_time": "0:43:25", "remaining_time": "0:53:59", "throughput": 4263.7, "total_tokens": 11109640} {"current_steps": 17015, "total_steps": 38160, "loss": 0.4314, "lr": 0.0006777826333671367, "epoch": 8.917714884696016, "percentage": 44.59, "elapsed_time": "0:43:26", "remaining_time": "0:53:58", "throughput": 4263.75, "total_tokens": 11112776} {"current_steps": 17020, "total_steps": 38160, "loss": 0.4182, "lr": 0.0006775688733587227, "epoch": 8.920335429769391, "percentage": 44.6, "elapsed_time": "0:43:27", "remaining_time": "0:53:58", "throughput": 4263.79, "total_tokens": 11115912} {"current_steps": 17025, "total_steps": 38160, "loss": 0.4316, "lr": 0.0006773550762049265, "epoch": 8.922955974842766, "percentage": 44.61, "elapsed_time": "0:43:27", "remaining_time": "0:53:57", "throughput": 4263.84, "total_tokens": 11119048} {"current_steps": 17030, "total_steps": 38160, "loss": 0.4838, "lr": 0.0006771412419504716, "epoch": 8.925576519916142, "percentage": 44.63, "elapsed_time": "0:43:28", "remaining_time": "0:53:56", "throughput": 4263.9, "total_tokens": 11122280} {"current_steps": 17035, "total_steps": 38160, "loss": 0.5712, "lr": 0.00067692737064009, "epoch": 8.928197064989519, "percentage": 44.64, "elapsed_time": "0:43:29", "remaining_time": "0:53:55", "throughput": 4263.98, "total_tokens": 11125576} {"current_steps": 17040, "total_steps": 38160, "loss": 0.3907, "lr": 0.0006767134623185208, "epoch": 8.930817610062894, "percentage": 44.65, "elapsed_time": "0:43:29", "remaining_time": "0:53:54", "throughput": 4264.08, "total_tokens": 11128904} {"current_steps": 17045, "total_steps": 38160, "loss": 0.6073, "lr": 0.0006764995170305114, "epoch": 8.933438155136269, "percentage": 44.67, "elapsed_time": "0:43:30", "remaining_time": "0:53:53", "throughput": 4264.11, "total_tokens": 11132008} {"current_steps": 17050, "total_steps": 38160, "loss": 0.5273, "lr": 0.0006762855348208166, "epoch": 8.936058700209644, "percentage": 44.68, "elapsed_time": "0:43:31", "remaining_time": "0:53:53", "throughput": 4264.25, "total_tokens": 11135624} {"current_steps": 17055, "total_steps": 38160, "loss": 0.4961, "lr": 0.0006760715157341991, "epoch": 8.93867924528302, "percentage": 44.69, "elapsed_time": "0:43:32", "remaining_time": "0:53:52", "throughput": 4264.27, "total_tokens": 11138728} {"current_steps": 17060, "total_steps": 38160, "loss": 0.5119, "lr": 0.0006758574598154292, "epoch": 8.941299790356394, "percentage": 44.71, "elapsed_time": "0:43:32", "remaining_time": "0:53:51", "throughput": 4264.36, "total_tokens": 11142216} {"current_steps": 17065, "total_steps": 38160, "loss": 0.4528, "lr": 0.0006756433671092852, "epoch": 8.94392033542977, "percentage": 44.72, "elapsed_time": "0:43:33", "remaining_time": "0:53:50", "throughput": 4264.3, "total_tokens": 11144776} {"current_steps": 17070, "total_steps": 38160, "loss": 0.3754, "lr": 0.0006754292376605524, "epoch": 8.946540880503145, "percentage": 44.73, "elapsed_time": "0:43:34", "remaining_time": "0:53:49", "throughput": 4264.3, "total_tokens": 11147688} {"current_steps": 17075, "total_steps": 38160, "loss": 0.4893, "lr": 0.0006752150715140247, "epoch": 8.94916142557652, "percentage": 44.75, "elapsed_time": "0:43:34", "remaining_time": "0:53:49", "throughput": 4264.41, "total_tokens": 11151304} {"current_steps": 17080, "total_steps": 38160, "loss": 0.4594, "lr": 0.0006750008687145028, "epoch": 8.951781970649895, "percentage": 44.76, "elapsed_time": "0:43:35", "remaining_time": "0:53:48", "throughput": 4264.39, "total_tokens": 11154248} {"current_steps": 17085, "total_steps": 38160, "loss": 0.4788, "lr": 0.0006747866293067958, "epoch": 8.95440251572327, "percentage": 44.77, "elapsed_time": "0:43:36", "remaining_time": "0:53:47", "throughput": 4264.41, "total_tokens": 11157192} {"current_steps": 17090, "total_steps": 38160, "loss": 0.3608, "lr": 0.00067457235333572, "epoch": 8.957023060796645, "percentage": 44.79, "elapsed_time": "0:43:37", "remaining_time": "0:53:46", "throughput": 4264.55, "total_tokens": 11160872} {"current_steps": 17095, "total_steps": 38160, "loss": 0.4624, "lr": 0.0006743580408460994, "epoch": 8.95964360587002, "percentage": 44.8, "elapsed_time": "0:43:37", "remaining_time": "0:53:45", "throughput": 4264.45, "total_tokens": 11163272} {"current_steps": 17100, "total_steps": 38160, "loss": 0.354, "lr": 0.0006741436918827659, "epoch": 8.962264150943396, "percentage": 44.81, "elapsed_time": "0:43:38", "remaining_time": "0:53:44", "throughput": 4264.59, "total_tokens": 11166888} {"current_steps": 17105, "total_steps": 38160, "loss": 0.4148, "lr": 0.0006739293064905589, "epoch": 8.964884696016771, "percentage": 44.82, "elapsed_time": "0:43:39", "remaining_time": "0:53:44", "throughput": 4264.85, "total_tokens": 11171272} {"current_steps": 17110, "total_steps": 38160, "loss": 0.4266, "lr": 0.0006737148847143251, "epoch": 8.967505241090146, "percentage": 44.84, "elapsed_time": "0:43:39", "remaining_time": "0:53:43", "throughput": 4264.74, "total_tokens": 11173608} {"current_steps": 17115, "total_steps": 38160, "loss": 0.5723, "lr": 0.0006735004265989195, "epoch": 8.970125786163521, "percentage": 44.85, "elapsed_time": "0:43:40", "remaining_time": "0:53:42", "throughput": 4264.94, "total_tokens": 11177608} {"current_steps": 17120, "total_steps": 38160, "loss": 0.4179, "lr": 0.0006732859321892038, "epoch": 8.972746331236896, "percentage": 44.86, "elapsed_time": "0:43:41", "remaining_time": "0:53:41", "throughput": 4265.21, "total_tokens": 11182088} {"current_steps": 17125, "total_steps": 38160, "loss": 0.423, "lr": 0.0006730714015300481, "epoch": 8.975366876310272, "percentage": 44.88, "elapsed_time": "0:43:42", "remaining_time": "0:53:41", "throughput": 4265.21, "total_tokens": 11185064} {"current_steps": 17130, "total_steps": 38160, "loss": 0.4626, "lr": 0.0006728568346663299, "epoch": 8.977987421383649, "percentage": 44.89, "elapsed_time": "0:43:43", "remaining_time": "0:53:40", "throughput": 4265.19, "total_tokens": 11187944} {"current_steps": 17135, "total_steps": 38160, "loss": 0.3626, "lr": 0.0006726422316429337, "epoch": 8.980607966457024, "percentage": 44.9, "elapsed_time": "0:43:43", "remaining_time": "0:53:39", "throughput": 4265.16, "total_tokens": 11190632} {"current_steps": 17140, "total_steps": 38160, "loss": 0.6272, "lr": 0.0006724275925047523, "epoch": 8.983228511530399, "percentage": 44.92, "elapsed_time": "0:43:44", "remaining_time": "0:53:38", "throughput": 4265.27, "total_tokens": 11194280} {"current_steps": 17145, "total_steps": 38160, "loss": 0.656, "lr": 0.0006722129172966858, "epoch": 8.985849056603774, "percentage": 44.93, "elapsed_time": "0:43:45", "remaining_time": "0:53:37", "throughput": 4265.32, "total_tokens": 11197416} {"current_steps": 17150, "total_steps": 38160, "loss": 0.5653, "lr": 0.0006719982060636416, "epoch": 8.98846960167715, "percentage": 44.94, "elapsed_time": "0:43:45", "remaining_time": "0:53:36", "throughput": 4265.3, "total_tokens": 11200328} {"current_steps": 17155, "total_steps": 38160, "loss": 0.4903, "lr": 0.000671783458850535, "epoch": 8.991090146750524, "percentage": 44.96, "elapsed_time": "0:43:46", "remaining_time": "0:53:36", "throughput": 4265.48, "total_tokens": 11204200} {"current_steps": 17160, "total_steps": 38160, "loss": 0.5199, "lr": 0.0006715686757022886, "epoch": 8.9937106918239, "percentage": 44.97, "elapsed_time": "0:43:47", "remaining_time": "0:53:35", "throughput": 4265.48, "total_tokens": 11207144} {"current_steps": 17165, "total_steps": 38160, "loss": 0.4077, "lr": 0.0006713538566638326, "epoch": 8.996331236897275, "percentage": 44.98, "elapsed_time": "0:43:48", "remaining_time": "0:53:34", "throughput": 4265.61, "total_tokens": 11210888} {"current_steps": 17170, "total_steps": 38160, "loss": 0.3771, "lr": 0.0006711390017801049, "epoch": 8.99895178197065, "percentage": 44.99, "elapsed_time": "0:43:48", "remaining_time": "0:53:33", "throughput": 4265.57, "total_tokens": 11213512} {"current_steps": 17172, "total_steps": 38160, "eval_loss": 0.48470157384872437, "epoch": 9.0, "percentage": 45.0, "elapsed_time": "0:44:02", "remaining_time": "0:53:50", "throughput": 4243.23, "total_tokens": 11214472} {"current_steps": 17175, "total_steps": 38160, "loss": 0.4193, "lr": 0.0006709241110960502, "epoch": 9.001572327044025, "percentage": 45.01, "elapsed_time": "0:44:04", "remaining_time": "0:53:51", "throughput": 4240.97, "total_tokens": 11217000} {"current_steps": 17180, "total_steps": 38160, "loss": 0.3626, "lr": 0.0006707091846566216, "epoch": 9.0041928721174, "percentage": 45.02, "elapsed_time": "0:44:05", "remaining_time": "0:53:50", "throughput": 4241.07, "total_tokens": 11220424} {"current_steps": 17185, "total_steps": 38160, "loss": 0.4578, "lr": 0.0006704942225067791, "epoch": 9.006813417190775, "percentage": 45.03, "elapsed_time": "0:44:06", "remaining_time": "0:53:49", "throughput": 4241.0, "total_tokens": 11222888} {"current_steps": 17190, "total_steps": 38160, "loss": 0.3387, "lr": 0.0006702792246914902, "epoch": 9.00943396226415, "percentage": 45.05, "elapsed_time": "0:44:06", "remaining_time": "0:53:48", "throughput": 4240.96, "total_tokens": 11225480} {"current_steps": 17195, "total_steps": 38160, "loss": 0.5879, "lr": 0.0006700641912557304, "epoch": 9.012054507337526, "percentage": 45.06, "elapsed_time": "0:44:07", "remaining_time": "0:53:48", "throughput": 4241.02, "total_tokens": 11228712} {"current_steps": 17200, "total_steps": 38160, "loss": 0.4227, "lr": 0.0006698491222444818, "epoch": 9.014675052410901, "percentage": 45.07, "elapsed_time": "0:44:08", "remaining_time": "0:53:47", "throughput": 4240.99, "total_tokens": 11231464} {"current_steps": 17205, "total_steps": 38160, "loss": 0.6398, "lr": 0.0006696340177027346, "epoch": 9.017295597484276, "percentage": 45.09, "elapsed_time": "0:44:09", "remaining_time": "0:53:46", "throughput": 4241.03, "total_tokens": 11234568} {"current_steps": 17210, "total_steps": 38160, "loss": 0.5371, "lr": 0.0006694188776754863, "epoch": 9.019916142557651, "percentage": 45.1, "elapsed_time": "0:44:09", "remaining_time": "0:53:45", "throughput": 4240.97, "total_tokens": 11237096} {"current_steps": 17215, "total_steps": 38160, "loss": 0.3618, "lr": 0.0006692037022077415, "epoch": 9.022536687631026, "percentage": 45.11, "elapsed_time": "0:44:10", "remaining_time": "0:53:44", "throughput": 4240.94, "total_tokens": 11239880} {"current_steps": 17220, "total_steps": 38160, "loss": 0.477, "lr": 0.0006689884913445126, "epoch": 9.025157232704403, "percentage": 45.13, "elapsed_time": "0:44:11", "remaining_time": "0:53:43", "throughput": 4241.09, "total_tokens": 11243656} {"current_steps": 17225, "total_steps": 38160, "loss": 0.4238, "lr": 0.0006687732451308193, "epoch": 9.027777777777779, "percentage": 45.14, "elapsed_time": "0:44:11", "remaining_time": "0:53:43", "throughput": 4241.15, "total_tokens": 11246888} {"current_steps": 17230, "total_steps": 38160, "loss": 0.4477, "lr": 0.0006685579636116886, "epoch": 9.030398322851154, "percentage": 45.15, "elapsed_time": "0:44:12", "remaining_time": "0:53:42", "throughput": 4241.12, "total_tokens": 11249608} {"current_steps": 17235, "total_steps": 38160, "loss": 0.3676, "lr": 0.0006683426468321547, "epoch": 9.033018867924529, "percentage": 45.17, "elapsed_time": "0:44:13", "remaining_time": "0:53:41", "throughput": 4241.1, "total_tokens": 11252360} {"current_steps": 17240, "total_steps": 38160, "loss": 0.4688, "lr": 0.0006681272948372598, "epoch": 9.035639412997904, "percentage": 45.18, "elapsed_time": "0:44:13", "remaining_time": "0:53:40", "throughput": 4241.05, "total_tokens": 11254952} {"current_steps": 17245, "total_steps": 38160, "loss": 0.4822, "lr": 0.000667911907672053, "epoch": 9.03825995807128, "percentage": 45.19, "elapsed_time": "0:44:14", "remaining_time": "0:53:39", "throughput": 4241.08, "total_tokens": 11257928} {"current_steps": 17250, "total_steps": 38160, "loss": 0.5538, "lr": 0.0006676964853815906, "epoch": 9.040880503144654, "percentage": 45.2, "elapsed_time": "0:44:15", "remaining_time": "0:53:38", "throughput": 4241.15, "total_tokens": 11261224} {"current_steps": 17255, "total_steps": 38160, "loss": 0.4114, "lr": 0.0006674810280109367, "epoch": 9.04350104821803, "percentage": 45.22, "elapsed_time": "0:44:15", "remaining_time": "0:53:37", "throughput": 4241.16, "total_tokens": 11264104} {"current_steps": 17260, "total_steps": 38160, "loss": 0.444, "lr": 0.0006672655356051625, "epoch": 9.046121593291405, "percentage": 45.23, "elapsed_time": "0:44:16", "remaining_time": "0:53:36", "throughput": 4241.29, "total_tokens": 11267752} {"current_steps": 17265, "total_steps": 38160, "loss": 0.3873, "lr": 0.0006670500082093465, "epoch": 9.04874213836478, "percentage": 45.24, "elapsed_time": "0:44:17", "remaining_time": "0:53:36", "throughput": 4241.42, "total_tokens": 11271304} {"current_steps": 17270, "total_steps": 38160, "loss": 0.4818, "lr": 0.0006668344458685745, "epoch": 9.051362683438155, "percentage": 45.26, "elapsed_time": "0:44:18", "remaining_time": "0:53:35", "throughput": 4241.61, "total_tokens": 11275272} {"current_steps": 17275, "total_steps": 38160, "loss": 0.3539, "lr": 0.00066661884862794, "epoch": 9.05398322851153, "percentage": 45.27, "elapsed_time": "0:44:18", "remaining_time": "0:53:34", "throughput": 4241.5, "total_tokens": 11277544} {"current_steps": 17280, "total_steps": 38160, "loss": 0.5871, "lr": 0.000666403216532543, "epoch": 9.056603773584905, "percentage": 45.28, "elapsed_time": "0:44:19", "remaining_time": "0:53:33", "throughput": 4241.71, "total_tokens": 11281608} {"current_steps": 17285, "total_steps": 38160, "loss": 0.5495, "lr": 0.0006661875496274916, "epoch": 9.05922431865828, "percentage": 45.3, "elapsed_time": "0:44:20", "remaining_time": "0:53:32", "throughput": 4241.69, "total_tokens": 11284328} {"current_steps": 17290, "total_steps": 38160, "loss": 0.5219, "lr": 0.0006659718479579008, "epoch": 9.061844863731656, "percentage": 45.31, "elapsed_time": "0:44:21", "remaining_time": "0:53:32", "throughput": 4241.74, "total_tokens": 11287464} {"current_steps": 17295, "total_steps": 38160, "loss": 0.4126, "lr": 0.0006657561115688929, "epoch": 9.064465408805031, "percentage": 45.32, "elapsed_time": "0:44:21", "remaining_time": "0:53:31", "throughput": 4241.77, "total_tokens": 11290536} {"current_steps": 17300, "total_steps": 38160, "loss": 0.3299, "lr": 0.0006655403405055977, "epoch": 9.067085953878406, "percentage": 45.34, "elapsed_time": "0:44:22", "remaining_time": "0:53:30", "throughput": 4242.24, "total_tokens": 11296520} {"current_steps": 17305, "total_steps": 38160, "loss": 0.3984, "lr": 0.0006653245348131517, "epoch": 9.069706498951781, "percentage": 45.35, "elapsed_time": "0:44:23", "remaining_time": "0:53:29", "throughput": 4242.2, "total_tokens": 11299144} {"current_steps": 17310, "total_steps": 38160, "loss": 0.5685, "lr": 0.0006651086945366991, "epoch": 9.072327044025156, "percentage": 45.36, "elapsed_time": "0:44:24", "remaining_time": "0:53:29", "throughput": 4242.36, "total_tokens": 11302856} {"current_steps": 17315, "total_steps": 38160, "loss": 0.4558, "lr": 0.0006648928197213914, "epoch": 9.074947589098532, "percentage": 45.37, "elapsed_time": "0:44:25", "remaining_time": "0:53:28", "throughput": 4242.57, "total_tokens": 11306824} {"current_steps": 17320, "total_steps": 38160, "loss": 0.5534, "lr": 0.0006646769104123868, "epoch": 9.077568134171909, "percentage": 45.39, "elapsed_time": "0:44:25", "remaining_time": "0:53:27", "throughput": 4242.55, "total_tokens": 11309672} {"current_steps": 17325, "total_steps": 38160, "loss": 0.3516, "lr": 0.0006644609666548513, "epoch": 9.080188679245284, "percentage": 45.4, "elapsed_time": "0:44:26", "remaining_time": "0:53:26", "throughput": 4242.61, "total_tokens": 11312776} {"current_steps": 17330, "total_steps": 38160, "loss": 0.3535, "lr": 0.000664244988493958, "epoch": 9.082809224318659, "percentage": 45.41, "elapsed_time": "0:44:27", "remaining_time": "0:53:26", "throughput": 4243.21, "total_tokens": 11319304} {"current_steps": 17335, "total_steps": 38160, "loss": 0.6658, "lr": 0.0006640289759748867, "epoch": 9.085429769392034, "percentage": 45.43, "elapsed_time": "0:44:28", "remaining_time": "0:53:25", "throughput": 4243.26, "total_tokens": 11322440} {"current_steps": 17340, "total_steps": 38160, "loss": 0.4236, "lr": 0.0006638129291428252, "epoch": 9.08805031446541, "percentage": 45.44, "elapsed_time": "0:44:29", "remaining_time": "0:53:24", "throughput": 4243.33, "total_tokens": 11325736} {"current_steps": 17345, "total_steps": 38160, "loss": 0.5434, "lr": 0.0006635968480429677, "epoch": 9.090670859538784, "percentage": 45.45, "elapsed_time": "0:44:29", "remaining_time": "0:53:23", "throughput": 4243.33, "total_tokens": 11328616} {"current_steps": 17350, "total_steps": 38160, "loss": 0.4844, "lr": 0.0006633807327205162, "epoch": 9.09329140461216, "percentage": 45.47, "elapsed_time": "0:44:30", "remaining_time": "0:53:23", "throughput": 4243.44, "total_tokens": 11332072} {"current_steps": 17355, "total_steps": 38160, "loss": 0.5462, "lr": 0.0006631645832206789, "epoch": 9.095911949685535, "percentage": 45.48, "elapsed_time": "0:44:31", "remaining_time": "0:53:22", "throughput": 4243.54, "total_tokens": 11335624} {"current_steps": 17360, "total_steps": 38160, "loss": 0.4338, "lr": 0.0006629483995886727, "epoch": 9.09853249475891, "percentage": 45.49, "elapsed_time": "0:44:31", "remaining_time": "0:53:21", "throughput": 4243.42, "total_tokens": 11337800} {"current_steps": 17365, "total_steps": 38160, "loss": 0.4747, "lr": 0.0006627321818697202, "epoch": 9.101153039832285, "percentage": 45.51, "elapsed_time": "0:44:32", "remaining_time": "0:53:20", "throughput": 4243.57, "total_tokens": 11341640} {"current_steps": 17370, "total_steps": 38160, "loss": 0.5508, "lr": 0.0006625159301090518, "epoch": 9.10377358490566, "percentage": 45.52, "elapsed_time": "0:44:33", "remaining_time": "0:53:19", "throughput": 4243.6, "total_tokens": 11344680} {"current_steps": 17375, "total_steps": 38160, "loss": 0.5198, "lr": 0.0006622996443519047, "epoch": 9.106394129979035, "percentage": 45.53, "elapsed_time": "0:44:34", "remaining_time": "0:53:18", "throughput": 4243.69, "total_tokens": 11348136} {"current_steps": 17380, "total_steps": 38160, "loss": 0.4049, "lr": 0.0006620833246435238, "epoch": 9.10901467505241, "percentage": 45.55, "elapsed_time": "0:44:34", "remaining_time": "0:53:18", "throughput": 4243.79, "total_tokens": 11351560} {"current_steps": 17385, "total_steps": 38160, "loss": 0.4735, "lr": 0.0006618669710291606, "epoch": 9.111635220125786, "percentage": 45.56, "elapsed_time": "0:44:35", "remaining_time": "0:53:17", "throughput": 4243.95, "total_tokens": 11355240} {"current_steps": 17390, "total_steps": 38160, "loss": 0.4631, "lr": 0.0006616505835540736, "epoch": 9.114255765199161, "percentage": 45.57, "elapsed_time": "0:44:36", "remaining_time": "0:53:16", "throughput": 4243.9, "total_tokens": 11357832} {"current_steps": 17395, "total_steps": 38160, "loss": 0.5145, "lr": 0.0006614341622635287, "epoch": 9.116876310272536, "percentage": 45.58, "elapsed_time": "0:44:37", "remaining_time": "0:53:15", "throughput": 4244.09, "total_tokens": 11361832} {"current_steps": 17400, "total_steps": 38160, "loss": 0.4187, "lr": 0.0006612177072027989, "epoch": 9.119496855345911, "percentage": 45.6, "elapsed_time": "0:44:37", "remaining_time": "0:53:14", "throughput": 4244.18, "total_tokens": 11365288} {"current_steps": 17405, "total_steps": 38160, "loss": 0.3482, "lr": 0.0006610012184171641, "epoch": 9.122117400419286, "percentage": 45.61, "elapsed_time": "0:44:38", "remaining_time": "0:53:14", "throughput": 4244.24, "total_tokens": 11368584} {"current_steps": 17410, "total_steps": 38160, "loss": 0.3071, "lr": 0.0006607846959519109, "epoch": 9.124737945492662, "percentage": 45.62, "elapsed_time": "0:44:39", "remaining_time": "0:53:13", "throughput": 4244.27, "total_tokens": 11371560} {"current_steps": 17415, "total_steps": 38160, "loss": 0.3273, "lr": 0.0006605681398523339, "epoch": 9.127358490566039, "percentage": 45.64, "elapsed_time": "0:44:39", "remaining_time": "0:53:12", "throughput": 4244.24, "total_tokens": 11374280} {"current_steps": 17420, "total_steps": 38160, "loss": 0.493, "lr": 0.0006603515501637338, "epoch": 9.129979035639414, "percentage": 45.65, "elapsed_time": "0:44:40", "remaining_time": "0:53:11", "throughput": 4244.27, "total_tokens": 11377320} {"current_steps": 17425, "total_steps": 38160, "loss": 0.4885, "lr": 0.0006601349269314187, "epoch": 9.132599580712789, "percentage": 45.66, "elapsed_time": "0:44:41", "remaining_time": "0:53:10", "throughput": 4244.31, "total_tokens": 11380424} {"current_steps": 17430, "total_steps": 38160, "loss": 0.3168, "lr": 0.0006599182702007042, "epoch": 9.135220125786164, "percentage": 45.68, "elapsed_time": "0:44:42", "remaining_time": "0:53:09", "throughput": 4244.36, "total_tokens": 11383560} {"current_steps": 17435, "total_steps": 38160, "loss": 0.4303, "lr": 0.0006597015800169116, "epoch": 9.13784067085954, "percentage": 45.69, "elapsed_time": "0:44:42", "remaining_time": "0:53:09", "throughput": 4244.4, "total_tokens": 11386760} {"current_steps": 17440, "total_steps": 38160, "loss": 0.4555, "lr": 0.0006594848564253705, "epoch": 9.140461215932914, "percentage": 45.7, "elapsed_time": "0:44:43", "remaining_time": "0:53:08", "throughput": 4244.35, "total_tokens": 11389352} {"current_steps": 17445, "total_steps": 38160, "loss": 0.5289, "lr": 0.0006592680994714171, "epoch": 9.14308176100629, "percentage": 45.72, "elapsed_time": "0:44:44", "remaining_time": "0:53:07", "throughput": 4244.41, "total_tokens": 11392584} {"current_steps": 17450, "total_steps": 38160, "loss": 0.4557, "lr": 0.0006590513092003943, "epoch": 9.145702306079665, "percentage": 45.73, "elapsed_time": "0:44:44", "remaining_time": "0:53:06", "throughput": 4244.45, "total_tokens": 11395688} {"current_steps": 17455, "total_steps": 38160, "loss": 0.4043, "lr": 0.0006588344856576521, "epoch": 9.14832285115304, "percentage": 45.74, "elapsed_time": "0:44:45", "remaining_time": "0:53:05", "throughput": 4244.46, "total_tokens": 11398696} {"current_steps": 17460, "total_steps": 38160, "loss": 0.5093, "lr": 0.0006586176288885475, "epoch": 9.150943396226415, "percentage": 45.75, "elapsed_time": "0:44:46", "remaining_time": "0:53:04", "throughput": 4244.63, "total_tokens": 11402536} {"current_steps": 17465, "total_steps": 38160, "loss": 0.4833, "lr": 0.0006584007389384446, "epoch": 9.15356394129979, "percentage": 45.77, "elapsed_time": "0:44:47", "remaining_time": "0:53:04", "throughput": 4244.68, "total_tokens": 11405704} {"current_steps": 17470, "total_steps": 38160, "loss": 0.5133, "lr": 0.0006581838158527144, "epoch": 9.156184486373165, "percentage": 45.78, "elapsed_time": "0:44:47", "remaining_time": "0:53:03", "throughput": 4244.67, "total_tokens": 11408648} {"current_steps": 17475, "total_steps": 38160, "loss": 0.4746, "lr": 0.0006579668596767343, "epoch": 9.15880503144654, "percentage": 45.79, "elapsed_time": "0:44:48", "remaining_time": "0:53:02", "throughput": 4244.73, "total_tokens": 11411816} {"current_steps": 17480, "total_steps": 38160, "loss": 0.3955, "lr": 0.0006577498704558894, "epoch": 9.161425576519916, "percentage": 45.81, "elapsed_time": "0:44:49", "remaining_time": "0:53:01", "throughput": 4244.78, "total_tokens": 11414952} {"current_steps": 17485, "total_steps": 38160, "loss": 0.4437, "lr": 0.0006575328482355715, "epoch": 9.164046121593291, "percentage": 45.82, "elapsed_time": "0:44:49", "remaining_time": "0:53:00", "throughput": 4244.87, "total_tokens": 11418344} {"current_steps": 17490, "total_steps": 38160, "loss": 0.5206, "lr": 0.0006573157930611788, "epoch": 9.166666666666666, "percentage": 45.83, "elapsed_time": "0:44:50", "remaining_time": "0:52:59", "throughput": 4244.86, "total_tokens": 11421128} {"current_steps": 17495, "total_steps": 38160, "loss": 0.3981, "lr": 0.000657098704978117, "epoch": 9.169287211740041, "percentage": 45.85, "elapsed_time": "0:44:51", "remaining_time": "0:52:58", "throughput": 4244.87, "total_tokens": 11424072} {"current_steps": 17500, "total_steps": 38160, "loss": 0.5026, "lr": 0.0006568815840317984, "epoch": 9.171907756813416, "percentage": 45.86, "elapsed_time": "0:44:51", "remaining_time": "0:52:58", "throughput": 4244.88, "total_tokens": 11426952} {"current_steps": 17505, "total_steps": 38160, "loss": 0.3259, "lr": 0.0006566644302676422, "epoch": 9.174528301886792, "percentage": 45.87, "elapsed_time": "0:44:52", "remaining_time": "0:52:57", "throughput": 4245.08, "total_tokens": 11430984} {"current_steps": 17510, "total_steps": 38160, "loss": 0.2978, "lr": 0.0006564472437310746, "epoch": 9.177148846960169, "percentage": 45.89, "elapsed_time": "0:44:53", "remaining_time": "0:52:56", "throughput": 4245.13, "total_tokens": 11434184} {"current_steps": 17515, "total_steps": 38160, "loss": 0.638, "lr": 0.0006562300244675283, "epoch": 9.179769392033544, "percentage": 45.9, "elapsed_time": "0:44:54", "remaining_time": "0:52:55", "throughput": 4245.07, "total_tokens": 11436680} {"current_steps": 17520, "total_steps": 38160, "loss": 0.4052, "lr": 0.0006560127725224432, "epoch": 9.182389937106919, "percentage": 45.91, "elapsed_time": "0:44:54", "remaining_time": "0:52:54", "throughput": 4245.11, "total_tokens": 11439784} {"current_steps": 17525, "total_steps": 38160, "loss": 0.502, "lr": 0.0006557954879412662, "epoch": 9.185010482180294, "percentage": 45.93, "elapsed_time": "0:44:55", "remaining_time": "0:52:53", "throughput": 4245.07, "total_tokens": 11442440} {"current_steps": 17530, "total_steps": 38160, "loss": 0.4366, "lr": 0.0006555781707694506, "epoch": 9.18763102725367, "percentage": 45.94, "elapsed_time": "0:44:56", "remaining_time": "0:52:52", "throughput": 4245.05, "total_tokens": 11445096} {"current_steps": 17535, "total_steps": 38160, "loss": 0.5466, "lr": 0.0006553608210524564, "epoch": 9.190251572327044, "percentage": 45.95, "elapsed_time": "0:44:56", "remaining_time": "0:52:52", "throughput": 4245.18, "total_tokens": 11448712} {"current_steps": 17540, "total_steps": 38160, "loss": 0.4238, "lr": 0.0006551434388357509, "epoch": 9.19287211740042, "percentage": 45.96, "elapsed_time": "0:44:57", "remaining_time": "0:52:51", "throughput": 4245.1, "total_tokens": 11451080} {"current_steps": 17545, "total_steps": 38160, "loss": 0.3315, "lr": 0.000654926024164808, "epoch": 9.195492662473795, "percentage": 45.98, "elapsed_time": "0:44:58", "remaining_time": "0:52:50", "throughput": 4245.13, "total_tokens": 11454120} {"current_steps": 17550, "total_steps": 38160, "loss": 0.4316, "lr": 0.0006547085770851084, "epoch": 9.19811320754717, "percentage": 45.99, "elapsed_time": "0:44:58", "remaining_time": "0:52:49", "throughput": 4245.22, "total_tokens": 11457544} {"current_steps": 17555, "total_steps": 38160, "loss": 0.3645, "lr": 0.0006544910976421395, "epoch": 9.200733752620545, "percentage": 46.0, "elapsed_time": "0:44:59", "remaining_time": "0:52:48", "throughput": 4245.4, "total_tokens": 11461384} {"current_steps": 17560, "total_steps": 38160, "loss": 0.4506, "lr": 0.0006542735858813953, "epoch": 9.20335429769392, "percentage": 46.02, "elapsed_time": "0:45:00", "remaining_time": "0:52:47", "throughput": 4245.4, "total_tokens": 11464328} {"current_steps": 17565, "total_steps": 38160, "loss": 0.4507, "lr": 0.0006540560418483771, "epoch": 9.205974842767295, "percentage": 46.03, "elapsed_time": "0:45:01", "remaining_time": "0:52:47", "throughput": 4245.41, "total_tokens": 11467176} {"current_steps": 17570, "total_steps": 38160, "loss": 0.4381, "lr": 0.0006538384655885925, "epoch": 9.20859538784067, "percentage": 46.04, "elapsed_time": "0:45:01", "remaining_time": "0:52:46", "throughput": 4245.38, "total_tokens": 11469832} {"current_steps": 17575, "total_steps": 38160, "loss": 0.3683, "lr": 0.000653620857147556, "epoch": 9.211215932914046, "percentage": 46.06, "elapsed_time": "0:45:02", "remaining_time": "0:52:45", "throughput": 4245.38, "total_tokens": 11472680} {"current_steps": 17580, "total_steps": 38160, "loss": 0.4458, "lr": 0.0006534032165707887, "epoch": 9.213836477987421, "percentage": 46.07, "elapsed_time": "0:45:03", "remaining_time": "0:52:44", "throughput": 4245.4, "total_tokens": 11475656} {"current_steps": 17585, "total_steps": 38160, "loss": 0.4916, "lr": 0.0006531855439038187, "epoch": 9.216457023060796, "percentage": 46.08, "elapsed_time": "0:45:04", "remaining_time": "0:52:43", "throughput": 4245.74, "total_tokens": 11480488} {"current_steps": 17590, "total_steps": 38160, "loss": 0.3878, "lr": 0.0006529678391921805, "epoch": 9.219077568134171, "percentage": 46.1, "elapsed_time": "0:45:04", "remaining_time": "0:52:43", "throughput": 4245.88, "total_tokens": 11484232} {"current_steps": 17595, "total_steps": 38160, "loss": 0.4571, "lr": 0.0006527501024814155, "epoch": 9.221698113207546, "percentage": 46.11, "elapsed_time": "0:45:05", "remaining_time": "0:52:42", "throughput": 4245.85, "total_tokens": 11486984} {"current_steps": 17600, "total_steps": 38160, "loss": 0.3651, "lr": 0.0006525323338170718, "epoch": 9.224318658280922, "percentage": 46.12, "elapsed_time": "0:45:06", "remaining_time": "0:52:41", "throughput": 4245.88, "total_tokens": 11489992} {"current_steps": 17605, "total_steps": 38160, "loss": 0.4767, "lr": 0.000652314533244704, "epoch": 9.226939203354299, "percentage": 46.13, "elapsed_time": "0:45:06", "remaining_time": "0:52:40", "throughput": 4246.07, "total_tokens": 11493960} {"current_steps": 17610, "total_steps": 38160, "loss": 0.5906, "lr": 0.0006520967008098735, "epoch": 9.229559748427674, "percentage": 46.15, "elapsed_time": "0:45:07", "remaining_time": "0:52:39", "throughput": 4246.17, "total_tokens": 11497416} {"current_steps": 17615, "total_steps": 38160, "loss": 0.3957, "lr": 0.0006518788365581485, "epoch": 9.232180293501049, "percentage": 46.16, "elapsed_time": "0:45:08", "remaining_time": "0:52:39", "throughput": 4246.36, "total_tokens": 11501384} {"current_steps": 17620, "total_steps": 38160, "loss": 0.3521, "lr": 0.0006516609405351034, "epoch": 9.234800838574424, "percentage": 46.17, "elapsed_time": "0:45:09", "remaining_time": "0:52:38", "throughput": 4246.45, "total_tokens": 11504744} {"current_steps": 17625, "total_steps": 38160, "loss": 0.4977, "lr": 0.00065144301278632, "epoch": 9.2374213836478, "percentage": 46.19, "elapsed_time": "0:45:09", "remaining_time": "0:52:37", "throughput": 4246.45, "total_tokens": 11507592} {"current_steps": 17630, "total_steps": 38160, "loss": 0.4413, "lr": 0.0006512250533573862, "epoch": 9.240041928721174, "percentage": 46.2, "elapsed_time": "0:45:10", "remaining_time": "0:52:36", "throughput": 4246.47, "total_tokens": 11510568} {"current_steps": 17635, "total_steps": 38160, "loss": 0.5459, "lr": 0.0006510070622938962, "epoch": 9.24266247379455, "percentage": 46.21, "elapsed_time": "0:45:11", "remaining_time": "0:52:35", "throughput": 4246.38, "total_tokens": 11512968} {"current_steps": 17640, "total_steps": 38160, "loss": 0.3915, "lr": 0.0006507890396414516, "epoch": 9.245283018867925, "percentage": 46.23, "elapsed_time": "0:45:11", "remaining_time": "0:52:34", "throughput": 4246.35, "total_tokens": 11515560} {"current_steps": 17645, "total_steps": 38160, "loss": 0.3795, "lr": 0.0006505709854456602, "epoch": 9.2479035639413, "percentage": 46.24, "elapsed_time": "0:45:12", "remaining_time": "0:52:33", "throughput": 4246.54, "total_tokens": 11519560} {"current_steps": 17650, "total_steps": 38160, "loss": 0.406, "lr": 0.0006503528997521365, "epoch": 9.250524109014675, "percentage": 46.25, "elapsed_time": "0:45:13", "remaining_time": "0:52:33", "throughput": 4246.57, "total_tokens": 11522568} {"current_steps": 17655, "total_steps": 38160, "loss": 0.4921, "lr": 0.0006501347826065017, "epoch": 9.25314465408805, "percentage": 46.27, "elapsed_time": "0:45:14", "remaining_time": "0:52:32", "throughput": 4246.72, "total_tokens": 11526408} {"current_steps": 17660, "total_steps": 38160, "loss": 0.4187, "lr": 0.000649916634054383, "epoch": 9.255765199161425, "percentage": 46.28, "elapsed_time": "0:45:14", "remaining_time": "0:52:31", "throughput": 4246.79, "total_tokens": 11529672} {"current_steps": 17665, "total_steps": 38160, "loss": 0.4594, "lr": 0.0006496984541414147, "epoch": 9.2583857442348, "percentage": 46.29, "elapsed_time": "0:45:15", "remaining_time": "0:52:30", "throughput": 4246.89, "total_tokens": 11533128} {"current_steps": 17670, "total_steps": 38160, "loss": 0.5512, "lr": 0.0006494802429132378, "epoch": 9.261006289308176, "percentage": 46.31, "elapsed_time": "0:45:16", "remaining_time": "0:52:29", "throughput": 4246.81, "total_tokens": 11535496} {"current_steps": 17675, "total_steps": 38160, "loss": 0.5087, "lr": 0.0006492620004154993, "epoch": 9.26362683438155, "percentage": 46.32, "elapsed_time": "0:45:16", "remaining_time": "0:52:28", "throughput": 4246.8, "total_tokens": 11538280} {"current_steps": 17680, "total_steps": 38160, "loss": 0.4077, "lr": 0.0006490437266938534, "epoch": 9.266247379454926, "percentage": 46.33, "elapsed_time": "0:45:17", "remaining_time": "0:52:28", "throughput": 4247.13, "total_tokens": 11543080} {"current_steps": 17685, "total_steps": 38160, "loss": 0.4955, "lr": 0.0006488254217939601, "epoch": 9.268867924528301, "percentage": 46.34, "elapsed_time": "0:45:18", "remaining_time": "0:52:27", "throughput": 4247.18, "total_tokens": 11546248} {"current_steps": 17690, "total_steps": 38160, "loss": 0.5238, "lr": 0.0006486070857614863, "epoch": 9.271488469601676, "percentage": 46.36, "elapsed_time": "0:45:19", "remaining_time": "0:52:26", "throughput": 4247.21, "total_tokens": 11549352} {"current_steps": 17695, "total_steps": 38160, "loss": 0.4462, "lr": 0.0006483887186421059, "epoch": 9.274109014675052, "percentage": 46.37, "elapsed_time": "0:45:19", "remaining_time": "0:52:25", "throughput": 4247.28, "total_tokens": 11552552} {"current_steps": 17700, "total_steps": 38160, "loss": 0.4579, "lr": 0.0006481703204814982, "epoch": 9.276729559748428, "percentage": 46.38, "elapsed_time": "0:45:20", "remaining_time": "0:52:24", "throughput": 4247.2, "total_tokens": 11554920} {"current_steps": 17705, "total_steps": 38160, "loss": 0.4701, "lr": 0.00064795189132535, "epoch": 9.279350104821804, "percentage": 46.4, "elapsed_time": "0:45:21", "remaining_time": "0:52:23", "throughput": 4247.2, "total_tokens": 11557800} {"current_steps": 17710, "total_steps": 38160, "loss": 0.5354, "lr": 0.000647733431219354, "epoch": 9.281970649895179, "percentage": 46.41, "elapsed_time": "0:45:21", "remaining_time": "0:52:23", "throughput": 4247.19, "total_tokens": 11560616} {"current_steps": 17715, "total_steps": 38160, "loss": 0.4934, "lr": 0.0006475149402092097, "epoch": 9.284591194968554, "percentage": 46.42, "elapsed_time": "0:45:22", "remaining_time": "0:52:22", "throughput": 4247.38, "total_tokens": 11564552} {"current_steps": 17720, "total_steps": 38160, "loss": 0.3841, "lr": 0.0006472964183406229, "epoch": 9.28721174004193, "percentage": 46.44, "elapsed_time": "0:45:23", "remaining_time": "0:52:21", "throughput": 4247.45, "total_tokens": 11567976} {"current_steps": 17725, "total_steps": 38160, "loss": 0.6287, "lr": 0.0006470778656593055, "epoch": 9.289832285115304, "percentage": 46.45, "elapsed_time": "0:45:24", "remaining_time": "0:52:20", "throughput": 4247.5, "total_tokens": 11571144} {"current_steps": 17730, "total_steps": 38160, "loss": 0.4433, "lr": 0.0006468592822109769, "epoch": 9.29245283018868, "percentage": 46.46, "elapsed_time": "0:45:24", "remaining_time": "0:52:19", "throughput": 4247.62, "total_tokens": 11574664} {"current_steps": 17735, "total_steps": 38160, "loss": 0.4228, "lr": 0.0006466406680413619, "epoch": 9.295073375262055, "percentage": 46.48, "elapsed_time": "0:45:25", "remaining_time": "0:52:19", "throughput": 4247.7, "total_tokens": 11577896} {"current_steps": 17740, "total_steps": 38160, "loss": 0.4995, "lr": 0.000646422023196192, "epoch": 9.29769392033543, "percentage": 46.49, "elapsed_time": "0:45:26", "remaining_time": "0:52:18", "throughput": 4247.86, "total_tokens": 11581608} {"current_steps": 17745, "total_steps": 38160, "loss": 0.303, "lr": 0.0006462033477212054, "epoch": 9.300314465408805, "percentage": 46.5, "elapsed_time": "0:45:27", "remaining_time": "0:52:17", "throughput": 4247.94, "total_tokens": 11584936} {"current_steps": 17750, "total_steps": 38160, "loss": 0.4762, "lr": 0.0006459846416621462, "epoch": 9.30293501048218, "percentage": 46.51, "elapsed_time": "0:45:27", "remaining_time": "0:52:16", "throughput": 4248.04, "total_tokens": 11588360} {"current_steps": 17755, "total_steps": 38160, "loss": 0.3546, "lr": 0.0006457659050647657, "epoch": 9.305555555555555, "percentage": 46.53, "elapsed_time": "0:45:28", "remaining_time": "0:52:15", "throughput": 4247.95, "total_tokens": 11590760} {"current_steps": 17760, "total_steps": 38160, "loss": 0.5726, "lr": 0.0006455471379748208, "epoch": 9.30817610062893, "percentage": 46.54, "elapsed_time": "0:45:29", "remaining_time": "0:52:14", "throughput": 4247.97, "total_tokens": 11593736} {"current_steps": 17765, "total_steps": 38160, "loss": 0.4373, "lr": 0.000645328340438075, "epoch": 9.310796645702306, "percentage": 46.55, "elapsed_time": "0:45:29", "remaining_time": "0:52:14", "throughput": 4248.06, "total_tokens": 11597192} {"current_steps": 17770, "total_steps": 38160, "loss": 0.4365, "lr": 0.0006451095125002985, "epoch": 9.31341719077568, "percentage": 46.57, "elapsed_time": "0:45:30", "remaining_time": "0:52:13", "throughput": 4248.2, "total_tokens": 11601000} {"current_steps": 17775, "total_steps": 38160, "loss": 0.5281, "lr": 0.0006448906542072674, "epoch": 9.316037735849056, "percentage": 46.58, "elapsed_time": "0:45:31", "remaining_time": "0:52:12", "throughput": 4248.17, "total_tokens": 11603624} {"current_steps": 17780, "total_steps": 38160, "loss": 0.4558, "lr": 0.0006446717656047645, "epoch": 9.318658280922431, "percentage": 46.59, "elapsed_time": "0:45:32", "remaining_time": "0:52:11", "throughput": 4248.37, "total_tokens": 11607656} {"current_steps": 17785, "total_steps": 38160, "loss": 0.5315, "lr": 0.0006444528467385789, "epoch": 9.321278825995806, "percentage": 46.61, "elapsed_time": "0:45:33", "remaining_time": "0:52:11", "throughput": 4248.66, "total_tokens": 11612168} {"current_steps": 17790, "total_steps": 38160, "loss": 0.4434, "lr": 0.0006442338976545054, "epoch": 9.323899371069182, "percentage": 46.62, "elapsed_time": "0:45:33", "remaining_time": "0:52:10", "throughput": 4248.65, "total_tokens": 11614984} {"current_steps": 17795, "total_steps": 38160, "loss": 0.5199, "lr": 0.0006440149183983461, "epoch": 9.326519916142558, "percentage": 46.63, "elapsed_time": "0:45:34", "remaining_time": "0:52:09", "throughput": 4248.67, "total_tokens": 11618056} {"current_steps": 17800, "total_steps": 38160, "loss": 0.3645, "lr": 0.0006437959090159093, "epoch": 9.329140461215934, "percentage": 46.65, "elapsed_time": "0:45:35", "remaining_time": "0:52:08", "throughput": 4248.63, "total_tokens": 11620616} {"current_steps": 17805, "total_steps": 38160, "loss": 0.3747, "lr": 0.0006435768695530085, "epoch": 9.331761006289309, "percentage": 46.66, "elapsed_time": "0:45:35", "remaining_time": "0:52:07", "throughput": 4248.76, "total_tokens": 11624264} {"current_steps": 17810, "total_steps": 38160, "loss": 0.4476, "lr": 0.0006433578000554645, "epoch": 9.334381551362684, "percentage": 46.67, "elapsed_time": "0:45:36", "remaining_time": "0:52:06", "throughput": 4248.67, "total_tokens": 11626600} {"current_steps": 17815, "total_steps": 38160, "loss": 0.3806, "lr": 0.0006431387005691045, "epoch": 9.33700209643606, "percentage": 46.69, "elapsed_time": "0:45:37", "remaining_time": "0:52:05", "throughput": 4248.67, "total_tokens": 11629416} {"current_steps": 17820, "total_steps": 38160, "loss": 0.3288, "lr": 0.0006429195711397611, "epoch": 9.339622641509434, "percentage": 46.7, "elapsed_time": "0:45:38", "remaining_time": "0:52:05", "throughput": 4248.92, "total_tokens": 11633800} {"current_steps": 17825, "total_steps": 38160, "loss": 0.5756, "lr": 0.0006427004118132742, "epoch": 9.34224318658281, "percentage": 46.71, "elapsed_time": "0:45:38", "remaining_time": "0:52:04", "throughput": 4249.14, "total_tokens": 11637896} {"current_steps": 17830, "total_steps": 38160, "loss": 0.364, "lr": 0.0006424812226354889, "epoch": 9.344863731656185, "percentage": 46.72, "elapsed_time": "0:45:39", "remaining_time": "0:52:03", "throughput": 4249.15, "total_tokens": 11640904} {"current_steps": 17835, "total_steps": 38160, "loss": 0.5777, "lr": 0.0006422620036522574, "epoch": 9.34748427672956, "percentage": 46.74, "elapsed_time": "0:45:40", "remaining_time": "0:52:02", "throughput": 4249.32, "total_tokens": 11644744} {"current_steps": 17840, "total_steps": 38160, "loss": 0.3922, "lr": 0.000642042754909438, "epoch": 9.350104821802935, "percentage": 46.75, "elapsed_time": "0:45:41", "remaining_time": "0:52:02", "throughput": 4249.44, "total_tokens": 11648264} {"current_steps": 17845, "total_steps": 38160, "loss": 0.4071, "lr": 0.0006418234764528945, "epoch": 9.35272536687631, "percentage": 46.76, "elapsed_time": "0:45:41", "remaining_time": "0:52:01", "throughput": 4249.56, "total_tokens": 11651784} {"current_steps": 17850, "total_steps": 38160, "loss": 0.4658, "lr": 0.0006416041683284978, "epoch": 9.355345911949685, "percentage": 46.78, "elapsed_time": "0:45:42", "remaining_time": "0:52:00", "throughput": 4249.7, "total_tokens": 11655400} {"current_steps": 17855, "total_steps": 38160, "loss": 0.33, "lr": 0.0006413848305821246, "epoch": 9.35796645702306, "percentage": 46.79, "elapsed_time": "0:45:43", "remaining_time": "0:51:59", "throughput": 4249.74, "total_tokens": 11658568} {"current_steps": 17860, "total_steps": 38160, "loss": 0.4764, "lr": 0.0006411654632596578, "epoch": 9.360587002096436, "percentage": 46.8, "elapsed_time": "0:45:44", "remaining_time": "0:51:58", "throughput": 4249.74, "total_tokens": 11661448} {"current_steps": 17865, "total_steps": 38160, "loss": 0.4628, "lr": 0.0006409460664069867, "epoch": 9.36320754716981, "percentage": 46.82, "elapsed_time": "0:45:44", "remaining_time": "0:51:58", "throughput": 4249.76, "total_tokens": 11664520} {"current_steps": 17870, "total_steps": 38160, "loss": 0.4264, "lr": 0.0006407266400700064, "epoch": 9.365828092243186, "percentage": 46.83, "elapsed_time": "0:45:45", "remaining_time": "0:51:57", "throughput": 4249.81, "total_tokens": 11667816} {"current_steps": 17875, "total_steps": 38160, "loss": 0.4307, "lr": 0.0006405071842946185, "epoch": 9.368448637316561, "percentage": 46.84, "elapsed_time": "0:45:46", "remaining_time": "0:51:56", "throughput": 4249.79, "total_tokens": 11670632} {"current_steps": 17880, "total_steps": 38160, "loss": 0.3389, "lr": 0.0006402876991267308, "epoch": 9.371069182389936, "percentage": 46.86, "elapsed_time": "0:45:46", "remaining_time": "0:51:55", "throughput": 4249.83, "total_tokens": 11673800} {"current_steps": 17885, "total_steps": 38160, "loss": 0.4842, "lr": 0.0006400681846122568, "epoch": 9.373689727463312, "percentage": 46.87, "elapsed_time": "0:45:47", "remaining_time": "0:51:54", "throughput": 4249.92, "total_tokens": 11677224} {"current_steps": 17890, "total_steps": 38160, "loss": 0.4135, "lr": 0.0006398486407971166, "epoch": 9.376310272536688, "percentage": 46.88, "elapsed_time": "0:45:48", "remaining_time": "0:51:54", "throughput": 4250.01, "total_tokens": 11680648} {"current_steps": 17895, "total_steps": 38160, "loss": 0.3986, "lr": 0.0006396290677272361, "epoch": 9.378930817610064, "percentage": 46.89, "elapsed_time": "0:45:49", "remaining_time": "0:51:53", "throughput": 4250.19, "total_tokens": 11684616} {"current_steps": 17900, "total_steps": 38160, "loss": 0.3688, "lr": 0.0006394094654485477, "epoch": 9.381551362683439, "percentage": 46.91, "elapsed_time": "0:45:49", "remaining_time": "0:51:52", "throughput": 4250.33, "total_tokens": 11688296} {"current_steps": 17905, "total_steps": 38160, "loss": 0.3959, "lr": 0.0006391898340069896, "epoch": 9.384171907756814, "percentage": 46.92, "elapsed_time": "0:45:50", "remaining_time": "0:51:51", "throughput": 4250.34, "total_tokens": 11691240} {"current_steps": 17910, "total_steps": 38160, "loss": 0.3738, "lr": 0.0006389701734485061, "epoch": 9.38679245283019, "percentage": 46.93, "elapsed_time": "0:45:51", "remaining_time": "0:51:50", "throughput": 4250.28, "total_tokens": 11693704} {"current_steps": 17915, "total_steps": 38160, "loss": 0.4102, "lr": 0.0006387504838190479, "epoch": 9.389412997903564, "percentage": 46.95, "elapsed_time": "0:45:51", "remaining_time": "0:51:49", "throughput": 4250.3, "total_tokens": 11696776} {"current_steps": 17920, "total_steps": 38160, "loss": 0.3734, "lr": 0.0006385307651645715, "epoch": 9.39203354297694, "percentage": 46.96, "elapsed_time": "0:45:52", "remaining_time": "0:51:49", "throughput": 4250.28, "total_tokens": 11699496} {"current_steps": 17925, "total_steps": 38160, "loss": 0.4025, "lr": 0.0006383110175310393, "epoch": 9.394654088050315, "percentage": 46.97, "elapsed_time": "0:45:53", "remaining_time": "0:51:48", "throughput": 4250.43, "total_tokens": 11703176} {"current_steps": 17930, "total_steps": 38160, "loss": 0.4878, "lr": 0.0006380912409644202, "epoch": 9.39727463312369, "percentage": 46.99, "elapsed_time": "0:45:54", "remaining_time": "0:51:47", "throughput": 4250.55, "total_tokens": 11706728} {"current_steps": 17935, "total_steps": 38160, "loss": 0.3987, "lr": 0.000637871435510689, "epoch": 9.399895178197065, "percentage": 47.0, "elapsed_time": "0:45:54", "remaining_time": "0:51:46", "throughput": 4250.59, "total_tokens": 11709864} {"current_steps": 17940, "total_steps": 38160, "loss": 0.476, "lr": 0.0006376516012158262, "epoch": 9.40251572327044, "percentage": 47.01, "elapsed_time": "0:45:55", "remaining_time": "0:51:45", "throughput": 4250.84, "total_tokens": 11714152} {"current_steps": 17945, "total_steps": 38160, "loss": 0.4998, "lr": 0.000637431738125819, "epoch": 9.405136268343815, "percentage": 47.03, "elapsed_time": "0:45:56", "remaining_time": "0:51:45", "throughput": 4251.08, "total_tokens": 11718504} {"current_steps": 17950, "total_steps": 38160, "loss": 0.3785, "lr": 0.00063721184628666, "epoch": 9.40775681341719, "percentage": 47.04, "elapsed_time": "0:45:57", "remaining_time": "0:51:44", "throughput": 4251.11, "total_tokens": 11721640} {"current_steps": 17955, "total_steps": 38160, "loss": 0.3954, "lr": 0.0006369919257443484, "epoch": 9.410377358490566, "percentage": 47.05, "elapsed_time": "0:45:58", "remaining_time": "0:51:43", "throughput": 4251.25, "total_tokens": 11725352} {"current_steps": 17960, "total_steps": 38160, "loss": 0.5032, "lr": 0.0006367719765448886, "epoch": 9.41299790356394, "percentage": 47.06, "elapsed_time": "0:45:58", "remaining_time": "0:51:42", "throughput": 4251.24, "total_tokens": 11728168} {"current_steps": 17965, "total_steps": 38160, "loss": 0.5263, "lr": 0.0006365519987342916, "epoch": 9.415618448637316, "percentage": 47.08, "elapsed_time": "0:45:59", "remaining_time": "0:51:41", "throughput": 4251.22, "total_tokens": 11730920} {"current_steps": 17970, "total_steps": 38160, "loss": 0.4328, "lr": 0.0006363319923585746, "epoch": 9.418238993710691, "percentage": 47.09, "elapsed_time": "0:46:00", "remaining_time": "0:51:41", "throughput": 4251.18, "total_tokens": 11733576} {"current_steps": 17975, "total_steps": 38160, "loss": 0.3616, "lr": 0.0006361119574637599, "epoch": 9.420859538784066, "percentage": 47.1, "elapsed_time": "0:46:00", "remaining_time": "0:51:40", "throughput": 4251.29, "total_tokens": 11737096} {"current_steps": 17980, "total_steps": 38160, "loss": 0.512, "lr": 0.0006358918940958767, "epoch": 9.423480083857442, "percentage": 47.12, "elapsed_time": "0:46:01", "remaining_time": "0:51:39", "throughput": 4251.57, "total_tokens": 11741608} {"current_steps": 17985, "total_steps": 38160, "loss": 0.5684, "lr": 0.0006356718023009597, "epoch": 9.426100628930818, "percentage": 47.13, "elapsed_time": "0:46:02", "remaining_time": "0:51:38", "throughput": 4251.61, "total_tokens": 11744776} {"current_steps": 17990, "total_steps": 38160, "loss": 0.4247, "lr": 0.0006354516821250492, "epoch": 9.428721174004194, "percentage": 47.14, "elapsed_time": "0:46:03", "remaining_time": "0:51:37", "throughput": 4251.57, "total_tokens": 11747432} {"current_steps": 17995, "total_steps": 38160, "loss": 0.4206, "lr": 0.0006352315336141923, "epoch": 9.431341719077569, "percentage": 47.16, "elapsed_time": "0:46:03", "remaining_time": "0:51:36", "throughput": 4251.54, "total_tokens": 11750088} {"current_steps": 18000, "total_steps": 38160, "loss": 0.2861, "lr": 0.0006350113568144414, "epoch": 9.433962264150944, "percentage": 47.17, "elapsed_time": "0:46:04", "remaining_time": "0:51:36", "throughput": 4251.61, "total_tokens": 11753480} {"current_steps": 18005, "total_steps": 38160, "loss": 0.3948, "lr": 0.0006347911517718547, "epoch": 9.43658280922432, "percentage": 47.18, "elapsed_time": "0:46:05", "remaining_time": "0:51:35", "throughput": 4251.58, "total_tokens": 11756168} {"current_steps": 18010, "total_steps": 38160, "loss": 0.5451, "lr": 0.0006345709185324972, "epoch": 9.439203354297694, "percentage": 47.2, "elapsed_time": "0:46:06", "remaining_time": "0:51:34", "throughput": 4251.92, "total_tokens": 11761032} {"current_steps": 18015, "total_steps": 38160, "loss": 0.4909, "lr": 0.0006343506571424386, "epoch": 9.44182389937107, "percentage": 47.21, "elapsed_time": "0:46:06", "remaining_time": "0:51:33", "throughput": 4252.0, "total_tokens": 11764392} {"current_steps": 18020, "total_steps": 38160, "loss": 0.4525, "lr": 0.0006341303676477552, "epoch": 9.444444444444445, "percentage": 47.22, "elapsed_time": "0:46:07", "remaining_time": "0:51:33", "throughput": 4252.0, "total_tokens": 11767272} {"current_steps": 18025, "total_steps": 38160, "loss": 0.6169, "lr": 0.0006339100500945293, "epoch": 9.44706498951782, "percentage": 47.24, "elapsed_time": "0:46:08", "remaining_time": "0:51:32", "throughput": 4252.02, "total_tokens": 11770248} {"current_steps": 18030, "total_steps": 38160, "loss": 0.4218, "lr": 0.0006336897045288486, "epoch": 9.449685534591195, "percentage": 47.25, "elapsed_time": "0:46:08", "remaining_time": "0:51:31", "throughput": 4252.1, "total_tokens": 11773704} {"current_steps": 18035, "total_steps": 38160, "loss": 0.3642, "lr": 0.0006334693309968068, "epoch": 9.45230607966457, "percentage": 47.26, "elapsed_time": "0:46:09", "remaining_time": "0:51:30", "throughput": 4252.07, "total_tokens": 11776328} {"current_steps": 18040, "total_steps": 38160, "loss": 0.4545, "lr": 0.0006332489295445038, "epoch": 9.454926624737945, "percentage": 47.27, "elapsed_time": "0:46:10", "remaining_time": "0:51:29", "throughput": 4252.1, "total_tokens": 11779400} {"current_steps": 18045, "total_steps": 38160, "loss": 0.3624, "lr": 0.0006330285002180448, "epoch": 9.45754716981132, "percentage": 47.29, "elapsed_time": "0:46:10", "remaining_time": "0:51:28", "throughput": 4252.0, "total_tokens": 11781672} {"current_steps": 18050, "total_steps": 38160, "loss": 0.5188, "lr": 0.0006328080430635412, "epoch": 9.460167714884696, "percentage": 47.3, "elapsed_time": "0:46:11", "remaining_time": "0:51:27", "throughput": 4251.99, "total_tokens": 11784552} {"current_steps": 18055, "total_steps": 38160, "loss": 0.5165, "lr": 0.0006325875581271103, "epoch": 9.46278825995807, "percentage": 47.31, "elapsed_time": "0:46:12", "remaining_time": "0:51:27", "throughput": 4252.03, "total_tokens": 11787624} {"current_steps": 18060, "total_steps": 38160, "loss": 0.5417, "lr": 0.0006323670454548749, "epoch": 9.465408805031446, "percentage": 47.33, "elapsed_time": "0:46:13", "remaining_time": "0:51:26", "throughput": 4252.22, "total_tokens": 11791784} {"current_steps": 18065, "total_steps": 38160, "loss": 0.382, "lr": 0.0006321465050929635, "epoch": 9.468029350104821, "percentage": 47.34, "elapsed_time": "0:46:13", "remaining_time": "0:51:25", "throughput": 4252.26, "total_tokens": 11794824} {"current_steps": 18070, "total_steps": 38160, "loss": 0.4133, "lr": 0.000631925937087511, "epoch": 9.470649895178196, "percentage": 47.35, "elapsed_time": "0:46:15", "remaining_time": "0:51:25", "throughput": 4253.1, "total_tokens": 11803304} {"current_steps": 18075, "total_steps": 38160, "loss": 0.4393, "lr": 0.0006317053414846576, "epoch": 9.473270440251572, "percentage": 47.37, "elapsed_time": "0:46:16", "remaining_time": "0:51:24", "throughput": 4253.3, "total_tokens": 11807304} {"current_steps": 18080, "total_steps": 38160, "loss": 0.4642, "lr": 0.0006314847183305492, "epoch": 9.475890985324948, "percentage": 47.38, "elapsed_time": "0:46:16", "remaining_time": "0:51:23", "throughput": 4253.31, "total_tokens": 11810376} {"current_steps": 18085, "total_steps": 38160, "loss": 0.3905, "lr": 0.0006312640676713378, "epoch": 9.478511530398324, "percentage": 47.39, "elapsed_time": "0:46:17", "remaining_time": "0:51:23", "throughput": 4253.33, "total_tokens": 11813352} {"current_steps": 18090, "total_steps": 38160, "loss": 0.4199, "lr": 0.0006310433895531811, "epoch": 9.481132075471699, "percentage": 47.41, "elapsed_time": "0:46:18", "remaining_time": "0:51:22", "throughput": 4253.36, "total_tokens": 11816392} {"current_steps": 18095, "total_steps": 38160, "loss": 0.4911, "lr": 0.0006308226840222422, "epoch": 9.483752620545074, "percentage": 47.42, "elapsed_time": "0:46:18", "remaining_time": "0:51:21", "throughput": 4253.46, "total_tokens": 11819816} {"current_steps": 18100, "total_steps": 38160, "loss": 0.4251, "lr": 0.0006306019511246905, "epoch": 9.48637316561845, "percentage": 47.43, "elapsed_time": "0:46:19", "remaining_time": "0:51:20", "throughput": 4253.62, "total_tokens": 11823752} {"current_steps": 18105, "total_steps": 38160, "loss": 0.4492, "lr": 0.0006303811909067003, "epoch": 9.488993710691824, "percentage": 47.44, "elapsed_time": "0:46:20", "remaining_time": "0:51:19", "throughput": 4253.57, "total_tokens": 11826248} {"current_steps": 18110, "total_steps": 38160, "loss": 0.3951, "lr": 0.0006301604034144527, "epoch": 9.4916142557652, "percentage": 47.46, "elapsed_time": "0:46:21", "remaining_time": "0:51:19", "throughput": 4253.79, "total_tokens": 11830504} {"current_steps": 18115, "total_steps": 38160, "loss": 0.4382, "lr": 0.0006299395886941336, "epoch": 9.494234800838575, "percentage": 47.47, "elapsed_time": "0:46:21", "remaining_time": "0:51:18", "throughput": 4253.7, "total_tokens": 11832872} {"current_steps": 18120, "total_steps": 38160, "loss": 0.5824, "lr": 0.0006297187467919347, "epoch": 9.49685534591195, "percentage": 47.48, "elapsed_time": "0:46:22", "remaining_time": "0:51:17", "throughput": 4253.71, "total_tokens": 11835688} {"current_steps": 18125, "total_steps": 38160, "loss": 0.4658, "lr": 0.0006294978777540542, "epoch": 9.499475890985325, "percentage": 47.5, "elapsed_time": "0:46:23", "remaining_time": "0:51:16", "throughput": 4253.91, "total_tokens": 11839720} {"current_steps": 18130, "total_steps": 38160, "loss": 0.4428, "lr": 0.000629276981626695, "epoch": 9.5020964360587, "percentage": 47.51, "elapsed_time": "0:46:23", "remaining_time": "0:51:15", "throughput": 4253.94, "total_tokens": 11842856} {"current_steps": 18135, "total_steps": 38160, "loss": 0.4442, "lr": 0.0006290560584560661, "epoch": 9.504716981132075, "percentage": 47.52, "elapsed_time": "0:46:24", "remaining_time": "0:51:14", "throughput": 4254.01, "total_tokens": 11846216} {"current_steps": 18140, "total_steps": 38160, "loss": 0.4021, "lr": 0.0006288351082883822, "epoch": 9.50733752620545, "percentage": 47.54, "elapsed_time": "0:46:25", "remaining_time": "0:51:14", "throughput": 4253.95, "total_tokens": 11848776} {"current_steps": 18145, "total_steps": 38160, "loss": 0.4998, "lr": 0.0006286141311698633, "epoch": 9.509958071278826, "percentage": 47.55, "elapsed_time": "0:46:26", "remaining_time": "0:51:13", "throughput": 4254.09, "total_tokens": 11852424} {"current_steps": 18150, "total_steps": 38160, "loss": 0.691, "lr": 0.0006283931271467355, "epoch": 9.5125786163522, "percentage": 47.56, "elapsed_time": "0:46:27", "remaining_time": "0:51:12", "throughput": 4254.35, "total_tokens": 11857064} {"current_steps": 18155, "total_steps": 38160, "loss": 0.3738, "lr": 0.0006281720962652305, "epoch": 9.515199161425576, "percentage": 47.58, "elapsed_time": "0:46:27", "remaining_time": "0:51:11", "throughput": 4254.37, "total_tokens": 11860040} {"current_steps": 18160, "total_steps": 38160, "loss": 0.3913, "lr": 0.0006279510385715849, "epoch": 9.517819706498951, "percentage": 47.59, "elapsed_time": "0:46:28", "remaining_time": "0:51:11", "throughput": 4254.48, "total_tokens": 11863688} {"current_steps": 18165, "total_steps": 38160, "loss": 0.319, "lr": 0.0006277299541120419, "epoch": 9.520440251572326, "percentage": 47.6, "elapsed_time": "0:46:29", "remaining_time": "0:51:10", "throughput": 4254.74, "total_tokens": 11868136} {"current_steps": 18170, "total_steps": 38160, "loss": 0.5036, "lr": 0.0006275088429328499, "epoch": 9.523060796645701, "percentage": 47.62, "elapsed_time": "0:46:30", "remaining_time": "0:51:09", "throughput": 4254.75, "total_tokens": 11871176} {"current_steps": 18175, "total_steps": 38160, "loss": 0.393, "lr": 0.0006272877050802623, "epoch": 9.525681341719078, "percentage": 47.63, "elapsed_time": "0:46:30", "remaining_time": "0:51:08", "throughput": 4254.84, "total_tokens": 11874536} {"current_steps": 18180, "total_steps": 38160, "loss": 0.4441, "lr": 0.0006270665406005393, "epoch": 9.528301886792454, "percentage": 47.64, "elapsed_time": "0:46:31", "remaining_time": "0:51:07", "throughput": 4254.92, "total_tokens": 11877992} {"current_steps": 18185, "total_steps": 38160, "loss": 0.385, "lr": 0.0006268453495399455, "epoch": 9.530922431865829, "percentage": 47.65, "elapsed_time": "0:46:32", "remaining_time": "0:51:07", "throughput": 4254.86, "total_tokens": 11880584} {"current_steps": 18190, "total_steps": 38160, "loss": 0.7339, "lr": 0.0006266241319447517, "epoch": 9.533542976939204, "percentage": 47.67, "elapsed_time": "0:46:33", "remaining_time": "0:51:06", "throughput": 4254.98, "total_tokens": 11884200} {"current_steps": 18195, "total_steps": 38160, "loss": 0.4273, "lr": 0.0006264028878612343, "epoch": 9.536163522012579, "percentage": 47.68, "elapsed_time": "0:46:33", "remaining_time": "0:51:05", "throughput": 4254.93, "total_tokens": 11886760} {"current_steps": 18200, "total_steps": 38160, "loss": 0.4377, "lr": 0.0006261816173356746, "epoch": 9.538784067085954, "percentage": 47.69, "elapsed_time": "0:46:34", "remaining_time": "0:51:04", "throughput": 4254.9, "total_tokens": 11889512} {"current_steps": 18205, "total_steps": 38160, "loss": 0.4996, "lr": 0.0006259603204143602, "epoch": 9.54140461215933, "percentage": 47.71, "elapsed_time": "0:46:35", "remaining_time": "0:51:03", "throughput": 4254.96, "total_tokens": 11892776} {"current_steps": 18210, "total_steps": 38160, "loss": 0.3639, "lr": 0.0006257389971435839, "epoch": 9.544025157232705, "percentage": 47.72, "elapsed_time": "0:46:35", "remaining_time": "0:51:02", "throughput": 4254.92, "total_tokens": 11895432} {"current_steps": 18215, "total_steps": 38160, "loss": 0.4117, "lr": 0.0006255176475696437, "epoch": 9.54664570230608, "percentage": 47.73, "elapsed_time": "0:46:36", "remaining_time": "0:51:02", "throughput": 4255.06, "total_tokens": 11899112} {"current_steps": 18220, "total_steps": 38160, "loss": 0.4383, "lr": 0.0006252962717388438, "epoch": 9.549266247379455, "percentage": 47.75, "elapsed_time": "0:46:37", "remaining_time": "0:51:01", "throughput": 4255.04, "total_tokens": 11901928} {"current_steps": 18225, "total_steps": 38160, "loss": 0.6031, "lr": 0.0006250748696974932, "epoch": 9.55188679245283, "percentage": 47.76, "elapsed_time": "0:46:37", "remaining_time": "0:51:00", "throughput": 4255.22, "total_tokens": 11905928} {"current_steps": 18230, "total_steps": 38160, "loss": 0.6252, "lr": 0.0006248534414919067, "epoch": 9.554507337526205, "percentage": 47.77, "elapsed_time": "0:46:38", "remaining_time": "0:50:59", "throughput": 4255.31, "total_tokens": 11909416} {"current_steps": 18235, "total_steps": 38160, "loss": 0.4365, "lr": 0.0006246319871684047, "epoch": 9.55712788259958, "percentage": 47.79, "elapsed_time": "0:46:39", "remaining_time": "0:50:58", "throughput": 4255.41, "total_tokens": 11912840} {"current_steps": 18240, "total_steps": 38160, "loss": 0.635, "lr": 0.000624410506773313, "epoch": 9.559748427672956, "percentage": 47.8, "elapsed_time": "0:46:40", "remaining_time": "0:50:58", "throughput": 4255.57, "total_tokens": 11916648} {"current_steps": 18245, "total_steps": 38160, "loss": 0.5066, "lr": 0.0006241890003529626, "epoch": 9.56236897274633, "percentage": 47.81, "elapsed_time": "0:46:40", "remaining_time": "0:50:57", "throughput": 4255.65, "total_tokens": 11920040} {"current_steps": 18250, "total_steps": 38160, "loss": 0.4709, "lr": 0.00062396746795369, "epoch": 9.564989517819706, "percentage": 47.82, "elapsed_time": "0:46:41", "remaining_time": "0:50:56", "throughput": 4255.67, "total_tokens": 11923048} {"current_steps": 18255, "total_steps": 38160, "loss": 0.4208, "lr": 0.0006237459096218375, "epoch": 9.567610062893081, "percentage": 47.84, "elapsed_time": "0:46:42", "remaining_time": "0:50:55", "throughput": 4255.79, "total_tokens": 11926792} {"current_steps": 18260, "total_steps": 38160, "loss": 0.4249, "lr": 0.0006235243254037525, "epoch": 9.570230607966456, "percentage": 47.85, "elapsed_time": "0:46:43", "remaining_time": "0:50:54", "throughput": 4255.85, "total_tokens": 11930056} {"current_steps": 18265, "total_steps": 38160, "loss": 0.5018, "lr": 0.0006233027153457878, "epoch": 9.572851153039831, "percentage": 47.86, "elapsed_time": "0:46:43", "remaining_time": "0:50:54", "throughput": 4255.85, "total_tokens": 11933096} {"current_steps": 18270, "total_steps": 38160, "loss": 0.3967, "lr": 0.0006230810794943017, "epoch": 9.575471698113208, "percentage": 47.88, "elapsed_time": "0:46:44", "remaining_time": "0:50:53", "throughput": 4255.85, "total_tokens": 11936072} {"current_steps": 18275, "total_steps": 38160, "loss": 0.3885, "lr": 0.0006228594178956581, "epoch": 9.578092243186584, "percentage": 47.89, "elapsed_time": "0:46:45", "remaining_time": "0:50:52", "throughput": 4255.82, "total_tokens": 11938824} {"current_steps": 18280, "total_steps": 38160, "loss": 0.5573, "lr": 0.0006226377305962259, "epoch": 9.580712788259959, "percentage": 47.9, "elapsed_time": "0:46:45", "remaining_time": "0:50:51", "throughput": 4255.74, "total_tokens": 11941224} {"current_steps": 18285, "total_steps": 38160, "loss": 0.5211, "lr": 0.0006224160176423796, "epoch": 9.583333333333334, "percentage": 47.92, "elapsed_time": "0:46:46", "remaining_time": "0:50:50", "throughput": 4255.77, "total_tokens": 11944264} {"current_steps": 18290, "total_steps": 38160, "loss": 0.4249, "lr": 0.0006221942790804989, "epoch": 9.585953878406709, "percentage": 47.93, "elapsed_time": "0:46:47", "remaining_time": "0:50:49", "throughput": 4255.74, "total_tokens": 11946984} {"current_steps": 18295, "total_steps": 38160, "loss": 0.5168, "lr": 0.0006219725149569691, "epoch": 9.588574423480084, "percentage": 47.94, "elapsed_time": "0:46:47", "remaining_time": "0:50:48", "throughput": 4255.74, "total_tokens": 11949864} {"current_steps": 18300, "total_steps": 38160, "loss": 0.4745, "lr": 0.0006217507253181809, "epoch": 9.59119496855346, "percentage": 47.96, "elapsed_time": "0:46:48", "remaining_time": "0:50:48", "throughput": 4255.8, "total_tokens": 11953096} {"current_steps": 18305, "total_steps": 38160, "loss": 0.5258, "lr": 0.0006215289102105297, "epoch": 9.593815513626835, "percentage": 47.97, "elapsed_time": "0:46:49", "remaining_time": "0:50:47", "throughput": 4256.12, "total_tokens": 11958024} {"current_steps": 18310, "total_steps": 38160, "loss": 0.3679, "lr": 0.0006213070696804171, "epoch": 9.59643605870021, "percentage": 47.98, "elapsed_time": "0:46:50", "remaining_time": "0:50:46", "throughput": 4256.28, "total_tokens": 11961960} {"current_steps": 18315, "total_steps": 38160, "loss": 0.5197, "lr": 0.0006210852037742495, "epoch": 9.599056603773585, "percentage": 48.0, "elapsed_time": "0:46:51", "remaining_time": "0:50:46", "throughput": 4256.47, "total_tokens": 11966120} {"current_steps": 18320, "total_steps": 38160, "loss": 0.6778, "lr": 0.0006208633125384385, "epoch": 9.60167714884696, "percentage": 48.01, "elapsed_time": "0:46:52", "remaining_time": "0:50:45", "throughput": 4256.5, "total_tokens": 11969288} {"current_steps": 18325, "total_steps": 38160, "loss": 0.5076, "lr": 0.0006206413960194017, "epoch": 9.604297693920335, "percentage": 48.02, "elapsed_time": "0:46:52", "remaining_time": "0:50:44", "throughput": 4256.45, "total_tokens": 11971880} {"current_steps": 18330, "total_steps": 38160, "loss": 0.4584, "lr": 0.000620419454263561, "epoch": 9.60691823899371, "percentage": 48.03, "elapsed_time": "0:46:53", "remaining_time": "0:50:43", "throughput": 4256.53, "total_tokens": 11975240} {"current_steps": 18335, "total_steps": 38160, "loss": 0.4546, "lr": 0.0006201974873173443, "epoch": 9.609538784067086, "percentage": 48.05, "elapsed_time": "0:46:54", "remaining_time": "0:50:42", "throughput": 4256.74, "total_tokens": 11979432} {"current_steps": 18340, "total_steps": 38160, "loss": 0.4902, "lr": 0.0006199754952271847, "epoch": 9.61215932914046, "percentage": 48.06, "elapsed_time": "0:46:55", "remaining_time": "0:50:42", "throughput": 4256.95, "total_tokens": 11983496} {"current_steps": 18345, "total_steps": 38160, "loss": 0.4562, "lr": 0.00061975347803952, "epoch": 9.614779874213836, "percentage": 48.07, "elapsed_time": "0:46:55", "remaining_time": "0:50:41", "throughput": 4257.08, "total_tokens": 11987208} {"current_steps": 18350, "total_steps": 38160, "loss": 0.3811, "lr": 0.000619531435800794, "epoch": 9.617400419287211, "percentage": 48.09, "elapsed_time": "0:46:56", "remaining_time": "0:50:40", "throughput": 4257.14, "total_tokens": 11990408} {"current_steps": 18355, "total_steps": 38160, "loss": 0.4883, "lr": 0.0006193093685574553, "epoch": 9.620020964360586, "percentage": 48.1, "elapsed_time": "0:46:57", "remaining_time": "0:50:39", "throughput": 4257.12, "total_tokens": 11993192} {"current_steps": 18360, "total_steps": 38160, "loss": 0.5568, "lr": 0.0006190872763559578, "epoch": 9.622641509433961, "percentage": 48.11, "elapsed_time": "0:46:57", "remaining_time": "0:50:38", "throughput": 4257.26, "total_tokens": 11996872} {"current_steps": 18365, "total_steps": 38160, "loss": 0.4163, "lr": 0.0006188651592427609, "epoch": 9.625262054507338, "percentage": 48.13, "elapsed_time": "0:46:58", "remaining_time": "0:50:38", "throughput": 4257.42, "total_tokens": 12000776} {"current_steps": 18370, "total_steps": 38160, "loss": 0.3179, "lr": 0.0006186430172643287, "epoch": 9.627882599580714, "percentage": 48.14, "elapsed_time": "0:46:59", "remaining_time": "0:50:37", "throughput": 4257.53, "total_tokens": 12004200} {"current_steps": 18375, "total_steps": 38160, "loss": 0.3222, "lr": 0.0006184208504671307, "epoch": 9.630503144654089, "percentage": 48.15, "elapsed_time": "0:47:00", "remaining_time": "0:50:36", "throughput": 4257.51, "total_tokens": 12006952} {"current_steps": 18380, "total_steps": 38160, "loss": 0.3982, "lr": 0.000618198658897642, "epoch": 9.633123689727464, "percentage": 48.17, "elapsed_time": "0:47:00", "remaining_time": "0:50:35", "throughput": 4257.48, "total_tokens": 12009640} {"current_steps": 18385, "total_steps": 38160, "loss": 0.4846, "lr": 0.0006179764426023422, "epoch": 9.635744234800839, "percentage": 48.18, "elapsed_time": "0:47:01", "remaining_time": "0:50:34", "throughput": 4257.51, "total_tokens": 12012680} {"current_steps": 18390, "total_steps": 38160, "loss": 0.436, "lr": 0.0006177542016277167, "epoch": 9.638364779874214, "percentage": 48.19, "elapsed_time": "0:47:02", "remaining_time": "0:50:34", "throughput": 4257.6, "total_tokens": 12016168} {"current_steps": 18395, "total_steps": 38160, "loss": 0.4551, "lr": 0.0006175319360202556, "epoch": 9.64098532494759, "percentage": 48.2, "elapsed_time": "0:47:02", "remaining_time": "0:50:33", "throughput": 4257.53, "total_tokens": 12018664} {"current_steps": 18400, "total_steps": 38160, "loss": 0.489, "lr": 0.0006173096458264542, "epoch": 9.643605870020965, "percentage": 48.22, "elapsed_time": "0:47:03", "remaining_time": "0:50:32", "throughput": 4257.64, "total_tokens": 12022280} {"current_steps": 18405, "total_steps": 38160, "loss": 0.3749, "lr": 0.0006170873310928133, "epoch": 9.64622641509434, "percentage": 48.23, "elapsed_time": "0:47:04", "remaining_time": "0:50:31", "throughput": 4257.71, "total_tokens": 12025512} {"current_steps": 18410, "total_steps": 38160, "loss": 0.5443, "lr": 0.0006168649918658387, "epoch": 9.648846960167715, "percentage": 48.24, "elapsed_time": "0:47:05", "remaining_time": "0:50:30", "throughput": 4257.65, "total_tokens": 12027976} {"current_steps": 18415, "total_steps": 38160, "loss": 0.5422, "lr": 0.0006166426281920407, "epoch": 9.65146750524109, "percentage": 48.26, "elapsed_time": "0:47:05", "remaining_time": "0:50:29", "throughput": 4257.73, "total_tokens": 12031400} {"current_steps": 18420, "total_steps": 38160, "loss": 0.4779, "lr": 0.000616420240117936, "epoch": 9.654088050314465, "percentage": 48.27, "elapsed_time": "0:47:06", "remaining_time": "0:50:29", "throughput": 4257.75, "total_tokens": 12034344} {"current_steps": 18425, "total_steps": 38160, "loss": 0.5029, "lr": 0.000616197827690045, "epoch": 9.65670859538784, "percentage": 48.28, "elapsed_time": "0:47:07", "remaining_time": "0:50:28", "throughput": 4258.07, "total_tokens": 12039368} {"current_steps": 18430, "total_steps": 38160, "loss": 0.299, "lr": 0.0006159753909548943, "epoch": 9.659329140461216, "percentage": 48.3, "elapsed_time": "0:47:08", "remaining_time": "0:50:27", "throughput": 4258.17, "total_tokens": 12042760} {"current_steps": 18435, "total_steps": 38160, "loss": 0.3736, "lr": 0.0006157529299590148, "epoch": 9.66194968553459, "percentage": 48.31, "elapsed_time": "0:47:08", "remaining_time": "0:50:26", "throughput": 4258.2, "total_tokens": 12045800} {"current_steps": 18440, "total_steps": 38160, "loss": 0.3984, "lr": 0.000615530444748943, "epoch": 9.664570230607966, "percentage": 48.32, "elapsed_time": "0:47:09", "remaining_time": "0:50:26", "throughput": 4258.33, "total_tokens": 12049544} {"current_steps": 18445, "total_steps": 38160, "loss": 0.4704, "lr": 0.0006153079353712201, "epoch": 9.667190775681341, "percentage": 48.34, "elapsed_time": "0:47:10", "remaining_time": "0:50:25", "throughput": 4258.31, "total_tokens": 12052296} {"current_steps": 18450, "total_steps": 38160, "loss": 0.4943, "lr": 0.0006150854018723926, "epoch": 9.669811320754716, "percentage": 48.35, "elapsed_time": "0:47:10", "remaining_time": "0:50:24", "throughput": 4258.32, "total_tokens": 12055208} {"current_steps": 18455, "total_steps": 38160, "loss": 0.5035, "lr": 0.0006148628442990122, "epoch": 9.672431865828091, "percentage": 48.36, "elapsed_time": "0:47:11", "remaining_time": "0:50:23", "throughput": 4258.57, "total_tokens": 12059624} {"current_steps": 18460, "total_steps": 38160, "loss": 0.425, "lr": 0.0006146402626976351, "epoch": 9.675052410901468, "percentage": 48.38, "elapsed_time": "0:47:12", "remaining_time": "0:50:22", "throughput": 4258.57, "total_tokens": 12062504} {"current_steps": 18465, "total_steps": 38160, "loss": 0.3654, "lr": 0.0006144176571148228, "epoch": 9.677672955974844, "percentage": 48.39, "elapsed_time": "0:47:13", "remaining_time": "0:50:22", "throughput": 4258.67, "total_tokens": 12066024} {"current_steps": 18470, "total_steps": 38160, "loss": 0.3102, "lr": 0.0006141950275971422, "epoch": 9.680293501048219, "percentage": 48.4, "elapsed_time": "0:47:13", "remaining_time": "0:50:21", "throughput": 4258.69, "total_tokens": 12069000} {"current_steps": 18475, "total_steps": 38160, "loss": 0.4834, "lr": 0.0006139723741911644, "epoch": 9.682914046121594, "percentage": 48.41, "elapsed_time": "0:47:14", "remaining_time": "0:50:20", "throughput": 4258.9, "total_tokens": 12073160} {"current_steps": 18480, "total_steps": 38160, "loss": 0.5581, "lr": 0.0006137496969434664, "epoch": 9.685534591194969, "percentage": 48.43, "elapsed_time": "0:47:15", "remaining_time": "0:50:19", "throughput": 4258.98, "total_tokens": 12076552} {"current_steps": 18485, "total_steps": 38160, "loss": 0.4406, "lr": 0.0006135269959006294, "epoch": 9.688155136268344, "percentage": 48.44, "elapsed_time": "0:47:16", "remaining_time": "0:50:18", "throughput": 4259.01, "total_tokens": 12079592} {"current_steps": 18490, "total_steps": 38160, "loss": 0.4899, "lr": 0.00061330427110924, "epoch": 9.69077568134172, "percentage": 48.45, "elapsed_time": "0:47:16", "remaining_time": "0:50:17", "throughput": 4258.98, "total_tokens": 12082376} {"current_steps": 18495, "total_steps": 38160, "loss": 0.4785, "lr": 0.0006130815226158899, "epoch": 9.693396226415095, "percentage": 48.47, "elapsed_time": "0:47:17", "remaining_time": "0:50:17", "throughput": 4258.99, "total_tokens": 12085224} {"current_steps": 18500, "total_steps": 38160, "loss": 0.4471, "lr": 0.0006128587504671753, "epoch": 9.69601677148847, "percentage": 48.48, "elapsed_time": "0:47:18", "remaining_time": "0:50:16", "throughput": 4258.96, "total_tokens": 12087976} {"current_steps": 18505, "total_steps": 38160, "loss": 0.4444, "lr": 0.0006126359547096974, "epoch": 9.698637316561845, "percentage": 48.49, "elapsed_time": "0:47:18", "remaining_time": "0:50:15", "throughput": 4258.91, "total_tokens": 12090696} {"current_steps": 18510, "total_steps": 38160, "loss": 0.4268, "lr": 0.0006124131353900632, "epoch": 9.70125786163522, "percentage": 48.51, "elapsed_time": "0:47:19", "remaining_time": "0:50:14", "throughput": 4259.02, "total_tokens": 12094312} {"current_steps": 18515, "total_steps": 38160, "loss": 0.5107, "lr": 0.0006121902925548833, "epoch": 9.703878406708595, "percentage": 48.52, "elapsed_time": "0:47:20", "remaining_time": "0:50:13", "throughput": 4259.14, "total_tokens": 12097928} {"current_steps": 18520, "total_steps": 38160, "loss": 0.5502, "lr": 0.0006119674262507743, "epoch": 9.70649895178197, "percentage": 48.53, "elapsed_time": "0:47:21", "remaining_time": "0:50:13", "throughput": 4259.27, "total_tokens": 12101576} {"current_steps": 18525, "total_steps": 38160, "loss": 0.4241, "lr": 0.0006117445365243571, "epoch": 9.709119496855346, "percentage": 48.55, "elapsed_time": "0:47:21", "remaining_time": "0:50:12", "throughput": 4259.23, "total_tokens": 12104200} {"current_steps": 18530, "total_steps": 38160, "loss": 0.3376, "lr": 0.0006115216234222575, "epoch": 9.71174004192872, "percentage": 48.56, "elapsed_time": "0:47:22", "remaining_time": "0:50:11", "throughput": 4259.4, "total_tokens": 12108008} {"current_steps": 18535, "total_steps": 38160, "loss": 0.4373, "lr": 0.0006112986869911068, "epoch": 9.714360587002096, "percentage": 48.57, "elapsed_time": "0:47:23", "remaining_time": "0:50:10", "throughput": 4259.46, "total_tokens": 12111240} {"current_steps": 18540, "total_steps": 38160, "loss": 0.3933, "lr": 0.0006110757272775405, "epoch": 9.716981132075471, "percentage": 48.58, "elapsed_time": "0:47:24", "remaining_time": "0:50:09", "throughput": 4259.48, "total_tokens": 12114216} {"current_steps": 18545, "total_steps": 38160, "loss": 0.4875, "lr": 0.0006108527443281992, "epoch": 9.719601677148846, "percentage": 48.6, "elapsed_time": "0:47:24", "remaining_time": "0:50:08", "throughput": 4259.38, "total_tokens": 12116520} {"current_steps": 18550, "total_steps": 38160, "loss": 0.4898, "lr": 0.0006106297381897284, "epoch": 9.722222222222221, "percentage": 48.61, "elapsed_time": "0:47:25", "remaining_time": "0:50:07", "throughput": 4259.34, "total_tokens": 12119208} {"current_steps": 18555, "total_steps": 38160, "loss": 0.4682, "lr": 0.0006104067089087787, "epoch": 9.724842767295598, "percentage": 48.62, "elapsed_time": "0:47:26", "remaining_time": "0:50:07", "throughput": 4259.37, "total_tokens": 12122248} {"current_steps": 18560, "total_steps": 38160, "loss": 0.4062, "lr": 0.0006101836565320049, "epoch": 9.727463312368974, "percentage": 48.64, "elapsed_time": "0:47:26", "remaining_time": "0:50:06", "throughput": 4259.48, "total_tokens": 12125800} {"current_steps": 18565, "total_steps": 38160, "loss": 0.5318, "lr": 0.0006099605811060673, "epoch": 9.730083857442349, "percentage": 48.65, "elapsed_time": "0:47:27", "remaining_time": "0:50:05", "throughput": 4259.42, "total_tokens": 12128328} {"current_steps": 18570, "total_steps": 38160, "loss": 0.4216, "lr": 0.0006097374826776307, "epoch": 9.732704402515724, "percentage": 48.66, "elapsed_time": "0:47:28", "remaining_time": "0:50:04", "throughput": 4259.48, "total_tokens": 12131560} {"current_steps": 18575, "total_steps": 38160, "loss": 0.4385, "lr": 0.0006095143612933646, "epoch": 9.735324947589099, "percentage": 48.68, "elapsed_time": "0:47:28", "remaining_time": "0:50:03", "throughput": 4259.42, "total_tokens": 12134024} {"current_steps": 18580, "total_steps": 38160, "loss": 0.5623, "lr": 0.0006092912169999435, "epoch": 9.737945492662474, "percentage": 48.69, "elapsed_time": "0:47:29", "remaining_time": "0:50:02", "throughput": 4259.39, "total_tokens": 12136808} {"current_steps": 18585, "total_steps": 38160, "loss": 0.4756, "lr": 0.0006090680498440465, "epoch": 9.74056603773585, "percentage": 48.7, "elapsed_time": "0:47:30", "remaining_time": "0:50:02", "throughput": 4259.53, "total_tokens": 12140488} {"current_steps": 18590, "total_steps": 38160, "loss": 0.3293, "lr": 0.0006088448598723581, "epoch": 9.743186582809225, "percentage": 48.72, "elapsed_time": "0:47:30", "remaining_time": "0:50:01", "throughput": 4259.65, "total_tokens": 12144104} {"current_steps": 18595, "total_steps": 38160, "loss": 0.4631, "lr": 0.0006086216471315666, "epoch": 9.7458071278826, "percentage": 48.73, "elapsed_time": "0:47:31", "remaining_time": "0:50:00", "throughput": 4259.72, "total_tokens": 12147464} {"current_steps": 18600, "total_steps": 38160, "loss": 0.3998, "lr": 0.0006083984116683659, "epoch": 9.748427672955975, "percentage": 48.74, "elapsed_time": "0:47:32", "remaining_time": "0:49:59", "throughput": 4259.79, "total_tokens": 12150760} {"current_steps": 18605, "total_steps": 38160, "loss": 0.5643, "lr": 0.0006081751535294539, "epoch": 9.75104821802935, "percentage": 48.76, "elapsed_time": "0:47:33", "remaining_time": "0:49:58", "throughput": 4259.83, "total_tokens": 12153896} {"current_steps": 18610, "total_steps": 38160, "loss": 0.3765, "lr": 0.0006079518727615341, "epoch": 9.753668763102725, "percentage": 48.77, "elapsed_time": "0:47:33", "remaining_time": "0:49:57", "throughput": 4259.81, "total_tokens": 12156584} {"current_steps": 18615, "total_steps": 38160, "loss": 0.3757, "lr": 0.0006077285694113141, "epoch": 9.7562893081761, "percentage": 48.78, "elapsed_time": "0:47:34", "remaining_time": "0:49:57", "throughput": 4260.02, "total_tokens": 12160648} {"current_steps": 18620, "total_steps": 38160, "loss": 0.4625, "lr": 0.0006075052435255062, "epoch": 9.758909853249476, "percentage": 48.79, "elapsed_time": "0:47:35", "remaining_time": "0:49:56", "throughput": 4260.02, "total_tokens": 12163496} {"current_steps": 18625, "total_steps": 38160, "loss": 0.6049, "lr": 0.000607281895150828, "epoch": 9.76153039832285, "percentage": 48.81, "elapsed_time": "0:47:35", "remaining_time": "0:49:55", "throughput": 4259.92, "total_tokens": 12165800} {"current_steps": 18630, "total_steps": 38160, "loss": 0.5575, "lr": 0.0006070585243340013, "epoch": 9.764150943396226, "percentage": 48.82, "elapsed_time": "0:47:36", "remaining_time": "0:49:54", "throughput": 4259.97, "total_tokens": 12169064} {"current_steps": 18635, "total_steps": 38160, "loss": 0.4776, "lr": 0.0006068351311217526, "epoch": 9.766771488469601, "percentage": 48.83, "elapsed_time": "0:47:37", "remaining_time": "0:49:53", "throughput": 4259.94, "total_tokens": 12171816} {"current_steps": 18640, "total_steps": 38160, "loss": 0.4154, "lr": 0.0006066117155608135, "epoch": 9.769392033542976, "percentage": 48.85, "elapsed_time": "0:47:38", "remaining_time": "0:49:52", "throughput": 4260.03, "total_tokens": 12175368} {"current_steps": 18645, "total_steps": 38160, "loss": 0.535, "lr": 0.0006063882776979196, "epoch": 9.772012578616351, "percentage": 48.86, "elapsed_time": "0:47:38", "remaining_time": "0:49:52", "throughput": 4260.27, "total_tokens": 12179752} {"current_steps": 18650, "total_steps": 38160, "loss": 0.4757, "lr": 0.0006061648175798117, "epoch": 9.774633123689728, "percentage": 48.87, "elapsed_time": "0:47:39", "remaining_time": "0:49:51", "throughput": 4260.3, "total_tokens": 12182888} {"current_steps": 18655, "total_steps": 38160, "loss": 0.3703, "lr": 0.0006059413352532355, "epoch": 9.777253668763104, "percentage": 48.89, "elapsed_time": "0:47:40", "remaining_time": "0:49:50", "throughput": 4260.35, "total_tokens": 12186024} {"current_steps": 18660, "total_steps": 38160, "loss": 0.3969, "lr": 0.0006057178307649402, "epoch": 9.779874213836479, "percentage": 48.9, "elapsed_time": "0:47:40", "remaining_time": "0:49:49", "throughput": 4260.3, "total_tokens": 12188680} {"current_steps": 18665, "total_steps": 38160, "loss": 0.4739, "lr": 0.000605494304161681, "epoch": 9.782494758909854, "percentage": 48.91, "elapsed_time": "0:47:41", "remaining_time": "0:49:48", "throughput": 4260.38, "total_tokens": 12192040} {"current_steps": 18670, "total_steps": 38160, "loss": 0.5169, "lr": 0.0006052707554902169, "epoch": 9.785115303983229, "percentage": 48.93, "elapsed_time": "0:47:42", "remaining_time": "0:49:48", "throughput": 4260.46, "total_tokens": 12195400} {"current_steps": 18675, "total_steps": 38160, "loss": 0.4593, "lr": 0.0006050471847973117, "epoch": 9.787735849056604, "percentage": 48.94, "elapsed_time": "0:47:43", "remaining_time": "0:49:47", "throughput": 4260.55, "total_tokens": 12198888} {"current_steps": 18680, "total_steps": 38160, "loss": 0.5208, "lr": 0.000604823592129734, "epoch": 9.79035639412998, "percentage": 48.95, "elapsed_time": "0:47:43", "remaining_time": "0:49:46", "throughput": 4260.56, "total_tokens": 12201800} {"current_steps": 18685, "total_steps": 38160, "loss": 0.3877, "lr": 0.0006045999775342566, "epoch": 9.792976939203355, "percentage": 48.96, "elapsed_time": "0:47:44", "remaining_time": "0:49:45", "throughput": 4260.5, "total_tokens": 12204328} {"current_steps": 18690, "total_steps": 38160, "loss": 0.3828, "lr": 0.0006043763410576572, "epoch": 9.79559748427673, "percentage": 48.98, "elapsed_time": "0:47:45", "remaining_time": "0:49:44", "throughput": 4260.52, "total_tokens": 12207432} {"current_steps": 18695, "total_steps": 38160, "loss": 0.3415, "lr": 0.0006041526827467182, "epoch": 9.798218029350105, "percentage": 48.99, "elapsed_time": "0:47:45", "remaining_time": "0:49:43", "throughput": 4260.44, "total_tokens": 12209832} {"current_steps": 18700, "total_steps": 38160, "loss": 0.4573, "lr": 0.000603929002648226, "epoch": 9.80083857442348, "percentage": 49.0, "elapsed_time": "0:47:46", "remaining_time": "0:49:43", "throughput": 4260.43, "total_tokens": 12212648} {"current_steps": 18705, "total_steps": 38160, "loss": 0.2992, "lr": 0.0006037053008089723, "epoch": 9.803459119496855, "percentage": 49.02, "elapsed_time": "0:47:47", "remaining_time": "0:49:42", "throughput": 4260.61, "total_tokens": 12216648} {"current_steps": 18710, "total_steps": 38160, "loss": 0.4698, "lr": 0.0006034815772757528, "epoch": 9.80607966457023, "percentage": 49.03, "elapsed_time": "0:47:48", "remaining_time": "0:49:41", "throughput": 4260.66, "total_tokens": 12219816} {"current_steps": 18715, "total_steps": 38160, "loss": 0.4687, "lr": 0.0006032578320953678, "epoch": 9.808700209643606, "percentage": 49.04, "elapsed_time": "0:47:48", "remaining_time": "0:49:40", "throughput": 4260.87, "total_tokens": 12224040} {"current_steps": 18720, "total_steps": 38160, "loss": 0.4876, "lr": 0.0006030340653146224, "epoch": 9.81132075471698, "percentage": 49.06, "elapsed_time": "0:47:49", "remaining_time": "0:49:40", "throughput": 4261.12, "total_tokens": 12228392} {"current_steps": 18725, "total_steps": 38160, "loss": 0.5814, "lr": 0.0006028102769803261, "epoch": 9.813941299790356, "percentage": 49.07, "elapsed_time": "0:47:50", "remaining_time": "0:49:39", "throughput": 4261.1, "total_tokens": 12231144} {"current_steps": 18730, "total_steps": 38160, "loss": 0.5176, "lr": 0.0006025864671392925, "epoch": 9.816561844863731, "percentage": 49.08, "elapsed_time": "0:47:51", "remaining_time": "0:49:38", "throughput": 4261.29, "total_tokens": 12235176} {"current_steps": 18735, "total_steps": 38160, "loss": 0.5061, "lr": 0.0006023626358383406, "epoch": 9.819182389937106, "percentage": 49.1, "elapsed_time": "0:47:51", "remaining_time": "0:49:37", "throughput": 4261.33, "total_tokens": 12238312} {"current_steps": 18740, "total_steps": 38160, "loss": 0.7069, "lr": 0.0006021387831242932, "epoch": 9.821802935010481, "percentage": 49.11, "elapsed_time": "0:47:52", "remaining_time": "0:49:36", "throughput": 4261.27, "total_tokens": 12240872} {"current_steps": 18745, "total_steps": 38160, "loss": 0.4121, "lr": 0.0006019149090439774, "epoch": 9.824423480083858, "percentage": 49.12, "elapsed_time": "0:47:53", "remaining_time": "0:49:35", "throughput": 4261.32, "total_tokens": 12244008} {"current_steps": 18750, "total_steps": 38160, "loss": 0.6491, "lr": 0.0006016910136442254, "epoch": 9.827044025157234, "percentage": 49.14, "elapsed_time": "0:47:53", "remaining_time": "0:49:35", "throughput": 4261.34, "total_tokens": 12247048} {"current_steps": 18755, "total_steps": 38160, "loss": 0.36, "lr": 0.0006014670969718735, "epoch": 9.829664570230609, "percentage": 49.15, "elapsed_time": "0:47:54", "remaining_time": "0:49:34", "throughput": 4261.36, "total_tokens": 12250056} {"current_steps": 18760, "total_steps": 38160, "loss": 0.3429, "lr": 0.0006012431590737625, "epoch": 9.832285115303984, "percentage": 49.16, "elapsed_time": "0:47:55", "remaining_time": "0:49:33", "throughput": 4261.33, "total_tokens": 12252744} {"current_steps": 18765, "total_steps": 38160, "loss": 0.3385, "lr": 0.0006010191999967378, "epoch": 9.834905660377359, "percentage": 49.17, "elapsed_time": "0:47:55", "remaining_time": "0:49:32", "throughput": 4261.29, "total_tokens": 12255368} {"current_steps": 18770, "total_steps": 38160, "loss": 0.3716, "lr": 0.0006007952197876487, "epoch": 9.837526205450734, "percentage": 49.19, "elapsed_time": "0:47:56", "remaining_time": "0:49:31", "throughput": 4261.45, "total_tokens": 12259304} {"current_steps": 18775, "total_steps": 38160, "loss": 0.4013, "lr": 0.0006005712184933498, "epoch": 9.84014675052411, "percentage": 49.2, "elapsed_time": "0:47:57", "remaining_time": "0:49:30", "throughput": 4261.47, "total_tokens": 12262376} {"current_steps": 18780, "total_steps": 38160, "loss": 0.3318, "lr": 0.0006003471961606992, "epoch": 9.842767295597485, "percentage": 49.21, "elapsed_time": "0:47:58", "remaining_time": "0:49:30", "throughput": 4261.55, "total_tokens": 12265672} {"current_steps": 18785, "total_steps": 38160, "loss": 0.5076, "lr": 0.0006001231528365601, "epoch": 9.84538784067086, "percentage": 49.23, "elapsed_time": "0:47:58", "remaining_time": "0:49:29", "throughput": 4261.59, "total_tokens": 12268904} {"current_steps": 18790, "total_steps": 38160, "loss": 0.4756, "lr": 0.0005998990885677996, "epoch": 9.848008385744235, "percentage": 49.24, "elapsed_time": "0:47:59", "remaining_time": "0:49:28", "throughput": 4261.68, "total_tokens": 12272264} {"current_steps": 18795, "total_steps": 38160, "loss": 0.4144, "lr": 0.0005996750034012895, "epoch": 9.85062893081761, "percentage": 49.25, "elapsed_time": "0:48:00", "remaining_time": "0:49:27", "throughput": 4261.79, "total_tokens": 12275720} {"current_steps": 18800, "total_steps": 38160, "loss": 0.4095, "lr": 0.0005994508973839058, "epoch": 9.853249475890985, "percentage": 49.27, "elapsed_time": "0:48:01", "remaining_time": "0:49:26", "throughput": 4261.77, "total_tokens": 12278440} {"current_steps": 18805, "total_steps": 38160, "loss": 0.4427, "lr": 0.0005992267705625289, "epoch": 9.85587002096436, "percentage": 49.28, "elapsed_time": "0:48:01", "remaining_time": "0:49:25", "throughput": 4261.68, "total_tokens": 12280776} {"current_steps": 18810, "total_steps": 38160, "loss": 0.5527, "lr": 0.0005990026229840439, "epoch": 9.858490566037736, "percentage": 49.29, "elapsed_time": "0:48:02", "remaining_time": "0:49:25", "throughput": 4261.74, "total_tokens": 12284104} {"current_steps": 18815, "total_steps": 38160, "loss": 0.3789, "lr": 0.0005987784546953394, "epoch": 9.86111111111111, "percentage": 49.31, "elapsed_time": "0:48:03", "remaining_time": "0:49:24", "throughput": 4261.85, "total_tokens": 12287848} {"current_steps": 18820, "total_steps": 38160, "loss": 0.4727, "lr": 0.0005985542657433091, "epoch": 9.863731656184486, "percentage": 49.32, "elapsed_time": "0:48:03", "remaining_time": "0:49:23", "throughput": 4261.84, "total_tokens": 12290664} {"current_steps": 18825, "total_steps": 38160, "loss": 0.4057, "lr": 0.000598330056174851, "epoch": 9.866352201257861, "percentage": 49.33, "elapsed_time": "0:48:04", "remaining_time": "0:49:22", "throughput": 4261.87, "total_tokens": 12293928} {"current_steps": 18830, "total_steps": 38160, "loss": 0.3537, "lr": 0.0005981058260368668, "epoch": 9.868972746331236, "percentage": 49.34, "elapsed_time": "0:48:05", "remaining_time": "0:49:21", "throughput": 4261.8, "total_tokens": 12296488} {"current_steps": 18835, "total_steps": 38160, "loss": 0.4914, "lr": 0.0005978815753762632, "epoch": 9.871593291404611, "percentage": 49.36, "elapsed_time": "0:48:06", "remaining_time": "0:49:21", "throughput": 4261.92, "total_tokens": 12300008} {"current_steps": 18840, "total_steps": 38160, "loss": 0.3619, "lr": 0.0005976573042399505, "epoch": 9.874213836477988, "percentage": 49.37, "elapsed_time": "0:48:06", "remaining_time": "0:49:20", "throughput": 4261.98, "total_tokens": 12303240} {"current_steps": 18845, "total_steps": 38160, "loss": 0.477, "lr": 0.000597433012674844, "epoch": 9.876834381551364, "percentage": 49.38, "elapsed_time": "0:48:07", "remaining_time": "0:49:19", "throughput": 4262.01, "total_tokens": 12306312} {"current_steps": 18850, "total_steps": 38160, "loss": 0.39, "lr": 0.0005972087007278628, "epoch": 9.879454926624739, "percentage": 49.4, "elapsed_time": "0:48:08", "remaining_time": "0:49:18", "throughput": 4261.97, "total_tokens": 12309000} {"current_steps": 18855, "total_steps": 38160, "loss": 0.4153, "lr": 0.0005969843684459305, "epoch": 9.882075471698114, "percentage": 49.41, "elapsed_time": "0:48:08", "remaining_time": "0:49:17", "throughput": 4262.13, "total_tokens": 12312904} {"current_steps": 18860, "total_steps": 38160, "loss": 0.3903, "lr": 0.0005967600158759746, "epoch": 9.884696016771489, "percentage": 49.42, "elapsed_time": "0:48:09", "remaining_time": "0:49:16", "throughput": 4262.11, "total_tokens": 12315624} {"current_steps": 18865, "total_steps": 38160, "loss": 0.4963, "lr": 0.0005965356430649276, "epoch": 9.887316561844864, "percentage": 49.44, "elapsed_time": "0:48:10", "remaining_time": "0:49:16", "throughput": 4262.23, "total_tokens": 12319336} {"current_steps": 18870, "total_steps": 38160, "loss": 0.6399, "lr": 0.0005963112500597251, "epoch": 9.88993710691824, "percentage": 49.45, "elapsed_time": "0:48:11", "remaining_time": "0:49:15", "throughput": 4262.19, "total_tokens": 12322088} {"current_steps": 18875, "total_steps": 38160, "loss": 0.4581, "lr": 0.0005960868369073079, "epoch": 9.892557651991615, "percentage": 49.46, "elapsed_time": "0:48:11", "remaining_time": "0:49:14", "throughput": 4262.13, "total_tokens": 12324648} {"current_steps": 18880, "total_steps": 38160, "loss": 0.4291, "lr": 0.0005958624036546208, "epoch": 9.89517819706499, "percentage": 49.48, "elapsed_time": "0:48:12", "remaining_time": "0:49:13", "throughput": 4262.27, "total_tokens": 12328392} {"current_steps": 18885, "total_steps": 38160, "loss": 0.3235, "lr": 0.0005956379503486123, "epoch": 9.897798742138365, "percentage": 49.49, "elapsed_time": "0:48:13", "remaining_time": "0:49:12", "throughput": 4262.41, "total_tokens": 12332200} {"current_steps": 18890, "total_steps": 38160, "loss": 0.3401, "lr": 0.0005954134770362359, "epoch": 9.90041928721174, "percentage": 49.5, "elapsed_time": "0:48:13", "remaining_time": "0:49:12", "throughput": 4262.44, "total_tokens": 12335304} {"current_steps": 18895, "total_steps": 38160, "loss": 0.3496, "lr": 0.0005951889837644486, "epoch": 9.903039832285115, "percentage": 49.52, "elapsed_time": "0:48:14", "remaining_time": "0:49:11", "throughput": 4262.47, "total_tokens": 12338440} {"current_steps": 18900, "total_steps": 38160, "loss": 0.4681, "lr": 0.0005949644705802116, "epoch": 9.90566037735849, "percentage": 49.53, "elapsed_time": "0:48:15", "remaining_time": "0:49:11", "throughput": 4262.99, "total_tokens": 12345192} {"current_steps": 18905, "total_steps": 38160, "loss": 0.4352, "lr": 0.0005947399375304909, "epoch": 9.908280922431866, "percentage": 49.54, "elapsed_time": "0:48:16", "remaining_time": "0:49:10", "throughput": 4263.12, "total_tokens": 12349000} {"current_steps": 18910, "total_steps": 38160, "loss": 0.4082, "lr": 0.0005945153846622563, "epoch": 9.91090146750524, "percentage": 49.55, "elapsed_time": "0:48:17", "remaining_time": "0:49:09", "throughput": 4263.12, "total_tokens": 12351880} {"current_steps": 18915, "total_steps": 38160, "loss": 0.587, "lr": 0.0005942908120224815, "epoch": 9.913522012578616, "percentage": 49.57, "elapsed_time": "0:48:18", "remaining_time": "0:49:08", "throughput": 4263.09, "total_tokens": 12354600} {"current_steps": 18920, "total_steps": 38160, "loss": 0.3585, "lr": 0.0005940662196581443, "epoch": 9.916142557651991, "percentage": 49.58, "elapsed_time": "0:48:18", "remaining_time": "0:49:07", "throughput": 4263.08, "total_tokens": 12357416} {"current_steps": 18925, "total_steps": 38160, "loss": 0.5251, "lr": 0.0005938416076162273, "epoch": 9.918763102725366, "percentage": 49.59, "elapsed_time": "0:48:19", "remaining_time": "0:49:06", "throughput": 4263.14, "total_tokens": 12360616} {"current_steps": 18930, "total_steps": 38160, "loss": 0.4579, "lr": 0.0005936169759437165, "epoch": 9.921383647798741, "percentage": 49.61, "elapsed_time": "0:48:20", "remaining_time": "0:49:06", "throughput": 4263.08, "total_tokens": 12363144} {"current_steps": 18935, "total_steps": 38160, "loss": 0.3993, "lr": 0.0005933923246876024, "epoch": 9.924004192872118, "percentage": 49.62, "elapsed_time": "0:48:20", "remaining_time": "0:49:05", "throughput": 4263.22, "total_tokens": 12366856} {"current_steps": 18940, "total_steps": 38160, "loss": 0.5501, "lr": 0.0005931676538948795, "epoch": 9.926624737945493, "percentage": 49.63, "elapsed_time": "0:48:21", "remaining_time": "0:49:04", "throughput": 4263.38, "total_tokens": 12370824} {"current_steps": 18945, "total_steps": 38160, "loss": 0.4601, "lr": 0.0005929429636125463, "epoch": 9.929245283018869, "percentage": 49.65, "elapsed_time": "0:48:22", "remaining_time": "0:49:03", "throughput": 4263.52, "total_tokens": 12374568} {"current_steps": 18950, "total_steps": 38160, "loss": 0.6144, "lr": 0.0005927182538876055, "epoch": 9.931865828092244, "percentage": 49.66, "elapsed_time": "0:48:23", "remaining_time": "0:49:02", "throughput": 4263.46, "total_tokens": 12377096} {"current_steps": 18955, "total_steps": 38160, "loss": 0.4336, "lr": 0.0005924935247670637, "epoch": 9.934486373165619, "percentage": 49.67, "elapsed_time": "0:48:23", "remaining_time": "0:49:02", "throughput": 4263.48, "total_tokens": 12380072} {"current_steps": 18960, "total_steps": 38160, "loss": 0.3917, "lr": 0.0005922687762979317, "epoch": 9.937106918238994, "percentage": 49.69, "elapsed_time": "0:48:24", "remaining_time": "0:49:01", "throughput": 4263.51, "total_tokens": 12383240} {"current_steps": 18965, "total_steps": 38160, "loss": 0.4668, "lr": 0.0005920440085272245, "epoch": 9.93972746331237, "percentage": 49.7, "elapsed_time": "0:48:25", "remaining_time": "0:49:00", "throughput": 4263.71, "total_tokens": 12387368} {"current_steps": 18970, "total_steps": 38160, "loss": 0.4693, "lr": 0.0005918192215019608, "epoch": 9.942348008385745, "percentage": 49.71, "elapsed_time": "0:48:25", "remaining_time": "0:48:59", "throughput": 4263.71, "total_tokens": 12390280} {"current_steps": 18975, "total_steps": 38160, "loss": 0.3611, "lr": 0.0005915944152691633, "epoch": 9.94496855345912, "percentage": 49.72, "elapsed_time": "0:48:27", "remaining_time": "0:48:59", "throughput": 4264.17, "total_tokens": 12396232} {"current_steps": 18980, "total_steps": 38160, "loss": 0.4405, "lr": 0.0005913695898758593, "epoch": 9.947589098532495, "percentage": 49.74, "elapsed_time": "0:48:27", "remaining_time": "0:48:58", "throughput": 4264.1, "total_tokens": 12398760} {"current_steps": 18985, "total_steps": 38160, "loss": 0.4877, "lr": 0.0005911447453690793, "epoch": 9.95020964360587, "percentage": 49.75, "elapsed_time": "0:48:28", "remaining_time": "0:48:57", "throughput": 4264.2, "total_tokens": 12402184} {"current_steps": 18990, "total_steps": 38160, "loss": 0.5124, "lr": 0.0005909198817958585, "epoch": 9.952830188679245, "percentage": 49.76, "elapsed_time": "0:48:29", "remaining_time": "0:48:56", "throughput": 4264.19, "total_tokens": 12405064} {"current_steps": 18995, "total_steps": 38160, "loss": 0.5467, "lr": 0.0005906949992032359, "epoch": 9.95545073375262, "percentage": 49.78, "elapsed_time": "0:48:29", "remaining_time": "0:48:55", "throughput": 4264.18, "total_tokens": 12407976} {"current_steps": 19000, "total_steps": 38160, "loss": 0.5232, "lr": 0.0005904700976382539, "epoch": 9.958071278825996, "percentage": 49.79, "elapsed_time": "0:48:30", "remaining_time": "0:48:55", "throughput": 4264.35, "total_tokens": 12411976} {"current_steps": 19005, "total_steps": 38160, "loss": 0.5234, "lr": 0.0005902451771479596, "epoch": 9.96069182389937, "percentage": 49.8, "elapsed_time": "0:48:31", "remaining_time": "0:48:54", "throughput": 4264.55, "total_tokens": 12416136} {"current_steps": 19010, "total_steps": 38160, "loss": 0.459, "lr": 0.000590020237779404, "epoch": 9.963312368972746, "percentage": 49.82, "elapsed_time": "0:48:32", "remaining_time": "0:48:53", "throughput": 4264.54, "total_tokens": 12418952} {"current_steps": 19015, "total_steps": 38160, "loss": 0.3963, "lr": 0.0005897952795796415, "epoch": 9.965932914046121, "percentage": 49.83, "elapsed_time": "0:48:32", "remaining_time": "0:48:52", "throughput": 4264.53, "total_tokens": 12421768} {"current_steps": 19020, "total_steps": 38160, "loss": 0.5123, "lr": 0.0005895703025957311, "epoch": 9.968553459119496, "percentage": 49.84, "elapsed_time": "0:48:33", "remaining_time": "0:48:51", "throughput": 4264.65, "total_tokens": 12425416} {"current_steps": 19025, "total_steps": 38160, "loss": 0.4713, "lr": 0.0005893453068747352, "epoch": 9.971174004192871, "percentage": 49.86, "elapsed_time": "0:48:34", "remaining_time": "0:48:51", "throughput": 4264.57, "total_tokens": 12427848} {"current_steps": 19030, "total_steps": 38160, "loss": 0.3528, "lr": 0.0005891202924637202, "epoch": 9.973794549266248, "percentage": 49.87, "elapsed_time": "0:48:34", "remaining_time": "0:48:50", "throughput": 4264.67, "total_tokens": 12431464} {"current_steps": 19035, "total_steps": 38160, "loss": 0.3947, "lr": 0.0005888952594097572, "epoch": 9.976415094339622, "percentage": 49.88, "elapsed_time": "0:48:35", "remaining_time": "0:48:49", "throughput": 4264.74, "total_tokens": 12434792} {"current_steps": 19040, "total_steps": 38160, "loss": 0.5323, "lr": 0.0005886702077599197, "epoch": 9.979035639412999, "percentage": 49.9, "elapsed_time": "0:48:36", "remaining_time": "0:48:48", "throughput": 4264.78, "total_tokens": 12437928} {"current_steps": 19045, "total_steps": 38160, "loss": 0.4135, "lr": 0.0005884451375612865, "epoch": 9.981656184486374, "percentage": 49.91, "elapsed_time": "0:48:37", "remaining_time": "0:48:47", "throughput": 4264.83, "total_tokens": 12441160} {"current_steps": 19050, "total_steps": 38160, "loss": 0.5346, "lr": 0.0005882200488609396, "epoch": 9.984276729559749, "percentage": 49.92, "elapsed_time": "0:48:37", "remaining_time": "0:48:47", "throughput": 4264.94, "total_tokens": 12444712} {"current_steps": 19055, "total_steps": 38160, "loss": 0.4806, "lr": 0.0005879949417059649, "epoch": 9.986897274633124, "percentage": 49.93, "elapsed_time": "0:48:38", "remaining_time": "0:48:46", "throughput": 4264.95, "total_tokens": 12447688} {"current_steps": 19060, "total_steps": 38160, "loss": 0.4668, "lr": 0.0005877698161434522, "epoch": 9.9895178197065, "percentage": 49.95, "elapsed_time": "0:48:39", "remaining_time": "0:48:45", "throughput": 4265.01, "total_tokens": 12450984} {"current_steps": 19065, "total_steps": 38160, "loss": 0.5517, "lr": 0.0005875446722204955, "epoch": 9.992138364779874, "percentage": 49.96, "elapsed_time": "0:48:40", "remaining_time": "0:48:44", "throughput": 4265.22, "total_tokens": 12455176} {"current_steps": 19070, "total_steps": 38160, "loss": 0.4319, "lr": 0.0005873195099841919, "epoch": 9.99475890985325, "percentage": 49.97, "elapsed_time": "0:48:40", "remaining_time": "0:48:43", "throughput": 4265.26, "total_tokens": 12458376} {"current_steps": 19075, "total_steps": 38160, "loss": 0.4432, "lr": 0.0005870943294816431, "epoch": 9.997379454926625, "percentage": 49.99, "elapsed_time": "0:48:41", "remaining_time": "0:48:43", "throughput": 4265.21, "total_tokens": 12460968} {"current_steps": 19080, "total_steps": 38160, "loss": 0.3931, "lr": 0.0005868691307599543, "epoch": 10.0, "percentage": 50.0, "elapsed_time": "0:48:42", "remaining_time": "0:48:42", "throughput": 4264.97, "total_tokens": 12463312} {"current_steps": 19080, "total_steps": 38160, "eval_loss": 0.4845305383205414, "epoch": 10.0, "percentage": 50.0, "elapsed_time": "0:48:55", "remaining_time": "0:48:55", "throughput": 4245.03, "total_tokens": 12463312} {"current_steps": 19085, "total_steps": 38160, "loss": 0.3677, "lr": 0.0005866439138662343, "epoch": 10.002620545073375, "percentage": 50.01, "elapsed_time": "0:48:58", "remaining_time": "0:48:56", "throughput": 4242.78, "total_tokens": 12466928} {"current_steps": 19090, "total_steps": 38160, "loss": 0.4061, "lr": 0.000586418678847596, "epoch": 10.00524109014675, "percentage": 50.03, "elapsed_time": "0:48:59", "remaining_time": "0:48:55", "throughput": 4242.78, "total_tokens": 12469776} {"current_steps": 19095, "total_steps": 38160, "loss": 0.4473, "lr": 0.000586193425751156, "epoch": 10.007861635220126, "percentage": 50.04, "elapsed_time": "0:48:59", "remaining_time": "0:48:55", "throughput": 4242.74, "total_tokens": 12472528} {"current_steps": 19100, "total_steps": 38160, "loss": 0.383, "lr": 0.0005859681546240348, "epoch": 10.0104821802935, "percentage": 50.05, "elapsed_time": "0:49:00", "remaining_time": "0:48:54", "throughput": 4242.8, "total_tokens": 12475760} {"current_steps": 19105, "total_steps": 38160, "loss": 0.4966, "lr": 0.0005857428655133562, "epoch": 10.013102725366876, "percentage": 50.07, "elapsed_time": "0:49:01", "remaining_time": "0:48:53", "throughput": 4242.86, "total_tokens": 12479056} {"current_steps": 19110, "total_steps": 38160, "loss": 0.4916, "lr": 0.0005855175584662485, "epoch": 10.015723270440251, "percentage": 50.08, "elapsed_time": "0:49:01", "remaining_time": "0:48:52", "throughput": 4242.9, "total_tokens": 12482224} {"current_steps": 19115, "total_steps": 38160, "loss": 0.374, "lr": 0.0005852922335298433, "epoch": 10.018343815513626, "percentage": 50.09, "elapsed_time": "0:49:02", "remaining_time": "0:48:51", "throughput": 4242.94, "total_tokens": 12485360} {"current_steps": 19120, "total_steps": 38160, "loss": 0.4176, "lr": 0.0005850668907512757, "epoch": 10.020964360587001, "percentage": 50.1, "elapsed_time": "0:49:03", "remaining_time": "0:48:50", "throughput": 4242.89, "total_tokens": 12487920} {"current_steps": 19125, "total_steps": 38160, "loss": 0.5133, "lr": 0.0005848415301776852, "epoch": 10.023584905660377, "percentage": 50.12, "elapsed_time": "0:49:03", "remaining_time": "0:48:50", "throughput": 4242.92, "total_tokens": 12491024} {"current_steps": 19130, "total_steps": 38160, "loss": 0.4717, "lr": 0.0005846161518562144, "epoch": 10.026205450733753, "percentage": 50.13, "elapsed_time": "0:49:04", "remaining_time": "0:48:49", "throughput": 4242.9, "total_tokens": 12493744} {"current_steps": 19135, "total_steps": 38160, "loss": 0.3639, "lr": 0.00058439075583401, "epoch": 10.028825995807129, "percentage": 50.14, "elapsed_time": "0:49:05", "remaining_time": "0:48:48", "throughput": 4242.9, "total_tokens": 12496592} {"current_steps": 19140, "total_steps": 38160, "loss": 0.6352, "lr": 0.0005841653421582223, "epoch": 10.031446540880504, "percentage": 50.16, "elapsed_time": "0:49:06", "remaining_time": "0:48:47", "throughput": 4242.95, "total_tokens": 12499728} {"current_steps": 19145, "total_steps": 38160, "loss": 0.5339, "lr": 0.0005839399108760052, "epoch": 10.034067085953879, "percentage": 50.17, "elapsed_time": "0:49:06", "remaining_time": "0:48:46", "throughput": 4243.04, "total_tokens": 12503248} {"current_steps": 19150, "total_steps": 38160, "loss": 0.4013, "lr": 0.0005837144620345165, "epoch": 10.036687631027254, "percentage": 50.18, "elapsed_time": "0:49:07", "remaining_time": "0:48:45", "throughput": 4243.11, "total_tokens": 12506544} {"current_steps": 19155, "total_steps": 38160, "loss": 0.4015, "lr": 0.0005834889956809173, "epoch": 10.03930817610063, "percentage": 50.2, "elapsed_time": "0:49:08", "remaining_time": "0:48:45", "throughput": 4243.3, "total_tokens": 12510512} {"current_steps": 19160, "total_steps": 38160, "loss": 0.4528, "lr": 0.0005832635118623726, "epoch": 10.041928721174004, "percentage": 50.21, "elapsed_time": "0:49:09", "remaining_time": "0:48:44", "throughput": 4243.41, "total_tokens": 12514096} {"current_steps": 19165, "total_steps": 38160, "loss": 0.399, "lr": 0.0005830380106260513, "epoch": 10.04454926624738, "percentage": 50.22, "elapsed_time": "0:49:09", "remaining_time": "0:48:43", "throughput": 4243.6, "total_tokens": 12518352} {"current_steps": 19170, "total_steps": 38160, "loss": 0.5255, "lr": 0.0005828124920191255, "epoch": 10.047169811320755, "percentage": 50.24, "elapsed_time": "0:49:10", "remaining_time": "0:48:43", "throughput": 4243.83, "total_tokens": 12522736} {"current_steps": 19175, "total_steps": 38160, "loss": 0.5269, "lr": 0.000582586956088771, "epoch": 10.04979035639413, "percentage": 50.25, "elapsed_time": "0:49:11", "remaining_time": "0:48:42", "throughput": 4243.76, "total_tokens": 12525296} {"current_steps": 19180, "total_steps": 38160, "loss": 0.5192, "lr": 0.0005823614028821677, "epoch": 10.052410901467505, "percentage": 50.26, "elapsed_time": "0:49:12", "remaining_time": "0:48:41", "throughput": 4243.98, "total_tokens": 12529616} {"current_steps": 19185, "total_steps": 38160, "loss": 0.4433, "lr": 0.0005821358324464985, "epoch": 10.05503144654088, "percentage": 50.28, "elapsed_time": "0:49:13", "remaining_time": "0:48:40", "throughput": 4244.2, "total_tokens": 12534000} {"current_steps": 19190, "total_steps": 38160, "loss": 0.3564, "lr": 0.0005819102448289501, "epoch": 10.057651991614255, "percentage": 50.29, "elapsed_time": "0:49:13", "remaining_time": "0:48:40", "throughput": 4244.19, "total_tokens": 12536848} {"current_steps": 19195, "total_steps": 38160, "loss": 0.4324, "lr": 0.000581684640076713, "epoch": 10.06027253668763, "percentage": 50.3, "elapsed_time": "0:49:14", "remaining_time": "0:48:39", "throughput": 4244.16, "total_tokens": 12539632} {"current_steps": 19200, "total_steps": 38160, "loss": 0.4131, "lr": 0.0005814590182369811, "epoch": 10.062893081761006, "percentage": 50.31, "elapsed_time": "0:49:15", "remaining_time": "0:48:38", "throughput": 4244.26, "total_tokens": 12543024} {"current_steps": 19205, "total_steps": 38160, "loss": 0.4111, "lr": 0.000581233379356952, "epoch": 10.065513626834381, "percentage": 50.33, "elapsed_time": "0:49:15", "remaining_time": "0:48:37", "throughput": 4244.15, "total_tokens": 12545264} {"current_steps": 19210, "total_steps": 38160, "loss": 0.5067, "lr": 0.0005810077234838267, "epoch": 10.068134171907756, "percentage": 50.34, "elapsed_time": "0:49:16", "remaining_time": "0:48:36", "throughput": 4244.32, "total_tokens": 12549264} {"current_steps": 19215, "total_steps": 38160, "loss": 0.4603, "lr": 0.0005807820506648097, "epoch": 10.070754716981131, "percentage": 50.35, "elapsed_time": "0:49:17", "remaining_time": "0:48:36", "throughput": 4244.74, "total_tokens": 12554864} {"current_steps": 19220, "total_steps": 38160, "loss": 0.5452, "lr": 0.0005805563609471095, "epoch": 10.073375262054507, "percentage": 50.37, "elapsed_time": "0:49:18", "remaining_time": "0:48:35", "throughput": 4244.78, "total_tokens": 12558032} {"current_steps": 19225, "total_steps": 38160, "loss": 0.4291, "lr": 0.0005803306543779375, "epoch": 10.075995807127883, "percentage": 50.38, "elapsed_time": "0:49:19", "remaining_time": "0:48:34", "throughput": 4244.72, "total_tokens": 12560528} {"current_steps": 19230, "total_steps": 38160, "loss": 0.4569, "lr": 0.000580104931004509, "epoch": 10.078616352201259, "percentage": 50.39, "elapsed_time": "0:49:19", "remaining_time": "0:48:33", "throughput": 4244.67, "total_tokens": 12563056} {"current_steps": 19235, "total_steps": 38160, "loss": 0.3162, "lr": 0.000579879190874043, "epoch": 10.081236897274634, "percentage": 50.41, "elapsed_time": "0:49:20", "remaining_time": "0:48:32", "throughput": 4244.81, "total_tokens": 12566896} {"current_steps": 19240, "total_steps": 38160, "loss": 0.5287, "lr": 0.0005796534340337614, "epoch": 10.083857442348009, "percentage": 50.42, "elapsed_time": "0:49:21", "remaining_time": "0:48:32", "throughput": 4244.92, "total_tokens": 12570480} {"current_steps": 19245, "total_steps": 38160, "loss": 0.4823, "lr": 0.0005794276605308902, "epoch": 10.086477987421384, "percentage": 50.43, "elapsed_time": "0:49:22", "remaining_time": "0:48:31", "throughput": 4245.0, "total_tokens": 12573808} {"current_steps": 19250, "total_steps": 38160, "loss": 0.3554, "lr": 0.0005792018704126586, "epoch": 10.08909853249476, "percentage": 50.45, "elapsed_time": "0:49:22", "remaining_time": "0:48:30", "throughput": 4245.04, "total_tokens": 12577072} {"current_steps": 19255, "total_steps": 38160, "loss": 0.5132, "lr": 0.0005789760637262992, "epoch": 10.091719077568134, "percentage": 50.46, "elapsed_time": "0:49:23", "remaining_time": "0:48:29", "throughput": 4245.08, "total_tokens": 12580176} {"current_steps": 19260, "total_steps": 38160, "loss": 0.4005, "lr": 0.0005787502405190483, "epoch": 10.09433962264151, "percentage": 50.47, "elapsed_time": "0:49:24", "remaining_time": "0:48:28", "throughput": 4245.31, "total_tokens": 12584528} {"current_steps": 19265, "total_steps": 38160, "loss": 0.5541, "lr": 0.0005785244008381456, "epoch": 10.096960167714885, "percentage": 50.48, "elapsed_time": "0:49:25", "remaining_time": "0:48:28", "throughput": 4245.3, "total_tokens": 12587376} {"current_steps": 19270, "total_steps": 38160, "loss": 0.383, "lr": 0.0005782985447308341, "epoch": 10.09958071278826, "percentage": 50.5, "elapsed_time": "0:49:25", "remaining_time": "0:48:27", "throughput": 4245.3, "total_tokens": 12590256} {"current_steps": 19275, "total_steps": 38160, "loss": 0.3983, "lr": 0.0005780726722443602, "epoch": 10.102201257861635, "percentage": 50.51, "elapsed_time": "0:49:26", "remaining_time": "0:48:26", "throughput": 4245.25, "total_tokens": 12592848} {"current_steps": 19280, "total_steps": 38160, "loss": 0.3901, "lr": 0.0005778467834259741, "epoch": 10.10482180293501, "percentage": 50.52, "elapsed_time": "0:49:27", "remaining_time": "0:48:25", "throughput": 4245.34, "total_tokens": 12596272} {"current_steps": 19285, "total_steps": 38160, "loss": 0.5293, "lr": 0.000577620878322929, "epoch": 10.107442348008385, "percentage": 50.54, "elapsed_time": "0:49:27", "remaining_time": "0:48:24", "throughput": 4245.53, "total_tokens": 12600464} {"current_steps": 19290, "total_steps": 38160, "loss": 0.4911, "lr": 0.0005773949569824816, "epoch": 10.11006289308176, "percentage": 50.55, "elapsed_time": "0:49:28", "remaining_time": "0:48:24", "throughput": 4245.62, "total_tokens": 12603952} {"current_steps": 19295, "total_steps": 38160, "loss": 0.3695, "lr": 0.0005771690194518922, "epoch": 10.112683438155136, "percentage": 50.56, "elapsed_time": "0:49:29", "remaining_time": "0:48:23", "throughput": 4245.55, "total_tokens": 12606480} {"current_steps": 19300, "total_steps": 38160, "loss": 0.3208, "lr": 0.0005769430657784245, "epoch": 10.115303983228511, "percentage": 50.58, "elapsed_time": "0:49:29", "remaining_time": "0:48:22", "throughput": 4245.46, "total_tokens": 12608784} {"current_steps": 19305, "total_steps": 38160, "loss": 0.4928, "lr": 0.0005767170960093449, "epoch": 10.117924528301886, "percentage": 50.59, "elapsed_time": "0:49:30", "remaining_time": "0:48:21", "throughput": 4245.68, "total_tokens": 12613232} {"current_steps": 19310, "total_steps": 38160, "loss": 0.5742, "lr": 0.0005764911101919244, "epoch": 10.120545073375261, "percentage": 50.6, "elapsed_time": "0:49:31", "remaining_time": "0:48:20", "throughput": 4245.8, "total_tokens": 12616816} {"current_steps": 19315, "total_steps": 38160, "loss": 0.3693, "lr": 0.0005762651083734363, "epoch": 10.123165618448636, "percentage": 50.62, "elapsed_time": "0:49:32", "remaining_time": "0:48:20", "throughput": 4245.95, "total_tokens": 12620624} {"current_steps": 19320, "total_steps": 38160, "loss": 0.4821, "lr": 0.0005760390906011574, "epoch": 10.125786163522013, "percentage": 50.63, "elapsed_time": "0:49:33", "remaining_time": "0:48:19", "throughput": 4246.05, "total_tokens": 12624176} {"current_steps": 19325, "total_steps": 38160, "loss": 0.3706, "lr": 0.0005758130569223684, "epoch": 10.128406708595389, "percentage": 50.64, "elapsed_time": "0:49:33", "remaining_time": "0:48:18", "throughput": 4246.1, "total_tokens": 12627472} {"current_steps": 19330, "total_steps": 38160, "loss": 0.4268, "lr": 0.0005755870073843527, "epoch": 10.131027253668764, "percentage": 50.66, "elapsed_time": "0:49:34", "remaining_time": "0:48:17", "throughput": 4246.22, "total_tokens": 12631152} {"current_steps": 19335, "total_steps": 38160, "loss": 0.4812, "lr": 0.0005753609420343973, "epoch": 10.133647798742139, "percentage": 50.67, "elapsed_time": "0:49:35", "remaining_time": "0:48:17", "throughput": 4246.41, "total_tokens": 12635216} {"current_steps": 19340, "total_steps": 38160, "loss": 0.5045, "lr": 0.0005751348609197929, "epoch": 10.136268343815514, "percentage": 50.68, "elapsed_time": "0:49:36", "remaining_time": "0:48:16", "throughput": 4246.58, "total_tokens": 12639120} {"current_steps": 19345, "total_steps": 38160, "loss": 0.4864, "lr": 0.0005749087640878325, "epoch": 10.13888888888889, "percentage": 50.69, "elapsed_time": "0:49:36", "remaining_time": "0:48:15", "throughput": 4246.58, "total_tokens": 12642064} {"current_steps": 19350, "total_steps": 38160, "loss": 0.3291, "lr": 0.0005746826515858135, "epoch": 10.141509433962264, "percentage": 50.71, "elapsed_time": "0:49:37", "remaining_time": "0:48:14", "throughput": 4246.57, "total_tokens": 12644848} {"current_steps": 19355, "total_steps": 38160, "loss": 0.4273, "lr": 0.0005744565234610356, "epoch": 10.14412997903564, "percentage": 50.72, "elapsed_time": "0:49:38", "remaining_time": "0:48:13", "throughput": 4246.64, "total_tokens": 12648112} {"current_steps": 19360, "total_steps": 38160, "loss": 0.3645, "lr": 0.0005742303797608023, "epoch": 10.146750524109015, "percentage": 50.73, "elapsed_time": "0:49:39", "remaining_time": "0:48:12", "throughput": 4246.65, "total_tokens": 12650992} {"current_steps": 19365, "total_steps": 38160, "loss": 0.5099, "lr": 0.0005740042205324208, "epoch": 10.14937106918239, "percentage": 50.75, "elapsed_time": "0:49:39", "remaining_time": "0:48:12", "throughput": 4246.66, "total_tokens": 12654000} {"current_steps": 19370, "total_steps": 38160, "loss": 0.4003, "lr": 0.0005737780458232004, "epoch": 10.151991614255765, "percentage": 50.76, "elapsed_time": "0:49:40", "remaining_time": "0:48:11", "throughput": 4246.67, "total_tokens": 12657008} {"current_steps": 19375, "total_steps": 38160, "loss": 0.4637, "lr": 0.0005735518556804546, "epoch": 10.15461215932914, "percentage": 50.77, "elapsed_time": "0:49:41", "remaining_time": "0:48:10", "throughput": 4246.63, "total_tokens": 12659696} {"current_steps": 19380, "total_steps": 38160, "loss": 0.381, "lr": 0.0005733256501514999, "epoch": 10.157232704402515, "percentage": 50.79, "elapsed_time": "0:49:41", "remaining_time": "0:48:09", "throughput": 4246.71, "total_tokens": 12663024} {"current_steps": 19385, "total_steps": 38160, "loss": 0.4443, "lr": 0.0005730994292836555, "epoch": 10.15985324947589, "percentage": 50.8, "elapsed_time": "0:49:42", "remaining_time": "0:48:08", "throughput": 4246.75, "total_tokens": 12666160} {"current_steps": 19390, "total_steps": 38160, "loss": 0.4733, "lr": 0.0005728731931242445, "epoch": 10.162473794549266, "percentage": 50.81, "elapsed_time": "0:49:43", "remaining_time": "0:48:07", "throughput": 4246.69, "total_tokens": 12668656} {"current_steps": 19395, "total_steps": 38160, "loss": 0.3991, "lr": 0.0005726469417205928, "epoch": 10.165094339622641, "percentage": 50.83, "elapsed_time": "0:49:43", "remaining_time": "0:48:06", "throughput": 4246.72, "total_tokens": 12671792} {"current_steps": 19400, "total_steps": 38160, "loss": 0.3721, "lr": 0.0005724206751200297, "epoch": 10.167714884696016, "percentage": 50.84, "elapsed_time": "0:49:44", "remaining_time": "0:48:06", "throughput": 4246.65, "total_tokens": 12674192} {"current_steps": 19405, "total_steps": 38160, "loss": 0.3647, "lr": 0.0005721943933698879, "epoch": 10.170335429769391, "percentage": 50.85, "elapsed_time": "0:49:45", "remaining_time": "0:48:05", "throughput": 4246.72, "total_tokens": 12677456} {"current_steps": 19410, "total_steps": 38160, "loss": 0.3516, "lr": 0.0005719680965175023, "epoch": 10.172955974842766, "percentage": 50.86, "elapsed_time": "0:49:46", "remaining_time": "0:48:04", "throughput": 4246.98, "total_tokens": 12681968} {"current_steps": 19415, "total_steps": 38160, "loss": 0.4107, "lr": 0.000571741784610212, "epoch": 10.175576519916143, "percentage": 50.88, "elapsed_time": "0:49:46", "remaining_time": "0:48:03", "throughput": 4246.93, "total_tokens": 12684560} {"current_steps": 19420, "total_steps": 38160, "loss": 0.6615, "lr": 0.0005715154576953589, "epoch": 10.178197064989519, "percentage": 50.89, "elapsed_time": "0:49:47", "remaining_time": "0:48:02", "throughput": 4246.99, "total_tokens": 12687824} {"current_steps": 19425, "total_steps": 38160, "loss": 0.4601, "lr": 0.0005712891158202879, "epoch": 10.180817610062894, "percentage": 50.9, "elapsed_time": "0:49:48", "remaining_time": "0:48:01", "throughput": 4246.9, "total_tokens": 12690160} {"current_steps": 19430, "total_steps": 38160, "loss": 0.5673, "lr": 0.0005710627590323473, "epoch": 10.183438155136269, "percentage": 50.92, "elapsed_time": "0:49:48", "remaining_time": "0:48:01", "throughput": 4247.02, "total_tokens": 12693840} {"current_steps": 19435, "total_steps": 38160, "loss": 0.491, "lr": 0.0005708363873788882, "epoch": 10.186058700209644, "percentage": 50.93, "elapsed_time": "0:49:49", "remaining_time": "0:48:00", "throughput": 4247.01, "total_tokens": 12696688} {"current_steps": 19440, "total_steps": 38160, "loss": 0.4675, "lr": 0.0005706100009072649, "epoch": 10.18867924528302, "percentage": 50.94, "elapsed_time": "0:49:50", "remaining_time": "0:47:59", "throughput": 4247.0, "total_tokens": 12699472} {"current_steps": 19445, "total_steps": 38160, "loss": 0.4301, "lr": 0.000570383599664835, "epoch": 10.191299790356394, "percentage": 50.96, "elapsed_time": "0:49:50", "remaining_time": "0:47:58", "throughput": 4247.07, "total_tokens": 12702768} {"current_steps": 19450, "total_steps": 38160, "loss": 0.3295, "lr": 0.0005701571836989591, "epoch": 10.19392033542977, "percentage": 50.97, "elapsed_time": "0:49:51", "remaining_time": "0:47:57", "throughput": 4247.15, "total_tokens": 12706096} {"current_steps": 19455, "total_steps": 38160, "loss": 0.545, "lr": 0.0005699307530570008, "epoch": 10.196540880503145, "percentage": 50.98, "elapsed_time": "0:49:52", "remaining_time": "0:47:57", "throughput": 4247.24, "total_tokens": 12709648} {"current_steps": 19460, "total_steps": 38160, "loss": 0.37, "lr": 0.0005697043077863267, "epoch": 10.19916142557652, "percentage": 51.0, "elapsed_time": "0:49:53", "remaining_time": "0:47:56", "throughput": 4247.27, "total_tokens": 12712784} {"current_steps": 19465, "total_steps": 38160, "loss": 0.4111, "lr": 0.0005694778479343065, "epoch": 10.201781970649895, "percentage": 51.01, "elapsed_time": "0:49:53", "remaining_time": "0:47:55", "throughput": 4247.32, "total_tokens": 12715920} {"current_steps": 19470, "total_steps": 38160, "loss": 0.3636, "lr": 0.0005692513735483134, "epoch": 10.20440251572327, "percentage": 51.02, "elapsed_time": "0:49:54", "remaining_time": "0:47:54", "throughput": 4247.32, "total_tokens": 12718832} {"current_steps": 19475, "total_steps": 38160, "loss": 0.5676, "lr": 0.0005690248846757228, "epoch": 10.207023060796645, "percentage": 51.04, "elapsed_time": "0:49:55", "remaining_time": "0:47:53", "throughput": 4247.43, "total_tokens": 12722448} {"current_steps": 19480, "total_steps": 38160, "loss": 0.5224, "lr": 0.0005687983813639139, "epoch": 10.20964360587002, "percentage": 51.05, "elapsed_time": "0:49:56", "remaining_time": "0:47:53", "throughput": 4247.55, "total_tokens": 12726096} {"current_steps": 19485, "total_steps": 38160, "loss": 0.4398, "lr": 0.0005685718636602685, "epoch": 10.212264150943396, "percentage": 51.06, "elapsed_time": "0:49:56", "remaining_time": "0:47:52", "throughput": 4247.53, "total_tokens": 12728976} {"current_steps": 19490, "total_steps": 38160, "loss": 0.3228, "lr": 0.0005683453316121716, "epoch": 10.214884696016771, "percentage": 51.07, "elapsed_time": "0:49:57", "remaining_time": "0:47:51", "throughput": 4247.62, "total_tokens": 12732432} {"current_steps": 19495, "total_steps": 38160, "loss": 0.3986, "lr": 0.0005681187852670111, "epoch": 10.217505241090146, "percentage": 51.09, "elapsed_time": "0:49:58", "remaining_time": "0:47:50", "throughput": 4248.03, "total_tokens": 12738288} {"current_steps": 19500, "total_steps": 38160, "loss": 0.5051, "lr": 0.0005678922246721777, "epoch": 10.220125786163521, "percentage": 51.1, "elapsed_time": "0:49:59", "remaining_time": "0:47:50", "throughput": 4248.02, "total_tokens": 12741168} {"current_steps": 19505, "total_steps": 38160, "loss": 0.3426, "lr": 0.0005676656498750656, "epoch": 10.222746331236896, "percentage": 51.11, "elapsed_time": "0:50:00", "remaining_time": "0:47:49", "throughput": 4248.23, "total_tokens": 12745456} {"current_steps": 19510, "total_steps": 38160, "loss": 0.4275, "lr": 0.0005674390609230715, "epoch": 10.225366876310272, "percentage": 51.13, "elapsed_time": "0:50:00", "remaining_time": "0:47:48", "throughput": 4248.23, "total_tokens": 12748336} {"current_steps": 19515, "total_steps": 38160, "loss": 0.443, "lr": 0.0005672124578635951, "epoch": 10.227987421383649, "percentage": 51.14, "elapsed_time": "0:50:01", "remaining_time": "0:47:47", "throughput": 4248.24, "total_tokens": 12751344} {"current_steps": 19520, "total_steps": 38160, "loss": 0.3581, "lr": 0.0005669858407440394, "epoch": 10.230607966457024, "percentage": 51.15, "elapsed_time": "0:50:02", "remaining_time": "0:47:46", "throughput": 4248.25, "total_tokens": 12754256} {"current_steps": 19525, "total_steps": 38160, "loss": 0.3859, "lr": 0.00056675920961181, "epoch": 10.233228511530399, "percentage": 51.17, "elapsed_time": "0:50:03", "remaining_time": "0:47:46", "throughput": 4248.36, "total_tokens": 12757840} {"current_steps": 19530, "total_steps": 38160, "loss": 0.4938, "lr": 0.0005665325645143155, "epoch": 10.235849056603774, "percentage": 51.18, "elapsed_time": "0:50:03", "remaining_time": "0:47:45", "throughput": 4248.4, "total_tokens": 12760944} {"current_steps": 19535, "total_steps": 38160, "loss": 0.4353, "lr": 0.0005663059054989679, "epoch": 10.23846960167715, "percentage": 51.19, "elapsed_time": "0:50:04", "remaining_time": "0:47:44", "throughput": 4248.55, "total_tokens": 12764880} {"current_steps": 19540, "total_steps": 38160, "loss": 0.4503, "lr": 0.0005660792326131809, "epoch": 10.241090146750524, "percentage": 51.21, "elapsed_time": "0:50:05", "remaining_time": "0:47:43", "throughput": 4248.57, "total_tokens": 12767920} {"current_steps": 19545, "total_steps": 38160, "loss": 0.4877, "lr": 0.0005658525459043725, "epoch": 10.2437106918239, "percentage": 51.22, "elapsed_time": "0:50:05", "remaining_time": "0:47:42", "throughput": 4248.53, "total_tokens": 12770416} {"current_steps": 19550, "total_steps": 38160, "loss": 0.4211, "lr": 0.000565625845419963, "epoch": 10.246331236897275, "percentage": 51.23, "elapsed_time": "0:50:06", "remaining_time": "0:47:42", "throughput": 4248.62, "total_tokens": 12773936} {"current_steps": 19555, "total_steps": 38160, "loss": 0.3837, "lr": 0.000565399131207375, "epoch": 10.24895178197065, "percentage": 51.24, "elapsed_time": "0:50:07", "remaining_time": "0:47:41", "throughput": 4248.77, "total_tokens": 12777776} {"current_steps": 19560, "total_steps": 38160, "loss": 0.5813, "lr": 0.000565172403314035, "epoch": 10.251572327044025, "percentage": 51.26, "elapsed_time": "0:50:08", "remaining_time": "0:47:40", "throughput": 4248.81, "total_tokens": 12780912} {"current_steps": 19565, "total_steps": 38160, "loss": 0.3061, "lr": 0.0005649456617873717, "epoch": 10.2541928721174, "percentage": 51.27, "elapsed_time": "0:50:08", "remaining_time": "0:47:39", "throughput": 4248.88, "total_tokens": 12784272} {"current_steps": 19570, "total_steps": 38160, "loss": 0.5443, "lr": 0.0005647189066748169, "epoch": 10.256813417190775, "percentage": 51.28, "elapsed_time": "0:50:09", "remaining_time": "0:47:38", "throughput": 4248.99, "total_tokens": 12787888} {"current_steps": 19575, "total_steps": 38160, "loss": 0.4403, "lr": 0.0005644921380238052, "epoch": 10.25943396226415, "percentage": 51.3, "elapsed_time": "0:50:10", "remaining_time": "0:47:38", "throughput": 4249.1, "total_tokens": 12791472} {"current_steps": 19580, "total_steps": 38160, "loss": 0.4055, "lr": 0.000564265355881774, "epoch": 10.262054507337526, "percentage": 51.31, "elapsed_time": "0:50:11", "remaining_time": "0:47:37", "throughput": 4249.17, "total_tokens": 12794800} {"current_steps": 19585, "total_steps": 38160, "loss": 0.4333, "lr": 0.0005640385602961634, "epoch": 10.264675052410901, "percentage": 51.32, "elapsed_time": "0:50:11", "remaining_time": "0:47:36", "throughput": 4249.41, "total_tokens": 12799184} {"current_steps": 19590, "total_steps": 38160, "loss": 0.4481, "lr": 0.0005638117513144168, "epoch": 10.267295597484276, "percentage": 51.34, "elapsed_time": "0:50:12", "remaining_time": "0:47:35", "throughput": 4249.49, "total_tokens": 12802576} {"current_steps": 19595, "total_steps": 38160, "loss": 0.4476, "lr": 0.0005635849289839797, "epoch": 10.269916142557651, "percentage": 51.35, "elapsed_time": "0:50:13", "remaining_time": "0:47:35", "throughput": 4249.5, "total_tokens": 12805488} {"current_steps": 19600, "total_steps": 38160, "loss": 0.4024, "lr": 0.000563358093352301, "epoch": 10.272536687631026, "percentage": 51.36, "elapsed_time": "0:50:14", "remaining_time": "0:47:34", "throughput": 4249.65, "total_tokens": 12809328} {"current_steps": 19605, "total_steps": 38160, "loss": 0.4913, "lr": 0.0005631312444668318, "epoch": 10.275157232704402, "percentage": 51.38, "elapsed_time": "0:50:14", "remaining_time": "0:47:33", "throughput": 4249.72, "total_tokens": 12812752} {"current_steps": 19610, "total_steps": 38160, "loss": 0.4081, "lr": 0.0005629043823750266, "epoch": 10.277777777777779, "percentage": 51.39, "elapsed_time": "0:50:15", "remaining_time": "0:47:32", "throughput": 4249.68, "total_tokens": 12815312} {"current_steps": 19615, "total_steps": 38160, "loss": 0.4293, "lr": 0.0005626775071243423, "epoch": 10.280398322851154, "percentage": 51.4, "elapsed_time": "0:50:16", "remaining_time": "0:47:31", "throughput": 4249.64, "total_tokens": 12817936} {"current_steps": 19620, "total_steps": 38160, "loss": 0.5904, "lr": 0.0005624506187622384, "epoch": 10.283018867924529, "percentage": 51.42, "elapsed_time": "0:50:16", "remaining_time": "0:47:30", "throughput": 4249.7, "total_tokens": 12821200} {"current_steps": 19625, "total_steps": 38160, "loss": 0.4076, "lr": 0.0005622237173361777, "epoch": 10.285639412997904, "percentage": 51.43, "elapsed_time": "0:50:17", "remaining_time": "0:47:30", "throughput": 4249.73, "total_tokens": 12824304} {"current_steps": 19630, "total_steps": 38160, "loss": 0.5153, "lr": 0.0005619968028936252, "epoch": 10.28825995807128, "percentage": 51.44, "elapsed_time": "0:50:18", "remaining_time": "0:47:29", "throughput": 4249.74, "total_tokens": 12827184} {"current_steps": 19635, "total_steps": 38160, "loss": 0.6161, "lr": 0.0005617698754820489, "epoch": 10.290880503144654, "percentage": 51.45, "elapsed_time": "0:50:19", "remaining_time": "0:47:28", "throughput": 4249.9, "total_tokens": 12831088} {"current_steps": 19640, "total_steps": 38160, "loss": 0.5387, "lr": 0.0005615429351489192, "epoch": 10.29350104821803, "percentage": 51.47, "elapsed_time": "0:50:19", "remaining_time": "0:47:27", "throughput": 4249.91, "total_tokens": 12834032} {"current_steps": 19645, "total_steps": 38160, "loss": 0.5118, "lr": 0.0005613159819417095, "epoch": 10.296121593291405, "percentage": 51.48, "elapsed_time": "0:50:20", "remaining_time": "0:47:26", "throughput": 4249.91, "total_tokens": 12836880} {"current_steps": 19650, "total_steps": 38160, "loss": 0.4559, "lr": 0.0005610890159078961, "epoch": 10.29874213836478, "percentage": 51.49, "elapsed_time": "0:50:21", "remaining_time": "0:47:25", "throughput": 4249.91, "total_tokens": 12839792} {"current_steps": 19655, "total_steps": 38160, "loss": 0.3683, "lr": 0.0005608620370949575, "epoch": 10.301362683438155, "percentage": 51.51, "elapsed_time": "0:50:21", "remaining_time": "0:47:25", "throughput": 4249.84, "total_tokens": 12842192} {"current_steps": 19660, "total_steps": 38160, "loss": 0.4397, "lr": 0.000560635045550375, "epoch": 10.30398322851153, "percentage": 51.52, "elapsed_time": "0:50:22", "remaining_time": "0:47:24", "throughput": 4249.9, "total_tokens": 12845488} {"current_steps": 19665, "total_steps": 38160, "loss": 0.5247, "lr": 0.0005604080413216328, "epoch": 10.306603773584905, "percentage": 51.53, "elapsed_time": "0:50:23", "remaining_time": "0:47:23", "throughput": 4250.4, "total_tokens": 12852240} {"current_steps": 19670, "total_steps": 38160, "loss": 0.4092, "lr": 0.0005601810244562175, "epoch": 10.30922431865828, "percentage": 51.55, "elapsed_time": "0:50:24", "remaining_time": "0:47:22", "throughput": 4250.37, "total_tokens": 12854928} {"current_steps": 19675, "total_steps": 38160, "loss": 0.3453, "lr": 0.0005599539950016184, "epoch": 10.311844863731656, "percentage": 51.56, "elapsed_time": "0:50:25", "remaining_time": "0:47:22", "throughput": 4250.43, "total_tokens": 12858256} {"current_steps": 19680, "total_steps": 38160, "loss": 0.4727, "lr": 0.0005597269530053277, "epoch": 10.314465408805031, "percentage": 51.57, "elapsed_time": "0:50:26", "remaining_time": "0:47:21", "throughput": 4250.64, "total_tokens": 12862640} {"current_steps": 19685, "total_steps": 38160, "loss": 0.3958, "lr": 0.0005594998985148398, "epoch": 10.317085953878406, "percentage": 51.59, "elapsed_time": "0:50:26", "remaining_time": "0:47:20", "throughput": 4250.6, "total_tokens": 12865200} {"current_steps": 19690, "total_steps": 38160, "loss": 0.4691, "lr": 0.0005592728315776519, "epoch": 10.319706498951781, "percentage": 51.6, "elapsed_time": "0:50:27", "remaining_time": "0:47:19", "throughput": 4250.75, "total_tokens": 12869040} {"current_steps": 19695, "total_steps": 38160, "loss": 0.5661, "lr": 0.0005590457522412638, "epoch": 10.322327044025156, "percentage": 51.61, "elapsed_time": "0:50:28", "remaining_time": "0:47:19", "throughput": 4250.8, "total_tokens": 12872304} {"current_steps": 19700, "total_steps": 38160, "loss": 0.3819, "lr": 0.000558818660553178, "epoch": 10.324947589098532, "percentage": 51.62, "elapsed_time": "0:50:28", "remaining_time": "0:47:18", "throughput": 4250.74, "total_tokens": 12874896} {"current_steps": 19705, "total_steps": 38160, "loss": 0.6151, "lr": 0.0005585915565608995, "epoch": 10.327568134171909, "percentage": 51.64, "elapsed_time": "0:50:29", "remaining_time": "0:47:17", "throughput": 4250.79, "total_tokens": 12878160} {"current_steps": 19710, "total_steps": 38160, "loss": 0.4732, "lr": 0.0005583644403119357, "epoch": 10.330188679245284, "percentage": 51.65, "elapsed_time": "0:50:30", "remaining_time": "0:47:16", "throughput": 4250.83, "total_tokens": 12881328} {"current_steps": 19715, "total_steps": 38160, "loss": 0.2881, "lr": 0.0005581373118537969, "epoch": 10.332809224318659, "percentage": 51.66, "elapsed_time": "0:50:30", "remaining_time": "0:47:15", "throughput": 4250.82, "total_tokens": 12884144} {"current_steps": 19720, "total_steps": 38160, "loss": 0.5831, "lr": 0.0005579101712339957, "epoch": 10.335429769392034, "percentage": 51.68, "elapsed_time": "0:50:31", "remaining_time": "0:47:14", "throughput": 4250.89, "total_tokens": 12887440} {"current_steps": 19725, "total_steps": 38160, "loss": 0.4991, "lr": 0.0005576830185000474, "epoch": 10.33805031446541, "percentage": 51.69, "elapsed_time": "0:50:32", "remaining_time": "0:47:14", "throughput": 4251.01, "total_tokens": 12891088} {"current_steps": 19730, "total_steps": 38160, "loss": 0.4076, "lr": 0.0005574558536994698, "epoch": 10.340670859538784, "percentage": 51.7, "elapsed_time": "0:50:33", "remaining_time": "0:47:13", "throughput": 4251.23, "total_tokens": 12895632} {"current_steps": 19735, "total_steps": 38160, "loss": 0.3647, "lr": 0.0005572286768797829, "epoch": 10.34329140461216, "percentage": 51.72, "elapsed_time": "0:50:34", "remaining_time": "0:47:12", "throughput": 4251.23, "total_tokens": 12898544} {"current_steps": 19740, "total_steps": 38160, "loss": 0.4443, "lr": 0.0005570014880885098, "epoch": 10.345911949685535, "percentage": 51.73, "elapsed_time": "0:50:34", "remaining_time": "0:47:11", "throughput": 4251.18, "total_tokens": 12901136} {"current_steps": 19745, "total_steps": 38160, "loss": 0.4431, "lr": 0.0005567742873731757, "epoch": 10.34853249475891, "percentage": 51.74, "elapsed_time": "0:50:35", "remaining_time": "0:47:11", "throughput": 4251.28, "total_tokens": 12904656} {"current_steps": 19750, "total_steps": 38160, "loss": 0.4902, "lr": 0.0005565470747813085, "epoch": 10.351153039832285, "percentage": 51.76, "elapsed_time": "0:50:36", "remaining_time": "0:47:10", "throughput": 4251.29, "total_tokens": 12907696} {"current_steps": 19755, "total_steps": 38160, "loss": 0.5156, "lr": 0.0005563198503604382, "epoch": 10.35377358490566, "percentage": 51.77, "elapsed_time": "0:50:36", "remaining_time": "0:47:09", "throughput": 4251.22, "total_tokens": 12910064} {"current_steps": 19760, "total_steps": 38160, "loss": 0.3556, "lr": 0.0005560926141580978, "epoch": 10.356394129979035, "percentage": 51.78, "elapsed_time": "0:50:37", "remaining_time": "0:47:08", "throughput": 4251.22, "total_tokens": 12912944} {"current_steps": 19765, "total_steps": 38160, "loss": 0.3614, "lr": 0.0005558653662218225, "epoch": 10.35901467505241, "percentage": 51.8, "elapsed_time": "0:50:38", "remaining_time": "0:47:07", "throughput": 4251.14, "total_tokens": 12915248} {"current_steps": 19770, "total_steps": 38160, "loss": 0.3736, "lr": 0.00055563810659915, "epoch": 10.361635220125786, "percentage": 51.81, "elapsed_time": "0:50:38", "remaining_time": "0:47:06", "throughput": 4251.1, "total_tokens": 12917808} {"current_steps": 19775, "total_steps": 38160, "loss": 0.4223, "lr": 0.0005554108353376201, "epoch": 10.364255765199161, "percentage": 51.82, "elapsed_time": "0:50:39", "remaining_time": "0:47:05", "throughput": 4251.28, "total_tokens": 12921808} {"current_steps": 19780, "total_steps": 38160, "loss": 0.5793, "lr": 0.0005551835524847757, "epoch": 10.366876310272536, "percentage": 51.83, "elapsed_time": "0:50:40", "remaining_time": "0:47:05", "throughput": 4251.37, "total_tokens": 12925264} {"current_steps": 19785, "total_steps": 38160, "loss": 0.4567, "lr": 0.0005549562580881618, "epoch": 10.369496855345911, "percentage": 51.85, "elapsed_time": "0:50:41", "remaining_time": "0:47:04", "throughput": 4251.49, "total_tokens": 12928848} {"current_steps": 19790, "total_steps": 38160, "loss": 0.3765, "lr": 0.0005547289521953257, "epoch": 10.372117400419286, "percentage": 51.86, "elapsed_time": "0:50:41", "remaining_time": "0:47:03", "throughput": 4251.56, "total_tokens": 12932144} {"current_steps": 19795, "total_steps": 38160, "loss": 0.5962, "lr": 0.000554501634853817, "epoch": 10.374737945492662, "percentage": 51.87, "elapsed_time": "0:50:42", "remaining_time": "0:47:02", "throughput": 4251.64, "total_tokens": 12935536} {"current_steps": 19800, "total_steps": 38160, "loss": 0.5452, "lr": 0.0005542743061111883, "epoch": 10.377358490566039, "percentage": 51.89, "elapsed_time": "0:50:43", "remaining_time": "0:47:01", "throughput": 4251.67, "total_tokens": 12938736} {"current_steps": 19805, "total_steps": 38160, "loss": 0.3442, "lr": 0.0005540469660149938, "epoch": 10.379979035639414, "percentage": 51.9, "elapsed_time": "0:50:43", "remaining_time": "0:47:01", "throughput": 4251.78, "total_tokens": 12942288} {"current_steps": 19810, "total_steps": 38160, "loss": 0.4371, "lr": 0.0005538196146127907, "epoch": 10.382599580712789, "percentage": 51.91, "elapsed_time": "0:50:44", "remaining_time": "0:47:00", "throughput": 4251.84, "total_tokens": 12945520} {"current_steps": 19815, "total_steps": 38160, "loss": 0.3844, "lr": 0.0005535922519521381, "epoch": 10.385220125786164, "percentage": 51.93, "elapsed_time": "0:50:45", "remaining_time": "0:46:59", "throughput": 4251.81, "total_tokens": 12948240} {"current_steps": 19820, "total_steps": 38160, "loss": 0.428, "lr": 0.0005533648780805979, "epoch": 10.38784067085954, "percentage": 51.94, "elapsed_time": "0:50:46", "remaining_time": "0:46:58", "throughput": 4251.82, "total_tokens": 12951184} {"current_steps": 19825, "total_steps": 38160, "loss": 0.359, "lr": 0.000553137493045734, "epoch": 10.390461215932914, "percentage": 51.95, "elapsed_time": "0:50:46", "remaining_time": "0:46:57", "throughput": 4251.8, "total_tokens": 12953968} {"current_steps": 19830, "total_steps": 38160, "loss": 0.5585, "lr": 0.0005529100968951127, "epoch": 10.39308176100629, "percentage": 51.97, "elapsed_time": "0:50:47", "remaining_time": "0:46:56", "throughput": 4251.8, "total_tokens": 12956784} {"current_steps": 19835, "total_steps": 38160, "loss": 0.4218, "lr": 0.0005526826896763029, "epoch": 10.395702306079665, "percentage": 51.98, "elapsed_time": "0:50:48", "remaining_time": "0:46:55", "throughput": 4251.76, "total_tokens": 12959408} {"current_steps": 19840, "total_steps": 38160, "loss": 0.5889, "lr": 0.0005524552714368753, "epoch": 10.39832285115304, "percentage": 51.99, "elapsed_time": "0:50:48", "remaining_time": "0:46:55", "throughput": 4251.8, "total_tokens": 12962544} {"current_steps": 19845, "total_steps": 38160, "loss": 0.5135, "lr": 0.0005522278422244035, "epoch": 10.400943396226415, "percentage": 52.0, "elapsed_time": "0:50:49", "remaining_time": "0:46:54", "throughput": 4251.76, "total_tokens": 12965200} {"current_steps": 19850, "total_steps": 38160, "loss": 0.4568, "lr": 0.0005520004020864631, "epoch": 10.40356394129979, "percentage": 52.02, "elapsed_time": "0:50:50", "remaining_time": "0:46:53", "throughput": 4251.87, "total_tokens": 12968816} {"current_steps": 19855, "total_steps": 38160, "loss": 0.4683, "lr": 0.0005517729510706315, "epoch": 10.406184486373165, "percentage": 52.03, "elapsed_time": "0:50:50", "remaining_time": "0:46:52", "throughput": 4251.87, "total_tokens": 12971632} {"current_steps": 19860, "total_steps": 38160, "loss": 0.4327, "lr": 0.0005515454892244892, "epoch": 10.40880503144654, "percentage": 52.04, "elapsed_time": "0:50:51", "remaining_time": "0:46:51", "throughput": 4251.95, "total_tokens": 12975120} {"current_steps": 19865, "total_steps": 38160, "loss": 0.6483, "lr": 0.0005513180165956189, "epoch": 10.411425576519916, "percentage": 52.06, "elapsed_time": "0:50:52", "remaining_time": "0:46:51", "throughput": 4252.11, "total_tokens": 12979088} {"current_steps": 19870, "total_steps": 38160, "loss": 0.4933, "lr": 0.0005510905332316049, "epoch": 10.414046121593291, "percentage": 52.07, "elapsed_time": "0:50:53", "remaining_time": "0:46:50", "throughput": 4252.15, "total_tokens": 12982224} {"current_steps": 19875, "total_steps": 38160, "loss": 0.4859, "lr": 0.0005508630391800341, "epoch": 10.416666666666666, "percentage": 52.08, "elapsed_time": "0:50:53", "remaining_time": "0:46:49", "throughput": 4252.08, "total_tokens": 12984720} {"current_steps": 19880, "total_steps": 38160, "loss": 0.481, "lr": 0.0005506355344884959, "epoch": 10.419287211740041, "percentage": 52.1, "elapsed_time": "0:50:54", "remaining_time": "0:46:48", "throughput": 4252.07, "total_tokens": 12987472} {"current_steps": 19885, "total_steps": 38160, "loss": 0.3951, "lr": 0.0005504080192045813, "epoch": 10.421907756813416, "percentage": 52.11, "elapsed_time": "0:50:55", "remaining_time": "0:46:47", "throughput": 4252.07, "total_tokens": 12990352} {"current_steps": 19890, "total_steps": 38160, "loss": 0.3891, "lr": 0.0005501804933758846, "epoch": 10.424528301886792, "percentage": 52.12, "elapsed_time": "0:50:55", "remaining_time": "0:46:46", "throughput": 4252.12, "total_tokens": 12993616} {"current_steps": 19895, "total_steps": 38160, "loss": 0.484, "lr": 0.0005499529570500009, "epoch": 10.427148846960169, "percentage": 52.14, "elapsed_time": "0:50:56", "remaining_time": "0:46:46", "throughput": 4252.12, "total_tokens": 12996432} {"current_steps": 19900, "total_steps": 38160, "loss": 0.4182, "lr": 0.0005497254102745285, "epoch": 10.429769392033544, "percentage": 52.15, "elapsed_time": "0:50:57", "remaining_time": "0:46:45", "throughput": 4252.29, "total_tokens": 13000560} {"current_steps": 19905, "total_steps": 38160, "loss": 0.5014, "lr": 0.0005494978530970676, "epoch": 10.432389937106919, "percentage": 52.16, "elapsed_time": "0:50:58", "remaining_time": "0:46:44", "throughput": 4252.33, "total_tokens": 13003664} {"current_steps": 19910, "total_steps": 38160, "loss": 0.4477, "lr": 0.0005492702855652206, "epoch": 10.435010482180294, "percentage": 52.18, "elapsed_time": "0:50:58", "remaining_time": "0:46:43", "throughput": 4252.47, "total_tokens": 13007536} {"current_steps": 19915, "total_steps": 38160, "loss": 0.4445, "lr": 0.000549042707726592, "epoch": 10.43763102725367, "percentage": 52.19, "elapsed_time": "0:50:59", "remaining_time": "0:46:42", "throughput": 4252.56, "total_tokens": 13010960} {"current_steps": 19920, "total_steps": 38160, "loss": 0.3981, "lr": 0.0005488151196287882, "epoch": 10.440251572327044, "percentage": 52.2, "elapsed_time": "0:51:00", "remaining_time": "0:46:42", "throughput": 4252.71, "total_tokens": 13014896} {"current_steps": 19925, "total_steps": 38160, "loss": 0.3344, "lr": 0.0005485875213194184, "epoch": 10.44287211740042, "percentage": 52.21, "elapsed_time": "0:51:01", "remaining_time": "0:46:41", "throughput": 4252.7, "total_tokens": 13017808} {"current_steps": 19930, "total_steps": 38160, "loss": 0.3522, "lr": 0.0005483599128460935, "epoch": 10.445492662473795, "percentage": 52.23, "elapsed_time": "0:51:01", "remaining_time": "0:46:40", "throughput": 4252.69, "total_tokens": 13020592} {"current_steps": 19935, "total_steps": 38160, "loss": 0.3941, "lr": 0.0005481322942564266, "epoch": 10.44811320754717, "percentage": 52.24, "elapsed_time": "0:51:02", "remaining_time": "0:46:39", "throughput": 4252.75, "total_tokens": 13024016} {"current_steps": 19940, "total_steps": 38160, "loss": 0.5303, "lr": 0.0005479046655980327, "epoch": 10.450733752620545, "percentage": 52.25, "elapsed_time": "0:51:03", "remaining_time": "0:46:38", "throughput": 4252.68, "total_tokens": 13026416} {"current_steps": 19945, "total_steps": 38160, "loss": 0.409, "lr": 0.0005476770269185295, "epoch": 10.45335429769392, "percentage": 52.27, "elapsed_time": "0:51:03", "remaining_time": "0:46:38", "throughput": 4252.65, "total_tokens": 13029168} {"current_steps": 19950, "total_steps": 38160, "loss": 0.4936, "lr": 0.0005474493782655361, "epoch": 10.455974842767295, "percentage": 52.28, "elapsed_time": "0:51:04", "remaining_time": "0:46:37", "throughput": 4252.68, "total_tokens": 13032240} {"current_steps": 19955, "total_steps": 38160, "loss": 0.4757, "lr": 0.0005472217196866742, "epoch": 10.45859538784067, "percentage": 52.29, "elapsed_time": "0:51:05", "remaining_time": "0:46:36", "throughput": 4252.69, "total_tokens": 13035120} {"current_steps": 19960, "total_steps": 38160, "loss": 0.3282, "lr": 0.0005469940512295671, "epoch": 10.461215932914046, "percentage": 52.31, "elapsed_time": "0:51:05", "remaining_time": "0:46:35", "throughput": 4252.86, "total_tokens": 13039088} {"current_steps": 19965, "total_steps": 38160, "loss": 0.4455, "lr": 0.0005467663729418406, "epoch": 10.463836477987421, "percentage": 52.32, "elapsed_time": "0:51:06", "remaining_time": "0:46:34", "throughput": 4252.91, "total_tokens": 13042320} {"current_steps": 19970, "total_steps": 38160, "loss": 0.4273, "lr": 0.0005465386848711225, "epoch": 10.466457023060796, "percentage": 52.33, "elapsed_time": "0:51:07", "remaining_time": "0:46:34", "throughput": 4253.06, "total_tokens": 13046160} {"current_steps": 19975, "total_steps": 38160, "loss": 0.4169, "lr": 0.0005463109870650426, "epoch": 10.469077568134171, "percentage": 52.35, "elapsed_time": "0:51:08", "remaining_time": "0:46:33", "throughput": 4253.05, "total_tokens": 13048944} {"current_steps": 19980, "total_steps": 38160, "loss": 0.4675, "lr": 0.0005460832795712323, "epoch": 10.471698113207546, "percentage": 52.36, "elapsed_time": "0:51:08", "remaining_time": "0:46:32", "throughput": 4253.19, "total_tokens": 13052816} {"current_steps": 19985, "total_steps": 38160, "loss": 0.4106, "lr": 0.0005458555624373258, "epoch": 10.474318658280922, "percentage": 52.37, "elapsed_time": "0:51:09", "remaining_time": "0:46:31", "throughput": 4253.32, "total_tokens": 13056592} {"current_steps": 19990, "total_steps": 38160, "loss": 0.3207, "lr": 0.0005456278357109589, "epoch": 10.476939203354299, "percentage": 52.38, "elapsed_time": "0:51:10", "remaining_time": "0:46:30", "throughput": 4253.34, "total_tokens": 13059632} {"current_steps": 19995, "total_steps": 38160, "loss": 0.4737, "lr": 0.0005454000994397691, "epoch": 10.479559748427674, "percentage": 52.4, "elapsed_time": "0:51:11", "remaining_time": "0:46:30", "throughput": 4253.37, "total_tokens": 13062864} {"current_steps": 20000, "total_steps": 38160, "loss": 0.3965, "lr": 0.0005451723536713965, "epoch": 10.482180293501049, "percentage": 52.41, "elapsed_time": "0:51:12", "remaining_time": "0:46:29", "throughput": 4253.56, "total_tokens": 13067152} {"current_steps": 20005, "total_steps": 38160, "loss": 0.5018, "lr": 0.0005449445984534828, "epoch": 10.484800838574424, "percentage": 52.42, "elapsed_time": "0:51:12", "remaining_time": "0:46:28", "throughput": 4253.75, "total_tokens": 13071440} {"current_steps": 20010, "total_steps": 38160, "loss": 0.4489, "lr": 0.0005447168338336721, "epoch": 10.4874213836478, "percentage": 52.44, "elapsed_time": "0:51:13", "remaining_time": "0:46:28", "throughput": 4253.87, "total_tokens": 13075248} {"current_steps": 20015, "total_steps": 38160, "loss": 0.4899, "lr": 0.0005444890598596098, "epoch": 10.490041928721174, "percentage": 52.45, "elapsed_time": "0:51:14", "remaining_time": "0:46:27", "throughput": 4253.87, "total_tokens": 13078128} {"current_steps": 20020, "total_steps": 38160, "loss": 0.4697, "lr": 0.0005442612765789437, "epoch": 10.49266247379455, "percentage": 52.46, "elapsed_time": "0:51:15", "remaining_time": "0:46:26", "throughput": 4254.02, "total_tokens": 13082000} {"current_steps": 20025, "total_steps": 38160, "loss": 0.4132, "lr": 0.0005440334840393235, "epoch": 10.495283018867925, "percentage": 52.48, "elapsed_time": "0:51:15", "remaining_time": "0:46:25", "throughput": 4254.15, "total_tokens": 13085680} {"current_steps": 20030, "total_steps": 38160, "loss": 0.5332, "lr": 0.0005438056822884007, "epoch": 10.4979035639413, "percentage": 52.49, "elapsed_time": "0:51:16", "remaining_time": "0:46:24", "throughput": 4254.3, "total_tokens": 13089520} {"current_steps": 20035, "total_steps": 38160, "loss": 0.4888, "lr": 0.0005435778713738292, "epoch": 10.500524109014675, "percentage": 52.5, "elapsed_time": "0:51:17", "remaining_time": "0:46:24", "throughput": 4254.29, "total_tokens": 13092368} {"current_steps": 20040, "total_steps": 38160, "loss": 0.362, "lr": 0.0005433500513432639, "epoch": 10.50314465408805, "percentage": 52.52, "elapsed_time": "0:51:18", "remaining_time": "0:46:23", "throughput": 4254.28, "total_tokens": 13095216} {"current_steps": 20045, "total_steps": 38160, "loss": 0.4815, "lr": 0.0005431222222443626, "epoch": 10.505765199161425, "percentage": 52.53, "elapsed_time": "0:51:18", "remaining_time": "0:46:22", "throughput": 4254.23, "total_tokens": 13097840} {"current_steps": 20050, "total_steps": 38160, "loss": 0.3794, "lr": 0.0005428943841247843, "epoch": 10.5083857442348, "percentage": 52.54, "elapsed_time": "0:51:19", "remaining_time": "0:46:21", "throughput": 4254.24, "total_tokens": 13100784} {"current_steps": 20055, "total_steps": 38160, "loss": 0.3982, "lr": 0.0005426665370321901, "epoch": 10.511006289308176, "percentage": 52.56, "elapsed_time": "0:51:20", "remaining_time": "0:46:20", "throughput": 4254.4, "total_tokens": 13104720} {"current_steps": 20060, "total_steps": 38160, "loss": 0.4194, "lr": 0.0005424386810142433, "epoch": 10.51362683438155, "percentage": 52.57, "elapsed_time": "0:51:21", "remaining_time": "0:46:20", "throughput": 4254.61, "total_tokens": 13109040} {"current_steps": 20065, "total_steps": 38160, "loss": 0.4345, "lr": 0.0005422108161186086, "epoch": 10.516247379454926, "percentage": 52.58, "elapsed_time": "0:51:21", "remaining_time": "0:46:19", "throughput": 4254.59, "total_tokens": 13111888} {"current_steps": 20070, "total_steps": 38160, "loss": 0.4528, "lr": 0.0005419829423929525, "epoch": 10.518867924528301, "percentage": 52.59, "elapsed_time": "0:51:22", "remaining_time": "0:46:18", "throughput": 4254.71, "total_tokens": 13115504} {"current_steps": 20075, "total_steps": 38160, "loss": 0.4994, "lr": 0.0005417550598849441, "epoch": 10.521488469601676, "percentage": 52.61, "elapsed_time": "0:51:23", "remaining_time": "0:46:17", "throughput": 4254.81, "total_tokens": 13119056} {"current_steps": 20080, "total_steps": 38160, "loss": 0.5323, "lr": 0.0005415271686422534, "epoch": 10.524109014675052, "percentage": 52.62, "elapsed_time": "0:51:23", "remaining_time": "0:46:16", "throughput": 4254.75, "total_tokens": 13121552} {"current_steps": 20085, "total_steps": 38160, "loss": 0.3765, "lr": 0.0005412992687125527, "epoch": 10.526729559748428, "percentage": 52.63, "elapsed_time": "0:51:24", "remaining_time": "0:46:16", "throughput": 4254.97, "total_tokens": 13125872} {"current_steps": 20090, "total_steps": 38160, "loss": 0.4729, "lr": 0.0005410713601435164, "epoch": 10.529350104821804, "percentage": 52.65, "elapsed_time": "0:51:25", "remaining_time": "0:46:15", "throughput": 4254.94, "total_tokens": 13128592} {"current_steps": 20095, "total_steps": 38160, "loss": 0.4978, "lr": 0.0005408434429828199, "epoch": 10.531970649895179, "percentage": 52.66, "elapsed_time": "0:51:26", "remaining_time": "0:46:14", "throughput": 4254.88, "total_tokens": 13131216} {"current_steps": 20100, "total_steps": 38160, "loss": 0.539, "lr": 0.0005406155172781412, "epoch": 10.534591194968554, "percentage": 52.67, "elapsed_time": "0:51:26", "remaining_time": "0:46:13", "throughput": 4254.89, "total_tokens": 13134192} {"current_steps": 20105, "total_steps": 38160, "loss": 0.475, "lr": 0.0005403875830771596, "epoch": 10.53721174004193, "percentage": 52.69, "elapsed_time": "0:51:27", "remaining_time": "0:46:12", "throughput": 4254.91, "total_tokens": 13137232} {"current_steps": 20110, "total_steps": 38160, "loss": 0.4517, "lr": 0.0005401596404275564, "epoch": 10.539832285115304, "percentage": 52.7, "elapsed_time": "0:51:28", "remaining_time": "0:46:11", "throughput": 4255.03, "total_tokens": 13140880} {"current_steps": 20115, "total_steps": 38160, "loss": 0.4932, "lr": 0.0005399316893770147, "epoch": 10.54245283018868, "percentage": 52.71, "elapsed_time": "0:51:29", "remaining_time": "0:46:11", "throughput": 4255.14, "total_tokens": 13144464} {"current_steps": 20120, "total_steps": 38160, "loss": 0.5768, "lr": 0.0005397037299732189, "epoch": 10.545073375262055, "percentage": 52.73, "elapsed_time": "0:51:29", "remaining_time": "0:46:10", "throughput": 4255.14, "total_tokens": 13147504} {"current_steps": 20125, "total_steps": 38160, "loss": 0.6034, "lr": 0.000539475762263856, "epoch": 10.54769392033543, "percentage": 52.74, "elapsed_time": "0:51:30", "remaining_time": "0:46:09", "throughput": 4255.11, "total_tokens": 13150288} {"current_steps": 20130, "total_steps": 38160, "loss": 0.3551, "lr": 0.0005392477862966138, "epoch": 10.550314465408805, "percentage": 52.75, "elapsed_time": "0:51:31", "remaining_time": "0:46:08", "throughput": 4255.18, "total_tokens": 13153616} {"current_steps": 20135, "total_steps": 38160, "loss": 0.3868, "lr": 0.0005390198021191827, "epoch": 10.55293501048218, "percentage": 52.76, "elapsed_time": "0:51:31", "remaining_time": "0:46:07", "throughput": 4255.12, "total_tokens": 13156080} {"current_steps": 20140, "total_steps": 38160, "loss": 0.4499, "lr": 0.000538791809779254, "epoch": 10.555555555555555, "percentage": 52.78, "elapsed_time": "0:51:32", "remaining_time": "0:46:07", "throughput": 4255.25, "total_tokens": 13159792} {"current_steps": 20145, "total_steps": 38160, "loss": 0.5525, "lr": 0.0005385638093245213, "epoch": 10.55817610062893, "percentage": 52.79, "elapsed_time": "0:51:33", "remaining_time": "0:46:06", "throughput": 4255.32, "total_tokens": 13163120} {"current_steps": 20150, "total_steps": 38160, "loss": 0.3426, "lr": 0.0005383358008026795, "epoch": 10.560796645702306, "percentage": 52.8, "elapsed_time": "0:51:34", "remaining_time": "0:46:05", "throughput": 4255.35, "total_tokens": 13166192} {"current_steps": 20155, "total_steps": 38160, "loss": 0.4488, "lr": 0.0005381077842614257, "epoch": 10.56341719077568, "percentage": 52.82, "elapsed_time": "0:51:34", "remaining_time": "0:46:04", "throughput": 4255.33, "total_tokens": 13168944} {"current_steps": 20160, "total_steps": 38160, "loss": 0.4775, "lr": 0.0005378797597484582, "epoch": 10.566037735849056, "percentage": 52.83, "elapsed_time": "0:51:35", "remaining_time": "0:46:03", "throughput": 4255.36, "total_tokens": 13172080} {"current_steps": 20165, "total_steps": 38160, "loss": 0.3141, "lr": 0.0005376517273114771, "epoch": 10.568658280922431, "percentage": 52.84, "elapsed_time": "0:51:36", "remaining_time": "0:46:02", "throughput": 4255.32, "total_tokens": 13174704} {"current_steps": 20170, "total_steps": 38160, "loss": 0.4197, "lr": 0.0005374236869981841, "epoch": 10.571278825995806, "percentage": 52.86, "elapsed_time": "0:51:36", "remaining_time": "0:46:02", "throughput": 4255.34, "total_tokens": 13177648} {"current_steps": 20175, "total_steps": 38160, "loss": 0.5175, "lr": 0.0005371956388562827, "epoch": 10.573899371069182, "percentage": 52.87, "elapsed_time": "0:51:37", "remaining_time": "0:46:01", "throughput": 4255.34, "total_tokens": 13180592} {"current_steps": 20180, "total_steps": 38160, "loss": 0.5428, "lr": 0.0005369675829334782, "epoch": 10.576519916142558, "percentage": 52.88, "elapsed_time": "0:51:38", "remaining_time": "0:46:00", "throughput": 4255.33, "total_tokens": 13183408} {"current_steps": 20185, "total_steps": 38160, "loss": 0.4368, "lr": 0.0005367395192774769, "epoch": 10.579140461215934, "percentage": 52.9, "elapsed_time": "0:51:38", "remaining_time": "0:45:59", "throughput": 4255.47, "total_tokens": 13187280} {"current_steps": 20190, "total_steps": 38160, "loss": 0.4069, "lr": 0.0005365114479359875, "epoch": 10.581761006289309, "percentage": 52.91, "elapsed_time": "0:51:39", "remaining_time": "0:45:58", "throughput": 4255.48, "total_tokens": 13190288} {"current_steps": 20195, "total_steps": 38160, "loss": 0.3305, "lr": 0.0005362833689567197, "epoch": 10.584381551362684, "percentage": 52.92, "elapsed_time": "0:51:40", "remaining_time": "0:45:57", "throughput": 4255.49, "total_tokens": 13193328} {"current_steps": 20200, "total_steps": 38160, "loss": 0.3844, "lr": 0.0005360552823873849, "epoch": 10.58700209643606, "percentage": 52.94, "elapsed_time": "0:51:40", "remaining_time": "0:45:57", "throughput": 4255.44, "total_tokens": 13195888} {"current_steps": 20205, "total_steps": 38160, "loss": 0.6025, "lr": 0.0005358271882756966, "epoch": 10.589622641509434, "percentage": 52.95, "elapsed_time": "0:51:41", "remaining_time": "0:45:56", "throughput": 4255.39, "total_tokens": 13198512} {"current_steps": 20210, "total_steps": 38160, "loss": 0.3611, "lr": 0.0005355990866693689, "epoch": 10.59224318658281, "percentage": 52.96, "elapsed_time": "0:51:42", "remaining_time": "0:45:55", "throughput": 4255.36, "total_tokens": 13201168} {"current_steps": 20215, "total_steps": 38160, "loss": 0.4117, "lr": 0.0005353709776161187, "epoch": 10.594863731656185, "percentage": 52.97, "elapsed_time": "0:51:42", "remaining_time": "0:45:54", "throughput": 4255.41, "total_tokens": 13204432} {"current_steps": 20220, "total_steps": 38160, "loss": 0.4991, "lr": 0.0005351428611636636, "epoch": 10.59748427672956, "percentage": 52.99, "elapsed_time": "0:51:43", "remaining_time": "0:45:53", "throughput": 4255.5, "total_tokens": 13207920} {"current_steps": 20225, "total_steps": 38160, "loss": 0.4114, "lr": 0.0005349147373597226, "epoch": 10.600104821802935, "percentage": 53.0, "elapsed_time": "0:51:44", "remaining_time": "0:45:52", "throughput": 4255.44, "total_tokens": 13210384} {"current_steps": 20230, "total_steps": 38160, "loss": 0.6321, "lr": 0.000534686606252017, "epoch": 10.60272536687631, "percentage": 53.01, "elapsed_time": "0:51:45", "remaining_time": "0:45:52", "throughput": 4255.44, "total_tokens": 13213360} {"current_steps": 20235, "total_steps": 38160, "loss": 0.5773, "lr": 0.0005344584678882692, "epoch": 10.605345911949685, "percentage": 53.03, "elapsed_time": "0:51:45", "remaining_time": "0:45:51", "throughput": 4255.49, "total_tokens": 13216560} {"current_steps": 20240, "total_steps": 38160, "loss": 0.4279, "lr": 0.0005342303223162027, "epoch": 10.60796645702306, "percentage": 53.04, "elapsed_time": "0:51:46", "remaining_time": "0:45:50", "throughput": 4255.55, "total_tokens": 13219920} {"current_steps": 20245, "total_steps": 38160, "loss": 0.5053, "lr": 0.0005340021695835437, "epoch": 10.610587002096436, "percentage": 53.05, "elapsed_time": "0:51:47", "remaining_time": "0:45:49", "throughput": 4255.65, "total_tokens": 13223536} {"current_steps": 20250, "total_steps": 38160, "loss": 0.392, "lr": 0.0005337740097380184, "epoch": 10.61320754716981, "percentage": 53.07, "elapsed_time": "0:51:48", "remaining_time": "0:45:48", "throughput": 4255.74, "total_tokens": 13226992} {"current_steps": 20255, "total_steps": 38160, "loss": 0.3978, "lr": 0.0005335458428273557, "epoch": 10.615828092243186, "percentage": 53.08, "elapsed_time": "0:51:48", "remaining_time": "0:45:48", "throughput": 4255.77, "total_tokens": 13230000} {"current_steps": 20260, "total_steps": 38160, "loss": 0.491, "lr": 0.0005333176688992855, "epoch": 10.618448637316561, "percentage": 53.09, "elapsed_time": "0:51:49", "remaining_time": "0:45:47", "throughput": 4255.75, "total_tokens": 13232912} {"current_steps": 20265, "total_steps": 38160, "loss": 0.5413, "lr": 0.000533089488001539, "epoch": 10.621069182389936, "percentage": 53.11, "elapsed_time": "0:51:50", "remaining_time": "0:45:46", "throughput": 4255.89, "total_tokens": 13236720} {"current_steps": 20270, "total_steps": 38160, "loss": 0.4457, "lr": 0.0005328613001818492, "epoch": 10.623689727463312, "percentage": 53.12, "elapsed_time": "0:51:50", "remaining_time": "0:45:45", "throughput": 4255.9, "total_tokens": 13239600} {"current_steps": 20275, "total_steps": 38160, "loss": 0.5259, "lr": 0.0005326331054879502, "epoch": 10.626310272536688, "percentage": 53.13, "elapsed_time": "0:51:51", "remaining_time": "0:45:44", "throughput": 4255.82, "total_tokens": 13242000} {"current_steps": 20280, "total_steps": 38160, "loss": 0.433, "lr": 0.0005324049039675778, "epoch": 10.628930817610064, "percentage": 53.14, "elapsed_time": "0:51:52", "remaining_time": "0:45:43", "throughput": 4255.83, "total_tokens": 13244880} {"current_steps": 20285, "total_steps": 38160, "loss": 0.5755, "lr": 0.0005321766956684693, "epoch": 10.631551362683439, "percentage": 53.16, "elapsed_time": "0:51:52", "remaining_time": "0:45:43", "throughput": 4255.91, "total_tokens": 13248368} {"current_steps": 20290, "total_steps": 38160, "loss": 0.4564, "lr": 0.0005319484806383631, "epoch": 10.634171907756814, "percentage": 53.17, "elapsed_time": "0:51:53", "remaining_time": "0:45:42", "throughput": 4256.13, "total_tokens": 13252720} {"current_steps": 20295, "total_steps": 38160, "loss": 0.3142, "lr": 0.0005317202589249991, "epoch": 10.63679245283019, "percentage": 53.18, "elapsed_time": "0:51:54", "remaining_time": "0:45:41", "throughput": 4256.17, "total_tokens": 13255824} {"current_steps": 20300, "total_steps": 38160, "loss": 0.2988, "lr": 0.0005314920305761191, "epoch": 10.639412997903564, "percentage": 53.2, "elapsed_time": "0:51:55", "remaining_time": "0:45:40", "throughput": 4256.1, "total_tokens": 13258192} {"current_steps": 20305, "total_steps": 38160, "loss": 0.508, "lr": 0.0005312637956394654, "epoch": 10.64203354297694, "percentage": 53.21, "elapsed_time": "0:51:55", "remaining_time": "0:45:39", "throughput": 4256.16, "total_tokens": 13261456} {"current_steps": 20310, "total_steps": 38160, "loss": 0.3395, "lr": 0.0005310355541627824, "epoch": 10.644654088050315, "percentage": 53.22, "elapsed_time": "0:51:56", "remaining_time": "0:45:39", "throughput": 4256.19, "total_tokens": 13264656} {"current_steps": 20315, "total_steps": 38160, "loss": 0.3922, "lr": 0.0005308073061938153, "epoch": 10.64727463312369, "percentage": 53.24, "elapsed_time": "0:51:57", "remaining_time": "0:45:38", "throughput": 4256.14, "total_tokens": 13267184} {"current_steps": 20320, "total_steps": 38160, "loss": 0.5448, "lr": 0.0005305790517803115, "epoch": 10.649895178197065, "percentage": 53.25, "elapsed_time": "0:51:57", "remaining_time": "0:45:37", "throughput": 4256.24, "total_tokens": 13270768} {"current_steps": 20325, "total_steps": 38160, "loss": 0.5752, "lr": 0.0005303507909700189, "epoch": 10.65251572327044, "percentage": 53.26, "elapsed_time": "0:51:58", "remaining_time": "0:45:36", "throughput": 4256.19, "total_tokens": 13273296} {"current_steps": 20330, "total_steps": 38160, "loss": 0.4722, "lr": 0.000530122523810687, "epoch": 10.655136268343815, "percentage": 53.28, "elapsed_time": "0:51:59", "remaining_time": "0:45:35", "throughput": 4256.5, "total_tokens": 13278448} {"current_steps": 20335, "total_steps": 38160, "loss": 0.499, "lr": 0.0005298942503500668, "epoch": 10.65775681341719, "percentage": 53.29, "elapsed_time": "0:52:00", "remaining_time": "0:45:35", "throughput": 4256.52, "total_tokens": 13281520} {"current_steps": 20340, "total_steps": 38160, "loss": 0.4121, "lr": 0.0005296659706359105, "epoch": 10.660377358490566, "percentage": 53.3, "elapsed_time": "0:52:00", "remaining_time": "0:45:34", "throughput": 4256.54, "total_tokens": 13284496} {"current_steps": 20345, "total_steps": 38160, "loss": 0.4349, "lr": 0.0005294376847159716, "epoch": 10.66299790356394, "percentage": 53.31, "elapsed_time": "0:52:01", "remaining_time": "0:45:33", "throughput": 4256.57, "total_tokens": 13287760} {"current_steps": 20350, "total_steps": 38160, "loss": 0.4805, "lr": 0.0005292093926380049, "epoch": 10.665618448637316, "percentage": 53.33, "elapsed_time": "0:52:02", "remaining_time": "0:45:32", "throughput": 4256.54, "total_tokens": 13290384} {"current_steps": 20355, "total_steps": 38160, "loss": 0.4758, "lr": 0.0005289810944497663, "epoch": 10.668238993710691, "percentage": 53.34, "elapsed_time": "0:52:03", "remaining_time": "0:45:31", "throughput": 4256.69, "total_tokens": 13294448} {"current_steps": 20360, "total_steps": 38160, "loss": 0.5801, "lr": 0.0005287527901990137, "epoch": 10.670859538784066, "percentage": 53.35, "elapsed_time": "0:52:04", "remaining_time": "0:45:31", "throughput": 4256.86, "total_tokens": 13298480} {"current_steps": 20365, "total_steps": 38160, "loss": 0.4048, "lr": 0.0005285244799335053, "epoch": 10.673480083857442, "percentage": 53.37, "elapsed_time": "0:52:04", "remaining_time": "0:45:30", "throughput": 4256.96, "total_tokens": 13302096} {"current_steps": 20370, "total_steps": 38160, "loss": 0.4465, "lr": 0.0005282961637010009, "epoch": 10.676100628930818, "percentage": 53.38, "elapsed_time": "0:52:05", "remaining_time": "0:45:29", "throughput": 4256.98, "total_tokens": 13305136} {"current_steps": 20375, "total_steps": 38160, "loss": 0.3954, "lr": 0.0005280678415492621, "epoch": 10.678721174004194, "percentage": 53.39, "elapsed_time": "0:52:06", "remaining_time": "0:45:28", "throughput": 4257.05, "total_tokens": 13308464} {"current_steps": 20380, "total_steps": 38160, "loss": 0.4417, "lr": 0.0005278395135260512, "epoch": 10.681341719077569, "percentage": 53.41, "elapsed_time": "0:52:07", "remaining_time": "0:45:28", "throughput": 4257.37, "total_tokens": 13313392} {"current_steps": 20385, "total_steps": 38160, "loss": 0.3728, "lr": 0.0005276111796791314, "epoch": 10.683962264150944, "percentage": 53.42, "elapsed_time": "0:52:07", "remaining_time": "0:45:27", "throughput": 4257.41, "total_tokens": 13316624} {"current_steps": 20390, "total_steps": 38160, "loss": 0.5815, "lr": 0.000527382840056268, "epoch": 10.68658280922432, "percentage": 53.43, "elapsed_time": "0:52:08", "remaining_time": "0:45:26", "throughput": 4257.51, "total_tokens": 13320176} {"current_steps": 20395, "total_steps": 38160, "loss": 0.3871, "lr": 0.0005271544947052267, "epoch": 10.689203354297694, "percentage": 53.45, "elapsed_time": "0:52:09", "remaining_time": "0:45:25", "throughput": 4257.52, "total_tokens": 13323024} {"current_steps": 20400, "total_steps": 38160, "loss": 0.5057, "lr": 0.000526926143673775, "epoch": 10.69182389937107, "percentage": 53.46, "elapsed_time": "0:52:10", "remaining_time": "0:45:24", "throughput": 4257.6, "total_tokens": 13326544} {"current_steps": 20405, "total_steps": 38160, "loss": 0.3308, "lr": 0.0005266977870096813, "epoch": 10.694444444444445, "percentage": 53.47, "elapsed_time": "0:52:10", "remaining_time": "0:45:24", "throughput": 4257.73, "total_tokens": 13330352} {"current_steps": 20410, "total_steps": 38160, "loss": 0.4348, "lr": 0.000526469424760715, "epoch": 10.69706498951782, "percentage": 53.49, "elapsed_time": "0:52:11", "remaining_time": "0:45:23", "throughput": 4257.73, "total_tokens": 13333264} {"current_steps": 20415, "total_steps": 38160, "loss": 0.4265, "lr": 0.0005262410569746471, "epoch": 10.699685534591195, "percentage": 53.5, "elapsed_time": "0:52:12", "remaining_time": "0:45:22", "throughput": 4257.68, "total_tokens": 13335792} {"current_steps": 20420, "total_steps": 38160, "loss": 0.4946, "lr": 0.0005260126836992495, "epoch": 10.70230607966457, "percentage": 53.51, "elapsed_time": "0:52:12", "remaining_time": "0:45:21", "throughput": 4257.6, "total_tokens": 13338256} {"current_steps": 20425, "total_steps": 38160, "loss": 0.4352, "lr": 0.000525784304982295, "epoch": 10.704926624737945, "percentage": 53.52, "elapsed_time": "0:52:13", "remaining_time": "0:45:20", "throughput": 4257.61, "total_tokens": 13341136} {"current_steps": 20430, "total_steps": 38160, "loss": 0.4512, "lr": 0.0005255559208715585, "epoch": 10.70754716981132, "percentage": 53.54, "elapsed_time": "0:52:14", "remaining_time": "0:45:19", "throughput": 4257.6, "total_tokens": 13343984} {"current_steps": 20435, "total_steps": 38160, "loss": 0.4176, "lr": 0.0005253275314148145, "epoch": 10.710167714884696, "percentage": 53.55, "elapsed_time": "0:52:14", "remaining_time": "0:45:19", "throughput": 4257.55, "total_tokens": 13346544} {"current_steps": 20440, "total_steps": 38160, "loss": 0.5049, "lr": 0.0005250991366598401, "epoch": 10.71278825995807, "percentage": 53.56, "elapsed_time": "0:52:15", "remaining_time": "0:45:18", "throughput": 4257.54, "total_tokens": 13349392} {"current_steps": 20445, "total_steps": 38160, "loss": 0.3509, "lr": 0.0005248707366544126, "epoch": 10.715408805031446, "percentage": 53.58, "elapsed_time": "0:52:16", "remaining_time": "0:45:17", "throughput": 4257.65, "total_tokens": 13353040} {"current_steps": 20450, "total_steps": 38160, "loss": 0.4199, "lr": 0.0005246423314463106, "epoch": 10.718029350104821, "percentage": 53.59, "elapsed_time": "0:52:17", "remaining_time": "0:45:16", "throughput": 4257.8, "total_tokens": 13356912} {"current_steps": 20455, "total_steps": 38160, "loss": 0.5075, "lr": 0.000524413921083314, "epoch": 10.720649895178196, "percentage": 53.6, "elapsed_time": "0:52:17", "remaining_time": "0:45:16", "throughput": 4258.01, "total_tokens": 13361328} {"current_steps": 20460, "total_steps": 38160, "loss": 0.4515, "lr": 0.0005241855056132039, "epoch": 10.723270440251572, "percentage": 53.62, "elapsed_time": "0:52:18", "remaining_time": "0:45:15", "throughput": 4258.29, "total_tokens": 13366032} {"current_steps": 20465, "total_steps": 38160, "loss": 0.4378, "lr": 0.0005239570850837617, "epoch": 10.725890985324948, "percentage": 53.63, "elapsed_time": "0:52:19", "remaining_time": "0:45:14", "throughput": 4258.27, "total_tokens": 13368784} {"current_steps": 20470, "total_steps": 38160, "loss": 0.4065, "lr": 0.0005237286595427709, "epoch": 10.728511530398324, "percentage": 53.64, "elapsed_time": "0:52:20", "remaining_time": "0:45:13", "throughput": 4258.43, "total_tokens": 13372816} {"current_steps": 20475, "total_steps": 38160, "loss": 0.6014, "lr": 0.000523500229038015, "epoch": 10.731132075471699, "percentage": 53.66, "elapsed_time": "0:52:21", "remaining_time": "0:45:13", "throughput": 4258.48, "total_tokens": 13376048} {"current_steps": 20480, "total_steps": 38160, "loss": 0.4125, "lr": 0.0005232717936172794, "epoch": 10.733752620545074, "percentage": 53.67, "elapsed_time": "0:52:21", "remaining_time": "0:45:12", "throughput": 4258.48, "total_tokens": 13378896} {"current_steps": 20485, "total_steps": 38160, "loss": 0.3317, "lr": 0.0005230433533283498, "epoch": 10.73637316561845, "percentage": 53.68, "elapsed_time": "0:52:22", "remaining_time": "0:45:11", "throughput": 4258.59, "total_tokens": 13382512} {"current_steps": 20490, "total_steps": 38160, "loss": 0.4575, "lr": 0.0005228149082190139, "epoch": 10.738993710691824, "percentage": 53.69, "elapsed_time": "0:52:23", "remaining_time": "0:45:10", "throughput": 4258.65, "total_tokens": 13385776} {"current_steps": 20495, "total_steps": 38160, "loss": 0.4121, "lr": 0.0005225864583370594, "epoch": 10.7416142557652, "percentage": 53.71, "elapsed_time": "0:52:24", "remaining_time": "0:45:09", "throughput": 4258.8, "total_tokens": 13389680} {"current_steps": 20500, "total_steps": 38160, "loss": 0.384, "lr": 0.0005223580037302754, "epoch": 10.744234800838575, "percentage": 53.72, "elapsed_time": "0:52:24", "remaining_time": "0:45:09", "throughput": 4258.97, "total_tokens": 13393776} {"current_steps": 20505, "total_steps": 38160, "loss": 0.4659, "lr": 0.0005221295444464522, "epoch": 10.74685534591195, "percentage": 53.73, "elapsed_time": "0:52:25", "remaining_time": "0:45:08", "throughput": 4259.0, "total_tokens": 13396880} {"current_steps": 20510, "total_steps": 38160, "loss": 0.4577, "lr": 0.0005219010805333807, "epoch": 10.749475890985325, "percentage": 53.75, "elapsed_time": "0:52:26", "remaining_time": "0:45:07", "throughput": 4259.06, "total_tokens": 13400176} {"current_steps": 20515, "total_steps": 38160, "loss": 0.5616, "lr": 0.000521672612038853, "epoch": 10.7520964360587, "percentage": 53.76, "elapsed_time": "0:52:26", "remaining_time": "0:45:06", "throughput": 4259.04, "total_tokens": 13402896} {"current_steps": 20520, "total_steps": 38160, "loss": 0.4511, "lr": 0.0005214441390106624, "epoch": 10.754716981132075, "percentage": 53.77, "elapsed_time": "0:52:27", "remaining_time": "0:45:05", "throughput": 4259.17, "total_tokens": 13406672} {"current_steps": 20525, "total_steps": 38160, "loss": 0.5191, "lr": 0.0005212156614966022, "epoch": 10.75733752620545, "percentage": 53.79, "elapsed_time": "0:52:28", "remaining_time": "0:45:05", "throughput": 4259.15, "total_tokens": 13409456} {"current_steps": 20530, "total_steps": 38160, "loss": 0.396, "lr": 0.0005209871795444678, "epoch": 10.759958071278826, "percentage": 53.8, "elapsed_time": "0:52:29", "remaining_time": "0:45:04", "throughput": 4259.26, "total_tokens": 13413104} {"current_steps": 20535, "total_steps": 38160, "loss": 0.3768, "lr": 0.000520758693202055, "epoch": 10.7625786163522, "percentage": 53.81, "elapsed_time": "0:52:30", "remaining_time": "0:45:03", "throughput": 4259.74, "total_tokens": 13419888} {"current_steps": 20540, "total_steps": 38160, "loss": 0.3902, "lr": 0.0005205302025171601, "epoch": 10.765199161425576, "percentage": 53.83, "elapsed_time": "0:52:31", "remaining_time": "0:45:03", "throughput": 4259.81, "total_tokens": 13423248} {"current_steps": 20545, "total_steps": 38160, "loss": 0.5861, "lr": 0.0005203017075375812, "epoch": 10.767819706498951, "percentage": 53.84, "elapsed_time": "0:52:31", "remaining_time": "0:45:02", "throughput": 4259.78, "total_tokens": 13425968} {"current_steps": 20550, "total_steps": 38160, "loss": 0.4273, "lr": 0.0005200732083111169, "epoch": 10.770440251572326, "percentage": 53.85, "elapsed_time": "0:52:32", "remaining_time": "0:45:01", "throughput": 4259.86, "total_tokens": 13429488} {"current_steps": 20555, "total_steps": 38160, "loss": 0.4567, "lr": 0.000519844704885566, "epoch": 10.773060796645701, "percentage": 53.87, "elapsed_time": "0:52:33", "remaining_time": "0:45:00", "throughput": 4260.01, "total_tokens": 13433424} {"current_steps": 20560, "total_steps": 38160, "loss": 0.4964, "lr": 0.0005196161973087297, "epoch": 10.775681341719078, "percentage": 53.88, "elapsed_time": "0:52:34", "remaining_time": "0:45:00", "throughput": 4260.11, "total_tokens": 13436944} {"current_steps": 20565, "total_steps": 38160, "loss": 0.3348, "lr": 0.0005193876856284084, "epoch": 10.778301886792454, "percentage": 53.89, "elapsed_time": "0:52:34", "remaining_time": "0:44:59", "throughput": 4260.15, "total_tokens": 13440080} {"current_steps": 20570, "total_steps": 38160, "loss": 0.4089, "lr": 0.0005191591698924046, "epoch": 10.780922431865829, "percentage": 53.9, "elapsed_time": "0:52:35", "remaining_time": "0:44:58", "throughput": 4260.14, "total_tokens": 13442896} {"current_steps": 20575, "total_steps": 38160, "loss": 0.4451, "lr": 0.0005189306501485211, "epoch": 10.783542976939204, "percentage": 53.92, "elapsed_time": "0:52:36", "remaining_time": "0:44:57", "throughput": 4260.14, "total_tokens": 13445808} {"current_steps": 20580, "total_steps": 38160, "loss": 0.501, "lr": 0.0005187021264445613, "epoch": 10.786163522012579, "percentage": 53.93, "elapsed_time": "0:52:36", "remaining_time": "0:44:56", "throughput": 4260.13, "total_tokens": 13448720} {"current_steps": 20585, "total_steps": 38160, "loss": 0.4168, "lr": 0.0005184735988283302, "epoch": 10.788784067085954, "percentage": 53.94, "elapsed_time": "0:52:37", "remaining_time": "0:44:55", "throughput": 4260.24, "total_tokens": 13452400} {"current_steps": 20590, "total_steps": 38160, "loss": 0.4948, "lr": 0.000518245067347633, "epoch": 10.79140461215933, "percentage": 53.96, "elapsed_time": "0:52:38", "remaining_time": "0:44:55", "throughput": 4260.33, "total_tokens": 13455888} {"current_steps": 20595, "total_steps": 38160, "loss": 0.4615, "lr": 0.0005180165320502756, "epoch": 10.794025157232705, "percentage": 53.97, "elapsed_time": "0:52:39", "remaining_time": "0:44:54", "throughput": 4260.41, "total_tokens": 13459248} {"current_steps": 20600, "total_steps": 38160, "loss": 0.4415, "lr": 0.0005177879929840655, "epoch": 10.79664570230608, "percentage": 53.98, "elapsed_time": "0:52:39", "remaining_time": "0:44:53", "throughput": 4260.5, "total_tokens": 13462832} {"current_steps": 20605, "total_steps": 38160, "loss": 0.4621, "lr": 0.0005175594501968103, "epoch": 10.799266247379455, "percentage": 54.0, "elapsed_time": "0:52:40", "remaining_time": "0:44:52", "throughput": 4260.65, "total_tokens": 13466704} {"current_steps": 20610, "total_steps": 38160, "loss": 0.4288, "lr": 0.0005173309037363182, "epoch": 10.80188679245283, "percentage": 54.01, "elapsed_time": "0:52:41", "remaining_time": "0:44:52", "throughput": 4260.72, "total_tokens": 13470096} {"current_steps": 20615, "total_steps": 38160, "loss": 0.3798, "lr": 0.0005171023536503991, "epoch": 10.804507337526205, "percentage": 54.02, "elapsed_time": "0:52:42", "remaining_time": "0:44:51", "throughput": 4260.86, "total_tokens": 13473904} {"current_steps": 20620, "total_steps": 38160, "loss": 0.3287, "lr": 0.0005168737999868624, "epoch": 10.80712788259958, "percentage": 54.04, "elapsed_time": "0:52:42", "remaining_time": "0:44:50", "throughput": 4260.86, "total_tokens": 13476752} {"current_steps": 20625, "total_steps": 38160, "loss": 0.451, "lr": 0.0005166452427935193, "epoch": 10.809748427672956, "percentage": 54.05, "elapsed_time": "0:52:43", "remaining_time": "0:44:49", "throughput": 4260.94, "total_tokens": 13480208} {"current_steps": 20630, "total_steps": 38160, "loss": 0.4273, "lr": 0.0005164166821181814, "epoch": 10.81236897274633, "percentage": 54.06, "elapsed_time": "0:52:44", "remaining_time": "0:44:48", "throughput": 4260.92, "total_tokens": 13482832} {"current_steps": 20635, "total_steps": 38160, "loss": 0.3749, "lr": 0.0005161881180086607, "epoch": 10.814989517819706, "percentage": 54.07, "elapsed_time": "0:52:44", "remaining_time": "0:44:47", "throughput": 4260.9, "total_tokens": 13485744} {"current_steps": 20640, "total_steps": 38160, "loss": 0.3995, "lr": 0.0005159595505127705, "epoch": 10.817610062893081, "percentage": 54.09, "elapsed_time": "0:52:45", "remaining_time": "0:44:47", "throughput": 4260.9, "total_tokens": 13488656} {"current_steps": 20645, "total_steps": 38160, "loss": 0.3997, "lr": 0.0005157309796783246, "epoch": 10.820230607966456, "percentage": 54.1, "elapsed_time": "0:52:46", "remaining_time": "0:44:46", "throughput": 4260.89, "total_tokens": 13491408} {"current_steps": 20650, "total_steps": 38160, "loss": 0.5128, "lr": 0.000515502405553137, "epoch": 10.822851153039831, "percentage": 54.11, "elapsed_time": "0:52:47", "remaining_time": "0:44:45", "throughput": 4260.99, "total_tokens": 13495056} {"current_steps": 20655, "total_steps": 38160, "loss": 0.4278, "lr": 0.0005152738281850231, "epoch": 10.825471698113208, "percentage": 54.13, "elapsed_time": "0:52:47", "remaining_time": "0:44:44", "throughput": 4261.07, "total_tokens": 13498512} {"current_steps": 20660, "total_steps": 38160, "loss": 0.5601, "lr": 0.0005150452476217986, "epoch": 10.828092243186584, "percentage": 54.14, "elapsed_time": "0:52:48", "remaining_time": "0:44:43", "throughput": 4261.08, "total_tokens": 13501392} {"current_steps": 20665, "total_steps": 38160, "loss": 0.4794, "lr": 0.0005148166639112799, "epoch": 10.830712788259959, "percentage": 54.15, "elapsed_time": "0:52:49", "remaining_time": "0:44:43", "throughput": 4261.09, "total_tokens": 13504464} {"current_steps": 20670, "total_steps": 38160, "loss": 0.4653, "lr": 0.0005145880771012842, "epoch": 10.833333333333334, "percentage": 54.17, "elapsed_time": "0:52:49", "remaining_time": "0:44:42", "throughput": 4261.11, "total_tokens": 13507472} {"current_steps": 20675, "total_steps": 38160, "loss": 0.4028, "lr": 0.0005143594872396291, "epoch": 10.835953878406709, "percentage": 54.18, "elapsed_time": "0:52:50", "remaining_time": "0:44:41", "throughput": 4261.1, "total_tokens": 13510224} {"current_steps": 20680, "total_steps": 38160, "loss": 0.4696, "lr": 0.0005141308943741333, "epoch": 10.838574423480084, "percentage": 54.19, "elapsed_time": "0:52:51", "remaining_time": "0:44:40", "throughput": 4261.08, "total_tokens": 13512944} {"current_steps": 20685, "total_steps": 38160, "loss": 0.396, "lr": 0.0005139022985526154, "epoch": 10.84119496855346, "percentage": 54.21, "elapsed_time": "0:52:52", "remaining_time": "0:44:39", "throughput": 4261.24, "total_tokens": 13516976} {"current_steps": 20690, "total_steps": 38160, "loss": 0.4443, "lr": 0.0005136736998228952, "epoch": 10.843815513626835, "percentage": 54.22, "elapsed_time": "0:52:52", "remaining_time": "0:44:39", "throughput": 4261.37, "total_tokens": 13520816} {"current_steps": 20695, "total_steps": 38160, "loss": 0.3919, "lr": 0.0005134450982327933, "epoch": 10.84643605870021, "percentage": 54.23, "elapsed_time": "0:52:53", "remaining_time": "0:44:38", "throughput": 4261.41, "total_tokens": 13523888} {"current_steps": 20700, "total_steps": 38160, "loss": 0.333, "lr": 0.0005132164938301299, "epoch": 10.849056603773585, "percentage": 54.25, "elapsed_time": "0:52:54", "remaining_time": "0:44:37", "throughput": 4261.36, "total_tokens": 13526384} {"current_steps": 20705, "total_steps": 38160, "loss": 0.579, "lr": 0.0005129878866627271, "epoch": 10.85167714884696, "percentage": 54.26, "elapsed_time": "0:52:54", "remaining_time": "0:44:36", "throughput": 4261.31, "total_tokens": 13529008} {"current_steps": 20710, "total_steps": 38160, "loss": 0.4566, "lr": 0.0005127592767784063, "epoch": 10.854297693920335, "percentage": 54.27, "elapsed_time": "0:52:55", "remaining_time": "0:44:35", "throughput": 4261.33, "total_tokens": 13532080} {"current_steps": 20715, "total_steps": 38160, "loss": 0.5129, "lr": 0.0005125306642249905, "epoch": 10.85691823899371, "percentage": 54.28, "elapsed_time": "0:52:56", "remaining_time": "0:44:34", "throughput": 4261.4, "total_tokens": 13535504} {"current_steps": 20720, "total_steps": 38160, "loss": 0.4218, "lr": 0.0005123020490503027, "epoch": 10.859538784067086, "percentage": 54.3, "elapsed_time": "0:52:56", "remaining_time": "0:44:34", "throughput": 4261.38, "total_tokens": 13538256} {"current_steps": 20725, "total_steps": 38160, "loss": 0.5939, "lr": 0.0005120734313021665, "epoch": 10.86215932914046, "percentage": 54.31, "elapsed_time": "0:52:57", "remaining_time": "0:44:33", "throughput": 4261.43, "total_tokens": 13541456} {"current_steps": 20730, "total_steps": 38160, "loss": 0.4001, "lr": 0.0005118448110284063, "epoch": 10.864779874213836, "percentage": 54.32, "elapsed_time": "0:52:58", "remaining_time": "0:44:32", "throughput": 4261.5, "total_tokens": 13544720} {"current_steps": 20735, "total_steps": 38160, "loss": 0.4976, "lr": 0.0005116161882768469, "epoch": 10.867400419287211, "percentage": 54.34, "elapsed_time": "0:52:59", "remaining_time": "0:44:31", "throughput": 4261.47, "total_tokens": 13547504} {"current_steps": 20740, "total_steps": 38160, "loss": 0.397, "lr": 0.0005113875630953131, "epoch": 10.870020964360586, "percentage": 54.35, "elapsed_time": "0:52:59", "remaining_time": "0:44:30", "throughput": 4261.55, "total_tokens": 13551056} {"current_steps": 20745, "total_steps": 38160, "loss": 0.4481, "lr": 0.0005111589355316314, "epoch": 10.872641509433961, "percentage": 54.36, "elapsed_time": "0:53:00", "remaining_time": "0:44:30", "throughput": 4261.63, "total_tokens": 13554608} {"current_steps": 20750, "total_steps": 38160, "loss": 0.4909, "lr": 0.0005109303056336274, "epoch": 10.875262054507338, "percentage": 54.38, "elapsed_time": "0:53:01", "remaining_time": "0:44:29", "throughput": 4261.82, "total_tokens": 13558736} {"current_steps": 20755, "total_steps": 38160, "loss": 0.4435, "lr": 0.0005107016734491281, "epoch": 10.877882599580714, "percentage": 54.39, "elapsed_time": "0:53:02", "remaining_time": "0:44:28", "throughput": 4261.9, "total_tokens": 13562224} {"current_steps": 20760, "total_steps": 38160, "loss": 0.4733, "lr": 0.0005104730390259611, "epoch": 10.880503144654089, "percentage": 54.4, "elapsed_time": "0:53:02", "remaining_time": "0:44:27", "throughput": 4261.88, "total_tokens": 13565040} {"current_steps": 20765, "total_steps": 38160, "loss": 0.4185, "lr": 0.0005102444024119537, "epoch": 10.883123689727464, "percentage": 54.42, "elapsed_time": "0:53:03", "remaining_time": "0:44:26", "throughput": 4261.82, "total_tokens": 13567568} {"current_steps": 20770, "total_steps": 38160, "loss": 0.4028, "lr": 0.0005100157636549342, "epoch": 10.885744234800839, "percentage": 54.43, "elapsed_time": "0:53:04", "remaining_time": "0:44:25", "throughput": 4261.8, "total_tokens": 13570256} {"current_steps": 20775, "total_steps": 38160, "loss": 0.461, "lr": 0.0005097871228027312, "epoch": 10.888364779874214, "percentage": 54.44, "elapsed_time": "0:53:04", "remaining_time": "0:44:25", "throughput": 4261.9, "total_tokens": 13574000} {"current_steps": 20780, "total_steps": 38160, "loss": 0.459, "lr": 0.0005095584799031736, "epoch": 10.89098532494759, "percentage": 54.45, "elapsed_time": "0:53:05", "remaining_time": "0:44:24", "throughput": 4262.1, "total_tokens": 13578128} {"current_steps": 20785, "total_steps": 38160, "loss": 0.4183, "lr": 0.0005093298350040912, "epoch": 10.893605870020965, "percentage": 54.47, "elapsed_time": "0:53:06", "remaining_time": "0:44:23", "throughput": 4262.28, "total_tokens": 13582192} {"current_steps": 20790, "total_steps": 38160, "loss": 0.4762, "lr": 0.0005091011881533139, "epoch": 10.89622641509434, "percentage": 54.48, "elapsed_time": "0:53:07", "remaining_time": "0:44:22", "throughput": 4262.28, "total_tokens": 13585040} {"current_steps": 20795, "total_steps": 38160, "loss": 0.4029, "lr": 0.0005088725393986716, "epoch": 10.898846960167715, "percentage": 54.49, "elapsed_time": "0:53:07", "remaining_time": "0:44:22", "throughput": 4262.26, "total_tokens": 13587792} {"current_steps": 20800, "total_steps": 38160, "loss": 0.342, "lr": 0.0005086438887879955, "epoch": 10.90146750524109, "percentage": 54.51, "elapsed_time": "0:53:08", "remaining_time": "0:44:21", "throughput": 4262.42, "total_tokens": 13591760} {"current_steps": 20805, "total_steps": 38160, "loss": 0.4672, "lr": 0.0005084152363691164, "epoch": 10.904088050314465, "percentage": 54.52, "elapsed_time": "0:53:09", "remaining_time": "0:44:20", "throughput": 4262.33, "total_tokens": 13594096} {"current_steps": 20810, "total_steps": 38160, "loss": 0.4353, "lr": 0.0005081865821898658, "epoch": 10.90670859538784, "percentage": 54.53, "elapsed_time": "0:53:10", "remaining_time": "0:44:19", "throughput": 4262.32, "total_tokens": 13596944} {"current_steps": 20815, "total_steps": 38160, "loss": 0.4551, "lr": 0.0005079579262980756, "epoch": 10.909329140461216, "percentage": 54.55, "elapsed_time": "0:53:10", "remaining_time": "0:44:18", "throughput": 4262.27, "total_tokens": 13599504} {"current_steps": 20820, "total_steps": 38160, "loss": 0.5768, "lr": 0.0005077292687415781, "epoch": 10.91194968553459, "percentage": 54.56, "elapsed_time": "0:53:11", "remaining_time": "0:44:18", "throughput": 4262.44, "total_tokens": 13603632} {"current_steps": 20825, "total_steps": 38160, "loss": 0.3211, "lr": 0.0005075006095682056, "epoch": 10.914570230607966, "percentage": 54.57, "elapsed_time": "0:53:12", "remaining_time": "0:44:17", "throughput": 4262.43, "total_tokens": 13606480} {"current_steps": 20830, "total_steps": 38160, "loss": 0.4339, "lr": 0.0005072719488257914, "epoch": 10.917190775681341, "percentage": 54.59, "elapsed_time": "0:53:12", "remaining_time": "0:44:16", "throughput": 4262.41, "total_tokens": 13609168} {"current_steps": 20835, "total_steps": 38160, "loss": 0.4505, "lr": 0.0005070432865621683, "epoch": 10.919811320754716, "percentage": 54.6, "elapsed_time": "0:53:13", "remaining_time": "0:44:15", "throughput": 4262.4, "total_tokens": 13612080} {"current_steps": 20840, "total_steps": 38160, "loss": 0.5031, "lr": 0.00050681462282517, "epoch": 10.922431865828091, "percentage": 54.61, "elapsed_time": "0:53:14", "remaining_time": "0:44:14", "throughput": 4262.49, "total_tokens": 13615536} {"current_steps": 20845, "total_steps": 38160, "loss": 0.377, "lr": 0.0005065859576626304, "epoch": 10.925052410901468, "percentage": 54.63, "elapsed_time": "0:53:14", "remaining_time": "0:44:13", "throughput": 4262.52, "total_tokens": 13618672} {"current_steps": 20850, "total_steps": 38160, "loss": 0.5228, "lr": 0.0005063572911223836, "epoch": 10.927672955974844, "percentage": 54.64, "elapsed_time": "0:53:15", "remaining_time": "0:44:13", "throughput": 4262.46, "total_tokens": 13621072} {"current_steps": 20855, "total_steps": 38160, "loss": 0.4719, "lr": 0.0005061286232522639, "epoch": 10.930293501048219, "percentage": 54.65, "elapsed_time": "0:53:16", "remaining_time": "0:44:12", "throughput": 4262.52, "total_tokens": 13624400} {"current_steps": 20860, "total_steps": 38160, "loss": 0.5205, "lr": 0.0005058999541001064, "epoch": 10.932914046121594, "percentage": 54.66, "elapsed_time": "0:53:16", "remaining_time": "0:44:11", "throughput": 4262.4, "total_tokens": 13626544} {"current_steps": 20865, "total_steps": 38160, "loss": 0.3858, "lr": 0.0005056712837137456, "epoch": 10.935534591194969, "percentage": 54.68, "elapsed_time": "0:53:17", "remaining_time": "0:44:10", "throughput": 4262.45, "total_tokens": 13629840} {"current_steps": 20870, "total_steps": 38160, "loss": 0.3769, "lr": 0.000505442612141017, "epoch": 10.938155136268344, "percentage": 54.69, "elapsed_time": "0:53:18", "remaining_time": "0:44:09", "throughput": 4262.45, "total_tokens": 13632784} {"current_steps": 20875, "total_steps": 38160, "loss": 0.4221, "lr": 0.000505213939429756, "epoch": 10.94077568134172, "percentage": 54.7, "elapsed_time": "0:53:19", "remaining_time": "0:44:08", "throughput": 4262.44, "total_tokens": 13635600} {"current_steps": 20880, "total_steps": 38160, "loss": 0.4533, "lr": 0.0005049852656277984, "epoch": 10.943396226415095, "percentage": 54.72, "elapsed_time": "0:53:19", "remaining_time": "0:44:08", "throughput": 4262.51, "total_tokens": 13638992} {"current_steps": 20885, "total_steps": 38160, "loss": 0.4026, "lr": 0.0005047565907829801, "epoch": 10.94601677148847, "percentage": 54.73, "elapsed_time": "0:53:20", "remaining_time": "0:44:07", "throughput": 4262.48, "total_tokens": 13641616} {"current_steps": 20890, "total_steps": 38160, "loss": 0.4339, "lr": 0.0005045279149431374, "epoch": 10.948637316561845, "percentage": 54.74, "elapsed_time": "0:53:21", "remaining_time": "0:44:06", "throughput": 4262.45, "total_tokens": 13644240} {"current_steps": 20895, "total_steps": 38160, "loss": 0.5143, "lr": 0.0005042992381561063, "epoch": 10.95125786163522, "percentage": 54.76, "elapsed_time": "0:53:21", "remaining_time": "0:44:05", "throughput": 4262.49, "total_tokens": 13647408} {"current_steps": 20900, "total_steps": 38160, "loss": 0.4705, "lr": 0.0005040705604697238, "epoch": 10.953878406708595, "percentage": 54.77, "elapsed_time": "0:53:22", "remaining_time": "0:44:04", "throughput": 4262.45, "total_tokens": 13650064} {"current_steps": 20905, "total_steps": 38160, "loss": 0.4631, "lr": 0.0005038418819318265, "epoch": 10.95649895178197, "percentage": 54.78, "elapsed_time": "0:53:23", "remaining_time": "0:44:03", "throughput": 4262.66, "total_tokens": 13654416} {"current_steps": 20910, "total_steps": 38160, "loss": 0.398, "lr": 0.0005036132025902511, "epoch": 10.959119496855346, "percentage": 54.8, "elapsed_time": "0:53:23", "remaining_time": "0:44:03", "throughput": 4262.7, "total_tokens": 13657616} {"current_steps": 20915, "total_steps": 38160, "loss": 0.3827, "lr": 0.0005033845224928352, "epoch": 10.96174004192872, "percentage": 54.81, "elapsed_time": "0:53:24", "remaining_time": "0:44:02", "throughput": 4262.83, "total_tokens": 13661424} {"current_steps": 20920, "total_steps": 38160, "loss": 0.5081, "lr": 0.0005031558416874156, "epoch": 10.964360587002096, "percentage": 54.82, "elapsed_time": "0:53:25", "remaining_time": "0:44:01", "throughput": 4262.8, "total_tokens": 13664112} {"current_steps": 20925, "total_steps": 38160, "loss": 0.5222, "lr": 0.0005029271602218301, "epoch": 10.966981132075471, "percentage": 54.83, "elapsed_time": "0:53:26", "remaining_time": "0:44:00", "throughput": 4262.8, "total_tokens": 13667024} {"current_steps": 20930, "total_steps": 38160, "loss": 0.4127, "lr": 0.0005026984781439162, "epoch": 10.969601677148846, "percentage": 54.85, "elapsed_time": "0:53:26", "remaining_time": "0:43:59", "throughput": 4262.81, "total_tokens": 13670032} {"current_steps": 20935, "total_steps": 38160, "loss": 0.5023, "lr": 0.0005024697955015112, "epoch": 10.972222222222221, "percentage": 54.86, "elapsed_time": "0:53:27", "remaining_time": "0:43:59", "throughput": 4262.92, "total_tokens": 13673584} {"current_steps": 20940, "total_steps": 38160, "loss": 0.3711, "lr": 0.0005022411123424532, "epoch": 10.974842767295598, "percentage": 54.87, "elapsed_time": "0:53:28", "remaining_time": "0:43:58", "throughput": 4262.98, "total_tokens": 13676880} {"current_steps": 20945, "total_steps": 38160, "loss": 0.5742, "lr": 0.00050201242871458, "epoch": 10.977463312368974, "percentage": 54.89, "elapsed_time": "0:53:29", "remaining_time": "0:43:57", "throughput": 4263.08, "total_tokens": 13680400} {"current_steps": 20950, "total_steps": 38160, "loss": 0.5404, "lr": 0.0005017837446657298, "epoch": 10.980083857442349, "percentage": 54.9, "elapsed_time": "0:53:29", "remaining_time": "0:43:56", "throughput": 4263.06, "total_tokens": 13683248} {"current_steps": 20955, "total_steps": 38160, "loss": 0.4543, "lr": 0.0005015550602437405, "epoch": 10.982704402515724, "percentage": 54.91, "elapsed_time": "0:53:30", "remaining_time": "0:43:55", "throughput": 4263.05, "total_tokens": 13686128} {"current_steps": 20960, "total_steps": 38160, "loss": 0.3641, "lr": 0.0005013263754964504, "epoch": 10.985324947589099, "percentage": 54.93, "elapsed_time": "0:53:31", "remaining_time": "0:43:55", "throughput": 4263.12, "total_tokens": 13689360} {"current_steps": 20965, "total_steps": 38160, "loss": 0.3287, "lr": 0.0005010976904716977, "epoch": 10.987945492662474, "percentage": 54.94, "elapsed_time": "0:53:31", "remaining_time": "0:43:54", "throughput": 4263.07, "total_tokens": 13691952} {"current_steps": 20970, "total_steps": 38160, "loss": 0.4792, "lr": 0.0005008690052173206, "epoch": 10.99056603773585, "percentage": 54.95, "elapsed_time": "0:53:32", "remaining_time": "0:43:53", "throughput": 4263.04, "total_tokens": 13694544} {"current_steps": 20975, "total_steps": 38160, "loss": 0.4382, "lr": 0.0005006403197811575, "epoch": 10.993186582809225, "percentage": 54.97, "elapsed_time": "0:53:33", "remaining_time": "0:43:52", "throughput": 4263.47, "total_tokens": 13700912} {"current_steps": 20980, "total_steps": 38160, "loss": 0.4924, "lr": 0.0005004116342110469, "epoch": 10.9958071278826, "percentage": 54.98, "elapsed_time": "0:53:34", "remaining_time": "0:43:52", "throughput": 4263.53, "total_tokens": 13704272} {"current_steps": 20985, "total_steps": 38160, "loss": 0.5228, "lr": 0.0005001829485548272, "epoch": 10.998427672955975, "percentage": 54.99, "elapsed_time": "0:53:35", "remaining_time": "0:43:51", "throughput": 4263.55, "total_tokens": 13707344} {"current_steps": 20988, "total_steps": 38160, "eval_loss": 0.4845702648162842, "epoch": 11.0, "percentage": 55.0, "elapsed_time": "0:53:49", "remaining_time": "0:44:02", "throughput": 4245.22, "total_tokens": 13708664} {"current_steps": 20990, "total_steps": 38160, "loss": 0.3973, "lr": 0.0004999542628603364, "epoch": 11.00104821802935, "percentage": 55.01, "elapsed_time": "0:53:51", "remaining_time": "0:44:03", "throughput": 4243.0, "total_tokens": 13709848} {"current_steps": 20995, "total_steps": 38160, "loss": 0.476, "lr": 0.0004997255771754136, "epoch": 11.003668763102725, "percentage": 55.02, "elapsed_time": "0:53:51", "remaining_time": "0:44:02", "throughput": 4242.98, "total_tokens": 13712536} {"current_steps": 21000, "total_steps": 38160, "loss": 0.4542, "lr": 0.0004994968915478969, "epoch": 11.0062893081761, "percentage": 55.03, "elapsed_time": "0:53:52", "remaining_time": "0:44:01", "throughput": 4243.04, "total_tokens": 13715960} {"current_steps": 21005, "total_steps": 38160, "loss": 0.4002, "lr": 0.0004992682060256246, "epoch": 11.008909853249476, "percentage": 55.04, "elapsed_time": "0:53:53", "remaining_time": "0:44:00", "throughput": 4243.14, "total_tokens": 13719704} {"current_steps": 21010, "total_steps": 38160, "loss": 0.453, "lr": 0.0004990395206564353, "epoch": 11.01153039832285, "percentage": 55.06, "elapsed_time": "0:53:54", "remaining_time": "0:43:59", "throughput": 4243.19, "total_tokens": 13723096} {"current_steps": 21015, "total_steps": 38160, "loss": 0.3573, "lr": 0.0004988108354881674, "epoch": 11.014150943396226, "percentage": 55.07, "elapsed_time": "0:53:54", "remaining_time": "0:43:59", "throughput": 4243.24, "total_tokens": 13726360} {"current_steps": 21020, "total_steps": 38160, "loss": 0.3389, "lr": 0.0004985821505686591, "epoch": 11.016771488469601, "percentage": 55.08, "elapsed_time": "0:53:55", "remaining_time": "0:43:58", "throughput": 4243.51, "total_tokens": 13731128} {"current_steps": 21025, "total_steps": 38160, "loss": 0.339, "lr": 0.0004983534659457489, "epoch": 11.019392033542976, "percentage": 55.1, "elapsed_time": "0:53:56", "remaining_time": "0:43:57", "throughput": 4243.46, "total_tokens": 13733688} {"current_steps": 21030, "total_steps": 38160, "loss": 0.4468, "lr": 0.0004981247816672745, "epoch": 11.022012578616351, "percentage": 55.11, "elapsed_time": "0:53:57", "remaining_time": "0:43:56", "throughput": 4243.52, "total_tokens": 13736920} {"current_steps": 21035, "total_steps": 38160, "loss": 0.5387, "lr": 0.0004978960977810746, "epoch": 11.024633123689727, "percentage": 55.12, "elapsed_time": "0:53:57", "remaining_time": "0:43:55", "throughput": 4243.51, "total_tokens": 13739800} {"current_steps": 21040, "total_steps": 38160, "loss": 0.4458, "lr": 0.0004976674143349869, "epoch": 11.027253668763104, "percentage": 55.14, "elapsed_time": "0:53:58", "remaining_time": "0:43:55", "throughput": 4243.59, "total_tokens": 13743192} {"current_steps": 21045, "total_steps": 38160, "loss": 0.4832, "lr": 0.0004974387313768497, "epoch": 11.029874213836479, "percentage": 55.15, "elapsed_time": "0:53:59", "remaining_time": "0:43:54", "throughput": 4243.6, "total_tokens": 13746136} {"current_steps": 21050, "total_steps": 38160, "loss": 0.4386, "lr": 0.0004972100489545007, "epoch": 11.032494758909854, "percentage": 55.16, "elapsed_time": "0:53:59", "remaining_time": "0:43:53", "throughput": 4243.61, "total_tokens": 13749048} {"current_steps": 21055, "total_steps": 38160, "loss": 0.4222, "lr": 0.0004969813671157774, "epoch": 11.035115303983229, "percentage": 55.18, "elapsed_time": "0:54:00", "remaining_time": "0:43:52", "throughput": 4243.69, "total_tokens": 13752536} {"current_steps": 21060, "total_steps": 38160, "loss": 0.5974, "lr": 0.0004967526859085177, "epoch": 11.037735849056604, "percentage": 55.19, "elapsed_time": "0:54:01", "remaining_time": "0:43:51", "throughput": 4243.73, "total_tokens": 13755768} {"current_steps": 21065, "total_steps": 38160, "loss": 0.5323, "lr": 0.0004965240053805591, "epoch": 11.04035639412998, "percentage": 55.2, "elapsed_time": "0:54:02", "remaining_time": "0:43:51", "throughput": 4243.81, "total_tokens": 13759256} {"current_steps": 21070, "total_steps": 38160, "loss": 0.3017, "lr": 0.000496295325579739, "epoch": 11.042976939203355, "percentage": 55.21, "elapsed_time": "0:54:02", "remaining_time": "0:43:50", "throughput": 4243.83, "total_tokens": 13762296} {"current_steps": 21075, "total_steps": 38160, "loss": 0.4728, "lr": 0.0004960666465538945, "epoch": 11.04559748427673, "percentage": 55.23, "elapsed_time": "0:54:03", "remaining_time": "0:43:49", "throughput": 4243.87, "total_tokens": 13765432} {"current_steps": 21080, "total_steps": 38160, "loss": 0.4382, "lr": 0.0004958379683508627, "epoch": 11.048218029350105, "percentage": 55.24, "elapsed_time": "0:54:04", "remaining_time": "0:43:48", "throughput": 4243.83, "total_tokens": 13768088} {"current_steps": 21085, "total_steps": 38160, "loss": 0.4164, "lr": 0.0004956092910184803, "epoch": 11.05083857442348, "percentage": 55.25, "elapsed_time": "0:54:04", "remaining_time": "0:43:47", "throughput": 4243.86, "total_tokens": 13771160} {"current_steps": 21090, "total_steps": 38160, "loss": 0.3684, "lr": 0.0004953806146045843, "epoch": 11.053459119496855, "percentage": 55.27, "elapsed_time": "0:54:05", "remaining_time": "0:43:47", "throughput": 4244.05, "total_tokens": 13775256} {"current_steps": 21095, "total_steps": 38160, "loss": 0.4292, "lr": 0.0004951519391570108, "epoch": 11.05607966457023, "percentage": 55.28, "elapsed_time": "0:54:06", "remaining_time": "0:43:46", "throughput": 4244.1, "total_tokens": 13778488} {"current_steps": 21100, "total_steps": 38160, "loss": 0.4141, "lr": 0.0004949232647235964, "epoch": 11.058700209643606, "percentage": 55.29, "elapsed_time": "0:54:07", "remaining_time": "0:43:45", "throughput": 4244.24, "total_tokens": 13782328} {"current_steps": 21105, "total_steps": 38160, "loss": 0.3561, "lr": 0.0004946945913521771, "epoch": 11.06132075471698, "percentage": 55.31, "elapsed_time": "0:54:07", "remaining_time": "0:43:44", "throughput": 4244.23, "total_tokens": 13785144} {"current_steps": 21110, "total_steps": 38160, "loss": 0.3966, "lr": 0.0004944659190905889, "epoch": 11.063941299790356, "percentage": 55.32, "elapsed_time": "0:54:08", "remaining_time": "0:43:43", "throughput": 4244.25, "total_tokens": 13788184} {"current_steps": 21115, "total_steps": 38160, "loss": 0.4344, "lr": 0.0004942372479866674, "epoch": 11.066561844863731, "percentage": 55.33, "elapsed_time": "0:54:09", "remaining_time": "0:43:43", "throughput": 4244.47, "total_tokens": 13792600} {"current_steps": 21120, "total_steps": 38160, "loss": 0.5491, "lr": 0.0004940085780882475, "epoch": 11.069182389937106, "percentage": 55.35, "elapsed_time": "0:54:10", "remaining_time": "0:43:42", "throughput": 4244.55, "total_tokens": 13796024} {"current_steps": 21125, "total_steps": 38160, "loss": 0.4484, "lr": 0.0004937799094431649, "epoch": 11.071802935010481, "percentage": 55.36, "elapsed_time": "0:54:10", "remaining_time": "0:43:41", "throughput": 4244.56, "total_tokens": 13799000} {"current_steps": 21130, "total_steps": 38160, "loss": 0.5241, "lr": 0.0004935512420992542, "epoch": 11.074423480083857, "percentage": 55.37, "elapsed_time": "0:54:11", "remaining_time": "0:43:40", "throughput": 4244.52, "total_tokens": 13801688} {"current_steps": 21135, "total_steps": 38160, "loss": 0.3979, "lr": 0.0004933225761043502, "epoch": 11.077044025157234, "percentage": 55.39, "elapsed_time": "0:54:12", "remaining_time": "0:43:39", "throughput": 4244.56, "total_tokens": 13804920} {"current_steps": 21140, "total_steps": 38160, "loss": 0.3786, "lr": 0.0004930939115062872, "epoch": 11.079664570230609, "percentage": 55.4, "elapsed_time": "0:54:13", "remaining_time": "0:43:39", "throughput": 4244.65, "total_tokens": 13808472} {"current_steps": 21145, "total_steps": 38160, "loss": 0.2823, "lr": 0.0004928652483528989, "epoch": 11.082285115303984, "percentage": 55.41, "elapsed_time": "0:54:13", "remaining_time": "0:43:38", "throughput": 4244.62, "total_tokens": 13811192} {"current_steps": 21150, "total_steps": 38160, "loss": 0.4602, "lr": 0.0004926365866920193, "epoch": 11.084905660377359, "percentage": 55.42, "elapsed_time": "0:54:14", "remaining_time": "0:43:37", "throughput": 4244.63, "total_tokens": 13814104} {"current_steps": 21155, "total_steps": 38160, "loss": 0.4445, "lr": 0.0004924079265714817, "epoch": 11.087526205450734, "percentage": 55.44, "elapsed_time": "0:54:15", "remaining_time": "0:43:36", "throughput": 4244.64, "total_tokens": 13817144} {"current_steps": 21160, "total_steps": 38160, "loss": 0.3798, "lr": 0.0004921792680391193, "epoch": 11.09014675052411, "percentage": 55.45, "elapsed_time": "0:54:16", "remaining_time": "0:43:35", "throughput": 4244.83, "total_tokens": 13821464} {"current_steps": 21165, "total_steps": 38160, "loss": 0.4024, "lr": 0.0004919506111427649, "epoch": 11.092767295597485, "percentage": 55.46, "elapsed_time": "0:54:16", "remaining_time": "0:43:35", "throughput": 4244.88, "total_tokens": 13824696} {"current_steps": 21170, "total_steps": 38160, "loss": 0.3864, "lr": 0.0004917219559302507, "epoch": 11.09538784067086, "percentage": 55.48, "elapsed_time": "0:54:17", "remaining_time": "0:43:34", "throughput": 4244.98, "total_tokens": 13828248} {"current_steps": 21175, "total_steps": 38160, "loss": 0.4285, "lr": 0.0004914933024494089, "epoch": 11.098008385744235, "percentage": 55.49, "elapsed_time": "0:54:18", "remaining_time": "0:43:33", "throughput": 4245.03, "total_tokens": 13831448} {"current_steps": 21180, "total_steps": 38160, "loss": 0.4452, "lr": 0.0004912646507480713, "epoch": 11.10062893081761, "percentage": 55.5, "elapsed_time": "0:54:18", "remaining_time": "0:43:32", "throughput": 4244.99, "total_tokens": 13834072} {"current_steps": 21185, "total_steps": 38160, "loss": 0.5282, "lr": 0.0004910360008740689, "epoch": 11.103249475890985, "percentage": 55.52, "elapsed_time": "0:54:19", "remaining_time": "0:43:31", "throughput": 4245.03, "total_tokens": 13837208} {"current_steps": 21190, "total_steps": 38160, "loss": 0.386, "lr": 0.0004908073528752329, "epoch": 11.10587002096436, "percentage": 55.53, "elapsed_time": "0:54:20", "remaining_time": "0:43:31", "throughput": 4245.05, "total_tokens": 13840248} {"current_steps": 21195, "total_steps": 38160, "loss": 0.4836, "lr": 0.0004905787067993941, "epoch": 11.108490566037736, "percentage": 55.54, "elapsed_time": "0:54:21", "remaining_time": "0:43:30", "throughput": 4245.21, "total_tokens": 13844440} {"current_steps": 21200, "total_steps": 38160, "loss": 0.468, "lr": 0.000490350062694382, "epoch": 11.11111111111111, "percentage": 55.56, "elapsed_time": "0:54:21", "remaining_time": "0:43:29", "throughput": 4245.24, "total_tokens": 13847608} {"current_steps": 21205, "total_steps": 38160, "loss": 0.4978, "lr": 0.0004901214206080269, "epoch": 11.113731656184486, "percentage": 55.57, "elapsed_time": "0:54:22", "remaining_time": "0:43:28", "throughput": 4245.33, "total_tokens": 13851096} {"current_steps": 21210, "total_steps": 38160, "loss": 0.2982, "lr": 0.0004898927805881577, "epoch": 11.116352201257861, "percentage": 55.58, "elapsed_time": "0:54:23", "remaining_time": "0:43:27", "throughput": 4245.37, "total_tokens": 13854392} {"current_steps": 21215, "total_steps": 38160, "loss": 0.4575, "lr": 0.0004896641426826036, "epoch": 11.118972746331236, "percentage": 55.59, "elapsed_time": "0:54:24", "remaining_time": "0:43:27", "throughput": 4245.4, "total_tokens": 13857400} {"current_steps": 21220, "total_steps": 38160, "loss": 0.4752, "lr": 0.0004894355069391931, "epoch": 11.121593291404611, "percentage": 55.61, "elapsed_time": "0:54:24", "remaining_time": "0:43:26", "throughput": 4245.35, "total_tokens": 13860056} {"current_steps": 21225, "total_steps": 38160, "loss": 0.4509, "lr": 0.0004892068734057538, "epoch": 11.124213836477987, "percentage": 55.62, "elapsed_time": "0:54:25", "remaining_time": "0:43:25", "throughput": 4245.43, "total_tokens": 13863448} {"current_steps": 21230, "total_steps": 38160, "loss": 0.3799, "lr": 0.0004889782421301134, "epoch": 11.126834381551364, "percentage": 55.63, "elapsed_time": "0:54:26", "remaining_time": "0:43:24", "throughput": 4245.39, "total_tokens": 13866040} {"current_steps": 21235, "total_steps": 38160, "loss": 0.4804, "lr": 0.0004887496131600991, "epoch": 11.129454926624739, "percentage": 55.65, "elapsed_time": "0:54:26", "remaining_time": "0:43:23", "throughput": 4245.42, "total_tokens": 13869176} {"current_steps": 21240, "total_steps": 38160, "loss": 0.4647, "lr": 0.0004885209865435373, "epoch": 11.132075471698114, "percentage": 55.66, "elapsed_time": "0:54:27", "remaining_time": "0:43:23", "throughput": 4245.64, "total_tokens": 13873688} {"current_steps": 21245, "total_steps": 38160, "loss": 0.3997, "lr": 0.0004882923623282543, "epoch": 11.134696016771489, "percentage": 55.67, "elapsed_time": "0:54:28", "remaining_time": "0:43:22", "throughput": 4245.66, "total_tokens": 13876760} {"current_steps": 21250, "total_steps": 38160, "loss": 0.4816, "lr": 0.0004880637405620756, "epoch": 11.137316561844864, "percentage": 55.69, "elapsed_time": "0:54:29", "remaining_time": "0:43:21", "throughput": 4245.61, "total_tokens": 13879224} {"current_steps": 21255, "total_steps": 38160, "loss": 0.4838, "lr": 0.00048783512129282604, "epoch": 11.13993710691824, "percentage": 55.7, "elapsed_time": "0:54:29", "remaining_time": "0:43:20", "throughput": 4245.51, "total_tokens": 13881432} {"current_steps": 21260, "total_steps": 38160, "loss": 0.3425, "lr": 0.00048760650456833033, "epoch": 11.142557651991615, "percentage": 55.71, "elapsed_time": "0:54:30", "remaining_time": "0:43:19", "throughput": 4245.66, "total_tokens": 13885432} {"current_steps": 21265, "total_steps": 38160, "loss": 0.4788, "lr": 0.0004873778904364125, "epoch": 11.14517819706499, "percentage": 55.73, "elapsed_time": "0:54:31", "remaining_time": "0:43:18", "throughput": 4245.62, "total_tokens": 13888056} {"current_steps": 21270, "total_steps": 38160, "loss": 0.5274, "lr": 0.00048714927894489597, "epoch": 11.147798742138365, "percentage": 55.74, "elapsed_time": "0:54:31", "remaining_time": "0:43:18", "throughput": 4245.59, "total_tokens": 13890776} {"current_steps": 21275, "total_steps": 38160, "loss": 0.5243, "lr": 0.00048692067014160357, "epoch": 11.15041928721174, "percentage": 55.75, "elapsed_time": "0:54:32", "remaining_time": "0:43:17", "throughput": 4245.64, "total_tokens": 13894008} {"current_steps": 21280, "total_steps": 38160, "loss": 0.4205, "lr": 0.00048669206407435806, "epoch": 11.153039832285115, "percentage": 55.77, "elapsed_time": "0:54:33", "remaining_time": "0:43:16", "throughput": 4245.67, "total_tokens": 13897144} {"current_steps": 21285, "total_steps": 38160, "loss": 0.448, "lr": 0.00048646346079098075, "epoch": 11.15566037735849, "percentage": 55.78, "elapsed_time": "0:54:33", "remaining_time": "0:43:15", "throughput": 4245.71, "total_tokens": 13900312} {"current_steps": 21290, "total_steps": 38160, "loss": 0.4826, "lr": 0.0004862348603392929, "epoch": 11.158280922431866, "percentage": 55.79, "elapsed_time": "0:54:34", "remaining_time": "0:43:14", "throughput": 4245.74, "total_tokens": 13903448} {"current_steps": 21295, "total_steps": 38160, "loss": 0.3941, "lr": 0.0004860062627671154, "epoch": 11.16090146750524, "percentage": 55.8, "elapsed_time": "0:54:35", "remaining_time": "0:43:14", "throughput": 4245.8, "total_tokens": 13906808} {"current_steps": 21300, "total_steps": 38160, "loss": 0.4684, "lr": 0.0004857776681222679, "epoch": 11.163522012578616, "percentage": 55.82, "elapsed_time": "0:54:36", "remaining_time": "0:43:13", "throughput": 4245.81, "total_tokens": 13909720} {"current_steps": 21305, "total_steps": 38160, "loss": 0.4273, "lr": 0.00048554907645257024, "epoch": 11.166142557651991, "percentage": 55.83, "elapsed_time": "0:54:36", "remaining_time": "0:43:12", "throughput": 4245.96, "total_tokens": 13913688} {"current_steps": 21310, "total_steps": 38160, "loss": 0.5117, "lr": 0.0004853204878058407, "epoch": 11.168763102725366, "percentage": 55.84, "elapsed_time": "0:54:37", "remaining_time": "0:43:11", "throughput": 4245.96, "total_tokens": 13916568} {"current_steps": 21315, "total_steps": 38160, "loss": 0.4505, "lr": 0.0004850919022298977, "epoch": 11.171383647798741, "percentage": 55.86, "elapsed_time": "0:54:38", "remaining_time": "0:43:10", "throughput": 4245.91, "total_tokens": 13919160} {"current_steps": 21320, "total_steps": 38160, "loss": 0.3797, "lr": 0.0004848633197725586, "epoch": 11.174004192872117, "percentage": 55.87, "elapsed_time": "0:54:38", "remaining_time": "0:43:09", "throughput": 4245.92, "total_tokens": 13922072} {"current_steps": 21325, "total_steps": 38160, "loss": 0.5046, "lr": 0.0004846347404816404, "epoch": 11.176624737945493, "percentage": 55.88, "elapsed_time": "0:54:39", "remaining_time": "0:43:09", "throughput": 4246.01, "total_tokens": 13925688} {"current_steps": 21330, "total_steps": 38160, "loss": 0.5043, "lr": 0.0004844061644049591, "epoch": 11.179245283018869, "percentage": 55.9, "elapsed_time": "0:54:40", "remaining_time": "0:43:08", "throughput": 4245.98, "total_tokens": 13928408} {"current_steps": 21335, "total_steps": 38160, "loss": 0.5092, "lr": 0.0004841775915903305, "epoch": 11.181865828092244, "percentage": 55.91, "elapsed_time": "0:54:41", "remaining_time": "0:43:07", "throughput": 4246.1, "total_tokens": 13932152} {"current_steps": 21340, "total_steps": 38160, "loss": 0.3755, "lr": 0.00048394902208556917, "epoch": 11.184486373165619, "percentage": 55.92, "elapsed_time": "0:54:41", "remaining_time": "0:43:06", "throughput": 4246.23, "total_tokens": 13935864} {"current_steps": 21345, "total_steps": 38160, "loss": 0.438, "lr": 0.0004837204559384892, "epoch": 11.187106918238994, "percentage": 55.94, "elapsed_time": "0:54:42", "remaining_time": "0:43:05", "throughput": 4246.13, "total_tokens": 13938200} {"current_steps": 21350, "total_steps": 38160, "loss": 0.4792, "lr": 0.0004834918931969042, "epoch": 11.18972746331237, "percentage": 55.95, "elapsed_time": "0:54:43", "remaining_time": "0:43:05", "throughput": 4246.1, "total_tokens": 13940824} {"current_steps": 21355, "total_steps": 38160, "loss": 0.411, "lr": 0.0004832633339086267, "epoch": 11.192348008385745, "percentage": 55.96, "elapsed_time": "0:54:43", "remaining_time": "0:43:04", "throughput": 4246.09, "total_tokens": 13943704} {"current_steps": 21360, "total_steps": 38160, "loss": 0.3874, "lr": 0.0004830347781214689, "epoch": 11.19496855345912, "percentage": 55.97, "elapsed_time": "0:54:44", "remaining_time": "0:43:03", "throughput": 4246.12, "total_tokens": 13946808} {"current_steps": 21365, "total_steps": 38160, "loss": 0.4592, "lr": 0.0004828062258832421, "epoch": 11.197589098532495, "percentage": 55.99, "elapsed_time": "0:54:45", "remaining_time": "0:43:02", "throughput": 4246.15, "total_tokens": 13949880} {"current_steps": 21370, "total_steps": 38160, "loss": 0.3949, "lr": 0.0004825776772417564, "epoch": 11.20020964360587, "percentage": 56.0, "elapsed_time": "0:54:45", "remaining_time": "0:43:01", "throughput": 4246.14, "total_tokens": 13952728} {"current_steps": 21375, "total_steps": 38160, "loss": 0.5028, "lr": 0.00048234913224482205, "epoch": 11.202830188679245, "percentage": 56.01, "elapsed_time": "0:54:46", "remaining_time": "0:43:00", "throughput": 4246.1, "total_tokens": 13955320} {"current_steps": 21380, "total_steps": 38160, "loss": 0.3765, "lr": 0.00048212059094024774, "epoch": 11.20545073375262, "percentage": 56.03, "elapsed_time": "0:54:47", "remaining_time": "0:43:00", "throughput": 4246.18, "total_tokens": 13958712} {"current_steps": 21385, "total_steps": 38160, "loss": 0.5194, "lr": 0.0004818920533758418, "epoch": 11.208071278825996, "percentage": 56.04, "elapsed_time": "0:54:48", "remaining_time": "0:42:59", "throughput": 4246.22, "total_tokens": 13961912} {"current_steps": 21390, "total_steps": 38160, "loss": 0.4073, "lr": 0.00048166351959941185, "epoch": 11.21069182389937, "percentage": 56.05, "elapsed_time": "0:54:48", "remaining_time": "0:42:58", "throughput": 4246.37, "total_tokens": 13965784} {"current_steps": 21395, "total_steps": 38160, "loss": 0.4477, "lr": 0.0004814349896587645, "epoch": 11.213312368972746, "percentage": 56.07, "elapsed_time": "0:54:49", "remaining_time": "0:42:57", "throughput": 4246.28, "total_tokens": 13968088} {"current_steps": 21400, "total_steps": 38160, "loss": 0.3502, "lr": 0.0004812064636017053, "epoch": 11.215932914046121, "percentage": 56.08, "elapsed_time": "0:54:50", "remaining_time": "0:42:56", "throughput": 4246.29, "total_tokens": 13971000} {"current_steps": 21405, "total_steps": 38160, "loss": 0.3831, "lr": 0.0004809779414760396, "epoch": 11.218553459119496, "percentage": 56.09, "elapsed_time": "0:54:50", "remaining_time": "0:42:55", "throughput": 4246.3, "total_tokens": 13973944} {"current_steps": 21410, "total_steps": 38160, "loss": 0.5359, "lr": 0.00048074942332957136, "epoch": 11.221174004192871, "percentage": 56.11, "elapsed_time": "0:54:51", "remaining_time": "0:42:55", "throughput": 4246.36, "total_tokens": 13977272} {"current_steps": 21415, "total_steps": 38160, "loss": 0.5765, "lr": 0.00048052090921010435, "epoch": 11.223794549266247, "percentage": 56.12, "elapsed_time": "0:54:52", "remaining_time": "0:42:54", "throughput": 4246.41, "total_tokens": 13980536} {"current_steps": 21420, "total_steps": 38160, "loss": 0.4659, "lr": 0.00048029239916544094, "epoch": 11.226415094339623, "percentage": 56.13, "elapsed_time": "0:54:52", "remaining_time": "0:42:53", "throughput": 4246.42, "total_tokens": 13983416} {"current_steps": 21425, "total_steps": 38160, "loss": 0.4141, "lr": 0.0004800638932433826, "epoch": 11.229035639412999, "percentage": 56.15, "elapsed_time": "0:54:53", "remaining_time": "0:42:52", "throughput": 4246.61, "total_tokens": 13987640} {"current_steps": 21430, "total_steps": 38160, "loss": 0.4276, "lr": 0.00047983539149173043, "epoch": 11.231656184486374, "percentage": 56.16, "elapsed_time": "0:54:54", "remaining_time": "0:42:51", "throughput": 4246.53, "total_tokens": 13989944} {"current_steps": 21435, "total_steps": 38160, "loss": 0.5276, "lr": 0.0004796068939582843, "epoch": 11.234276729559749, "percentage": 56.17, "elapsed_time": "0:54:55", "remaining_time": "0:42:51", "throughput": 4246.75, "total_tokens": 13994552} {"current_steps": 21440, "total_steps": 38160, "loss": 0.4743, "lr": 0.00047937840069084333, "epoch": 11.236897274633124, "percentage": 56.18, "elapsed_time": "0:54:56", "remaining_time": "0:42:50", "throughput": 4246.71, "total_tokens": 13997176} {"current_steps": 21445, "total_steps": 38160, "loss": 0.4341, "lr": 0.0004791499117372056, "epoch": 11.2395178197065, "percentage": 56.2, "elapsed_time": "0:54:56", "remaining_time": "0:42:49", "throughput": 4246.71, "total_tokens": 14000056} {"current_steps": 21450, "total_steps": 38160, "loss": 0.5407, "lr": 0.0004789214271451686, "epoch": 11.242138364779874, "percentage": 56.21, "elapsed_time": "0:54:57", "remaining_time": "0:42:48", "throughput": 4246.7, "total_tokens": 14002840} {"current_steps": 21455, "total_steps": 38160, "loss": 0.354, "lr": 0.00047869294696252854, "epoch": 11.24475890985325, "percentage": 56.22, "elapsed_time": "0:54:58", "remaining_time": "0:42:47", "throughput": 4246.72, "total_tokens": 14005880} {"current_steps": 21460, "total_steps": 38160, "loss": 0.523, "lr": 0.0004784644712370807, "epoch": 11.247379454926625, "percentage": 56.24, "elapsed_time": "0:54:58", "remaining_time": "0:42:47", "throughput": 4246.78, "total_tokens": 14009176} {"current_steps": 21465, "total_steps": 38160, "loss": 0.3119, "lr": 0.00047823600001661984, "epoch": 11.25, "percentage": 56.25, "elapsed_time": "0:54:59", "remaining_time": "0:42:46", "throughput": 4246.87, "total_tokens": 14012728} {"current_steps": 21470, "total_steps": 38160, "loss": 0.4855, "lr": 0.0004780075333489396, "epoch": 11.252620545073375, "percentage": 56.26, "elapsed_time": "0:55:00", "remaining_time": "0:42:45", "throughput": 4247.14, "total_tokens": 14017560} {"current_steps": 21475, "total_steps": 38160, "loss": 0.4907, "lr": 0.00047777907128183233, "epoch": 11.25524109014675, "percentage": 56.28, "elapsed_time": "0:55:01", "remaining_time": "0:42:44", "throughput": 4247.19, "total_tokens": 14020824} {"current_steps": 21480, "total_steps": 38160, "loss": 0.4871, "lr": 0.0004775506138630901, "epoch": 11.257861635220126, "percentage": 56.29, "elapsed_time": "0:55:02", "remaining_time": "0:42:44", "throughput": 4247.35, "total_tokens": 14024920} {"current_steps": 21485, "total_steps": 38160, "loss": 0.3786, "lr": 0.0004773221611405032, "epoch": 11.2604821802935, "percentage": 56.3, "elapsed_time": "0:55:02", "remaining_time": "0:42:43", "throughput": 4247.35, "total_tokens": 14027864} {"current_steps": 21490, "total_steps": 38160, "loss": 0.4066, "lr": 0.0004770937131618614, "epoch": 11.263102725366876, "percentage": 56.32, "elapsed_time": "0:55:03", "remaining_time": "0:42:42", "throughput": 4247.32, "total_tokens": 14030456} {"current_steps": 21495, "total_steps": 38160, "loss": 0.4644, "lr": 0.0004768652699749535, "epoch": 11.265723270440251, "percentage": 56.33, "elapsed_time": "0:55:04", "remaining_time": "0:42:41", "throughput": 4247.43, "total_tokens": 14034104} {"current_steps": 21500, "total_steps": 38160, "loss": 0.4191, "lr": 0.00047663683162756717, "epoch": 11.268343815513626, "percentage": 56.34, "elapsed_time": "0:55:05", "remaining_time": "0:42:41", "throughput": 4247.78, "total_tokens": 14039640} {"current_steps": 21505, "total_steps": 38160, "loss": 0.5782, "lr": 0.00047640839816748926, "epoch": 11.270964360587001, "percentage": 56.35, "elapsed_time": "0:55:05", "remaining_time": "0:42:40", "throughput": 4247.77, "total_tokens": 14042520} {"current_steps": 21510, "total_steps": 38160, "loss": 0.4601, "lr": 0.00047617996964250525, "epoch": 11.273584905660377, "percentage": 56.37, "elapsed_time": "0:55:06", "remaining_time": "0:42:39", "throughput": 4247.8, "total_tokens": 14045688} {"current_steps": 21515, "total_steps": 38160, "loss": 0.4375, "lr": 0.0004759515461003997, "epoch": 11.276205450733753, "percentage": 56.38, "elapsed_time": "0:55:07", "remaining_time": "0:42:38", "throughput": 4247.82, "total_tokens": 14048728} {"current_steps": 21520, "total_steps": 38160, "loss": 0.45, "lr": 0.00047572312758895654, "epoch": 11.278825995807129, "percentage": 56.39, "elapsed_time": "0:55:07", "remaining_time": "0:42:37", "throughput": 4247.78, "total_tokens": 14051288} {"current_steps": 21525, "total_steps": 38160, "loss": 0.5557, "lr": 0.0004754947141559579, "epoch": 11.281446540880504, "percentage": 56.41, "elapsed_time": "0:55:08", "remaining_time": "0:42:37", "throughput": 4247.82, "total_tokens": 14054616} {"current_steps": 21530, "total_steps": 38160, "loss": 0.4505, "lr": 0.0004752663058491856, "epoch": 11.284067085953879, "percentage": 56.42, "elapsed_time": "0:55:09", "remaining_time": "0:42:36", "throughput": 4247.82, "total_tokens": 14057496} {"current_steps": 21535, "total_steps": 38160, "loss": 0.3673, "lr": 0.0004750379027164201, "epoch": 11.286687631027254, "percentage": 56.43, "elapsed_time": "0:55:09", "remaining_time": "0:42:35", "throughput": 4247.77, "total_tokens": 14060024} {"current_steps": 21540, "total_steps": 38160, "loss": 0.3441, "lr": 0.00047480950480544037, "epoch": 11.28930817610063, "percentage": 56.45, "elapsed_time": "0:55:10", "remaining_time": "0:42:34", "throughput": 4247.82, "total_tokens": 14063288} {"current_steps": 21545, "total_steps": 38160, "loss": 0.6174, "lr": 0.00047458111216402483, "epoch": 11.291928721174004, "percentage": 56.46, "elapsed_time": "0:55:11", "remaining_time": "0:42:33", "throughput": 4247.91, "total_tokens": 14066840} {"current_steps": 21550, "total_steps": 38160, "loss": 0.3772, "lr": 0.00047435272483995074, "epoch": 11.29454926624738, "percentage": 56.47, "elapsed_time": "0:55:12", "remaining_time": "0:42:32", "throughput": 4247.94, "total_tokens": 14069912} {"current_steps": 21555, "total_steps": 38160, "loss": 0.4785, "lr": 0.00047412434288099386, "epoch": 11.297169811320755, "percentage": 56.49, "elapsed_time": "0:55:12", "remaining_time": "0:42:32", "throughput": 4247.98, "total_tokens": 14073112} {"current_steps": 21560, "total_steps": 38160, "loss": 0.4032, "lr": 0.0004738959663349294, "epoch": 11.29979035639413, "percentage": 56.5, "elapsed_time": "0:55:13", "remaining_time": "0:42:31", "throughput": 4248.04, "total_tokens": 14076504} {"current_steps": 21565, "total_steps": 38160, "loss": 0.4263, "lr": 0.0004736675952495311, "epoch": 11.302410901467505, "percentage": 56.51, "elapsed_time": "0:55:14", "remaining_time": "0:42:30", "throughput": 4248.17, "total_tokens": 14080344} {"current_steps": 21570, "total_steps": 38160, "loss": 0.4134, "lr": 0.0004734392296725712, "epoch": 11.30503144654088, "percentage": 56.53, "elapsed_time": "0:55:15", "remaining_time": "0:42:29", "throughput": 4248.19, "total_tokens": 14083416} {"current_steps": 21575, "total_steps": 38160, "loss": 0.4711, "lr": 0.00047321086965182153, "epoch": 11.307651991614255, "percentage": 56.54, "elapsed_time": "0:55:15", "remaining_time": "0:42:29", "throughput": 4248.29, "total_tokens": 14087032} {"current_steps": 21580, "total_steps": 38160, "loss": 0.4078, "lr": 0.0004729825152350522, "epoch": 11.31027253668763, "percentage": 56.55, "elapsed_time": "0:55:16", "remaining_time": "0:42:28", "throughput": 4248.43, "total_tokens": 14090936} {"current_steps": 21585, "total_steps": 38160, "loss": 0.3948, "lr": 0.00047275416647003256, "epoch": 11.312893081761006, "percentage": 56.56, "elapsed_time": "0:55:17", "remaining_time": "0:42:27", "throughput": 4248.42, "total_tokens": 14093688} {"current_steps": 21590, "total_steps": 38160, "loss": 0.4668, "lr": 0.0004725258234045306, "epoch": 11.315513626834381, "percentage": 56.58, "elapsed_time": "0:55:18", "remaining_time": "0:42:26", "throughput": 4248.51, "total_tokens": 14097336} {"current_steps": 21595, "total_steps": 38160, "loss": 0.4025, "lr": 0.0004722974860863127, "epoch": 11.318134171907756, "percentage": 56.59, "elapsed_time": "0:55:18", "remaining_time": "0:42:25", "throughput": 4248.61, "total_tokens": 14100984} {"current_steps": 21600, "total_steps": 38160, "loss": 0.4526, "lr": 0.00047206915456314476, "epoch": 11.320754716981131, "percentage": 56.6, "elapsed_time": "0:55:19", "remaining_time": "0:42:25", "throughput": 4248.58, "total_tokens": 14103672} {"current_steps": 21605, "total_steps": 38160, "loss": 0.4947, "lr": 0.00047184082888279097, "epoch": 11.323375262054507, "percentage": 56.62, "elapsed_time": "0:55:20", "remaining_time": "0:42:24", "throughput": 4248.63, "total_tokens": 14106872} {"current_steps": 21610, "total_steps": 38160, "loss": 0.4002, "lr": 0.00047161250909301454, "epoch": 11.325995807127883, "percentage": 56.63, "elapsed_time": "0:55:21", "remaining_time": "0:42:23", "throughput": 4248.62, "total_tokens": 14109720} {"current_steps": 21615, "total_steps": 38160, "loss": 0.4039, "lr": 0.00047138419524157734, "epoch": 11.328616352201259, "percentage": 56.64, "elapsed_time": "0:55:21", "remaining_time": "0:42:22", "throughput": 4248.7, "total_tokens": 14113112} {"current_steps": 21620, "total_steps": 38160, "loss": 0.4924, "lr": 0.0004711558873762402, "epoch": 11.331236897274634, "percentage": 56.66, "elapsed_time": "0:55:22", "remaining_time": "0:42:21", "throughput": 4248.74, "total_tokens": 14116440} {"current_steps": 21625, "total_steps": 38160, "loss": 0.6045, "lr": 0.0004709275855447621, "epoch": 11.333857442348009, "percentage": 56.67, "elapsed_time": "0:55:23", "remaining_time": "0:42:20", "throughput": 4248.75, "total_tokens": 14119384} {"current_steps": 21630, "total_steps": 38160, "loss": 0.5217, "lr": 0.0004706992897949016, "epoch": 11.336477987421384, "percentage": 56.68, "elapsed_time": "0:55:23", "remaining_time": "0:42:20", "throughput": 4248.71, "total_tokens": 14122008} {"current_steps": 21635, "total_steps": 38160, "loss": 0.4293, "lr": 0.00047047100017441525, "epoch": 11.33909853249476, "percentage": 56.7, "elapsed_time": "0:55:24", "remaining_time": "0:42:19", "throughput": 4248.82, "total_tokens": 14125688} {"current_steps": 21640, "total_steps": 38160, "loss": 0.3212, "lr": 0.0004702427167310589, "epoch": 11.341719077568134, "percentage": 56.71, "elapsed_time": "0:55:25", "remaining_time": "0:42:18", "throughput": 4248.9, "total_tokens": 14129144} {"current_steps": 21645, "total_steps": 38160, "loss": 0.3962, "lr": 0.0004700144395125866, "epoch": 11.34433962264151, "percentage": 56.72, "elapsed_time": "0:55:26", "remaining_time": "0:42:17", "throughput": 4248.9, "total_tokens": 14131960} {"current_steps": 21650, "total_steps": 38160, "loss": 0.5033, "lr": 0.00046978616856675173, "epoch": 11.346960167714885, "percentage": 56.73, "elapsed_time": "0:55:26", "remaining_time": "0:42:17", "throughput": 4249.11, "total_tokens": 14136312} {"current_steps": 21655, "total_steps": 38160, "loss": 0.4153, "lr": 0.0004695579039413055, "epoch": 11.34958071278826, "percentage": 56.75, "elapsed_time": "0:55:27", "remaining_time": "0:42:16", "throughput": 4249.12, "total_tokens": 14139416} {"current_steps": 21660, "total_steps": 38160, "loss": 0.405, "lr": 0.0004693296456839984, "epoch": 11.352201257861635, "percentage": 56.76, "elapsed_time": "0:55:28", "remaining_time": "0:42:15", "throughput": 4249.19, "total_tokens": 14142904} {"current_steps": 21665, "total_steps": 38160, "loss": 0.4336, "lr": 0.0004691013938425796, "epoch": 11.35482180293501, "percentage": 56.77, "elapsed_time": "0:55:29", "remaining_time": "0:42:14", "throughput": 4249.26, "total_tokens": 14146328} {"current_steps": 21670, "total_steps": 38160, "loss": 0.3592, "lr": 0.00046887314846479663, "epoch": 11.357442348008385, "percentage": 56.79, "elapsed_time": "0:55:29", "remaining_time": "0:42:13", "throughput": 4249.28, "total_tokens": 14149368} {"current_steps": 21675, "total_steps": 38160, "loss": 0.3373, "lr": 0.000468644909598396, "epoch": 11.36006289308176, "percentage": 56.8, "elapsed_time": "0:55:30", "remaining_time": "0:42:13", "throughput": 4249.45, "total_tokens": 14153400} {"current_steps": 21680, "total_steps": 38160, "loss": 0.4414, "lr": 0.00046841667729112264, "epoch": 11.362683438155136, "percentage": 56.81, "elapsed_time": "0:55:31", "remaining_time": "0:42:12", "throughput": 4249.36, "total_tokens": 14155704} {"current_steps": 21685, "total_steps": 38160, "loss": 0.3895, "lr": 0.00046818845159071987, "epoch": 11.365303983228511, "percentage": 56.83, "elapsed_time": "0:55:31", "remaining_time": "0:42:11", "throughput": 4249.37, "total_tokens": 14158584} {"current_steps": 21690, "total_steps": 38160, "loss": 0.3074, "lr": 0.0004679602325449302, "epoch": 11.367924528301886, "percentage": 56.84, "elapsed_time": "0:55:32", "remaining_time": "0:42:10", "throughput": 4249.44, "total_tokens": 14162040} {"current_steps": 21695, "total_steps": 38160, "loss": 0.3353, "lr": 0.00046773202020149423, "epoch": 11.370545073375261, "percentage": 56.85, "elapsed_time": "0:55:33", "remaining_time": "0:42:09", "throughput": 4249.59, "total_tokens": 14166008} {"current_steps": 21700, "total_steps": 38160, "loss": 0.4715, "lr": 0.0004675038146081516, "epoch": 11.373165618448636, "percentage": 56.87, "elapsed_time": "0:55:34", "remaining_time": "0:42:09", "throughput": 4249.74, "total_tokens": 14170040} {"current_steps": 21705, "total_steps": 38160, "loss": 0.4233, "lr": 0.0004672756158126403, "epoch": 11.375786163522013, "percentage": 56.88, "elapsed_time": "0:55:35", "remaining_time": "0:42:08", "throughput": 4249.76, "total_tokens": 14173016} {"current_steps": 21710, "total_steps": 38160, "loss": 0.2968, "lr": 0.0004670474238626968, "epoch": 11.378406708595389, "percentage": 56.89, "elapsed_time": "0:55:35", "remaining_time": "0:42:07", "throughput": 4249.8, "total_tokens": 14176152} {"current_steps": 21715, "total_steps": 38160, "loss": 0.392, "lr": 0.00046681923880605614, "epoch": 11.381027253668764, "percentage": 56.91, "elapsed_time": "0:55:36", "remaining_time": "0:42:06", "throughput": 4249.9, "total_tokens": 14179736} {"current_steps": 21720, "total_steps": 38160, "loss": 0.3312, "lr": 0.0004665910606904523, "epoch": 11.383647798742139, "percentage": 56.92, "elapsed_time": "0:55:37", "remaining_time": "0:42:05", "throughput": 4249.99, "total_tokens": 14183224} {"current_steps": 21725, "total_steps": 38160, "loss": 0.4685, "lr": 0.0004663628895636173, "epoch": 11.386268343815514, "percentage": 56.93, "elapsed_time": "0:55:37", "remaining_time": "0:42:05", "throughput": 4250.0, "total_tokens": 14186200} {"current_steps": 21730, "total_steps": 38160, "loss": 0.4192, "lr": 0.0004661347254732822, "epoch": 11.38888888888889, "percentage": 56.94, "elapsed_time": "0:55:38", "remaining_time": "0:42:04", "throughput": 4250.1, "total_tokens": 14189848} {"current_steps": 21735, "total_steps": 38160, "loss": 0.4106, "lr": 0.0004659065684671762, "epoch": 11.391509433962264, "percentage": 56.96, "elapsed_time": "0:55:39", "remaining_time": "0:42:03", "throughput": 4250.19, "total_tokens": 14193400} {"current_steps": 21740, "total_steps": 38160, "loss": 0.3713, "lr": 0.00046567841859302696, "epoch": 11.39412997903564, "percentage": 56.97, "elapsed_time": "0:55:40", "remaining_time": "0:42:02", "throughput": 4250.15, "total_tokens": 14195960} {"current_steps": 21745, "total_steps": 38160, "loss": 0.4262, "lr": 0.0004654502758985611, "epoch": 11.396750524109015, "percentage": 56.98, "elapsed_time": "0:55:40", "remaining_time": "0:42:01", "throughput": 4250.1, "total_tokens": 14198520} {"current_steps": 21750, "total_steps": 38160, "loss": 0.425, "lr": 0.00046522214043150323, "epoch": 11.39937106918239, "percentage": 57.0, "elapsed_time": "0:55:41", "remaining_time": "0:42:01", "throughput": 4250.15, "total_tokens": 14201816} {"current_steps": 21755, "total_steps": 38160, "loss": 0.5202, "lr": 0.00046499401223957696, "epoch": 11.401991614255765, "percentage": 57.01, "elapsed_time": "0:55:42", "remaining_time": "0:42:00", "throughput": 4250.2, "total_tokens": 14205048} {"current_steps": 21760, "total_steps": 38160, "loss": 0.4189, "lr": 0.0004647658913705038, "epoch": 11.40461215932914, "percentage": 57.02, "elapsed_time": "0:55:42", "remaining_time": "0:41:59", "throughput": 4250.15, "total_tokens": 14207544} {"current_steps": 21765, "total_steps": 38160, "loss": 0.472, "lr": 0.00046453777787200444, "epoch": 11.407232704402515, "percentage": 57.04, "elapsed_time": "0:55:43", "remaining_time": "0:41:58", "throughput": 4250.25, "total_tokens": 14211128} {"current_steps": 21770, "total_steps": 38160, "loss": 0.4466, "lr": 0.0004643096717917973, "epoch": 11.40985324947589, "percentage": 57.05, "elapsed_time": "0:55:44", "remaining_time": "0:41:57", "throughput": 4250.3, "total_tokens": 14214328} {"current_steps": 21775, "total_steps": 38160, "loss": 0.354, "lr": 0.0004640815731775995, "epoch": 11.412473794549266, "percentage": 57.06, "elapsed_time": "0:55:45", "remaining_time": "0:41:57", "throughput": 4250.53, "total_tokens": 14218904} {"current_steps": 21780, "total_steps": 38160, "loss": 0.4531, "lr": 0.0004638534820771267, "epoch": 11.415094339622641, "percentage": 57.08, "elapsed_time": "0:55:45", "remaining_time": "0:41:56", "throughput": 4250.62, "total_tokens": 14222392} {"current_steps": 21785, "total_steps": 38160, "loss": 0.4865, "lr": 0.0004636253985380934, "epoch": 11.417714884696016, "percentage": 57.09, "elapsed_time": "0:55:46", "remaining_time": "0:41:55", "throughput": 4250.55, "total_tokens": 14224792} {"current_steps": 21790, "total_steps": 38160, "loss": 0.5699, "lr": 0.00046339732260821173, "epoch": 11.420335429769391, "percentage": 57.1, "elapsed_time": "0:55:47", "remaining_time": "0:41:54", "throughput": 4250.62, "total_tokens": 14228248} {"current_steps": 21795, "total_steps": 38160, "loss": 0.4504, "lr": 0.0004631692543351924, "epoch": 11.422955974842766, "percentage": 57.11, "elapsed_time": "0:55:48", "remaining_time": "0:41:53", "throughput": 4250.74, "total_tokens": 14232088} {"current_steps": 21800, "total_steps": 38160, "loss": 0.4191, "lr": 0.00046294119376674486, "epoch": 11.425576519916142, "percentage": 57.13, "elapsed_time": "0:55:48", "remaining_time": "0:41:53", "throughput": 4250.85, "total_tokens": 14235640} {"current_steps": 21805, "total_steps": 38160, "loss": 0.3893, "lr": 0.0004627131409505768, "epoch": 11.428197064989519, "percentage": 57.14, "elapsed_time": "0:55:49", "remaining_time": "0:41:52", "throughput": 4250.9, "total_tokens": 14238904} {"current_steps": 21810, "total_steps": 38160, "loss": 0.4724, "lr": 0.0004624850959343944, "epoch": 11.430817610062894, "percentage": 57.15, "elapsed_time": "0:55:50", "remaining_time": "0:41:51", "throughput": 4251.12, "total_tokens": 14243288} {"current_steps": 21815, "total_steps": 38160, "loss": 0.4187, "lr": 0.00046225705876590175, "epoch": 11.433438155136269, "percentage": 57.17, "elapsed_time": "0:55:51", "remaining_time": "0:41:50", "throughput": 4251.12, "total_tokens": 14246200} {"current_steps": 21820, "total_steps": 38160, "loss": 0.597, "lr": 0.00046202902949280206, "epoch": 11.436058700209644, "percentage": 57.18, "elapsed_time": "0:55:51", "remaining_time": "0:41:50", "throughput": 4251.19, "total_tokens": 14249656} {"current_steps": 21825, "total_steps": 38160, "loss": 0.4054, "lr": 0.00046180100816279614, "epoch": 11.43867924528302, "percentage": 57.19, "elapsed_time": "0:55:52", "remaining_time": "0:41:49", "throughput": 4251.24, "total_tokens": 14252920} {"current_steps": 21830, "total_steps": 38160, "loss": 0.3543, "lr": 0.0004615729948235833, "epoch": 11.441299790356394, "percentage": 57.21, "elapsed_time": "0:55:53", "remaining_time": "0:41:48", "throughput": 4251.31, "total_tokens": 14256152} {"current_steps": 21835, "total_steps": 38160, "loss": 0.3679, "lr": 0.00046134498952286174, "epoch": 11.44392033542977, "percentage": 57.22, "elapsed_time": "0:55:54", "remaining_time": "0:41:47", "throughput": 4251.32, "total_tokens": 14259224} {"current_steps": 21840, "total_steps": 38160, "loss": 0.4603, "lr": 0.00046111699230832727, "epoch": 11.446540880503145, "percentage": 57.23, "elapsed_time": "0:55:54", "remaining_time": "0:41:46", "throughput": 4251.33, "total_tokens": 14262232} {"current_steps": 21845, "total_steps": 38160, "loss": 0.4674, "lr": 0.00046088900322767434, "epoch": 11.44916142557652, "percentage": 57.25, "elapsed_time": "0:55:55", "remaining_time": "0:41:46", "throughput": 4251.42, "total_tokens": 14265752} {"current_steps": 21850, "total_steps": 38160, "loss": 0.4302, "lr": 0.0004606610223285961, "epoch": 11.451781970649895, "percentage": 57.26, "elapsed_time": "0:55:56", "remaining_time": "0:41:45", "throughput": 4251.45, "total_tokens": 14268888} {"current_steps": 21855, "total_steps": 38160, "loss": 0.3379, "lr": 0.00046043304965878284, "epoch": 11.45440251572327, "percentage": 57.27, "elapsed_time": "0:55:56", "remaining_time": "0:41:44", "throughput": 4251.49, "total_tokens": 14272024} {"current_steps": 21860, "total_steps": 38160, "loss": 0.5228, "lr": 0.00046020508526592425, "epoch": 11.457023060796645, "percentage": 57.29, "elapsed_time": "0:55:57", "remaining_time": "0:41:43", "throughput": 4251.51, "total_tokens": 14275128} {"current_steps": 21865, "total_steps": 38160, "loss": 0.5936, "lr": 0.0004599771291977079, "epoch": 11.45964360587002, "percentage": 57.3, "elapsed_time": "0:55:58", "remaining_time": "0:41:42", "throughput": 4251.64, "total_tokens": 14278936} {"current_steps": 21870, "total_steps": 38160, "loss": 0.5038, "lr": 0.0004597491815018194, "epoch": 11.462264150943396, "percentage": 57.31, "elapsed_time": "0:55:59", "remaining_time": "0:41:42", "throughput": 4251.68, "total_tokens": 14282040} {"current_steps": 21875, "total_steps": 38160, "loss": 0.2976, "lr": 0.0004595212422259431, "epoch": 11.464884696016771, "percentage": 57.32, "elapsed_time": "0:55:59", "remaining_time": "0:41:41", "throughput": 4251.78, "total_tokens": 14285688} {"current_steps": 21880, "total_steps": 38160, "loss": 0.3702, "lr": 0.00045929331141776104, "epoch": 11.467505241090146, "percentage": 57.34, "elapsed_time": "0:56:00", "remaining_time": "0:41:40", "throughput": 4251.93, "total_tokens": 14289688} {"current_steps": 21885, "total_steps": 38160, "loss": 0.4181, "lr": 0.0004590653891249537, "epoch": 11.470125786163521, "percentage": 57.35, "elapsed_time": "0:56:01", "remaining_time": "0:41:39", "throughput": 4251.91, "total_tokens": 14292440} {"current_steps": 21890, "total_steps": 38160, "loss": 0.503, "lr": 0.0004588374753952001, "epoch": 11.472746331236896, "percentage": 57.36, "elapsed_time": "0:56:02", "remaining_time": "0:41:39", "throughput": 4252.08, "total_tokens": 14296568} {"current_steps": 21895, "total_steps": 38160, "loss": 0.5568, "lr": 0.0004586095702761769, "epoch": 11.475366876310272, "percentage": 57.38, "elapsed_time": "0:56:02", "remaining_time": "0:41:38", "throughput": 4252.09, "total_tokens": 14299512} {"current_steps": 21900, "total_steps": 38160, "loss": 0.5114, "lr": 0.0004583816738155595, "epoch": 11.477987421383649, "percentage": 57.39, "elapsed_time": "0:56:03", "remaining_time": "0:41:37", "throughput": 4252.24, "total_tokens": 14303512} {"current_steps": 21905, "total_steps": 38160, "loss": 0.3615, "lr": 0.0004581537860610213, "epoch": 11.480607966457024, "percentage": 57.4, "elapsed_time": "0:56:04", "remaining_time": "0:41:36", "throughput": 4252.28, "total_tokens": 14306712} {"current_steps": 21910, "total_steps": 38160, "loss": 0.5254, "lr": 0.0004579259070602333, "epoch": 11.483228511530399, "percentage": 57.42, "elapsed_time": "0:56:05", "remaining_time": "0:41:35", "throughput": 4252.31, "total_tokens": 14309784} {"current_steps": 21915, "total_steps": 38160, "loss": 0.4215, "lr": 0.0004576980368608658, "epoch": 11.485849056603774, "percentage": 57.43, "elapsed_time": "0:56:05", "remaining_time": "0:41:35", "throughput": 4252.31, "total_tokens": 14312696} {"current_steps": 21920, "total_steps": 38160, "loss": 0.3751, "lr": 0.0004574701755105862, "epoch": 11.48846960167715, "percentage": 57.44, "elapsed_time": "0:56:06", "remaining_time": "0:41:34", "throughput": 4252.34, "total_tokens": 14315736} {"current_steps": 21925, "total_steps": 38160, "loss": 0.3787, "lr": 0.00045724232305706066, "epoch": 11.491090146750524, "percentage": 57.46, "elapsed_time": "0:56:07", "remaining_time": "0:41:33", "throughput": 4252.32, "total_tokens": 14318488} {"current_steps": 21930, "total_steps": 38160, "loss": 0.4854, "lr": 0.00045701447954795343, "epoch": 11.4937106918239, "percentage": 57.47, "elapsed_time": "0:56:07", "remaining_time": "0:41:32", "throughput": 4252.3, "total_tokens": 14321240} {"current_steps": 21935, "total_steps": 38160, "loss": 0.4192, "lr": 0.0004567866450309268, "epoch": 11.496331236897275, "percentage": 57.48, "elapsed_time": "0:56:08", "remaining_time": "0:41:31", "throughput": 4252.28, "total_tokens": 14324024} {"current_steps": 21940, "total_steps": 38160, "loss": 0.4635, "lr": 0.00045655881955364086, "epoch": 11.49895178197065, "percentage": 57.49, "elapsed_time": "0:56:09", "remaining_time": "0:41:30", "throughput": 4252.35, "total_tokens": 14327320} {"current_steps": 21945, "total_steps": 38160, "loss": 0.4547, "lr": 0.0004563310031637543, "epoch": 11.501572327044025, "percentage": 57.51, "elapsed_time": "0:56:10", "remaining_time": "0:41:30", "throughput": 4252.39, "total_tokens": 14330584} {"current_steps": 21950, "total_steps": 38160, "loss": 0.4392, "lr": 0.00045610319590892365, "epoch": 11.5041928721174, "percentage": 57.52, "elapsed_time": "0:56:10", "remaining_time": "0:41:29", "throughput": 4252.42, "total_tokens": 14333592} {"current_steps": 21955, "total_steps": 38160, "loss": 0.3748, "lr": 0.00045587539783680366, "epoch": 11.506813417190775, "percentage": 57.53, "elapsed_time": "0:56:11", "remaining_time": "0:41:28", "throughput": 4252.56, "total_tokens": 14337496} {"current_steps": 21960, "total_steps": 38160, "loss": 0.3561, "lr": 0.00045564760899504715, "epoch": 11.50943396226415, "percentage": 57.55, "elapsed_time": "0:56:12", "remaining_time": "0:41:27", "throughput": 4252.68, "total_tokens": 14341304} {"current_steps": 21965, "total_steps": 38160, "loss": 0.3533, "lr": 0.00045541982943130466, "epoch": 11.512054507337526, "percentage": 57.56, "elapsed_time": "0:56:12", "remaining_time": "0:41:26", "throughput": 4252.71, "total_tokens": 14344312} {"current_steps": 21970, "total_steps": 38160, "loss": 0.3937, "lr": 0.00045519205919322534, "epoch": 11.514675052410901, "percentage": 57.57, "elapsed_time": "0:56:13", "remaining_time": "0:41:26", "throughput": 4252.63, "total_tokens": 14346648} {"current_steps": 21975, "total_steps": 38160, "loss": 0.3312, "lr": 0.00045496429832845594, "epoch": 11.517295597484276, "percentage": 57.59, "elapsed_time": "0:56:14", "remaining_time": "0:41:25", "throughput": 4252.67, "total_tokens": 14349816} {"current_steps": 21980, "total_steps": 38160, "loss": 0.5453, "lr": 0.0004547365468846416, "epoch": 11.519916142557651, "percentage": 57.6, "elapsed_time": "0:56:15", "remaining_time": "0:41:24", "throughput": 4252.81, "total_tokens": 14353656} {"current_steps": 21985, "total_steps": 38160, "loss": 0.5652, "lr": 0.0004545088049094252, "epoch": 11.522536687631026, "percentage": 57.61, "elapsed_time": "0:56:15", "remaining_time": "0:41:23", "throughput": 4252.94, "total_tokens": 14357624} {"current_steps": 21990, "total_steps": 38160, "loss": 0.4017, "lr": 0.00045428107245044805, "epoch": 11.525157232704402, "percentage": 57.63, "elapsed_time": "0:56:16", "remaining_time": "0:41:22", "throughput": 4252.96, "total_tokens": 14360664} {"current_steps": 21995, "total_steps": 38160, "loss": 0.3997, "lr": 0.0004540533495553488, "epoch": 11.527777777777779, "percentage": 57.64, "elapsed_time": "0:56:17", "remaining_time": "0:41:22", "throughput": 4253.02, "total_tokens": 14363960} {"current_steps": 22000, "total_steps": 38160, "loss": 0.3898, "lr": 0.00045382563627176454, "epoch": 11.530398322851154, "percentage": 57.65, "elapsed_time": "0:56:17", "remaining_time": "0:41:21", "throughput": 4252.96, "total_tokens": 14366424} {"current_steps": 22005, "total_steps": 38160, "loss": 0.6727, "lr": 0.0004535979326473304, "epoch": 11.533018867924529, "percentage": 57.67, "elapsed_time": "0:56:18", "remaining_time": "0:41:20", "throughput": 4253.11, "total_tokens": 14370232} {"current_steps": 22010, "total_steps": 38160, "loss": 0.5644, "lr": 0.00045337023872967945, "epoch": 11.535639412997904, "percentage": 57.68, "elapsed_time": "0:56:19", "remaining_time": "0:41:19", "throughput": 4253.21, "total_tokens": 14373976} {"current_steps": 22015, "total_steps": 38160, "loss": 0.4398, "lr": 0.0004531425545664425, "epoch": 11.53825995807128, "percentage": 57.69, "elapsed_time": "0:56:20", "remaining_time": "0:41:18", "throughput": 4253.18, "total_tokens": 14376568} {"current_steps": 22020, "total_steps": 38160, "loss": 0.4139, "lr": 0.0004529148802052488, "epoch": 11.540880503144654, "percentage": 57.7, "elapsed_time": "0:56:20", "remaining_time": "0:41:18", "throughput": 4253.15, "total_tokens": 14379256} {"current_steps": 22025, "total_steps": 38160, "loss": 0.3919, "lr": 0.00045268721569372483, "epoch": 11.54350104821803, "percentage": 57.72, "elapsed_time": "0:56:21", "remaining_time": "0:41:17", "throughput": 4253.09, "total_tokens": 14381752} {"current_steps": 22030, "total_steps": 38160, "loss": 0.4745, "lr": 0.00045245956107949547, "epoch": 11.546121593291405, "percentage": 57.73, "elapsed_time": "0:56:22", "remaining_time": "0:41:16", "throughput": 4253.15, "total_tokens": 14384984} {"current_steps": 22035, "total_steps": 38160, "loss": 0.4109, "lr": 0.0004522319164101837, "epoch": 11.54874213836478, "percentage": 57.74, "elapsed_time": "0:56:22", "remaining_time": "0:41:15", "throughput": 4253.23, "total_tokens": 14388504} {"current_steps": 22040, "total_steps": 38160, "loss": 0.4969, "lr": 0.00045200428173340987, "epoch": 11.551362683438155, "percentage": 57.76, "elapsed_time": "0:56:23", "remaining_time": "0:41:14", "throughput": 4253.22, "total_tokens": 14391256} {"current_steps": 22045, "total_steps": 38160, "loss": 0.4739, "lr": 0.00045177665709679286, "epoch": 11.55398322851153, "percentage": 57.77, "elapsed_time": "0:56:24", "remaining_time": "0:41:13", "throughput": 4253.19, "total_tokens": 14393880} {"current_steps": 22050, "total_steps": 38160, "loss": 0.4127, "lr": 0.0004515490425479492, "epoch": 11.556603773584905, "percentage": 57.78, "elapsed_time": "0:56:24", "remaining_time": "0:41:13", "throughput": 4253.11, "total_tokens": 14396248} {"current_steps": 22055, "total_steps": 38160, "loss": 0.4201, "lr": 0.0004513214381344928, "epoch": 11.55922431865828, "percentage": 57.8, "elapsed_time": "0:56:25", "remaining_time": "0:41:12", "throughput": 4253.04, "total_tokens": 14398616} {"current_steps": 22060, "total_steps": 38160, "loss": 0.5156, "lr": 0.00045109384390403635, "epoch": 11.561844863731656, "percentage": 57.81, "elapsed_time": "0:56:26", "remaining_time": "0:41:11", "throughput": 4253.04, "total_tokens": 14401496} {"current_steps": 22065, "total_steps": 38160, "loss": 0.3782, "lr": 0.0004508662599041896, "epoch": 11.564465408805031, "percentage": 57.82, "elapsed_time": "0:56:26", "remaining_time": "0:41:10", "throughput": 4253.01, "total_tokens": 14404216} {"current_steps": 22070, "total_steps": 38160, "loss": 0.6041, "lr": 0.0004506386861825609, "epoch": 11.567085953878406, "percentage": 57.84, "elapsed_time": "0:56:27", "remaining_time": "0:41:09", "throughput": 4253.12, "total_tokens": 14407864} {"current_steps": 22075, "total_steps": 38160, "loss": 0.4819, "lr": 0.00045041112278675603, "epoch": 11.569706498951781, "percentage": 57.85, "elapsed_time": "0:56:28", "remaining_time": "0:41:08", "throughput": 4253.21, "total_tokens": 14411416} {"current_steps": 22080, "total_steps": 38160, "loss": 0.4028, "lr": 0.00045018356976437836, "epoch": 11.572327044025156, "percentage": 57.86, "elapsed_time": "0:56:29", "remaining_time": "0:41:08", "throughput": 4253.19, "total_tokens": 14414168} {"current_steps": 22085, "total_steps": 38160, "loss": 0.4432, "lr": 0.0004499560271630295, "epoch": 11.574947589098532, "percentage": 57.87, "elapsed_time": "0:56:29", "remaining_time": "0:41:07", "throughput": 4253.36, "total_tokens": 14418456} {"current_steps": 22090, "total_steps": 38160, "loss": 0.4738, "lr": 0.00044972849503030894, "epoch": 11.577568134171909, "percentage": 57.89, "elapsed_time": "0:56:30", "remaining_time": "0:41:06", "throughput": 4253.41, "total_tokens": 14421624} {"current_steps": 22095, "total_steps": 38160, "loss": 0.4051, "lr": 0.00044950097341381356, "epoch": 11.580188679245284, "percentage": 57.9, "elapsed_time": "0:56:31", "remaining_time": "0:41:05", "throughput": 4253.35, "total_tokens": 14424120} {"current_steps": 22100, "total_steps": 38160, "loss": 0.5315, "lr": 0.0004492734623611385, "epoch": 11.582809224318659, "percentage": 57.91, "elapsed_time": "0:56:32", "remaining_time": "0:41:05", "throughput": 4253.49, "total_tokens": 14428120} {"current_steps": 22105, "total_steps": 38160, "loss": 0.6252, "lr": 0.0004490459619198766, "epoch": 11.585429769392034, "percentage": 57.93, "elapsed_time": "0:56:32", "remaining_time": "0:41:04", "throughput": 4253.53, "total_tokens": 14431288} {"current_steps": 22110, "total_steps": 38160, "loss": 0.3866, "lr": 0.00044881847213761787, "epoch": 11.58805031446541, "percentage": 57.94, "elapsed_time": "0:56:33", "remaining_time": "0:41:03", "throughput": 4253.53, "total_tokens": 14434104} {"current_steps": 22115, "total_steps": 38160, "loss": 0.4567, "lr": 0.000448590993061951, "epoch": 11.590670859538784, "percentage": 57.95, "elapsed_time": "0:56:34", "remaining_time": "0:41:02", "throughput": 4253.49, "total_tokens": 14436664} {"current_steps": 22120, "total_steps": 38160, "loss": 0.4246, "lr": 0.00044836352474046177, "epoch": 11.59329140461216, "percentage": 57.97, "elapsed_time": "0:56:35", "remaining_time": "0:41:02", "throughput": 4253.97, "total_tokens": 14443672} {"current_steps": 22125, "total_steps": 38160, "loss": 0.6585, "lr": 0.00044813606722073415, "epoch": 11.595911949685535, "percentage": 57.98, "elapsed_time": "0:56:35", "remaining_time": "0:41:01", "throughput": 4253.92, "total_tokens": 14446200} {"current_steps": 22130, "total_steps": 38160, "loss": 0.4541, "lr": 0.00044790862055034945, "epoch": 11.59853249475891, "percentage": 57.99, "elapsed_time": "0:56:36", "remaining_time": "0:41:00", "throughput": 4253.95, "total_tokens": 14449240} {"current_steps": 22135, "total_steps": 38160, "loss": 0.4664, "lr": 0.00044768118477688727, "epoch": 11.601153039832285, "percentage": 58.01, "elapsed_time": "0:56:37", "remaining_time": "0:40:59", "throughput": 4253.93, "total_tokens": 14452024} {"current_steps": 22140, "total_steps": 38160, "loss": 0.4385, "lr": 0.00044745375994792425, "epoch": 11.60377358490566, "percentage": 58.02, "elapsed_time": "0:56:38", "remaining_time": "0:40:58", "throughput": 4254.08, "total_tokens": 14455992} {"current_steps": 22145, "total_steps": 38160, "loss": 0.322, "lr": 0.00044722634611103507, "epoch": 11.606394129979035, "percentage": 58.03, "elapsed_time": "0:56:39", "remaining_time": "0:40:58", "throughput": 4254.31, "total_tokens": 14460536} {"current_steps": 22150, "total_steps": 38160, "loss": 0.4472, "lr": 0.0004469989433137923, "epoch": 11.60901467505241, "percentage": 58.05, "elapsed_time": "0:56:39", "remaining_time": "0:40:57", "throughput": 4254.24, "total_tokens": 14463000} {"current_steps": 22155, "total_steps": 38160, "loss": 0.4358, "lr": 0.00044677155160376586, "epoch": 11.611635220125786, "percentage": 58.06, "elapsed_time": "0:56:40", "remaining_time": "0:40:56", "throughput": 4254.39, "total_tokens": 14467032} {"current_steps": 22160, "total_steps": 38160, "loss": 0.4193, "lr": 0.00044654417102852375, "epoch": 11.614255765199161, "percentage": 58.07, "elapsed_time": "0:56:41", "remaining_time": "0:40:55", "throughput": 4254.43, "total_tokens": 14470232} {"current_steps": 22165, "total_steps": 38160, "loss": 0.5201, "lr": 0.0004463168016356309, "epoch": 11.616876310272536, "percentage": 58.08, "elapsed_time": "0:56:41", "remaining_time": "0:40:54", "throughput": 4254.53, "total_tokens": 14473880} {"current_steps": 22170, "total_steps": 38160, "loss": 0.4026, "lr": 0.00044608944347265095, "epoch": 11.619496855345911, "percentage": 58.1, "elapsed_time": "0:56:42", "remaining_time": "0:40:54", "throughput": 4254.54, "total_tokens": 14476792} {"current_steps": 22175, "total_steps": 38160, "loss": 0.4276, "lr": 0.0004458620965871442, "epoch": 11.622117400419286, "percentage": 58.11, "elapsed_time": "0:56:43", "remaining_time": "0:40:53", "throughput": 4254.52, "total_tokens": 14479544} {"current_steps": 22180, "total_steps": 38160, "loss": 0.4831, "lr": 0.00044563476102666935, "epoch": 11.624737945492662, "percentage": 58.12, "elapsed_time": "0:56:44", "remaining_time": "0:40:52", "throughput": 4254.53, "total_tokens": 14482424} {"current_steps": 22185, "total_steps": 38160, "loss": 0.318, "lr": 0.0004454074368387821, "epoch": 11.627358490566039, "percentage": 58.14, "elapsed_time": "0:56:44", "remaining_time": "0:40:51", "throughput": 4254.59, "total_tokens": 14485784} {"current_steps": 22190, "total_steps": 38160, "loss": 0.4052, "lr": 0.0004451801240710365, "epoch": 11.629979035639414, "percentage": 58.15, "elapsed_time": "0:56:45", "remaining_time": "0:40:50", "throughput": 4254.53, "total_tokens": 14488216} {"current_steps": 22195, "total_steps": 38160, "loss": 0.4202, "lr": 0.0004449528227709834, "epoch": 11.632599580712789, "percentage": 58.16, "elapsed_time": "0:56:46", "remaining_time": "0:40:50", "throughput": 4254.92, "total_tokens": 14494264} {"current_steps": 22200, "total_steps": 38160, "loss": 0.3935, "lr": 0.0004447255329861716, "epoch": 11.635220125786164, "percentage": 58.18, "elapsed_time": "0:56:47", "remaining_time": "0:40:49", "throughput": 4255.11, "total_tokens": 14498680} {"current_steps": 22205, "total_steps": 38160, "loss": 0.4109, "lr": 0.0004444982547641479, "epoch": 11.63784067085954, "percentage": 58.19, "elapsed_time": "0:56:48", "remaining_time": "0:40:48", "throughput": 4255.25, "total_tokens": 14502488} {"current_steps": 22210, "total_steps": 38160, "loss": 0.5409, "lr": 0.00044427098815245594, "epoch": 11.640461215932914, "percentage": 58.2, "elapsed_time": "0:56:48", "remaining_time": "0:40:48", "throughput": 4255.27, "total_tokens": 14505624} {"current_steps": 22215, "total_steps": 38160, "loss": 0.3641, "lr": 0.00044404373319863763, "epoch": 11.64308176100629, "percentage": 58.22, "elapsed_time": "0:56:49", "remaining_time": "0:40:47", "throughput": 4255.24, "total_tokens": 14508312} {"current_steps": 22220, "total_steps": 38160, "loss": 0.4023, "lr": 0.000443816489950232, "epoch": 11.645702306079665, "percentage": 58.23, "elapsed_time": "0:56:50", "remaining_time": "0:40:46", "throughput": 4255.26, "total_tokens": 14511320} {"current_steps": 22225, "total_steps": 38160, "loss": 0.3778, "lr": 0.00044358925845477547, "epoch": 11.64832285115304, "percentage": 58.24, "elapsed_time": "0:56:50", "remaining_time": "0:40:45", "throughput": 4255.35, "total_tokens": 14514840} {"current_steps": 22230, "total_steps": 38160, "loss": 0.3957, "lr": 0.0004433620387598027, "epoch": 11.650943396226415, "percentage": 58.25, "elapsed_time": "0:56:51", "remaining_time": "0:40:44", "throughput": 4255.38, "total_tokens": 14517944} {"current_steps": 22235, "total_steps": 38160, "loss": 0.4482, "lr": 0.00044313483091284507, "epoch": 11.65356394129979, "percentage": 58.27, "elapsed_time": "0:56:52", "remaining_time": "0:40:44", "throughput": 4255.46, "total_tokens": 14521432} {"current_steps": 22240, "total_steps": 38160, "loss": 0.3555, "lr": 0.0004429076349614321, "epoch": 11.656184486373165, "percentage": 58.28, "elapsed_time": "0:56:53", "remaining_time": "0:40:43", "throughput": 4255.45, "total_tokens": 14524248} {"current_steps": 22245, "total_steps": 38160, "loss": 0.4552, "lr": 0.0004426804509530907, "epoch": 11.65880503144654, "percentage": 58.29, "elapsed_time": "0:56:53", "remaining_time": "0:40:42", "throughput": 4255.49, "total_tokens": 14527448} {"current_steps": 22250, "total_steps": 38160, "loss": 0.5117, "lr": 0.000442453278935345, "epoch": 11.661425576519916, "percentage": 58.31, "elapsed_time": "0:56:54", "remaining_time": "0:40:41", "throughput": 4255.43, "total_tokens": 14529944} {"current_steps": 22255, "total_steps": 38160, "loss": 0.5132, "lr": 0.0004422261189557167, "epoch": 11.664046121593291, "percentage": 58.32, "elapsed_time": "0:56:55", "remaining_time": "0:40:40", "throughput": 4255.47, "total_tokens": 14533144} {"current_steps": 22260, "total_steps": 38160, "loss": 0.5217, "lr": 0.00044199897106172526, "epoch": 11.666666666666666, "percentage": 58.33, "elapsed_time": "0:56:55", "remaining_time": "0:40:39", "throughput": 4255.59, "total_tokens": 14536888} {"current_steps": 22265, "total_steps": 38160, "loss": 0.5053, "lr": 0.0004417718353008873, "epoch": 11.669287211740041, "percentage": 58.35, "elapsed_time": "0:56:57", "remaining_time": "0:40:39", "throughput": 4256.32, "total_tokens": 14545912} {"current_steps": 22270, "total_steps": 38160, "loss": 0.3705, "lr": 0.0004415447117207172, "epoch": 11.671907756813416, "percentage": 58.36, "elapsed_time": "0:56:58", "remaining_time": "0:40:38", "throughput": 4256.32, "total_tokens": 14548856} {"current_steps": 22275, "total_steps": 38160, "loss": 0.7268, "lr": 0.00044131760036872657, "epoch": 11.674528301886792, "percentage": 58.37, "elapsed_time": "0:56:58", "remaining_time": "0:40:38", "throughput": 4256.34, "total_tokens": 14551800} {"current_steps": 22280, "total_steps": 38160, "loss": 0.4701, "lr": 0.00044109050129242434, "epoch": 11.677148846960169, "percentage": 58.39, "elapsed_time": "0:56:59", "remaining_time": "0:40:37", "throughput": 4256.42, "total_tokens": 14555256} {"current_steps": 22285, "total_steps": 38160, "loss": 0.522, "lr": 0.00044086341453931715, "epoch": 11.679769392033544, "percentage": 58.4, "elapsed_time": "0:57:00", "remaining_time": "0:40:36", "throughput": 4256.52, "total_tokens": 14558840} {"current_steps": 22290, "total_steps": 38160, "loss": 0.3606, "lr": 0.00044063634015690893, "epoch": 11.682389937106919, "percentage": 58.41, "elapsed_time": "0:57:01", "remaining_time": "0:40:35", "throughput": 4256.54, "total_tokens": 14561848} {"current_steps": 22295, "total_steps": 38160, "loss": 0.3501, "lr": 0.0004404092781927012, "epoch": 11.685010482180294, "percentage": 58.43, "elapsed_time": "0:57:01", "remaining_time": "0:40:34", "throughput": 4256.63, "total_tokens": 14565464} {"current_steps": 22300, "total_steps": 38160, "loss": 0.5275, "lr": 0.00044018222869419255, "epoch": 11.68763102725367, "percentage": 58.44, "elapsed_time": "0:57:02", "remaining_time": "0:40:34", "throughput": 4256.67, "total_tokens": 14568664} {"current_steps": 22305, "total_steps": 38160, "loss": 0.4242, "lr": 0.00043995519170887936, "epoch": 11.690251572327044, "percentage": 58.45, "elapsed_time": "0:57:03", "remaining_time": "0:40:33", "throughput": 4256.65, "total_tokens": 14571384} {"current_steps": 22310, "total_steps": 38160, "loss": 0.4199, "lr": 0.00043972816728425504, "epoch": 11.69287211740042, "percentage": 58.46, "elapsed_time": "0:57:03", "remaining_time": "0:40:32", "throughput": 4256.73, "total_tokens": 14574808} {"current_steps": 22315, "total_steps": 38160, "loss": 0.4397, "lr": 0.0004395011554678103, "epoch": 11.695492662473795, "percentage": 58.48, "elapsed_time": "0:57:04", "remaining_time": "0:40:31", "throughput": 4256.72, "total_tokens": 14577624} {"current_steps": 22320, "total_steps": 38160, "loss": 0.3781, "lr": 0.00043927415630703364, "epoch": 11.69811320754717, "percentage": 58.49, "elapsed_time": "0:57:05", "remaining_time": "0:40:30", "throughput": 4256.79, "total_tokens": 14581016} {"current_steps": 22325, "total_steps": 38160, "loss": 0.4212, "lr": 0.0004390471698494108, "epoch": 11.700733752620545, "percentage": 58.5, "elapsed_time": "0:57:06", "remaining_time": "0:40:30", "throughput": 4256.75, "total_tokens": 14583736} {"current_steps": 22330, "total_steps": 38160, "loss": 0.4845, "lr": 0.0004388201961424248, "epoch": 11.70335429769392, "percentage": 58.52, "elapsed_time": "0:57:06", "remaining_time": "0:40:29", "throughput": 4256.84, "total_tokens": 14587352} {"current_steps": 22335, "total_steps": 38160, "loss": 0.4622, "lr": 0.0004385932352335555, "epoch": 11.705974842767295, "percentage": 58.53, "elapsed_time": "0:57:07", "remaining_time": "0:40:28", "throughput": 4256.93, "total_tokens": 14590808} {"current_steps": 22340, "total_steps": 38160, "loss": 0.3886, "lr": 0.000438366287170281, "epoch": 11.70859538784067, "percentage": 58.54, "elapsed_time": "0:57:08", "remaining_time": "0:40:27", "throughput": 4257.01, "total_tokens": 14594296} {"current_steps": 22345, "total_steps": 38160, "loss": 0.3395, "lr": 0.0004381393520000759, "epoch": 11.711215932914046, "percentage": 58.56, "elapsed_time": "0:57:09", "remaining_time": "0:40:26", "throughput": 4257.11, "total_tokens": 14597944} {"current_steps": 22350, "total_steps": 38160, "loss": 0.4036, "lr": 0.0004379124297704127, "epoch": 11.713836477987421, "percentage": 58.57, "elapsed_time": "0:57:09", "remaining_time": "0:40:26", "throughput": 4257.12, "total_tokens": 14600920} {"current_steps": 22355, "total_steps": 38160, "loss": 0.433, "lr": 0.0004376855205287609, "epoch": 11.716457023060796, "percentage": 58.58, "elapsed_time": "0:57:10", "remaining_time": "0:40:25", "throughput": 4257.21, "total_tokens": 14604504} {"current_steps": 22360, "total_steps": 38160, "loss": 0.4654, "lr": 0.0004374586243225874, "epoch": 11.719077568134171, "percentage": 58.6, "elapsed_time": "0:57:11", "remaining_time": "0:40:24", "throughput": 4257.29, "total_tokens": 14607928} {"current_steps": 22365, "total_steps": 38160, "loss": 0.505, "lr": 0.00043723174119935607, "epoch": 11.721698113207546, "percentage": 58.61, "elapsed_time": "0:57:11", "remaining_time": "0:40:23", "throughput": 4257.32, "total_tokens": 14611000} {"current_steps": 22370, "total_steps": 38160, "loss": 0.4542, "lr": 0.00043700487120652826, "epoch": 11.724318658280922, "percentage": 58.62, "elapsed_time": "0:57:12", "remaining_time": "0:40:23", "throughput": 4257.38, "total_tokens": 14614456} {"current_steps": 22375, "total_steps": 38160, "loss": 0.4098, "lr": 0.00043677801439156284, "epoch": 11.726939203354299, "percentage": 58.63, "elapsed_time": "0:57:13", "remaining_time": "0:40:22", "throughput": 4257.54, "total_tokens": 14618648} {"current_steps": 22380, "total_steps": 38160, "loss": 0.4281, "lr": 0.00043655117080191545, "epoch": 11.729559748427674, "percentage": 58.65, "elapsed_time": "0:57:14", "remaining_time": "0:40:21", "throughput": 4257.53, "total_tokens": 14621464} {"current_steps": 22385, "total_steps": 38160, "loss": 0.3414, "lr": 0.00043632434048503934, "epoch": 11.732180293501049, "percentage": 58.66, "elapsed_time": "0:57:14", "remaining_time": "0:40:20", "throughput": 4257.55, "total_tokens": 14624472} {"current_steps": 22390, "total_steps": 38160, "loss": 0.5636, "lr": 0.00043609752348838484, "epoch": 11.734800838574424, "percentage": 58.67, "elapsed_time": "0:57:15", "remaining_time": "0:40:19", "throughput": 4257.74, "total_tokens": 14628824} {"current_steps": 22395, "total_steps": 38160, "loss": 0.3721, "lr": 0.0004358707198593992, "epoch": 11.7374213836478, "percentage": 58.69, "elapsed_time": "0:57:16", "remaining_time": "0:40:19", "throughput": 4257.76, "total_tokens": 14631832} {"current_steps": 22400, "total_steps": 38160, "loss": 0.3471, "lr": 0.0004356439296455273, "epoch": 11.740041928721174, "percentage": 58.7, "elapsed_time": "0:57:17", "remaining_time": "0:40:18", "throughput": 4257.85, "total_tokens": 14635416} {"current_steps": 22405, "total_steps": 38160, "loss": 0.5697, "lr": 0.0004354171528942113, "epoch": 11.74266247379455, "percentage": 58.71, "elapsed_time": "0:57:17", "remaining_time": "0:40:17", "throughput": 4257.89, "total_tokens": 14638584} {"current_steps": 22410, "total_steps": 38160, "loss": 0.4739, "lr": 0.00043519038965288994, "epoch": 11.745283018867925, "percentage": 58.73, "elapsed_time": "0:57:18", "remaining_time": "0:40:16", "throughput": 4257.95, "total_tokens": 14641880} {"current_steps": 22415, "total_steps": 38160, "loss": 0.6024, "lr": 0.0004349636399689998, "epoch": 11.7479035639413, "percentage": 58.74, "elapsed_time": "0:57:19", "remaining_time": "0:40:15", "throughput": 4258.01, "total_tokens": 14645144} {"current_steps": 22420, "total_steps": 38160, "loss": 0.5772, "lr": 0.00043473690388997434, "epoch": 11.750524109014675, "percentage": 58.75, "elapsed_time": "0:57:20", "remaining_time": "0:40:15", "throughput": 4258.04, "total_tokens": 14648312} {"current_steps": 22425, "total_steps": 38160, "loss": 0.5057, "lr": 0.0004345101814632438, "epoch": 11.75314465408805, "percentage": 58.77, "elapsed_time": "0:57:20", "remaining_time": "0:40:14", "throughput": 4258.1, "total_tokens": 14651768} {"current_steps": 22430, "total_steps": 38160, "loss": 0.6211, "lr": 0.0004342834727362362, "epoch": 11.755765199161425, "percentage": 58.78, "elapsed_time": "0:57:21", "remaining_time": "0:40:13", "throughput": 4258.23, "total_tokens": 14655640} {"current_steps": 22435, "total_steps": 38160, "loss": 0.5526, "lr": 0.00043405677775637633, "epoch": 11.7583857442348, "percentage": 58.79, "elapsed_time": "0:57:22", "remaining_time": "0:40:12", "throughput": 4258.22, "total_tokens": 14658424} {"current_steps": 22440, "total_steps": 38160, "loss": 0.3738, "lr": 0.0004338300965710863, "epoch": 11.761006289308176, "percentage": 58.81, "elapsed_time": "0:57:23", "remaining_time": "0:40:11", "throughput": 4258.16, "total_tokens": 14660888} {"current_steps": 22445, "total_steps": 38160, "loss": 0.4356, "lr": 0.0004336034292277853, "epoch": 11.76362683438155, "percentage": 58.82, "elapsed_time": "0:57:23", "remaining_time": "0:40:11", "throughput": 4258.32, "total_tokens": 14664888} {"current_steps": 22450, "total_steps": 38160, "loss": 0.4749, "lr": 0.00043337677577388916, "epoch": 11.766247379454926, "percentage": 58.83, "elapsed_time": "0:57:24", "remaining_time": "0:40:10", "throughput": 4258.33, "total_tokens": 14667864} {"current_steps": 22455, "total_steps": 38160, "loss": 0.497, "lr": 0.0004331501362568116, "epoch": 11.768867924528301, "percentage": 58.84, "elapsed_time": "0:57:25", "remaining_time": "0:40:09", "throughput": 4258.27, "total_tokens": 14670296} {"current_steps": 22460, "total_steps": 38160, "loss": 0.4724, "lr": 0.00043292351072396273, "epoch": 11.771488469601676, "percentage": 58.86, "elapsed_time": "0:57:25", "remaining_time": "0:40:08", "throughput": 4258.33, "total_tokens": 14673592} {"current_steps": 22465, "total_steps": 38160, "loss": 0.4518, "lr": 0.0004326968992227503, "epoch": 11.774109014675052, "percentage": 58.87, "elapsed_time": "0:57:26", "remaining_time": "0:40:07", "throughput": 4258.35, "total_tokens": 14676664} {"current_steps": 22470, "total_steps": 38160, "loss": 0.4472, "lr": 0.0004324703018005786, "epoch": 11.776729559748428, "percentage": 58.88, "elapsed_time": "0:57:27", "remaining_time": "0:40:07", "throughput": 4258.36, "total_tokens": 14679704} {"current_steps": 22475, "total_steps": 38160, "loss": 0.5242, "lr": 0.00043224371850484955, "epoch": 11.779350104821804, "percentage": 58.9, "elapsed_time": "0:57:27", "remaining_time": "0:40:06", "throughput": 4258.31, "total_tokens": 14682360} {"current_steps": 22480, "total_steps": 38160, "loss": 0.378, "lr": 0.0004320171493829614, "epoch": 11.781970649895179, "percentage": 58.91, "elapsed_time": "0:57:28", "remaining_time": "0:40:05", "throughput": 4258.35, "total_tokens": 14685528} {"current_steps": 22485, "total_steps": 38160, "loss": 0.5829, "lr": 0.00043179059448231004, "epoch": 11.784591194968554, "percentage": 58.92, "elapsed_time": "0:57:29", "remaining_time": "0:40:04", "throughput": 4258.38, "total_tokens": 14688600} {"current_steps": 22490, "total_steps": 38160, "loss": 0.5765, "lr": 0.0004315640538502881, "epoch": 11.78721174004193, "percentage": 58.94, "elapsed_time": "0:57:30", "remaining_time": "0:40:03", "throughput": 4258.39, "total_tokens": 14691544} {"current_steps": 22495, "total_steps": 38160, "loss": 0.3459, "lr": 0.00043133752753428547, "epoch": 11.789832285115304, "percentage": 58.95, "elapsed_time": "0:57:30", "remaining_time": "0:40:03", "throughput": 4258.51, "total_tokens": 14695320} {"current_steps": 22500, "total_steps": 38160, "loss": 0.4982, "lr": 0.0004311110155816886, "epoch": 11.79245283018868, "percentage": 58.96, "elapsed_time": "0:57:31", "remaining_time": "0:40:02", "throughput": 4258.64, "total_tokens": 14699192} {"current_steps": 22505, "total_steps": 38160, "loss": 0.4018, "lr": 0.00043088451803988153, "epoch": 11.795073375262055, "percentage": 58.98, "elapsed_time": "0:57:32", "remaining_time": "0:40:01", "throughput": 4258.66, "total_tokens": 14702264} {"current_steps": 22510, "total_steps": 38160, "loss": 0.5669, "lr": 0.00043065803495624465, "epoch": 11.79769392033543, "percentage": 58.99, "elapsed_time": "0:57:33", "remaining_time": "0:40:00", "throughput": 4258.76, "total_tokens": 14705912} {"current_steps": 22515, "total_steps": 38160, "loss": 0.394, "lr": 0.00043043156637815575, "epoch": 11.800314465408805, "percentage": 59.0, "elapsed_time": "0:57:33", "remaining_time": "0:39:59", "throughput": 4258.76, "total_tokens": 14708888} {"current_steps": 22520, "total_steps": 38160, "loss": 0.3604, "lr": 0.00043020511235298956, "epoch": 11.80293501048218, "percentage": 59.01, "elapsed_time": "0:57:34", "remaining_time": "0:39:59", "throughput": 4258.86, "total_tokens": 14712440} {"current_steps": 22525, "total_steps": 38160, "loss": 0.5126, "lr": 0.00042997867292811744, "epoch": 11.805555555555555, "percentage": 59.03, "elapsed_time": "0:57:35", "remaining_time": "0:39:58", "throughput": 4258.8, "total_tokens": 14714968} {"current_steps": 22530, "total_steps": 38160, "loss": 0.5558, "lr": 0.00042975224815090834, "epoch": 11.80817610062893, "percentage": 59.04, "elapsed_time": "0:57:35", "remaining_time": "0:39:57", "throughput": 4258.72, "total_tokens": 14717240} {"current_steps": 22535, "total_steps": 38160, "loss": 0.4849, "lr": 0.0004295258380687274, "epoch": 11.810796645702306, "percentage": 59.05, "elapsed_time": "0:57:36", "remaining_time": "0:39:56", "throughput": 4258.73, "total_tokens": 14720248} {"current_steps": 22540, "total_steps": 38160, "loss": 0.4423, "lr": 0.000429299442728937, "epoch": 11.81341719077568, "percentage": 59.07, "elapsed_time": "0:57:37", "remaining_time": "0:39:55", "throughput": 4258.78, "total_tokens": 14723544} {"current_steps": 22545, "total_steps": 38160, "loss": 0.473, "lr": 0.0004290730621788967, "epoch": 11.816037735849056, "percentage": 59.08, "elapsed_time": "0:57:38", "remaining_time": "0:39:55", "throughput": 4258.91, "total_tokens": 14727416} {"current_steps": 22550, "total_steps": 38160, "loss": 0.4032, "lr": 0.0004288466964659625, "epoch": 11.818658280922431, "percentage": 59.09, "elapsed_time": "0:57:38", "remaining_time": "0:39:54", "throughput": 4258.9, "total_tokens": 14730328} {"current_steps": 22555, "total_steps": 38160, "loss": 0.3732, "lr": 0.0004286203456374877, "epoch": 11.821278825995806, "percentage": 59.11, "elapsed_time": "0:57:39", "remaining_time": "0:39:53", "throughput": 4258.86, "total_tokens": 14732952} {"current_steps": 22560, "total_steps": 38160, "loss": 0.544, "lr": 0.0004283940097408224, "epoch": 11.823899371069182, "percentage": 59.12, "elapsed_time": "0:57:40", "remaining_time": "0:39:52", "throughput": 4258.85, "total_tokens": 14735800} {"current_steps": 22565, "total_steps": 38160, "loss": 0.3865, "lr": 0.00042816768882331324, "epoch": 11.826519916142558, "percentage": 59.13, "elapsed_time": "0:57:40", "remaining_time": "0:39:51", "throughput": 4258.82, "total_tokens": 14738584} {"current_steps": 22570, "total_steps": 38160, "loss": 0.4264, "lr": 0.000427941382932304, "epoch": 11.829140461215934, "percentage": 59.15, "elapsed_time": "0:57:41", "remaining_time": "0:39:50", "throughput": 4258.88, "total_tokens": 14741944} {"current_steps": 22575, "total_steps": 38160, "loss": 0.472, "lr": 0.0004277150921151354, "epoch": 11.831761006289309, "percentage": 59.16, "elapsed_time": "0:57:42", "remaining_time": "0:39:50", "throughput": 4258.97, "total_tokens": 14745496} {"current_steps": 22580, "total_steps": 38160, "loss": 0.3723, "lr": 0.0004274888164191448, "epoch": 11.834381551362684, "percentage": 59.17, "elapsed_time": "0:57:42", "remaining_time": "0:39:49", "throughput": 4258.92, "total_tokens": 14748088} {"current_steps": 22585, "total_steps": 38160, "loss": 0.4577, "lr": 0.00042726255589166666, "epoch": 11.83700209643606, "percentage": 59.19, "elapsed_time": "0:57:43", "remaining_time": "0:39:48", "throughput": 4258.93, "total_tokens": 14751096} {"current_steps": 22590, "total_steps": 38160, "loss": 0.3897, "lr": 0.0004270363105800321, "epoch": 11.839622641509434, "percentage": 59.2, "elapsed_time": "0:57:44", "remaining_time": "0:39:47", "throughput": 4259.0, "total_tokens": 14754488} {"current_steps": 22595, "total_steps": 38160, "loss": 0.35, "lr": 0.0004268100805315688, "epoch": 11.84224318658281, "percentage": 59.21, "elapsed_time": "0:57:44", "remaining_time": "0:39:46", "throughput": 4258.95, "total_tokens": 14757016} {"current_steps": 22600, "total_steps": 38160, "loss": 0.6181, "lr": 0.00042658386579360165, "epoch": 11.844863731656185, "percentage": 59.22, "elapsed_time": "0:57:45", "remaining_time": "0:39:46", "throughput": 4259.0, "total_tokens": 14760280} {"current_steps": 22605, "total_steps": 38160, "loss": 0.4615, "lr": 0.00042635766641345213, "epoch": 11.84748427672956, "percentage": 59.24, "elapsed_time": "0:57:46", "remaining_time": "0:39:45", "throughput": 4258.95, "total_tokens": 14762840} {"current_steps": 22610, "total_steps": 38160, "loss": 0.3186, "lr": 0.0004261314824384388, "epoch": 11.850104821802935, "percentage": 59.25, "elapsed_time": "0:57:47", "remaining_time": "0:39:44", "throughput": 4259.05, "total_tokens": 14766392} {"current_steps": 22615, "total_steps": 38160, "loss": 0.3561, "lr": 0.00042590531391587666, "epoch": 11.85272536687631, "percentage": 59.26, "elapsed_time": "0:57:47", "remaining_time": "0:39:43", "throughput": 4259.18, "total_tokens": 14770264} {"current_steps": 22620, "total_steps": 38160, "loss": 0.3722, "lr": 0.00042567916089307733, "epoch": 11.855345911949685, "percentage": 59.28, "elapsed_time": "0:57:48", "remaining_time": "0:39:42", "throughput": 4259.19, "total_tokens": 14773336} {"current_steps": 22625, "total_steps": 38160, "loss": 0.3967, "lr": 0.00042545302341734977, "epoch": 11.85796645702306, "percentage": 59.29, "elapsed_time": "0:57:49", "remaining_time": "0:39:42", "throughput": 4259.31, "total_tokens": 14777080} {"current_steps": 22630, "total_steps": 38160, "loss": 0.5736, "lr": 0.0004252269015359991, "epoch": 11.860587002096436, "percentage": 59.3, "elapsed_time": "0:57:50", "remaining_time": "0:39:41", "throughput": 4259.34, "total_tokens": 14780280} {"current_steps": 22635, "total_steps": 38160, "loss": 0.452, "lr": 0.00042500079529632763, "epoch": 11.86320754716981, "percentage": 59.32, "elapsed_time": "0:57:50", "remaining_time": "0:39:40", "throughput": 4259.4, "total_tokens": 14783736} {"current_steps": 22640, "total_steps": 38160, "loss": 0.423, "lr": 0.0004247747047456342, "epoch": 11.865828092243186, "percentage": 59.33, "elapsed_time": "0:57:51", "remaining_time": "0:39:39", "throughput": 4259.43, "total_tokens": 14786872} {"current_steps": 22645, "total_steps": 38160, "loss": 0.3553, "lr": 0.0004245486299312144, "epoch": 11.868448637316561, "percentage": 59.34, "elapsed_time": "0:57:52", "remaining_time": "0:39:38", "throughput": 4259.34, "total_tokens": 14789176} {"current_steps": 22650, "total_steps": 38160, "loss": 0.4265, "lr": 0.0004243225709003602, "epoch": 11.871069182389936, "percentage": 59.36, "elapsed_time": "0:57:52", "remaining_time": "0:39:38", "throughput": 4259.34, "total_tokens": 14792152} {"current_steps": 22655, "total_steps": 38160, "loss": 0.5258, "lr": 0.000424096527700361, "epoch": 11.873689727463312, "percentage": 59.37, "elapsed_time": "0:57:53", "remaining_time": "0:39:37", "throughput": 4259.37, "total_tokens": 14795256} {"current_steps": 22660, "total_steps": 38160, "loss": 0.4848, "lr": 0.0004238705003785021, "epoch": 11.876310272536688, "percentage": 59.38, "elapsed_time": "0:57:54", "remaining_time": "0:39:36", "throughput": 4259.39, "total_tokens": 14798360} {"current_steps": 22665, "total_steps": 38160, "loss": 0.5136, "lr": 0.0004236444889820661, "epoch": 11.878930817610064, "percentage": 59.39, "elapsed_time": "0:57:55", "remaining_time": "0:39:35", "throughput": 4259.43, "total_tokens": 14801592} {"current_steps": 22670, "total_steps": 38160, "loss": 0.4938, "lr": 0.0004234184935583318, "epoch": 11.881551362683439, "percentage": 59.41, "elapsed_time": "0:57:55", "remaining_time": "0:39:34", "throughput": 4259.41, "total_tokens": 14804344} {"current_steps": 22675, "total_steps": 38160, "loss": 0.5306, "lr": 0.00042319251415457517, "epoch": 11.884171907756814, "percentage": 59.42, "elapsed_time": "0:57:56", "remaining_time": "0:39:34", "throughput": 4259.41, "total_tokens": 14807288} {"current_steps": 22680, "total_steps": 38160, "loss": 0.4019, "lr": 0.0004229665508180681, "epoch": 11.88679245283019, "percentage": 59.43, "elapsed_time": "0:57:57", "remaining_time": "0:39:33", "throughput": 4259.47, "total_tokens": 14810680} {"current_steps": 22685, "total_steps": 38160, "loss": 0.4963, "lr": 0.0004227406035960798, "epoch": 11.889412997903564, "percentage": 59.45, "elapsed_time": "0:57:57", "remaining_time": "0:39:32", "throughput": 4259.45, "total_tokens": 14813432} {"current_steps": 22690, "total_steps": 38160, "loss": 0.3628, "lr": 0.0004225146725358758, "epoch": 11.89203354297694, "percentage": 59.46, "elapsed_time": "0:57:58", "remaining_time": "0:39:31", "throughput": 4259.5, "total_tokens": 14816664} {"current_steps": 22695, "total_steps": 38160, "loss": 0.4159, "lr": 0.0004222887576847183, "epoch": 11.894654088050315, "percentage": 59.47, "elapsed_time": "0:57:59", "remaining_time": "0:39:30", "throughput": 4259.53, "total_tokens": 14819864} {"current_steps": 22700, "total_steps": 38160, "loss": 0.5369, "lr": 0.00042206285908986626, "epoch": 11.89727463312369, "percentage": 59.49, "elapsed_time": "0:58:00", "remaining_time": "0:39:30", "throughput": 4259.66, "total_tokens": 14823736} {"current_steps": 22705, "total_steps": 38160, "loss": 0.46, "lr": 0.00042183697679857484, "epoch": 11.899895178197065, "percentage": 59.5, "elapsed_time": "0:58:00", "remaining_time": "0:39:29", "throughput": 4259.7, "total_tokens": 14826904} {"current_steps": 22710, "total_steps": 38160, "loss": 0.5257, "lr": 0.00042161111085809604, "epoch": 11.90251572327044, "percentage": 59.51, "elapsed_time": "0:58:01", "remaining_time": "0:39:28", "throughput": 4259.74, "total_tokens": 14830168} {"current_steps": 22715, "total_steps": 38160, "loss": 0.4859, "lr": 0.00042138526131567855, "epoch": 11.905136268343815, "percentage": 59.53, "elapsed_time": "0:58:02", "remaining_time": "0:39:27", "throughput": 4259.94, "total_tokens": 14834520} {"current_steps": 22720, "total_steps": 38160, "loss": 0.4702, "lr": 0.0004211594282185677, "epoch": 11.90775681341719, "percentage": 59.54, "elapsed_time": "0:58:03", "remaining_time": "0:39:27", "throughput": 4260.01, "total_tokens": 14837944} {"current_steps": 22725, "total_steps": 38160, "loss": 0.4367, "lr": 0.0004209336116140048, "epoch": 11.910377358490566, "percentage": 59.55, "elapsed_time": "0:58:03", "remaining_time": "0:39:26", "throughput": 4260.21, "total_tokens": 14842168} {"current_steps": 22730, "total_steps": 38160, "loss": 0.3349, "lr": 0.00042070781154922857, "epoch": 11.91299790356394, "percentage": 59.56, "elapsed_time": "0:58:04", "remaining_time": "0:39:25", "throughput": 4260.21, "total_tokens": 14845112} {"current_steps": 22735, "total_steps": 38160, "loss": 0.5013, "lr": 0.0004204820280714734, "epoch": 11.915618448637316, "percentage": 59.58, "elapsed_time": "0:58:05", "remaining_time": "0:39:24", "throughput": 4260.16, "total_tokens": 14847608} {"current_steps": 22740, "total_steps": 38160, "loss": 0.5022, "lr": 0.00042025626122797066, "epoch": 11.918238993710691, "percentage": 59.59, "elapsed_time": "0:58:06", "remaining_time": "0:39:23", "throughput": 4260.35, "total_tokens": 14852024} {"current_steps": 22745, "total_steps": 38160, "loss": 0.4037, "lr": 0.0004200305110659484, "epoch": 11.920859538784066, "percentage": 59.6, "elapsed_time": "0:58:06", "remaining_time": "0:39:23", "throughput": 4260.4, "total_tokens": 14855288} {"current_steps": 22750, "total_steps": 38160, "loss": 0.3566, "lr": 0.0004198047776326308, "epoch": 11.923480083857442, "percentage": 59.62, "elapsed_time": "0:58:07", "remaining_time": "0:39:22", "throughput": 4260.47, "total_tokens": 14858776} {"current_steps": 22755, "total_steps": 38160, "loss": 0.5025, "lr": 0.00041957906097523897, "epoch": 11.926100628930818, "percentage": 59.63, "elapsed_time": "0:58:08", "remaining_time": "0:39:21", "throughput": 4260.63, "total_tokens": 14862872} {"current_steps": 22760, "total_steps": 38160, "loss": 0.4249, "lr": 0.00041935336114099013, "epoch": 11.928721174004194, "percentage": 59.64, "elapsed_time": "0:58:09", "remaining_time": "0:39:20", "throughput": 4260.59, "total_tokens": 14865496} {"current_steps": 22765, "total_steps": 38160, "loss": 0.4516, "lr": 0.0004191276781770979, "epoch": 11.931341719077569, "percentage": 59.66, "elapsed_time": "0:58:09", "remaining_time": "0:39:19", "throughput": 4260.58, "total_tokens": 14868408} {"current_steps": 22770, "total_steps": 38160, "loss": 0.4697, "lr": 0.00041890201213077286, "epoch": 11.933962264150944, "percentage": 59.67, "elapsed_time": "0:58:10", "remaining_time": "0:39:19", "throughput": 4260.62, "total_tokens": 14871544} {"current_steps": 22775, "total_steps": 38160, "loss": 0.5042, "lr": 0.00041867636304922153, "epoch": 11.93658280922432, "percentage": 59.68, "elapsed_time": "0:58:11", "remaining_time": "0:39:18", "throughput": 4260.63, "total_tokens": 14874520} {"current_steps": 22780, "total_steps": 38160, "loss": 0.5118, "lr": 0.00041845073097964737, "epoch": 11.939203354297694, "percentage": 59.7, "elapsed_time": "0:58:11", "remaining_time": "0:39:17", "throughput": 4260.79, "total_tokens": 14878552} {"current_steps": 22785, "total_steps": 38160, "loss": 0.4589, "lr": 0.0004182251159692498, "epoch": 11.94182389937107, "percentage": 59.71, "elapsed_time": "0:58:12", "remaining_time": "0:39:16", "throughput": 4260.75, "total_tokens": 14881144} {"current_steps": 22790, "total_steps": 38160, "loss": 0.3721, "lr": 0.0004179995180652253, "epoch": 11.944444444444445, "percentage": 59.72, "elapsed_time": "0:58:13", "remaining_time": "0:39:16", "throughput": 4260.96, "total_tokens": 14885560} {"current_steps": 22795, "total_steps": 38160, "loss": 0.4534, "lr": 0.00041777393731476587, "epoch": 11.94706498951782, "percentage": 59.74, "elapsed_time": "0:58:14", "remaining_time": "0:39:15", "throughput": 4261.01, "total_tokens": 14888888} {"current_steps": 22800, "total_steps": 38160, "loss": 0.5185, "lr": 0.0004175483737650608, "epoch": 11.949685534591195, "percentage": 59.75, "elapsed_time": "0:58:14", "remaining_time": "0:39:14", "throughput": 4261.0, "total_tokens": 14891672} {"current_steps": 22805, "total_steps": 38160, "loss": 0.4631, "lr": 0.0004173228274632951, "epoch": 11.95230607966457, "percentage": 59.76, "elapsed_time": "0:58:15", "remaining_time": "0:39:13", "throughput": 4261.02, "total_tokens": 14894680} {"current_steps": 22810, "total_steps": 38160, "loss": 0.4689, "lr": 0.00041709729845665084, "epoch": 11.954926624737945, "percentage": 59.77, "elapsed_time": "0:58:16", "remaining_time": "0:39:12", "throughput": 4261.28, "total_tokens": 14899704} {"current_steps": 22815, "total_steps": 38160, "loss": 0.3472, "lr": 0.0004168717867923061, "epoch": 11.95754716981132, "percentage": 59.79, "elapsed_time": "0:58:17", "remaining_time": "0:39:12", "throughput": 4261.31, "total_tokens": 14902776} {"current_steps": 22820, "total_steps": 38160, "loss": 0.4155, "lr": 0.00041664629251743487, "epoch": 11.960167714884696, "percentage": 59.8, "elapsed_time": "0:58:17", "remaining_time": "0:39:11", "throughput": 4261.29, "total_tokens": 14905560} {"current_steps": 22825, "total_steps": 38160, "loss": 0.4577, "lr": 0.0004164208156792084, "epoch": 11.96278825995807, "percentage": 59.81, "elapsed_time": "0:58:18", "remaining_time": "0:39:10", "throughput": 4261.24, "total_tokens": 14908216} {"current_steps": 22830, "total_steps": 38160, "loss": 0.3825, "lr": 0.00041619535632479374, "epoch": 11.965408805031446, "percentage": 59.83, "elapsed_time": "0:58:19", "remaining_time": "0:39:09", "throughput": 4261.17, "total_tokens": 14910552} {"current_steps": 22835, "total_steps": 38160, "loss": 0.4729, "lr": 0.00041596991450135445, "epoch": 11.968029350104821, "percentage": 59.84, "elapsed_time": "0:58:19", "remaining_time": "0:39:08", "throughput": 4261.26, "total_tokens": 14914232} {"current_steps": 22840, "total_steps": 38160, "loss": 0.4162, "lr": 0.0004157444902560504, "epoch": 11.970649895178196, "percentage": 59.85, "elapsed_time": "0:58:20", "remaining_time": "0:39:08", "throughput": 4261.33, "total_tokens": 14917592} {"current_steps": 22845, "total_steps": 38160, "loss": 0.4925, "lr": 0.00041551908363603786, "epoch": 11.973270440251572, "percentage": 59.87, "elapsed_time": "0:58:21", "remaining_time": "0:39:07", "throughput": 4261.27, "total_tokens": 14920088} {"current_steps": 22850, "total_steps": 38160, "loss": 0.4974, "lr": 0.00041529369468846914, "epoch": 11.975890985324948, "percentage": 59.88, "elapsed_time": "0:58:22", "remaining_time": "0:39:06", "throughput": 4261.37, "total_tokens": 14923768} {"current_steps": 22855, "total_steps": 38160, "loss": 0.4402, "lr": 0.00041506832346049303, "epoch": 11.978511530398324, "percentage": 59.89, "elapsed_time": "0:58:22", "remaining_time": "0:39:05", "throughput": 4261.33, "total_tokens": 14926328} {"current_steps": 22860, "total_steps": 38160, "loss": 0.3896, "lr": 0.00041484296999925476, "epoch": 11.981132075471699, "percentage": 59.91, "elapsed_time": "0:58:23", "remaining_time": "0:39:04", "throughput": 4261.48, "total_tokens": 14930488} {"current_steps": 22865, "total_steps": 38160, "loss": 0.5609, "lr": 0.00041461763435189555, "epoch": 11.983752620545074, "percentage": 59.92, "elapsed_time": "0:58:24", "remaining_time": "0:39:04", "throughput": 4261.46, "total_tokens": 14933240} {"current_steps": 22870, "total_steps": 38160, "loss": 0.3776, "lr": 0.00041439231656555315, "epoch": 11.98637316561845, "percentage": 59.93, "elapsed_time": "0:58:24", "remaining_time": "0:39:03", "throughput": 4261.52, "total_tokens": 14936568} {"current_steps": 22875, "total_steps": 38160, "loss": 0.3843, "lr": 0.0004141670166873617, "epoch": 11.988993710691824, "percentage": 59.94, "elapsed_time": "0:58:25", "remaining_time": "0:39:02", "throughput": 4261.53, "total_tokens": 14939608} {"current_steps": 22880, "total_steps": 38160, "loss": 0.4664, "lr": 0.00041394173476445097, "epoch": 11.9916142557652, "percentage": 59.96, "elapsed_time": "0:58:26", "remaining_time": "0:39:01", "throughput": 4261.54, "total_tokens": 14942584} {"current_steps": 22885, "total_steps": 38160, "loss": 0.4301, "lr": 0.00041371647084394744, "epoch": 11.994234800838575, "percentage": 59.97, "elapsed_time": "0:58:27", "remaining_time": "0:39:00", "throughput": 4261.53, "total_tokens": 14945336} {"current_steps": 22890, "total_steps": 38160, "loss": 0.3586, "lr": 0.00041349122497297394, "epoch": 11.99685534591195, "percentage": 59.98, "elapsed_time": "0:58:27", "remaining_time": "0:39:00", "throughput": 4261.51, "total_tokens": 14948120} {"current_steps": 22895, "total_steps": 38160, "loss": 0.4694, "lr": 0.0004132659971986491, "epoch": 11.999475890985325, "percentage": 60.0, "elapsed_time": "0:58:28", "remaining_time": "0:38:59", "throughput": 4261.56, "total_tokens": 14951480} {"current_steps": 22896, "total_steps": 38160, "eval_loss": 0.48665136098861694, "epoch": 12.0, "percentage": 60.0, "elapsed_time": "0:58:42", "remaining_time": "0:39:08", "throughput": 4244.73, "total_tokens": 14951560} {"current_steps": 22900, "total_steps": 38160, "loss": 0.3937, "lr": 0.00041304078756808837, "epoch": 12.0020964360587, "percentage": 60.01, "elapsed_time": "0:58:44", "remaining_time": "0:39:08", "throughput": 4242.64, "total_tokens": 14953448} {"current_steps": 22905, "total_steps": 38160, "loss": 0.4956, "lr": 0.0004128155961284027, "epoch": 12.004716981132075, "percentage": 60.02, "elapsed_time": "0:58:45", "remaining_time": "0:39:07", "throughput": 4242.81, "total_tokens": 14957736} {"current_steps": 22910, "total_steps": 38160, "loss": 0.3935, "lr": 0.0004125904229266996, "epoch": 12.00733752620545, "percentage": 60.04, "elapsed_time": "0:58:46", "remaining_time": "0:39:07", "throughput": 4242.8, "total_tokens": 14960648} {"current_steps": 22915, "total_steps": 38160, "loss": 0.4173, "lr": 0.0004123652680100828, "epoch": 12.009958071278826, "percentage": 60.05, "elapsed_time": "0:58:46", "remaining_time": "0:39:06", "throughput": 4242.87, "total_tokens": 14964072} {"current_steps": 22920, "total_steps": 38160, "loss": 0.3777, "lr": 0.0004121401314256521, "epoch": 12.0125786163522, "percentage": 60.06, "elapsed_time": "0:58:47", "remaining_time": "0:39:05", "throughput": 4242.84, "total_tokens": 14966696} {"current_steps": 22925, "total_steps": 38160, "loss": 0.4445, "lr": 0.00041191501322050363, "epoch": 12.015199161425576, "percentage": 60.08, "elapsed_time": "0:58:48", "remaining_time": "0:39:04", "throughput": 4242.83, "total_tokens": 14969480} {"current_steps": 22930, "total_steps": 38160, "loss": 0.5453, "lr": 0.0004116899134417296, "epoch": 12.017819706498951, "percentage": 60.09, "elapsed_time": "0:58:48", "remaining_time": "0:39:03", "throughput": 4242.78, "total_tokens": 14972008} {"current_steps": 22935, "total_steps": 38160, "loss": 0.4287, "lr": 0.00041146483213641793, "epoch": 12.020440251572326, "percentage": 60.1, "elapsed_time": "0:58:49", "remaining_time": "0:39:03", "throughput": 4242.81, "total_tokens": 14975176} {"current_steps": 22940, "total_steps": 38160, "loss": 0.3576, "lr": 0.00041123976935165355, "epoch": 12.023060796645701, "percentage": 60.12, "elapsed_time": "0:58:50", "remaining_time": "0:39:02", "throughput": 4242.83, "total_tokens": 14978184} {"current_steps": 22945, "total_steps": 38160, "loss": 0.4852, "lr": 0.0004110147251345165, "epoch": 12.025681341719078, "percentage": 60.13, "elapsed_time": "0:58:50", "remaining_time": "0:39:01", "throughput": 4242.92, "total_tokens": 14981704} {"current_steps": 22950, "total_steps": 38160, "loss": 0.3489, "lr": 0.0004107896995320839, "epoch": 12.028301886792454, "percentage": 60.14, "elapsed_time": "0:58:51", "remaining_time": "0:39:00", "throughput": 4243.0, "total_tokens": 14985192} {"current_steps": 22955, "total_steps": 38160, "loss": 0.4307, "lr": 0.0004105646925914284, "epoch": 12.030922431865829, "percentage": 60.15, "elapsed_time": "0:58:52", "remaining_time": "0:38:59", "throughput": 4242.92, "total_tokens": 14987560} {"current_steps": 22960, "total_steps": 38160, "loss": 0.3625, "lr": 0.00041033970435961904, "epoch": 12.033542976939204, "percentage": 60.17, "elapsed_time": "0:58:53", "remaining_time": "0:38:59", "throughput": 4243.02, "total_tokens": 14991272} {"current_steps": 22965, "total_steps": 38160, "loss": 0.4627, "lr": 0.00041011473488372044, "epoch": 12.036163522012579, "percentage": 60.18, "elapsed_time": "0:58:53", "remaining_time": "0:38:58", "throughput": 4243.11, "total_tokens": 14994792} {"current_steps": 22970, "total_steps": 38160, "loss": 0.3698, "lr": 0.0004098897842107939, "epoch": 12.038784067085954, "percentage": 60.19, "elapsed_time": "0:58:54", "remaining_time": "0:38:57", "throughput": 4243.07, "total_tokens": 14997352} {"current_steps": 22975, "total_steps": 38160, "loss": 0.5398, "lr": 0.00040966485238789634, "epoch": 12.04140461215933, "percentage": 60.21, "elapsed_time": "0:58:55", "remaining_time": "0:38:56", "throughput": 4243.12, "total_tokens": 15000584} {"current_steps": 22980, "total_steps": 38160, "loss": 0.4758, "lr": 0.00040943993946208126, "epoch": 12.044025157232705, "percentage": 60.22, "elapsed_time": "0:58:56", "remaining_time": "0:38:55", "throughput": 4243.25, "total_tokens": 15004488} {"current_steps": 22985, "total_steps": 38160, "loss": 0.4676, "lr": 0.00040921504548039765, "epoch": 12.04664570230608, "percentage": 60.23, "elapsed_time": "0:58:56", "remaining_time": "0:38:55", "throughput": 4243.29, "total_tokens": 15007656} {"current_steps": 22990, "total_steps": 38160, "loss": 0.6438, "lr": 0.00040899017048989073, "epoch": 12.049266247379455, "percentage": 60.25, "elapsed_time": "0:58:57", "remaining_time": "0:38:54", "throughput": 4243.43, "total_tokens": 15011720} {"current_steps": 22995, "total_steps": 38160, "loss": 0.4158, "lr": 0.00040876531453760186, "epoch": 12.05188679245283, "percentage": 60.26, "elapsed_time": "0:58:58", "remaining_time": "0:38:53", "throughput": 4243.41, "total_tokens": 15014376} {"current_steps": 23000, "total_steps": 38160, "loss": 0.5513, "lr": 0.00040854047767056824, "epoch": 12.054507337526205, "percentage": 60.27, "elapsed_time": "0:58:58", "remaining_time": "0:38:52", "throughput": 4243.4, "total_tokens": 15017192} {"current_steps": 23005, "total_steps": 38160, "loss": 0.3834, "lr": 0.00040831565993582335, "epoch": 12.05712788259958, "percentage": 60.29, "elapsed_time": "0:58:59", "remaining_time": "0:38:51", "throughput": 4243.42, "total_tokens": 15020232} {"current_steps": 23010, "total_steps": 38160, "loss": 0.4055, "lr": 0.0004080908613803964, "epoch": 12.059748427672956, "percentage": 60.3, "elapsed_time": "0:59:00", "remaining_time": "0:38:51", "throughput": 4243.56, "total_tokens": 15024104} {"current_steps": 23015, "total_steps": 38160, "loss": 0.4007, "lr": 0.0004078660820513128, "epoch": 12.06236897274633, "percentage": 60.31, "elapsed_time": "0:59:01", "remaining_time": "0:38:50", "throughput": 4243.7, "total_tokens": 15028104} {"current_steps": 23020, "total_steps": 38160, "loss": 0.3415, "lr": 0.0004076413219955937, "epoch": 12.064989517819706, "percentage": 60.32, "elapsed_time": "0:59:01", "remaining_time": "0:38:49", "throughput": 4243.68, "total_tokens": 15030760} {"current_steps": 23025, "total_steps": 38160, "loss": 0.442, "lr": 0.00040741658126025614, "epoch": 12.067610062893081, "percentage": 60.34, "elapsed_time": "0:59:02", "remaining_time": "0:38:48", "throughput": 4243.71, "total_tokens": 15033992} {"current_steps": 23030, "total_steps": 38160, "loss": 0.5042, "lr": 0.0004071918598923136, "epoch": 12.070230607966456, "percentage": 60.35, "elapsed_time": "0:59:03", "remaining_time": "0:38:47", "throughput": 4243.72, "total_tokens": 15036936} {"current_steps": 23035, "total_steps": 38160, "loss": 0.5054, "lr": 0.0004069671579387753, "epoch": 12.072851153039831, "percentage": 60.36, "elapsed_time": "0:59:04", "remaining_time": "0:38:47", "throughput": 4243.76, "total_tokens": 15040104} {"current_steps": 23040, "total_steps": 38160, "loss": 0.3401, "lr": 0.000406742475446646, "epoch": 12.075471698113208, "percentage": 60.38, "elapsed_time": "0:59:04", "remaining_time": "0:38:46", "throughput": 4243.74, "total_tokens": 15042856} {"current_steps": 23045, "total_steps": 38160, "loss": 0.5643, "lr": 0.0004065178124629272, "epoch": 12.078092243186584, "percentage": 60.39, "elapsed_time": "0:59:05", "remaining_time": "0:38:45", "throughput": 4243.74, "total_tokens": 15045736} {"current_steps": 23050, "total_steps": 38160, "loss": 0.4578, "lr": 0.0004062931690346153, "epoch": 12.080712788259959, "percentage": 60.4, "elapsed_time": "0:59:06", "remaining_time": "0:38:44", "throughput": 4243.73, "total_tokens": 15048616} {"current_steps": 23055, "total_steps": 38160, "loss": 0.3702, "lr": 0.0004060685452087034, "epoch": 12.083333333333334, "percentage": 60.42, "elapsed_time": "0:59:06", "remaining_time": "0:38:43", "throughput": 4243.71, "total_tokens": 15051272} {"current_steps": 23060, "total_steps": 38160, "loss": 0.5439, "lr": 0.00040584394103218026, "epoch": 12.085953878406709, "percentage": 60.43, "elapsed_time": "0:59:07", "remaining_time": "0:38:42", "throughput": 4243.76, "total_tokens": 15054504} {"current_steps": 23065, "total_steps": 38160, "loss": 0.4545, "lr": 0.0004056193565520304, "epoch": 12.088574423480084, "percentage": 60.44, "elapsed_time": "0:59:08", "remaining_time": "0:38:42", "throughput": 4243.7, "total_tokens": 15056968} {"current_steps": 23070, "total_steps": 38160, "loss": 0.5651, "lr": 0.0004053947918152344, "epoch": 12.09119496855346, "percentage": 60.46, "elapsed_time": "0:59:08", "remaining_time": "0:38:41", "throughput": 4243.84, "total_tokens": 15060904} {"current_steps": 23075, "total_steps": 38160, "loss": 0.3495, "lr": 0.0004051702468687688, "epoch": 12.093815513626835, "percentage": 60.47, "elapsed_time": "0:59:09", "remaining_time": "0:38:40", "throughput": 4243.88, "total_tokens": 15064136} {"current_steps": 23080, "total_steps": 38160, "loss": 0.4362, "lr": 0.0004049457217596055, "epoch": 12.09643605870021, "percentage": 60.48, "elapsed_time": "0:59:10", "remaining_time": "0:38:39", "throughput": 4243.9, "total_tokens": 15067240} {"current_steps": 23085, "total_steps": 38160, "loss": 0.4298, "lr": 0.0004047212165347129, "epoch": 12.099056603773585, "percentage": 60.5, "elapsed_time": "0:59:11", "remaining_time": "0:38:38", "throughput": 4243.99, "total_tokens": 15070888} {"current_steps": 23090, "total_steps": 38160, "loss": 0.458, "lr": 0.00040449673124105464, "epoch": 12.10167714884696, "percentage": 60.51, "elapsed_time": "0:59:11", "remaining_time": "0:38:38", "throughput": 4243.97, "total_tokens": 15073608} {"current_steps": 23095, "total_steps": 38160, "loss": 0.4388, "lr": 0.00040427226592559064, "epoch": 12.104297693920335, "percentage": 60.52, "elapsed_time": "0:59:12", "remaining_time": "0:38:37", "throughput": 4243.99, "total_tokens": 15076744} {"current_steps": 23100, "total_steps": 38160, "loss": 0.4061, "lr": 0.00040404782063527684, "epoch": 12.10691823899371, "percentage": 60.53, "elapsed_time": "0:59:13", "remaining_time": "0:38:36", "throughput": 4243.99, "total_tokens": 15079560} {"current_steps": 23105, "total_steps": 38160, "loss": 0.4334, "lr": 0.00040382339541706393, "epoch": 12.109538784067086, "percentage": 60.55, "elapsed_time": "0:59:13", "remaining_time": "0:38:35", "throughput": 4243.96, "total_tokens": 15082216} {"current_steps": 23110, "total_steps": 38160, "loss": 0.5261, "lr": 0.0004035989903178995, "epoch": 12.11215932914046, "percentage": 60.56, "elapsed_time": "0:59:14", "remaining_time": "0:38:34", "throughput": 4244.05, "total_tokens": 15085800} {"current_steps": 23115, "total_steps": 38160, "loss": 0.4223, "lr": 0.0004033746053847266, "epoch": 12.114779874213836, "percentage": 60.57, "elapsed_time": "0:59:15", "remaining_time": "0:38:34", "throughput": 4244.12, "total_tokens": 15089192} {"current_steps": 23120, "total_steps": 38160, "loss": 0.6173, "lr": 0.00040315024066448374, "epoch": 12.117400419287211, "percentage": 60.59, "elapsed_time": "0:59:16", "remaining_time": "0:38:33", "throughput": 4244.13, "total_tokens": 15092200} {"current_steps": 23125, "total_steps": 38160, "loss": 0.4896, "lr": 0.00040292589620410577, "epoch": 12.120020964360586, "percentage": 60.6, "elapsed_time": "0:59:16", "remaining_time": "0:38:32", "throughput": 4244.15, "total_tokens": 15095272} {"current_steps": 23130, "total_steps": 38160, "loss": 0.4982, "lr": 0.0004027015720505229, "epoch": 12.122641509433961, "percentage": 60.61, "elapsed_time": "0:59:17", "remaining_time": "0:38:31", "throughput": 4244.14, "total_tokens": 15098088} {"current_steps": 23135, "total_steps": 38160, "loss": 0.4235, "lr": 0.0004024772682506609, "epoch": 12.125262054507338, "percentage": 60.63, "elapsed_time": "0:59:18", "remaining_time": "0:38:30", "throughput": 4244.15, "total_tokens": 15101064} {"current_steps": 23140, "total_steps": 38160, "loss": 0.4127, "lr": 0.0004022529848514419, "epoch": 12.127882599580714, "percentage": 60.64, "elapsed_time": "0:59:18", "remaining_time": "0:38:30", "throughput": 4244.22, "total_tokens": 15104488} {"current_steps": 23145, "total_steps": 38160, "loss": 0.4615, "lr": 0.00040202872189978324, "epoch": 12.130503144654089, "percentage": 60.65, "elapsed_time": "0:59:19", "remaining_time": "0:38:29", "throughput": 4244.27, "total_tokens": 15107784} {"current_steps": 23150, "total_steps": 38160, "loss": 0.4271, "lr": 0.0004018044794425983, "epoch": 12.133123689727464, "percentage": 60.67, "elapsed_time": "0:59:20", "remaining_time": "0:38:28", "throughput": 4244.41, "total_tokens": 15111912} {"current_steps": 23155, "total_steps": 38160, "loss": 0.3526, "lr": 0.00040158025752679596, "epoch": 12.135744234800839, "percentage": 60.68, "elapsed_time": "0:59:21", "remaining_time": "0:38:27", "throughput": 4244.38, "total_tokens": 15114568} {"current_steps": 23160, "total_steps": 38160, "loss": 0.4931, "lr": 0.0004013560561992811, "epoch": 12.138364779874214, "percentage": 60.69, "elapsed_time": "0:59:21", "remaining_time": "0:38:26", "throughput": 4244.38, "total_tokens": 15117384} {"current_steps": 23165, "total_steps": 38160, "loss": 0.3721, "lr": 0.0004011318755069537, "epoch": 12.14098532494759, "percentage": 60.7, "elapsed_time": "0:59:22", "remaining_time": "0:38:26", "throughput": 4244.46, "total_tokens": 15120936} {"current_steps": 23170, "total_steps": 38160, "loss": 0.4157, "lr": 0.00040090771549670994, "epoch": 12.143605870020965, "percentage": 60.72, "elapsed_time": "0:59:23", "remaining_time": "0:38:25", "throughput": 4244.47, "total_tokens": 15123912} {"current_steps": 23175, "total_steps": 38160, "loss": 0.3658, "lr": 0.00040068357621544167, "epoch": 12.14622641509434, "percentage": 60.73, "elapsed_time": "0:59:23", "remaining_time": "0:38:24", "throughput": 4244.43, "total_tokens": 15126504} {"current_steps": 23180, "total_steps": 38160, "loss": 0.5105, "lr": 0.00040045945771003625, "epoch": 12.148846960167715, "percentage": 60.74, "elapsed_time": "0:59:24", "remaining_time": "0:38:23", "throughput": 4244.43, "total_tokens": 15129384} {"current_steps": 23185, "total_steps": 38160, "loss": 0.2965, "lr": 0.0004002353600273767, "epoch": 12.15146750524109, "percentage": 60.76, "elapsed_time": "0:59:25", "remaining_time": "0:38:22", "throughput": 4244.44, "total_tokens": 15132360} {"current_steps": 23190, "total_steps": 38160, "loss": 0.6678, "lr": 0.0004000112832143415, "epoch": 12.154088050314465, "percentage": 60.77, "elapsed_time": "0:59:25", "remaining_time": "0:38:21", "throughput": 4244.5, "total_tokens": 15135784} {"current_steps": 23195, "total_steps": 38160, "loss": 0.4359, "lr": 0.00039978722731780523, "epoch": 12.15670859538784, "percentage": 60.78, "elapsed_time": "0:59:26", "remaining_time": "0:38:21", "throughput": 4244.39, "total_tokens": 15137896} {"current_steps": 23200, "total_steps": 38160, "loss": 0.4467, "lr": 0.00039956319238463754, "epoch": 12.159329140461216, "percentage": 60.8, "elapsed_time": "0:59:27", "remaining_time": "0:38:20", "throughput": 4244.31, "total_tokens": 15140168} {"current_steps": 23205, "total_steps": 38160, "loss": 0.4147, "lr": 0.00039933917846170436, "epoch": 12.16194968553459, "percentage": 60.81, "elapsed_time": "0:59:27", "remaining_time": "0:38:19", "throughput": 4244.36, "total_tokens": 15143432} {"current_steps": 23210, "total_steps": 38160, "loss": 0.3771, "lr": 0.0003991151855958665, "epoch": 12.164570230607966, "percentage": 60.82, "elapsed_time": "0:59:28", "remaining_time": "0:38:18", "throughput": 4244.38, "total_tokens": 15146440} {"current_steps": 23215, "total_steps": 38160, "loss": 0.4521, "lr": 0.00039889121383398113, "epoch": 12.167190775681341, "percentage": 60.84, "elapsed_time": "0:59:29", "remaining_time": "0:38:17", "throughput": 4244.35, "total_tokens": 15149064} {"current_steps": 23220, "total_steps": 38160, "loss": 0.3694, "lr": 0.00039866726322290014, "epoch": 12.169811320754716, "percentage": 60.85, "elapsed_time": "0:59:29", "remaining_time": "0:38:16", "throughput": 4244.27, "total_tokens": 15151336} {"current_steps": 23225, "total_steps": 38160, "loss": 0.4842, "lr": 0.0003984433338094715, "epoch": 12.172431865828091, "percentage": 60.86, "elapsed_time": "0:59:30", "remaining_time": "0:38:16", "throughput": 4244.22, "total_tokens": 15153928} {"current_steps": 23230, "total_steps": 38160, "loss": 0.5913, "lr": 0.000398219425640539, "epoch": 12.175052410901468, "percentage": 60.88, "elapsed_time": "0:59:31", "remaining_time": "0:38:15", "throughput": 4244.33, "total_tokens": 15157736} {"current_steps": 23235, "total_steps": 38160, "loss": 0.5305, "lr": 0.0003979955387629413, "epoch": 12.177672955974844, "percentage": 60.89, "elapsed_time": "0:59:31", "remaining_time": "0:38:14", "throughput": 4244.33, "total_tokens": 15160616} {"current_steps": 23240, "total_steps": 38160, "loss": 0.4989, "lr": 0.0003977716732235133, "epoch": 12.180293501048219, "percentage": 60.9, "elapsed_time": "0:59:32", "remaining_time": "0:38:13", "throughput": 4244.37, "total_tokens": 15163784} {"current_steps": 23245, "total_steps": 38160, "loss": 0.3593, "lr": 0.000397547829069085, "epoch": 12.182914046121594, "percentage": 60.91, "elapsed_time": "0:59:33", "remaining_time": "0:38:12", "throughput": 4244.4, "total_tokens": 15166888} {"current_steps": 23250, "total_steps": 38160, "loss": 0.5148, "lr": 0.000397324006346482, "epoch": 12.185534591194969, "percentage": 60.93, "elapsed_time": "0:59:34", "remaining_time": "0:38:12", "throughput": 4244.39, "total_tokens": 15169768} {"current_steps": 23255, "total_steps": 38160, "loss": 0.5865, "lr": 0.0003971002051025253, "epoch": 12.188155136268344, "percentage": 60.94, "elapsed_time": "0:59:34", "remaining_time": "0:38:11", "throughput": 4244.32, "total_tokens": 15172168} {"current_steps": 23260, "total_steps": 38160, "loss": 0.3492, "lr": 0.000396876425384032, "epoch": 12.19077568134172, "percentage": 60.95, "elapsed_time": "0:59:35", "remaining_time": "0:38:10", "throughput": 4244.31, "total_tokens": 15174984} {"current_steps": 23265, "total_steps": 38160, "loss": 0.413, "lr": 0.00039665266723781377, "epoch": 12.193396226415095, "percentage": 60.97, "elapsed_time": "0:59:36", "remaining_time": "0:38:09", "throughput": 4244.37, "total_tokens": 15178344} {"current_steps": 23270, "total_steps": 38160, "loss": 0.4865, "lr": 0.00039642893071067877, "epoch": 12.19601677148847, "percentage": 60.98, "elapsed_time": "0:59:36", "remaining_time": "0:38:08", "throughput": 4244.53, "total_tokens": 15182408} {"current_steps": 23275, "total_steps": 38160, "loss": 0.2909, "lr": 0.0003962052158494298, "epoch": 12.198637316561845, "percentage": 60.99, "elapsed_time": "0:59:37", "remaining_time": "0:38:08", "throughput": 4244.65, "total_tokens": 15186216} {"current_steps": 23280, "total_steps": 38160, "loss": 0.5098, "lr": 0.00039598152270086534, "epoch": 12.20125786163522, "percentage": 61.01, "elapsed_time": "0:59:38", "remaining_time": "0:38:07", "throughput": 4244.7, "total_tokens": 15189480} {"current_steps": 23285, "total_steps": 38160, "loss": 0.4165, "lr": 0.00039575785131177975, "epoch": 12.203878406708595, "percentage": 61.02, "elapsed_time": "0:59:39", "remaining_time": "0:38:06", "throughput": 4244.68, "total_tokens": 15192168} {"current_steps": 23290, "total_steps": 38160, "loss": 0.3839, "lr": 0.0003955342017289624, "epoch": 12.20649895178197, "percentage": 61.03, "elapsed_time": "0:59:39", "remaining_time": "0:38:05", "throughput": 4244.69, "total_tokens": 15195240} {"current_steps": 23295, "total_steps": 38160, "loss": 0.5791, "lr": 0.0003953105739991982, "epoch": 12.209119496855346, "percentage": 61.05, "elapsed_time": "0:59:40", "remaining_time": "0:38:04", "throughput": 4244.67, "total_tokens": 15198056} {"current_steps": 23300, "total_steps": 38160, "loss": 0.4963, "lr": 0.0003950869681692678, "epoch": 12.21174004192872, "percentage": 61.06, "elapsed_time": "0:59:41", "remaining_time": "0:38:03", "throughput": 4244.73, "total_tokens": 15201320} {"current_steps": 23305, "total_steps": 38160, "loss": 0.4726, "lr": 0.0003948633842859465, "epoch": 12.214360587002096, "percentage": 61.07, "elapsed_time": "0:59:42", "remaining_time": "0:38:03", "throughput": 4244.89, "total_tokens": 15205576} {"current_steps": 23310, "total_steps": 38160, "loss": 0.3783, "lr": 0.00039463982239600575, "epoch": 12.216981132075471, "percentage": 61.08, "elapsed_time": "0:59:42", "remaining_time": "0:38:02", "throughput": 4244.87, "total_tokens": 15208232} {"current_steps": 23315, "total_steps": 38160, "loss": 0.3845, "lr": 0.00039441628254621215, "epoch": 12.219601677148846, "percentage": 61.1, "elapsed_time": "0:59:43", "remaining_time": "0:38:01", "throughput": 4245.02, "total_tokens": 15212264} {"current_steps": 23320, "total_steps": 38160, "loss": 0.4115, "lr": 0.00039419276478332773, "epoch": 12.222222222222221, "percentage": 61.11, "elapsed_time": "0:59:44", "remaining_time": "0:38:00", "throughput": 4245.02, "total_tokens": 15215144} {"current_steps": 23325, "total_steps": 38160, "loss": 0.4337, "lr": 0.0003939692691541097, "epoch": 12.224842767295598, "percentage": 61.12, "elapsed_time": "0:59:44", "remaining_time": "0:38:00", "throughput": 4244.98, "total_tokens": 15217864} {"current_steps": 23330, "total_steps": 38160, "loss": 0.3972, "lr": 0.00039374579570531114, "epoch": 12.227463312368974, "percentage": 61.14, "elapsed_time": "0:59:45", "remaining_time": "0:37:59", "throughput": 4245.03, "total_tokens": 15221096} {"current_steps": 23335, "total_steps": 38160, "loss": 0.4468, "lr": 0.0003935223444836797, "epoch": 12.230083857442349, "percentage": 61.15, "elapsed_time": "0:59:46", "remaining_time": "0:37:58", "throughput": 4245.11, "total_tokens": 15224584} {"current_steps": 23340, "total_steps": 38160, "loss": 0.3527, "lr": 0.0003932989155359591, "epoch": 12.232704402515724, "percentage": 61.16, "elapsed_time": "0:59:46", "remaining_time": "0:37:57", "throughput": 4245.03, "total_tokens": 15226888} {"current_steps": 23345, "total_steps": 38160, "loss": 0.4608, "lr": 0.000393075508908888, "epoch": 12.235324947589099, "percentage": 61.18, "elapsed_time": "0:59:47", "remaining_time": "0:37:56", "throughput": 4245.18, "total_tokens": 15231016} {"current_steps": 23350, "total_steps": 38160, "loss": 0.4293, "lr": 0.00039285212464920064, "epoch": 12.237945492662474, "percentage": 61.19, "elapsed_time": "0:59:48", "remaining_time": "0:37:56", "throughput": 4245.14, "total_tokens": 15233640} {"current_steps": 23355, "total_steps": 38160, "loss": 0.3966, "lr": 0.0003926287628036265, "epoch": 12.24056603773585, "percentage": 61.2, "elapsed_time": "0:59:49", "remaining_time": "0:37:55", "throughput": 4245.24, "total_tokens": 15237256} {"current_steps": 23360, "total_steps": 38160, "loss": 0.3149, "lr": 0.00039240542341889003, "epoch": 12.243186582809225, "percentage": 61.22, "elapsed_time": "0:59:49", "remaining_time": "0:37:54", "throughput": 4245.23, "total_tokens": 15240136} {"current_steps": 23365, "total_steps": 38160, "loss": 0.5136, "lr": 0.0003921821065417116, "epoch": 12.2458071278826, "percentage": 61.23, "elapsed_time": "0:59:50", "remaining_time": "0:37:53", "throughput": 4245.31, "total_tokens": 15243592} {"current_steps": 23370, "total_steps": 38160, "loss": 0.6334, "lr": 0.0003919588122188063, "epoch": 12.248427672955975, "percentage": 61.24, "elapsed_time": "0:59:51", "remaining_time": "0:37:52", "throughput": 4245.27, "total_tokens": 15246216} {"current_steps": 23375, "total_steps": 38160, "loss": 0.5423, "lr": 0.000391735540496885, "epoch": 12.25104821802935, "percentage": 61.26, "elapsed_time": "0:59:52", "remaining_time": "0:37:52", "throughput": 4245.31, "total_tokens": 15249384} {"current_steps": 23380, "total_steps": 38160, "loss": 0.386, "lr": 0.00039151229142265337, "epoch": 12.253668763102725, "percentage": 61.27, "elapsed_time": "0:59:52", "remaining_time": "0:37:51", "throughput": 4245.37, "total_tokens": 15252648} {"current_steps": 23385, "total_steps": 38160, "loss": 0.3963, "lr": 0.00039128906504281295, "epoch": 12.2562893081761, "percentage": 61.28, "elapsed_time": "0:59:53", "remaining_time": "0:37:50", "throughput": 4245.59, "total_tokens": 15257448} {"current_steps": 23390, "total_steps": 38160, "loss": 0.5658, "lr": 0.00039106586140405964, "epoch": 12.258909853249476, "percentage": 61.29, "elapsed_time": "0:59:54", "remaining_time": "0:37:49", "throughput": 4245.57, "total_tokens": 15260168} {"current_steps": 23395, "total_steps": 38160, "loss": 0.5233, "lr": 0.00039084268055308537, "epoch": 12.26153039832285, "percentage": 61.31, "elapsed_time": "0:59:55", "remaining_time": "0:37:49", "throughput": 4245.77, "total_tokens": 15264744} {"current_steps": 23400, "total_steps": 38160, "loss": 0.2595, "lr": 0.00039061952253657703, "epoch": 12.264150943396226, "percentage": 61.32, "elapsed_time": "0:59:55", "remaining_time": "0:37:48", "throughput": 4245.77, "total_tokens": 15267656} {"current_steps": 23405, "total_steps": 38160, "loss": 0.4194, "lr": 0.0003903963874012166, "epoch": 12.266771488469601, "percentage": 61.33, "elapsed_time": "0:59:56", "remaining_time": "0:37:47", "throughput": 4245.84, "total_tokens": 15271080} {"current_steps": 23410, "total_steps": 38160, "loss": 0.3253, "lr": 0.0003901732751936815, "epoch": 12.269392033542976, "percentage": 61.35, "elapsed_time": "0:59:57", "remaining_time": "0:37:46", "throughput": 4245.97, "total_tokens": 15274920} {"current_steps": 23415, "total_steps": 38160, "loss": 0.516, "lr": 0.00038995018596064447, "epoch": 12.272012578616351, "percentage": 61.36, "elapsed_time": "0:59:58", "remaining_time": "0:37:45", "throughput": 4245.92, "total_tokens": 15277384} {"current_steps": 23420, "total_steps": 38160, "loss": 0.4595, "lr": 0.00038972711974877294, "epoch": 12.274633123689728, "percentage": 61.37, "elapsed_time": "0:59:58", "remaining_time": "0:37:45", "throughput": 4246.05, "total_tokens": 15281352} {"current_steps": 23425, "total_steps": 38160, "loss": 0.3461, "lr": 0.0003895040766047298, "epoch": 12.277253668763104, "percentage": 61.39, "elapsed_time": "0:59:59", "remaining_time": "0:37:44", "throughput": 4246.0, "total_tokens": 15283816} {"current_steps": 23430, "total_steps": 38160, "loss": 0.3421, "lr": 0.0003892810565751733, "epoch": 12.279874213836479, "percentage": 61.4, "elapsed_time": "1:00:00", "remaining_time": "0:37:43", "throughput": 4245.97, "total_tokens": 15286472} {"current_steps": 23435, "total_steps": 38160, "loss": 0.3562, "lr": 0.0003890580597067566, "epoch": 12.282494758909854, "percentage": 61.41, "elapsed_time": "1:00:00", "remaining_time": "0:37:42", "throughput": 4246.07, "total_tokens": 15290088} {"current_steps": 23440, "total_steps": 38160, "loss": 0.4451, "lr": 0.0003888350860461281, "epoch": 12.285115303983229, "percentage": 61.43, "elapsed_time": "1:00:01", "remaining_time": "0:37:41", "throughput": 4246.1, "total_tokens": 15293192} {"current_steps": 23445, "total_steps": 38160, "loss": 0.3654, "lr": 0.0003886121356399315, "epoch": 12.287735849056604, "percentage": 61.44, "elapsed_time": "1:00:02", "remaining_time": "0:37:40", "throughput": 4246.09, "total_tokens": 15295976} {"current_steps": 23450, "total_steps": 38160, "loss": 0.4452, "lr": 0.0003883892085348052, "epoch": 12.29035639412998, "percentage": 61.45, "elapsed_time": "1:00:03", "remaining_time": "0:37:40", "throughput": 4246.06, "total_tokens": 15298664} {"current_steps": 23455, "total_steps": 38160, "loss": 0.5439, "lr": 0.0003881663047773832, "epoch": 12.292976939203355, "percentage": 61.46, "elapsed_time": "1:00:03", "remaining_time": "0:37:39", "throughput": 4246.09, "total_tokens": 15301864} {"current_steps": 23460, "total_steps": 38160, "loss": 0.3187, "lr": 0.00038794342441429426, "epoch": 12.29559748427673, "percentage": 61.48, "elapsed_time": "1:00:04", "remaining_time": "0:37:38", "throughput": 4246.16, "total_tokens": 15305288} {"current_steps": 23465, "total_steps": 38160, "loss": 0.531, "lr": 0.00038772056749216267, "epoch": 12.298218029350105, "percentage": 61.49, "elapsed_time": "1:00:05", "remaining_time": "0:37:37", "throughput": 4246.19, "total_tokens": 15308456} {"current_steps": 23470, "total_steps": 38160, "loss": 0.4306, "lr": 0.00038749773405760744, "epoch": 12.30083857442348, "percentage": 61.5, "elapsed_time": "1:00:05", "remaining_time": "0:37:36", "throughput": 4246.22, "total_tokens": 15311656} {"current_steps": 23475, "total_steps": 38160, "loss": 0.4054, "lr": 0.00038727492415724265, "epoch": 12.303459119496855, "percentage": 61.52, "elapsed_time": "1:00:06", "remaining_time": "0:37:36", "throughput": 4246.19, "total_tokens": 15314472} {"current_steps": 23480, "total_steps": 38160, "loss": 0.4681, "lr": 0.00038705213783767767, "epoch": 12.30607966457023, "percentage": 61.53, "elapsed_time": "1:00:07", "remaining_time": "0:37:35", "throughput": 4246.19, "total_tokens": 15317256} {"current_steps": 23485, "total_steps": 38160, "loss": 0.3279, "lr": 0.00038682937514551686, "epoch": 12.308700209643606, "percentage": 61.54, "elapsed_time": "1:00:07", "remaining_time": "0:37:34", "throughput": 4246.16, "total_tokens": 15319976} {"current_steps": 23490, "total_steps": 38160, "loss": 0.3945, "lr": 0.0003866066361273596, "epoch": 12.31132075471698, "percentage": 61.56, "elapsed_time": "1:00:08", "remaining_time": "0:37:33", "throughput": 4246.19, "total_tokens": 15323080} {"current_steps": 23495, "total_steps": 38160, "loss": 0.5033, "lr": 0.00038638392082980056, "epoch": 12.313941299790356, "percentage": 61.57, "elapsed_time": "1:00:09", "remaining_time": "0:37:32", "throughput": 4246.22, "total_tokens": 15326280} {"current_steps": 23500, "total_steps": 38160, "loss": 0.383, "lr": 0.0003861612292994292, "epoch": 12.316561844863731, "percentage": 61.58, "elapsed_time": "1:00:10", "remaining_time": "0:37:32", "throughput": 4246.19, "total_tokens": 15328872} {"current_steps": 23505, "total_steps": 38160, "loss": 0.4495, "lr": 0.0003859385615828297, "epoch": 12.319182389937106, "percentage": 61.6, "elapsed_time": "1:00:10", "remaining_time": "0:37:31", "throughput": 4246.21, "total_tokens": 15332008} {"current_steps": 23510, "total_steps": 38160, "loss": 0.5076, "lr": 0.00038571591772658186, "epoch": 12.321802935010481, "percentage": 61.61, "elapsed_time": "1:00:11", "remaining_time": "0:37:30", "throughput": 4246.45, "total_tokens": 15336712} {"current_steps": 23515, "total_steps": 38160, "loss": 0.5204, "lr": 0.0003854932977772602, "epoch": 12.324423480083858, "percentage": 61.62, "elapsed_time": "1:00:12", "remaining_time": "0:37:29", "throughput": 4246.42, "total_tokens": 15339368} {"current_steps": 23520, "total_steps": 38160, "loss": 0.2908, "lr": 0.00038527070178143435, "epoch": 12.327044025157234, "percentage": 61.64, "elapsed_time": "1:00:13", "remaining_time": "0:37:29", "throughput": 4246.61, "total_tokens": 15343656} {"current_steps": 23525, "total_steps": 38160, "loss": 0.4929, "lr": 0.00038504812978566873, "epoch": 12.329664570230609, "percentage": 61.65, "elapsed_time": "1:00:13", "remaining_time": "0:37:28", "throughput": 4246.7, "total_tokens": 15347368} {"current_steps": 23530, "total_steps": 38160, "loss": 0.3918, "lr": 0.00038482558183652307, "epoch": 12.332285115303984, "percentage": 61.66, "elapsed_time": "1:00:14", "remaining_time": "0:37:27", "throughput": 4246.74, "total_tokens": 15350536} {"current_steps": 23535, "total_steps": 38160, "loss": 0.4208, "lr": 0.00038460305798055164, "epoch": 12.334905660377359, "percentage": 61.67, "elapsed_time": "1:00:15", "remaining_time": "0:37:26", "throughput": 4246.72, "total_tokens": 15353448} {"current_steps": 23540, "total_steps": 38160, "loss": 0.5213, "lr": 0.00038438055826430385, "epoch": 12.337526205450734, "percentage": 61.69, "elapsed_time": "1:00:16", "remaining_time": "0:37:25", "throughput": 4246.85, "total_tokens": 15357288} {"current_steps": 23545, "total_steps": 38160, "loss": 0.3631, "lr": 0.0003841580827343243, "epoch": 12.34014675052411, "percentage": 61.7, "elapsed_time": "1:00:16", "remaining_time": "0:37:25", "throughput": 4246.85, "total_tokens": 15360200} {"current_steps": 23550, "total_steps": 38160, "loss": 0.4629, "lr": 0.00038393563143715215, "epoch": 12.342767295597485, "percentage": 61.71, "elapsed_time": "1:00:17", "remaining_time": "0:37:24", "throughput": 4246.9, "total_tokens": 15363496} {"current_steps": 23555, "total_steps": 38160, "loss": 0.7057, "lr": 0.00038371320441932195, "epoch": 12.34538784067086, "percentage": 61.73, "elapsed_time": "1:00:18", "remaining_time": "0:37:23", "throughput": 4246.86, "total_tokens": 15366120} {"current_steps": 23560, "total_steps": 38160, "loss": 0.4816, "lr": 0.00038349080172736267, "epoch": 12.348008385744235, "percentage": 61.74, "elapsed_time": "1:00:19", "remaining_time": "0:37:22", "throughput": 4246.98, "total_tokens": 15369960} {"current_steps": 23565, "total_steps": 38160, "loss": 0.3905, "lr": 0.00038326842340779833, "epoch": 12.35062893081761, "percentage": 61.75, "elapsed_time": "1:00:19", "remaining_time": "0:37:21", "throughput": 4247.0, "total_tokens": 15372904} {"current_steps": 23570, "total_steps": 38160, "loss": 0.4294, "lr": 0.00038304606950714803, "epoch": 12.353249475890985, "percentage": 61.77, "elapsed_time": "1:00:20", "remaining_time": "0:37:21", "throughput": 4247.01, "total_tokens": 15375880} {"current_steps": 23575, "total_steps": 38160, "loss": 0.4898, "lr": 0.0003828237400719259, "epoch": 12.35587002096436, "percentage": 61.78, "elapsed_time": "1:00:21", "remaining_time": "0:37:20", "throughput": 4247.03, "total_tokens": 15379016} {"current_steps": 23580, "total_steps": 38160, "loss": 0.4491, "lr": 0.00038260143514864037, "epoch": 12.358490566037736, "percentage": 61.79, "elapsed_time": "1:00:21", "remaining_time": "0:37:19", "throughput": 4247.0, "total_tokens": 15381704} {"current_steps": 23585, "total_steps": 38160, "loss": 0.4157, "lr": 0.0003823791547837955, "epoch": 12.36111111111111, "percentage": 61.81, "elapsed_time": "1:00:22", "remaining_time": "0:37:18", "throughput": 4246.99, "total_tokens": 15384488} {"current_steps": 23590, "total_steps": 38160, "loss": 0.5008, "lr": 0.0003821568990238894, "epoch": 12.363731656184486, "percentage": 61.82, "elapsed_time": "1:00:23", "remaining_time": "0:37:17", "throughput": 4247.02, "total_tokens": 15387688} {"current_steps": 23595, "total_steps": 38160, "loss": 0.3809, "lr": 0.0003819346679154155, "epoch": 12.366352201257861, "percentage": 61.83, "elapsed_time": "1:00:23", "remaining_time": "0:37:17", "throughput": 4247.09, "total_tokens": 15391176} {"current_steps": 23600, "total_steps": 38160, "loss": 0.3425, "lr": 0.0003817124615048623, "epoch": 12.368972746331236, "percentage": 61.84, "elapsed_time": "1:00:24", "remaining_time": "0:37:16", "throughput": 4247.17, "total_tokens": 15394600} {"current_steps": 23605, "total_steps": 38160, "loss": 0.4687, "lr": 0.00038149027983871243, "epoch": 12.371593291404611, "percentage": 61.86, "elapsed_time": "1:00:25", "remaining_time": "0:37:15", "throughput": 4247.17, "total_tokens": 15397448} {"current_steps": 23610, "total_steps": 38160, "loss": 0.4004, "lr": 0.00038126812296344415, "epoch": 12.374213836477987, "percentage": 61.87, "elapsed_time": "1:00:26", "remaining_time": "0:37:14", "throughput": 4247.28, "total_tokens": 15401096} {"current_steps": 23615, "total_steps": 38160, "loss": 0.4917, "lr": 0.0003810459909255301, "epoch": 12.376834381551364, "percentage": 61.88, "elapsed_time": "1:00:26", "remaining_time": "0:37:13", "throughput": 4247.26, "total_tokens": 15403912} {"current_steps": 23620, "total_steps": 38160, "loss": 0.5309, "lr": 0.0003808238837714374, "epoch": 12.379454926624739, "percentage": 61.9, "elapsed_time": "1:00:27", "remaining_time": "0:37:12", "throughput": 4247.25, "total_tokens": 15406632} {"current_steps": 23625, "total_steps": 38160, "loss": 0.4491, "lr": 0.0003806018015476287, "epoch": 12.382075471698114, "percentage": 61.91, "elapsed_time": "1:00:28", "remaining_time": "0:37:12", "throughput": 4247.43, "total_tokens": 15410888} {"current_steps": 23630, "total_steps": 38160, "loss": 0.5601, "lr": 0.0003803797443005609, "epoch": 12.384696016771489, "percentage": 61.92, "elapsed_time": "1:00:28", "remaining_time": "0:37:11", "throughput": 4247.43, "total_tokens": 15413864} {"current_steps": 23635, "total_steps": 38160, "loss": 0.3132, "lr": 0.0003801577120766859, "epoch": 12.387316561844864, "percentage": 61.94, "elapsed_time": "1:00:29", "remaining_time": "0:37:10", "throughput": 4247.46, "total_tokens": 15416936} {"current_steps": 23640, "total_steps": 38160, "loss": 0.4275, "lr": 0.0003799357049224505, "epoch": 12.38993710691824, "percentage": 61.95, "elapsed_time": "1:00:30", "remaining_time": "0:37:09", "throughput": 4247.56, "total_tokens": 15420648} {"current_steps": 23645, "total_steps": 38160, "loss": 0.3617, "lr": 0.0003797137228842956, "epoch": 12.392557651991615, "percentage": 61.96, "elapsed_time": "1:00:31", "remaining_time": "0:37:09", "throughput": 4247.52, "total_tokens": 15423240} {"current_steps": 23650, "total_steps": 38160, "loss": 0.4928, "lr": 0.0003794917660086576, "epoch": 12.39517819706499, "percentage": 61.98, "elapsed_time": "1:00:31", "remaining_time": "0:37:08", "throughput": 4247.64, "total_tokens": 15427240} {"current_steps": 23655, "total_steps": 38160, "loss": 0.4828, "lr": 0.0003792698343419674, "epoch": 12.397798742138365, "percentage": 61.99, "elapsed_time": "1:00:32", "remaining_time": "0:37:07", "throughput": 4247.72, "total_tokens": 15430696} {"current_steps": 23660, "total_steps": 38160, "loss": 0.4679, "lr": 0.0003790479279306505, "epoch": 12.40041928721174, "percentage": 62.0, "elapsed_time": "1:00:33", "remaining_time": "0:37:06", "throughput": 4247.86, "total_tokens": 15434696} {"current_steps": 23665, "total_steps": 38160, "loss": 0.5475, "lr": 0.0003788260468211271, "epoch": 12.403039832285115, "percentage": 62.02, "elapsed_time": "1:00:34", "remaining_time": "0:37:06", "throughput": 4248.01, "total_tokens": 15438824} {"current_steps": 23670, "total_steps": 38160, "loss": 0.4566, "lr": 0.0003786041910598125, "epoch": 12.40566037735849, "percentage": 62.03, "elapsed_time": "1:00:35", "remaining_time": "0:37:05", "throughput": 4248.02, "total_tokens": 15441736} {"current_steps": 23675, "total_steps": 38160, "loss": 0.5884, "lr": 0.0003783823606931159, "epoch": 12.408280922431866, "percentage": 62.04, "elapsed_time": "1:00:35", "remaining_time": "0:37:04", "throughput": 4247.96, "total_tokens": 15444200} {"current_steps": 23680, "total_steps": 38160, "loss": 0.4351, "lr": 0.0003781605557674421, "epoch": 12.41090146750524, "percentage": 62.05, "elapsed_time": "1:00:36", "remaining_time": "0:37:03", "throughput": 4247.99, "total_tokens": 15447432} {"current_steps": 23685, "total_steps": 38160, "loss": 0.3531, "lr": 0.0003779387763291899, "epoch": 12.413522012578616, "percentage": 62.07, "elapsed_time": "1:00:37", "remaining_time": "0:37:02", "throughput": 4248.1, "total_tokens": 15451240} {"current_steps": 23690, "total_steps": 38160, "loss": 0.5841, "lr": 0.0003777170224247533, "epoch": 12.416142557651991, "percentage": 62.08, "elapsed_time": "1:00:37", "remaining_time": "0:37:02", "throughput": 4248.09, "total_tokens": 15454024} {"current_steps": 23695, "total_steps": 38160, "loss": 0.399, "lr": 0.0003774952941005204, "epoch": 12.418763102725366, "percentage": 62.09, "elapsed_time": "1:00:38", "remaining_time": "0:37:01", "throughput": 4248.13, "total_tokens": 15457160} {"current_steps": 23700, "total_steps": 38160, "loss": 0.5963, "lr": 0.00037727359140287455, "epoch": 12.421383647798741, "percentage": 62.11, "elapsed_time": "1:00:39", "remaining_time": "0:37:00", "throughput": 4248.23, "total_tokens": 15460840} {"current_steps": 23705, "total_steps": 38160, "loss": 0.3715, "lr": 0.00037705191437819316, "epoch": 12.424004192872117, "percentage": 62.12, "elapsed_time": "1:00:40", "remaining_time": "0:36:59", "throughput": 4248.24, "total_tokens": 15463752} {"current_steps": 23710, "total_steps": 38160, "loss": 0.3637, "lr": 0.00037683026307284853, "epoch": 12.426624737945493, "percentage": 62.13, "elapsed_time": "1:00:40", "remaining_time": "0:36:58", "throughput": 4248.21, "total_tokens": 15466408} {"current_steps": 23715, "total_steps": 38160, "loss": 0.4374, "lr": 0.0003766086375332077, "epoch": 12.429245283018869, "percentage": 62.15, "elapsed_time": "1:00:41", "remaining_time": "0:36:58", "throughput": 4248.27, "total_tokens": 15469864} {"current_steps": 23720, "total_steps": 38160, "loss": 0.4101, "lr": 0.0003763870378056321, "epoch": 12.431865828092244, "percentage": 62.16, "elapsed_time": "1:00:42", "remaining_time": "0:36:57", "throughput": 4248.49, "total_tokens": 15474504} {"current_steps": 23725, "total_steps": 38160, "loss": 0.3931, "lr": 0.00037616546393647824, "epoch": 12.434486373165619, "percentage": 62.17, "elapsed_time": "1:00:43", "remaining_time": "0:36:56", "throughput": 4248.62, "total_tokens": 15478408} {"current_steps": 23730, "total_steps": 38160, "loss": 0.5243, "lr": 0.0003759439159720962, "epoch": 12.437106918238994, "percentage": 62.19, "elapsed_time": "1:00:43", "remaining_time": "0:36:55", "throughput": 4248.65, "total_tokens": 15481640} {"current_steps": 23735, "total_steps": 38160, "loss": 0.4379, "lr": 0.0003757223939588318, "epoch": 12.43972746331237, "percentage": 62.2, "elapsed_time": "1:00:44", "remaining_time": "0:36:55", "throughput": 4248.66, "total_tokens": 15484648} {"current_steps": 23740, "total_steps": 38160, "loss": 0.4271, "lr": 0.00037550089794302464, "epoch": 12.442348008385745, "percentage": 62.21, "elapsed_time": "1:00:45", "remaining_time": "0:36:54", "throughput": 4248.65, "total_tokens": 15487560} {"current_steps": 23745, "total_steps": 38160, "loss": 0.4045, "lr": 0.0003752794279710094, "epoch": 12.44496855345912, "percentage": 62.22, "elapsed_time": "1:00:46", "remaining_time": "0:36:53", "throughput": 4248.83, "total_tokens": 15491784} {"current_steps": 23750, "total_steps": 38160, "loss": 0.4926, "lr": 0.0003750579840891148, "epoch": 12.447589098532495, "percentage": 62.24, "elapsed_time": "1:00:46", "remaining_time": "0:36:52", "throughput": 4248.88, "total_tokens": 15495080} {"current_steps": 23755, "total_steps": 38160, "loss": 0.4608, "lr": 0.0003748365663436647, "epoch": 12.45020964360587, "percentage": 62.25, "elapsed_time": "1:00:47", "remaining_time": "0:36:51", "throughput": 4248.95, "total_tokens": 15498472} {"current_steps": 23760, "total_steps": 38160, "loss": 0.4011, "lr": 0.0003746151747809769, "epoch": 12.452830188679245, "percentage": 62.26, "elapsed_time": "1:00:48", "remaining_time": "0:36:51", "throughput": 4248.91, "total_tokens": 15501032} {"current_steps": 23765, "total_steps": 38160, "loss": 0.4272, "lr": 0.000374393809447364, "epoch": 12.45545073375262, "percentage": 62.28, "elapsed_time": "1:00:48", "remaining_time": "0:36:50", "throughput": 4248.91, "total_tokens": 15503944} {"current_steps": 23770, "total_steps": 38160, "loss": 0.427, "lr": 0.0003741724703891333, "epoch": 12.458071278825996, "percentage": 62.29, "elapsed_time": "1:00:49", "remaining_time": "0:36:49", "throughput": 4248.96, "total_tokens": 15507272} {"current_steps": 23775, "total_steps": 38160, "loss": 0.4214, "lr": 0.00037395115765258616, "epoch": 12.46069182389937, "percentage": 62.3, "elapsed_time": "1:00:50", "remaining_time": "0:36:48", "throughput": 4248.96, "total_tokens": 15510248} {"current_steps": 23780, "total_steps": 38160, "loss": 0.3605, "lr": 0.0003737298712840188, "epoch": 12.463312368972746, "percentage": 62.32, "elapsed_time": "1:00:51", "remaining_time": "0:36:47", "throughput": 4248.95, "total_tokens": 15512968} {"current_steps": 23785, "total_steps": 38160, "loss": 0.3302, "lr": 0.000373508611329722, "epoch": 12.465932914046121, "percentage": 62.33, "elapsed_time": "1:00:51", "remaining_time": "0:36:47", "throughput": 4249.11, "total_tokens": 15517160} {"current_steps": 23790, "total_steps": 38160, "loss": 0.4027, "lr": 0.00037328737783598036, "epoch": 12.468553459119496, "percentage": 62.34, "elapsed_time": "1:00:52", "remaining_time": "0:36:46", "throughput": 4249.17, "total_tokens": 15520520} {"current_steps": 23795, "total_steps": 38160, "loss": 0.4036, "lr": 0.0003730661708490738, "epoch": 12.471174004192871, "percentage": 62.36, "elapsed_time": "1:00:53", "remaining_time": "0:36:45", "throughput": 4249.3, "total_tokens": 15524488} {"current_steps": 23800, "total_steps": 38160, "loss": 0.4045, "lr": 0.0003728449904152761, "epoch": 12.473794549266247, "percentage": 62.37, "elapsed_time": "1:00:54", "remaining_time": "0:36:44", "throughput": 4249.3, "total_tokens": 15527400} {"current_steps": 23805, "total_steps": 38160, "loss": 0.4954, "lr": 0.00037262383658085563, "epoch": 12.476415094339623, "percentage": 62.38, "elapsed_time": "1:00:54", "remaining_time": "0:36:43", "throughput": 4249.32, "total_tokens": 15530472} {"current_steps": 23810, "total_steps": 38160, "loss": 0.2726, "lr": 0.00037240270939207555, "epoch": 12.479035639412999, "percentage": 62.4, "elapsed_time": "1:00:55", "remaining_time": "0:36:43", "throughput": 4249.58, "total_tokens": 15535912} {"current_steps": 23815, "total_steps": 38160, "loss": 0.3398, "lr": 0.000372181608895193, "epoch": 12.481656184486374, "percentage": 62.41, "elapsed_time": "1:00:56", "remaining_time": "0:36:42", "throughput": 4249.64, "total_tokens": 15539336} {"current_steps": 23820, "total_steps": 38160, "loss": 0.3063, "lr": 0.00037196053513645957, "epoch": 12.484276729559749, "percentage": 62.42, "elapsed_time": "1:00:57", "remaining_time": "0:36:41", "throughput": 4249.65, "total_tokens": 15542472} {"current_steps": 23825, "total_steps": 38160, "loss": 0.3766, "lr": 0.00037173948816212146, "epoch": 12.486897274633124, "percentage": 62.43, "elapsed_time": "1:00:58", "remaining_time": "0:36:40", "throughput": 4249.69, "total_tokens": 15545640} {"current_steps": 23830, "total_steps": 38160, "loss": 0.5186, "lr": 0.00037151846801841904, "epoch": 12.4895178197065, "percentage": 62.45, "elapsed_time": "1:00:58", "remaining_time": "0:36:40", "throughput": 4249.86, "total_tokens": 15550024} {"current_steps": 23835, "total_steps": 38160, "loss": 0.5506, "lr": 0.00037129747475158736, "epoch": 12.492138364779874, "percentage": 62.46, "elapsed_time": "1:00:59", "remaining_time": "0:36:39", "throughput": 4249.85, "total_tokens": 15552904} {"current_steps": 23840, "total_steps": 38160, "loss": 0.3315, "lr": 0.0003710765084078558, "epoch": 12.49475890985325, "percentage": 62.47, "elapsed_time": "1:01:00", "remaining_time": "0:36:38", "throughput": 4249.81, "total_tokens": 15555528} {"current_steps": 23845, "total_steps": 38160, "loss": 0.4432, "lr": 0.0003708555690334477, "epoch": 12.497379454926625, "percentage": 62.49, "elapsed_time": "1:01:01", "remaining_time": "0:36:37", "throughput": 4249.91, "total_tokens": 15559240} {"current_steps": 23850, "total_steps": 38160, "loss": 0.5439, "lr": 0.00037063465667458125, "epoch": 12.5, "percentage": 62.5, "elapsed_time": "1:01:01", "remaining_time": "0:36:37", "throughput": 4249.92, "total_tokens": 15562184} {"current_steps": 23855, "total_steps": 38160, "loss": 0.4724, "lr": 0.0003704137713774686, "epoch": 12.502620545073375, "percentage": 62.51, "elapsed_time": "1:01:02", "remaining_time": "0:36:36", "throughput": 4249.96, "total_tokens": 15565384} {"current_steps": 23860, "total_steps": 38160, "loss": 0.5023, "lr": 0.0003701929131883167, "epoch": 12.50524109014675, "percentage": 62.53, "elapsed_time": "1:01:03", "remaining_time": "0:36:35", "throughput": 4250.15, "total_tokens": 15569960} {"current_steps": 23865, "total_steps": 38160, "loss": 0.5079, "lr": 0.0003699720821533264, "epoch": 12.507861635220126, "percentage": 62.54, "elapsed_time": "1:01:04", "remaining_time": "0:36:34", "throughput": 4250.42, "total_tokens": 15575272} {"current_steps": 23870, "total_steps": 38160, "loss": 0.4735, "lr": 0.00036975127831869326, "epoch": 12.5104821802935, "percentage": 62.55, "elapsed_time": "1:01:05", "remaining_time": "0:36:34", "throughput": 4250.45, "total_tokens": 15578504} {"current_steps": 23875, "total_steps": 38160, "loss": 0.424, "lr": 0.0003695305017306066, "epoch": 12.513102725366876, "percentage": 62.57, "elapsed_time": "1:01:05", "remaining_time": "0:36:33", "throughput": 4250.42, "total_tokens": 15581224} {"current_steps": 23880, "total_steps": 38160, "loss": 0.4434, "lr": 0.00036930975243525046, "epoch": 12.515723270440251, "percentage": 62.58, "elapsed_time": "1:01:06", "remaining_time": "0:36:32", "throughput": 4250.51, "total_tokens": 15584744} {"current_steps": 23885, "total_steps": 38160, "loss": 0.3904, "lr": 0.00036908903047880304, "epoch": 12.518343815513626, "percentage": 62.59, "elapsed_time": "1:01:07", "remaining_time": "0:36:31", "throughput": 4250.51, "total_tokens": 15587624} {"current_steps": 23890, "total_steps": 38160, "loss": 0.4795, "lr": 0.00036886833590743707, "epoch": 12.520964360587001, "percentage": 62.6, "elapsed_time": "1:01:07", "remaining_time": "0:36:30", "throughput": 4250.53, "total_tokens": 15590792} {"current_steps": 23895, "total_steps": 38160, "loss": 0.4364, "lr": 0.00036864766876731913, "epoch": 12.523584905660378, "percentage": 62.62, "elapsed_time": "1:01:08", "remaining_time": "0:36:30", "throughput": 4250.48, "total_tokens": 15593320} {"current_steps": 23900, "total_steps": 38160, "loss": 0.4961, "lr": 0.00036842702910461054, "epoch": 12.526205450733752, "percentage": 62.63, "elapsed_time": "1:01:09", "remaining_time": "0:36:29", "throughput": 4250.6, "total_tokens": 15597192} {"current_steps": 23905, "total_steps": 38160, "loss": 0.4201, "lr": 0.0003682064169654663, "epoch": 12.528825995807129, "percentage": 62.64, "elapsed_time": "1:01:10", "remaining_time": "0:36:28", "throughput": 4250.75, "total_tokens": 15601288} {"current_steps": 23910, "total_steps": 38160, "loss": 0.4508, "lr": 0.00036798583239603587, "epoch": 12.531446540880504, "percentage": 62.66, "elapsed_time": "1:01:11", "remaining_time": "0:36:27", "throughput": 4250.84, "total_tokens": 15604872} {"current_steps": 23915, "total_steps": 38160, "loss": 0.5361, "lr": 0.0003677652754424634, "epoch": 12.534067085953879, "percentage": 62.67, "elapsed_time": "1:01:11", "remaining_time": "0:36:27", "throughput": 4250.86, "total_tokens": 15607880} {"current_steps": 23920, "total_steps": 38160, "loss": 0.4259, "lr": 0.0003675447461508865, "epoch": 12.536687631027254, "percentage": 62.68, "elapsed_time": "1:01:12", "remaining_time": "0:36:26", "throughput": 4250.81, "total_tokens": 15610408} {"current_steps": 23925, "total_steps": 38160, "loss": 0.4493, "lr": 0.00036732424456743784, "epoch": 12.53930817610063, "percentage": 62.7, "elapsed_time": "1:01:13", "remaining_time": "0:36:25", "throughput": 4250.83, "total_tokens": 15613416} {"current_steps": 23930, "total_steps": 38160, "loss": 0.4746, "lr": 0.0003671037707382435, "epoch": 12.541928721174004, "percentage": 62.71, "elapsed_time": "1:01:13", "remaining_time": "0:36:24", "throughput": 4250.95, "total_tokens": 15617288} {"current_steps": 23935, "total_steps": 38160, "loss": 0.4014, "lr": 0.000366883324709424, "epoch": 12.54454926624738, "percentage": 62.72, "elapsed_time": "1:01:14", "remaining_time": "0:36:23", "throughput": 4250.93, "total_tokens": 15620008} {"current_steps": 23940, "total_steps": 38160, "loss": 0.5529, "lr": 0.00036666290652709446, "epoch": 12.547169811320755, "percentage": 62.74, "elapsed_time": "1:01:15", "remaining_time": "0:36:23", "throughput": 4250.98, "total_tokens": 15623272} {"current_steps": 23945, "total_steps": 38160, "loss": 0.4215, "lr": 0.0003664425162373635, "epoch": 12.54979035639413, "percentage": 62.75, "elapsed_time": "1:01:15", "remaining_time": "0:36:22", "throughput": 4250.86, "total_tokens": 15625224} {"current_steps": 23950, "total_steps": 38160, "loss": 0.5847, "lr": 0.0003662221538863346, "epoch": 12.552410901467505, "percentage": 62.76, "elapsed_time": "1:01:16", "remaining_time": "0:36:21", "throughput": 4250.86, "total_tokens": 15628072} {"current_steps": 23955, "total_steps": 38160, "loss": 0.4951, "lr": 0.0003660018195201049, "epoch": 12.55503144654088, "percentage": 62.78, "elapsed_time": "1:01:17", "remaining_time": "0:36:20", "throughput": 4250.89, "total_tokens": 15631304} {"current_steps": 23960, "total_steps": 38160, "loss": 0.4268, "lr": 0.0003657815131847657, "epoch": 12.557651991614255, "percentage": 62.79, "elapsed_time": "1:01:17", "remaining_time": "0:36:19", "throughput": 4250.89, "total_tokens": 15634152} {"current_steps": 23965, "total_steps": 38160, "loss": 0.6297, "lr": 0.0003655612349264027, "epoch": 12.56027253668763, "percentage": 62.8, "elapsed_time": "1:01:18", "remaining_time": "0:36:18", "throughput": 4250.9, "total_tokens": 15637160} {"current_steps": 23970, "total_steps": 38160, "loss": 0.3665, "lr": 0.0003653409847910957, "epoch": 12.562893081761006, "percentage": 62.81, "elapsed_time": "1:01:19", "remaining_time": "0:36:18", "throughput": 4250.89, "total_tokens": 15639944} {"current_steps": 23975, "total_steps": 38160, "loss": 0.5287, "lr": 0.0003651207628249182, "epoch": 12.565513626834381, "percentage": 62.83, "elapsed_time": "1:01:20", "remaining_time": "0:36:17", "throughput": 4251.43, "total_tokens": 15647592} {"current_steps": 23980, "total_steps": 38160, "loss": 0.4001, "lr": 0.0003649005690739386, "epoch": 12.568134171907756, "percentage": 62.84, "elapsed_time": "1:01:21", "remaining_time": "0:36:16", "throughput": 4251.41, "total_tokens": 15650344} {"current_steps": 23985, "total_steps": 38160, "loss": 0.3852, "lr": 0.0003646804035842187, "epoch": 12.570754716981131, "percentage": 62.85, "elapsed_time": "1:01:21", "remaining_time": "0:36:16", "throughput": 4251.47, "total_tokens": 15653672} {"current_steps": 23990, "total_steps": 38160, "loss": 0.6509, "lr": 0.0003644602664018143, "epoch": 12.573375262054507, "percentage": 62.87, "elapsed_time": "1:01:22", "remaining_time": "0:36:15", "throughput": 4251.4, "total_tokens": 15656008} {"current_steps": 23995, "total_steps": 38160, "loss": 0.3971, "lr": 0.000364240157572776, "epoch": 12.575995807127882, "percentage": 62.88, "elapsed_time": "1:01:23", "remaining_time": "0:36:14", "throughput": 4251.49, "total_tokens": 15659656} {"current_steps": 24000, "total_steps": 38160, "loss": 0.3362, "lr": 0.0003640200771431478, "epoch": 12.578616352201259, "percentage": 62.89, "elapsed_time": "1:01:23", "remaining_time": "0:36:13", "throughput": 4251.38, "total_tokens": 15661736} {"current_steps": 24005, "total_steps": 38160, "loss": 0.3233, "lr": 0.0003638000251589683, "epoch": 12.581236897274634, "percentage": 62.91, "elapsed_time": "1:01:24", "remaining_time": "0:36:12", "throughput": 4251.46, "total_tokens": 15665288} {"current_steps": 24010, "total_steps": 38160, "loss": 0.425, "lr": 0.0003635800016662696, "epoch": 12.583857442348009, "percentage": 62.92, "elapsed_time": "1:01:25", "remaining_time": "0:36:11", "throughput": 4251.43, "total_tokens": 15667912} {"current_steps": 24015, "total_steps": 38160, "loss": 0.5754, "lr": 0.00036336000671107816, "epoch": 12.586477987421384, "percentage": 62.93, "elapsed_time": "1:01:26", "remaining_time": "0:36:11", "throughput": 4251.48, "total_tokens": 15671176} {"current_steps": 24020, "total_steps": 38160, "loss": 0.4249, "lr": 0.00036314004033941445, "epoch": 12.58909853249476, "percentage": 62.95, "elapsed_time": "1:01:26", "remaining_time": "0:36:10", "throughput": 4251.45, "total_tokens": 15673864} {"current_steps": 24025, "total_steps": 38160, "loss": 0.3581, "lr": 0.00036292010259729283, "epoch": 12.591719077568134, "percentage": 62.96, "elapsed_time": "1:01:27", "remaining_time": "0:36:09", "throughput": 4251.46, "total_tokens": 15676744} {"current_steps": 24030, "total_steps": 38160, "loss": 0.4418, "lr": 0.000362700193530722, "epoch": 12.59433962264151, "percentage": 62.97, "elapsed_time": "1:01:28", "remaining_time": "0:36:08", "throughput": 4251.52, "total_tokens": 15680168} {"current_steps": 24035, "total_steps": 38160, "loss": 0.3254, "lr": 0.0003624803131857042, "epoch": 12.596960167714885, "percentage": 62.98, "elapsed_time": "1:01:28", "remaining_time": "0:36:07", "throughput": 4251.56, "total_tokens": 15683336} {"current_steps": 24040, "total_steps": 38160, "loss": 0.6099, "lr": 0.0003622604616082361, "epoch": 12.59958071278826, "percentage": 63.0, "elapsed_time": "1:01:29", "remaining_time": "0:36:07", "throughput": 4251.55, "total_tokens": 15686216} {"current_steps": 24045, "total_steps": 38160, "loss": 0.5125, "lr": 0.0003620406388443078, "epoch": 12.602201257861635, "percentage": 63.01, "elapsed_time": "1:01:30", "remaining_time": "0:36:06", "throughput": 4251.61, "total_tokens": 15689544} {"current_steps": 24050, "total_steps": 38160, "loss": 0.3858, "lr": 0.00036182084493990407, "epoch": 12.60482180293501, "percentage": 63.02, "elapsed_time": "1:01:30", "remaining_time": "0:36:05", "throughput": 4251.62, "total_tokens": 15692424} {"current_steps": 24055, "total_steps": 38160, "loss": 0.4599, "lr": 0.0003616010799410031, "epoch": 12.607442348008385, "percentage": 63.04, "elapsed_time": "1:01:31", "remaining_time": "0:36:04", "throughput": 4251.61, "total_tokens": 15695368} {"current_steps": 24060, "total_steps": 38160, "loss": 0.5699, "lr": 0.0003613813438935773, "epoch": 12.61006289308176, "percentage": 63.05, "elapsed_time": "1:01:32", "remaining_time": "0:36:03", "throughput": 4251.68, "total_tokens": 15698696} {"current_steps": 24065, "total_steps": 38160, "loss": 0.2837, "lr": 0.0003611616368435928, "epoch": 12.612683438155136, "percentage": 63.06, "elapsed_time": "1:01:33", "remaining_time": "0:36:03", "throughput": 4251.69, "total_tokens": 15701640} {"current_steps": 24070, "total_steps": 38160, "loss": 0.5585, "lr": 0.0003609419588370102, "epoch": 12.615303983228511, "percentage": 63.08, "elapsed_time": "1:01:33", "remaining_time": "0:36:02", "throughput": 4251.72, "total_tokens": 15704776} {"current_steps": 24075, "total_steps": 38160, "loss": 0.4135, "lr": 0.00036072230991978326, "epoch": 12.617924528301886, "percentage": 63.09, "elapsed_time": "1:01:34", "remaining_time": "0:36:01", "throughput": 4251.7, "total_tokens": 15707496} {"current_steps": 24080, "total_steps": 38160, "loss": 0.4067, "lr": 0.00036050269013785996, "epoch": 12.620545073375261, "percentage": 63.1, "elapsed_time": "1:01:35", "remaining_time": "0:36:00", "throughput": 4251.7, "total_tokens": 15710440} {"current_steps": 24085, "total_steps": 38160, "loss": 0.4864, "lr": 0.0003602830995371825, "epoch": 12.623165618448636, "percentage": 63.12, "elapsed_time": "1:01:36", "remaining_time": "0:35:59", "throughput": 4251.95, "total_tokens": 15715336} {"current_steps": 24090, "total_steps": 38160, "loss": 0.4508, "lr": 0.0003600635381636866, "epoch": 12.625786163522012, "percentage": 63.13, "elapsed_time": "1:01:36", "remaining_time": "0:35:59", "throughput": 4251.95, "total_tokens": 15718216} {"current_steps": 24095, "total_steps": 38160, "loss": 0.3701, "lr": 0.0003598440060633022, "epoch": 12.628406708595389, "percentage": 63.14, "elapsed_time": "1:01:37", "remaining_time": "0:35:58", "throughput": 4252.09, "total_tokens": 15722280} {"current_steps": 24100, "total_steps": 38160, "loss": 0.3867, "lr": 0.00035962450328195264, "epoch": 12.631027253668764, "percentage": 63.16, "elapsed_time": "1:01:38", "remaining_time": "0:35:57", "throughput": 4252.16, "total_tokens": 15725608} {"current_steps": 24105, "total_steps": 38160, "loss": 0.5318, "lr": 0.00035940502986555543, "epoch": 12.633647798742139, "percentage": 63.17, "elapsed_time": "1:01:38", "remaining_time": "0:35:56", "throughput": 4252.11, "total_tokens": 15728072} {"current_steps": 24110, "total_steps": 38160, "loss": 0.4282, "lr": 0.00035918558586002205, "epoch": 12.636268343815514, "percentage": 63.18, "elapsed_time": "1:01:39", "remaining_time": "0:35:55", "throughput": 4252.12, "total_tokens": 15731048} {"current_steps": 24115, "total_steps": 38160, "loss": 0.31, "lr": 0.0003589661713112575, "epoch": 12.63888888888889, "percentage": 63.19, "elapsed_time": "1:01:40", "remaining_time": "0:35:55", "throughput": 4252.15, "total_tokens": 15734184} {"current_steps": 24120, "total_steps": 38160, "loss": 0.5139, "lr": 0.000358746786265161, "epoch": 12.641509433962264, "percentage": 63.21, "elapsed_time": "1:01:41", "remaining_time": "0:35:54", "throughput": 4252.24, "total_tokens": 15737896} {"current_steps": 24125, "total_steps": 38160, "loss": 0.4505, "lr": 0.0003585274307676254, "epoch": 12.64412997903564, "percentage": 63.22, "elapsed_time": "1:01:41", "remaining_time": "0:35:53", "throughput": 4252.37, "total_tokens": 15741800} {"current_steps": 24130, "total_steps": 38160, "loss": 0.4294, "lr": 0.00035830810486453725, "epoch": 12.646750524109015, "percentage": 63.23, "elapsed_time": "1:01:42", "remaining_time": "0:35:52", "throughput": 4252.39, "total_tokens": 15744808} {"current_steps": 24135, "total_steps": 38160, "loss": 0.4496, "lr": 0.00035808880860177696, "epoch": 12.64937106918239, "percentage": 63.25, "elapsed_time": "1:01:43", "remaining_time": "0:35:52", "throughput": 4252.42, "total_tokens": 15747976} {"current_steps": 24140, "total_steps": 38160, "loss": 0.3529, "lr": 0.00035786954202521895, "epoch": 12.651991614255765, "percentage": 63.26, "elapsed_time": "1:01:44", "remaining_time": "0:35:51", "throughput": 4252.49, "total_tokens": 15751336} {"current_steps": 24145, "total_steps": 38160, "loss": 0.4358, "lr": 0.00035765030518073116, "epoch": 12.65461215932914, "percentage": 63.27, "elapsed_time": "1:01:44", "remaining_time": "0:35:50", "throughput": 4252.44, "total_tokens": 15753896} {"current_steps": 24150, "total_steps": 38160, "loss": 0.4763, "lr": 0.0003574310981141756, "epoch": 12.657232704402515, "percentage": 63.29, "elapsed_time": "1:01:45", "remaining_time": "0:35:49", "throughput": 4252.49, "total_tokens": 15757192} {"current_steps": 24155, "total_steps": 38160, "loss": 0.4765, "lr": 0.00035721192087140796, "epoch": 12.65985324947589, "percentage": 63.3, "elapsed_time": "1:01:46", "remaining_time": "0:35:48", "throughput": 4252.52, "total_tokens": 15760296} {"current_steps": 24160, "total_steps": 38160, "loss": 0.5255, "lr": 0.00035699277349827724, "epoch": 12.662473794549266, "percentage": 63.31, "elapsed_time": "1:01:46", "remaining_time": "0:35:47", "throughput": 4252.52, "total_tokens": 15763176} {"current_steps": 24165, "total_steps": 38160, "loss": 0.5249, "lr": 0.0003567736560406269, "epoch": 12.665094339622641, "percentage": 63.33, "elapsed_time": "1:01:47", "remaining_time": "0:35:47", "throughput": 4252.59, "total_tokens": 15766600} {"current_steps": 24170, "total_steps": 38160, "loss": 0.4758, "lr": 0.0003565545685442936, "epoch": 12.667714884696016, "percentage": 63.34, "elapsed_time": "1:01:48", "remaining_time": "0:35:46", "throughput": 4252.6, "total_tokens": 15769640} {"current_steps": 24175, "total_steps": 38160, "loss": 0.3555, "lr": 0.00035633551105510806, "epoch": 12.670335429769391, "percentage": 63.35, "elapsed_time": "1:01:48", "remaining_time": "0:35:45", "throughput": 4252.58, "total_tokens": 15772296} {"current_steps": 24180, "total_steps": 38160, "loss": 0.3915, "lr": 0.00035611648361889457, "epoch": 12.672955974842766, "percentage": 63.36, "elapsed_time": "1:01:49", "remaining_time": "0:35:44", "throughput": 4252.54, "total_tokens": 15774952} {"current_steps": 24185, "total_steps": 38160, "loss": 0.4639, "lr": 0.00035589748628147145, "epoch": 12.675576519916142, "percentage": 63.38, "elapsed_time": "1:01:50", "remaining_time": "0:35:43", "throughput": 4252.53, "total_tokens": 15777800} {"current_steps": 24190, "total_steps": 38160, "loss": 0.2571, "lr": 0.00035567851908865, "epoch": 12.678197064989519, "percentage": 63.39, "elapsed_time": "1:01:50", "remaining_time": "0:35:43", "throughput": 4252.5, "total_tokens": 15780424} {"current_steps": 24195, "total_steps": 38160, "loss": 0.4413, "lr": 0.0003554595820862358, "epoch": 12.680817610062894, "percentage": 63.4, "elapsed_time": "1:01:51", "remaining_time": "0:35:42", "throughput": 4252.5, "total_tokens": 15783304} {"current_steps": 24200, "total_steps": 38160, "loss": 0.4019, "lr": 0.00035524067532002803, "epoch": 12.683438155136269, "percentage": 63.42, "elapsed_time": "1:01:52", "remaining_time": "0:35:41", "throughput": 4252.46, "total_tokens": 15785928} {"current_steps": 24205, "total_steps": 38160, "loss": 0.3855, "lr": 0.00035502179883581956, "epoch": 12.686058700209644, "percentage": 63.43, "elapsed_time": "1:01:52", "remaining_time": "0:35:40", "throughput": 4252.46, "total_tokens": 15788712} {"current_steps": 24210, "total_steps": 38160, "loss": 0.3641, "lr": 0.0003548029526793969, "epoch": 12.68867924528302, "percentage": 63.44, "elapsed_time": "1:01:53", "remaining_time": "0:35:39", "throughput": 4252.54, "total_tokens": 15792296} {"current_steps": 24215, "total_steps": 38160, "loss": 0.3962, "lr": 0.0003545841368965398, "epoch": 12.691299790356394, "percentage": 63.46, "elapsed_time": "1:01:54", "remaining_time": "0:35:38", "throughput": 4252.56, "total_tokens": 15795272} {"current_steps": 24220, "total_steps": 38160, "loss": 0.4551, "lr": 0.00035436535153302235, "epoch": 12.69392033542977, "percentage": 63.47, "elapsed_time": "1:01:54", "remaining_time": "0:35:38", "throughput": 4252.59, "total_tokens": 15798248} {"current_steps": 24225, "total_steps": 38160, "loss": 0.4094, "lr": 0.0003541465966346118, "epoch": 12.696540880503145, "percentage": 63.48, "elapsed_time": "1:01:55", "remaining_time": "0:35:37", "throughput": 4252.79, "total_tokens": 15802760} {"current_steps": 24230, "total_steps": 38160, "loss": 0.4692, "lr": 0.00035392787224706936, "epoch": 12.69916142557652, "percentage": 63.5, "elapsed_time": "1:01:56", "remaining_time": "0:35:36", "throughput": 4252.81, "total_tokens": 15805608} {"current_steps": 24235, "total_steps": 38160, "loss": 0.4225, "lr": 0.0003537091784161495, "epoch": 12.701781970649895, "percentage": 63.51, "elapsed_time": "1:01:57", "remaining_time": "0:35:35", "throughput": 4252.78, "total_tokens": 15808264} {"current_steps": 24240, "total_steps": 38160, "loss": 0.3983, "lr": 0.0003534905151876007, "epoch": 12.70440251572327, "percentage": 63.52, "elapsed_time": "1:01:57", "remaining_time": "0:35:35", "throughput": 4252.78, "total_tokens": 15811240} {"current_steps": 24245, "total_steps": 38160, "loss": 0.367, "lr": 0.0003532718826071646, "epoch": 12.707023060796645, "percentage": 63.54, "elapsed_time": "1:01:58", "remaining_time": "0:35:34", "throughput": 4252.83, "total_tokens": 15814504} {"current_steps": 24250, "total_steps": 38160, "loss": 0.3509, "lr": 0.00035305328072057654, "epoch": 12.70964360587002, "percentage": 63.55, "elapsed_time": "1:01:59", "remaining_time": "0:35:33", "throughput": 4252.92, "total_tokens": 15818056} {"current_steps": 24255, "total_steps": 38160, "loss": 0.4641, "lr": 0.00035283470957356576, "epoch": 12.712264150943396, "percentage": 63.56, "elapsed_time": "1:02:00", "remaining_time": "0:35:32", "throughput": 4253.05, "total_tokens": 15822024} {"current_steps": 24260, "total_steps": 38160, "loss": 0.4916, "lr": 0.0003526161692118548, "epoch": 12.714884696016771, "percentage": 63.57, "elapsed_time": "1:02:00", "remaining_time": "0:35:31", "throughput": 4253.16, "total_tokens": 15825768} {"current_steps": 24265, "total_steps": 38160, "loss": 0.4372, "lr": 0.0003523976596811597, "epoch": 12.717505241090146, "percentage": 63.59, "elapsed_time": "1:02:01", "remaining_time": "0:35:31", "throughput": 4253.28, "total_tokens": 15829576} {"current_steps": 24270, "total_steps": 38160, "loss": 0.272, "lr": 0.0003521791810271906, "epoch": 12.720125786163521, "percentage": 63.6, "elapsed_time": "1:02:02", "remaining_time": "0:35:30", "throughput": 4253.31, "total_tokens": 15832744} {"current_steps": 24275, "total_steps": 38160, "loss": 0.5343, "lr": 0.0003519607332956501, "epoch": 12.722746331236896, "percentage": 63.61, "elapsed_time": "1:02:03", "remaining_time": "0:35:29", "throughput": 4253.4, "total_tokens": 15836328} {"current_steps": 24280, "total_steps": 38160, "loss": 0.3503, "lr": 0.0003517423165322353, "epoch": 12.725366876310272, "percentage": 63.63, "elapsed_time": "1:02:03", "remaining_time": "0:35:28", "throughput": 4253.47, "total_tokens": 15839816} {"current_steps": 24285, "total_steps": 38160, "loss": 0.5683, "lr": 0.0003515239307826366, "epoch": 12.727987421383649, "percentage": 63.64, "elapsed_time": "1:02:04", "remaining_time": "0:35:28", "throughput": 4253.58, "total_tokens": 15843528} {"current_steps": 24290, "total_steps": 38160, "loss": 0.4605, "lr": 0.00035130557609253744, "epoch": 12.730607966457024, "percentage": 63.65, "elapsed_time": "1:02:05", "remaining_time": "0:35:27", "throughput": 4253.69, "total_tokens": 15847272} {"current_steps": 24295, "total_steps": 38160, "loss": 0.3439, "lr": 0.00035108725250761566, "epoch": 12.733228511530399, "percentage": 63.67, "elapsed_time": "1:02:06", "remaining_time": "0:35:26", "throughput": 4253.75, "total_tokens": 15850600} {"current_steps": 24300, "total_steps": 38160, "loss": 0.4745, "lr": 0.0003508689600735416, "epoch": 12.735849056603774, "percentage": 63.68, "elapsed_time": "1:02:06", "remaining_time": "0:35:25", "throughput": 4253.73, "total_tokens": 15853416} {"current_steps": 24305, "total_steps": 38160, "loss": 0.375, "lr": 0.0003506506988359797, "epoch": 12.73846960167715, "percentage": 63.69, "elapsed_time": "1:02:07", "remaining_time": "0:35:24", "throughput": 4253.77, "total_tokens": 15856648} {"current_steps": 24310, "total_steps": 38160, "loss": 0.3837, "lr": 0.0003504324688405878, "epoch": 12.741090146750524, "percentage": 63.71, "elapsed_time": "1:02:08", "remaining_time": "0:35:24", "throughput": 4253.86, "total_tokens": 15860232} {"current_steps": 24315, "total_steps": 38160, "loss": 0.4454, "lr": 0.000350214270133017, "epoch": 12.7437106918239, "percentage": 63.72, "elapsed_time": "1:02:09", "remaining_time": "0:35:23", "throughput": 4254.08, "total_tokens": 15865032} {"current_steps": 24320, "total_steps": 38160, "loss": 0.3995, "lr": 0.00034999610275891204, "epoch": 12.746331236897275, "percentage": 63.73, "elapsed_time": "1:02:10", "remaining_time": "0:35:22", "throughput": 4254.09, "total_tokens": 15868008} {"current_steps": 24325, "total_steps": 38160, "loss": 0.4502, "lr": 0.0003497779667639113, "epoch": 12.74895178197065, "percentage": 63.74, "elapsed_time": "1:02:10", "remaining_time": "0:35:21", "throughput": 4254.08, "total_tokens": 15870824} {"current_steps": 24330, "total_steps": 38160, "loss": 0.4802, "lr": 0.0003495598621936458, "epoch": 12.751572327044025, "percentage": 63.76, "elapsed_time": "1:02:11", "remaining_time": "0:35:21", "throughput": 4254.14, "total_tokens": 15874184} {"current_steps": 24335, "total_steps": 38160, "loss": 0.4618, "lr": 0.00034934178909374084, "epoch": 12.7541928721174, "percentage": 63.77, "elapsed_time": "1:02:12", "remaining_time": "0:35:20", "throughput": 4254.14, "total_tokens": 15877032} {"current_steps": 24340, "total_steps": 38160, "loss": 0.5044, "lr": 0.0003491237475098148, "epoch": 12.756813417190775, "percentage": 63.78, "elapsed_time": "1:02:12", "remaining_time": "0:35:19", "throughput": 4254.28, "total_tokens": 15881160} {"current_steps": 24345, "total_steps": 38160, "loss": 0.4781, "lr": 0.00034890573748747945, "epoch": 12.75943396226415, "percentage": 63.8, "elapsed_time": "1:02:13", "remaining_time": "0:35:18", "throughput": 4254.49, "total_tokens": 15885768} {"current_steps": 24350, "total_steps": 38160, "loss": 0.3829, "lr": 0.00034868775907234017, "epoch": 12.762054507337526, "percentage": 63.81, "elapsed_time": "1:02:14", "remaining_time": "0:35:18", "throughput": 4254.52, "total_tokens": 15888872} {"current_steps": 24355, "total_steps": 38160, "loss": 0.5179, "lr": 0.0003484698123099956, "epoch": 12.764675052410901, "percentage": 63.82, "elapsed_time": "1:02:15", "remaining_time": "0:35:17", "throughput": 4254.66, "total_tokens": 15892936} {"current_steps": 24360, "total_steps": 38160, "loss": 0.4909, "lr": 0.00034825189724603723, "epoch": 12.767295597484276, "percentage": 63.84, "elapsed_time": "1:02:16", "remaining_time": "0:35:16", "throughput": 4254.72, "total_tokens": 15896328} {"current_steps": 24365, "total_steps": 38160, "loss": 0.4607, "lr": 0.0003480340139260509, "epoch": 12.769916142557651, "percentage": 63.85, "elapsed_time": "1:02:16", "remaining_time": "0:35:15", "throughput": 4254.67, "total_tokens": 15898856} {"current_steps": 24370, "total_steps": 38160, "loss": 0.4291, "lr": 0.000347816162395615, "epoch": 12.772536687631026, "percentage": 63.86, "elapsed_time": "1:02:17", "remaining_time": "0:35:14", "throughput": 4254.78, "total_tokens": 15902632} {"current_steps": 24375, "total_steps": 38160, "loss": 0.4132, "lr": 0.00034759834270030185, "epoch": 12.775157232704402, "percentage": 63.88, "elapsed_time": "1:02:18", "remaining_time": "0:35:14", "throughput": 4254.77, "total_tokens": 15905448} {"current_steps": 24380, "total_steps": 38160, "loss": 0.3579, "lr": 0.0003473805548856768, "epoch": 12.777777777777779, "percentage": 63.89, "elapsed_time": "1:02:19", "remaining_time": "0:35:13", "throughput": 4255.17, "total_tokens": 15912168} {"current_steps": 24385, "total_steps": 38160, "loss": 0.486, "lr": 0.00034716279899729826, "epoch": 12.780398322851154, "percentage": 63.9, "elapsed_time": "1:02:20", "remaining_time": "0:35:12", "throughput": 4255.26, "total_tokens": 15915880} {"current_steps": 24390, "total_steps": 38160, "loss": 0.4769, "lr": 0.00034694507508071864, "epoch": 12.783018867924529, "percentage": 63.92, "elapsed_time": "1:02:21", "remaining_time": "0:35:12", "throughput": 4255.34, "total_tokens": 15919432} {"current_steps": 24395, "total_steps": 38160, "loss": 0.3687, "lr": 0.00034672738318148303, "epoch": 12.785639412997904, "percentage": 63.93, "elapsed_time": "1:02:21", "remaining_time": "0:35:11", "throughput": 4255.44, "total_tokens": 15923144} {"current_steps": 24400, "total_steps": 38160, "loss": 0.4032, "lr": 0.00034650972334513043, "epoch": 12.78825995807128, "percentage": 63.94, "elapsed_time": "1:02:22", "remaining_time": "0:35:10", "throughput": 4255.34, "total_tokens": 15925320} {"current_steps": 24405, "total_steps": 38160, "loss": 0.5678, "lr": 0.00034629209561719244, "epoch": 12.790880503144654, "percentage": 63.95, "elapsed_time": "1:02:23", "remaining_time": "0:35:09", "throughput": 4255.39, "total_tokens": 15928488} {"current_steps": 24410, "total_steps": 38160, "loss": 0.318, "lr": 0.0003460745000431946, "epoch": 12.79350104821803, "percentage": 63.97, "elapsed_time": "1:02:23", "remaining_time": "0:35:08", "throughput": 4255.43, "total_tokens": 15931816} {"current_steps": 24415, "total_steps": 38160, "loss": 0.3812, "lr": 0.00034585693666865525, "epoch": 12.796121593291405, "percentage": 63.98, "elapsed_time": "1:02:24", "remaining_time": "0:35:08", "throughput": 4255.46, "total_tokens": 15934856} {"current_steps": 24420, "total_steps": 38160, "loss": 0.4252, "lr": 0.00034563940553908605, "epoch": 12.79874213836478, "percentage": 63.99, "elapsed_time": "1:02:25", "remaining_time": "0:35:07", "throughput": 4255.49, "total_tokens": 15938024} {"current_steps": 24425, "total_steps": 38160, "loss": 0.5131, "lr": 0.00034542190669999216, "epoch": 12.801362683438155, "percentage": 64.01, "elapsed_time": "1:02:26", "remaining_time": "0:35:06", "throughput": 4255.53, "total_tokens": 15941224} {"current_steps": 24430, "total_steps": 38160, "loss": 0.5, "lr": 0.000345204440196872, "epoch": 12.80398322851153, "percentage": 64.02, "elapsed_time": "1:02:26", "remaining_time": "0:35:05", "throughput": 4255.57, "total_tokens": 15944424} {"current_steps": 24435, "total_steps": 38160, "loss": 0.3668, "lr": 0.00034498700607521693, "epoch": 12.806603773584905, "percentage": 64.03, "elapsed_time": "1:02:27", "remaining_time": "0:35:04", "throughput": 4255.47, "total_tokens": 15946568} {"current_steps": 24440, "total_steps": 38160, "loss": 0.3718, "lr": 0.00034476960438051187, "epoch": 12.80922431865828, "percentage": 64.05, "elapsed_time": "1:02:28", "remaining_time": "0:35:04", "throughput": 4255.59, "total_tokens": 15950408} {"current_steps": 24445, "total_steps": 38160, "loss": 0.4119, "lr": 0.00034455223515823444, "epoch": 12.811844863731656, "percentage": 64.06, "elapsed_time": "1:02:28", "remaining_time": "0:35:03", "throughput": 4255.6, "total_tokens": 15953384} {"current_steps": 24450, "total_steps": 38160, "loss": 0.3829, "lr": 0.0003443348984538559, "epoch": 12.814465408805031, "percentage": 64.07, "elapsed_time": "1:02:29", "remaining_time": "0:35:02", "throughput": 4255.68, "total_tokens": 15957032} {"current_steps": 24455, "total_steps": 38160, "loss": 0.4145, "lr": 0.0003441175943128407, "epoch": 12.817085953878406, "percentage": 64.09, "elapsed_time": "1:02:30", "remaining_time": "0:35:01", "throughput": 4255.88, "total_tokens": 15961480} {"current_steps": 24460, "total_steps": 38160, "loss": 0.5607, "lr": 0.0003439003227806464, "epoch": 12.819706498951781, "percentage": 64.1, "elapsed_time": "1:02:31", "remaining_time": "0:35:01", "throughput": 4255.97, "total_tokens": 15965000} {"current_steps": 24465, "total_steps": 38160, "loss": 0.4223, "lr": 0.00034368308390272386, "epoch": 12.822327044025156, "percentage": 64.11, "elapsed_time": "1:02:31", "remaining_time": "0:35:00", "throughput": 4255.93, "total_tokens": 15967624} {"current_steps": 24470, "total_steps": 38160, "loss": 0.5209, "lr": 0.0003434658777245167, "epoch": 12.824947589098532, "percentage": 64.12, "elapsed_time": "1:02:32", "remaining_time": "0:34:59", "throughput": 4255.87, "total_tokens": 15970056} {"current_steps": 24475, "total_steps": 38160, "loss": 0.4566, "lr": 0.000343248704291462, "epoch": 12.827568134171909, "percentage": 64.14, "elapsed_time": "1:02:33", "remaining_time": "0:34:58", "throughput": 4255.84, "total_tokens": 15972680} {"current_steps": 24480, "total_steps": 38160, "loss": 0.5034, "lr": 0.00034303156364899016, "epoch": 12.830188679245284, "percentage": 64.15, "elapsed_time": "1:02:33", "remaining_time": "0:34:57", "throughput": 4255.85, "total_tokens": 15975592} {"current_steps": 24485, "total_steps": 38160, "loss": 0.4114, "lr": 0.00034281445584252425, "epoch": 12.832809224318659, "percentage": 64.16, "elapsed_time": "1:02:34", "remaining_time": "0:34:56", "throughput": 4255.86, "total_tokens": 15978664} {"current_steps": 24490, "total_steps": 38160, "loss": 0.4316, "lr": 0.00034259738091748103, "epoch": 12.835429769392034, "percentage": 64.18, "elapsed_time": "1:02:35", "remaining_time": "0:34:56", "throughput": 4256.04, "total_tokens": 15983048} {"current_steps": 24495, "total_steps": 38160, "loss": 0.4461, "lr": 0.00034238033891927013, "epoch": 12.83805031446541, "percentage": 64.19, "elapsed_time": "1:02:36", "remaining_time": "0:34:55", "throughput": 4256.09, "total_tokens": 15986344} {"current_steps": 24500, "total_steps": 38160, "loss": 0.6127, "lr": 0.00034216332989329387, "epoch": 12.840670859538784, "percentage": 64.2, "elapsed_time": "1:02:36", "remaining_time": "0:34:54", "throughput": 4256.17, "total_tokens": 15989864} {"current_steps": 24505, "total_steps": 38160, "loss": 0.458, "lr": 0.00034194635388494835, "epoch": 12.84329140461216, "percentage": 64.22, "elapsed_time": "1:02:37", "remaining_time": "0:34:53", "throughput": 4256.23, "total_tokens": 15993224} {"current_steps": 24510, "total_steps": 38160, "loss": 0.4417, "lr": 0.00034172941093962237, "epoch": 12.845911949685535, "percentage": 64.23, "elapsed_time": "1:02:38", "remaining_time": "0:34:53", "throughput": 4256.25, "total_tokens": 15996296} {"current_steps": 24515, "total_steps": 38160, "loss": 0.4369, "lr": 0.00034151250110269805, "epoch": 12.84853249475891, "percentage": 64.24, "elapsed_time": "1:02:39", "remaining_time": "0:34:52", "throughput": 4256.34, "total_tokens": 15999944} {"current_steps": 24520, "total_steps": 38160, "loss": 0.3849, "lr": 0.00034129562441955044, "epoch": 12.851153039832285, "percentage": 64.26, "elapsed_time": "1:02:39", "remaining_time": "0:34:51", "throughput": 4256.37, "total_tokens": 16003112} {"current_steps": 24525, "total_steps": 38160, "loss": 0.503, "lr": 0.00034107878093554765, "epoch": 12.85377358490566, "percentage": 64.27, "elapsed_time": "1:02:40", "remaining_time": "0:34:50", "throughput": 4256.35, "total_tokens": 16005832} {"current_steps": 24530, "total_steps": 38160, "loss": 0.4698, "lr": 0.00034086197069605064, "epoch": 12.856394129979035, "percentage": 64.28, "elapsed_time": "1:02:41", "remaining_time": "0:34:49", "throughput": 4256.4, "total_tokens": 16009096} {"current_steps": 24535, "total_steps": 38160, "loss": 0.4131, "lr": 0.0003406451937464139, "epoch": 12.85901467505241, "percentage": 64.3, "elapsed_time": "1:02:41", "remaining_time": "0:34:49", "throughput": 4256.35, "total_tokens": 16011592} {"current_steps": 24540, "total_steps": 38160, "loss": 0.5143, "lr": 0.0003404284501319845, "epoch": 12.861635220125786, "percentage": 64.31, "elapsed_time": "1:02:42", "remaining_time": "0:34:48", "throughput": 4256.51, "total_tokens": 16015784} {"current_steps": 24545, "total_steps": 38160, "loss": 0.552, "lr": 0.00034021173989810306, "epoch": 12.864255765199161, "percentage": 64.32, "elapsed_time": "1:02:43", "remaining_time": "0:34:47", "throughput": 4256.58, "total_tokens": 16019208} {"current_steps": 24550, "total_steps": 38160, "loss": 0.4809, "lr": 0.0003399950630901025, "epoch": 12.866876310272536, "percentage": 64.33, "elapsed_time": "1:02:44", "remaining_time": "0:34:46", "throughput": 4256.67, "total_tokens": 16022856} {"current_steps": 24555, "total_steps": 38160, "loss": 0.4736, "lr": 0.0003397784197533095, "epoch": 12.869496855345911, "percentage": 64.35, "elapsed_time": "1:02:44", "remaining_time": "0:34:45", "throughput": 4256.63, "total_tokens": 16025480} {"current_steps": 24560, "total_steps": 38160, "loss": 0.4912, "lr": 0.0003395618099330431, "epoch": 12.872117400419286, "percentage": 64.36, "elapsed_time": "1:02:45", "remaining_time": "0:34:45", "throughput": 4256.6, "total_tokens": 16028072} {"current_steps": 24565, "total_steps": 38160, "loss": 0.5371, "lr": 0.0003393452336746156, "epoch": 12.874737945492662, "percentage": 64.37, "elapsed_time": "1:02:46", "remaining_time": "0:34:44", "throughput": 4256.67, "total_tokens": 16031592} {"current_steps": 24570, "total_steps": 38160, "loss": 0.3815, "lr": 0.00033912869102333237, "epoch": 12.877358490566039, "percentage": 64.39, "elapsed_time": "1:02:46", "remaining_time": "0:34:43", "throughput": 4256.76, "total_tokens": 16035048} {"current_steps": 24575, "total_steps": 38160, "loss": 0.5073, "lr": 0.00033891218202449164, "epoch": 12.879979035639414, "percentage": 64.4, "elapsed_time": "1:02:47", "remaining_time": "0:34:42", "throughput": 4256.98, "total_tokens": 16039720} {"current_steps": 24580, "total_steps": 38160, "loss": 0.391, "lr": 0.00033869570672338486, "epoch": 12.882599580712789, "percentage": 64.41, "elapsed_time": "1:02:48", "remaining_time": "0:34:42", "throughput": 4257.03, "total_tokens": 16043016} {"current_steps": 24585, "total_steps": 38160, "loss": 0.4342, "lr": 0.00033847926516529574, "epoch": 12.885220125786164, "percentage": 64.43, "elapsed_time": "1:02:49", "remaining_time": "0:34:41", "throughput": 4257.03, "total_tokens": 16045896} {"current_steps": 24590, "total_steps": 38160, "loss": 0.4211, "lr": 0.0003382628573955018, "epoch": 12.88784067085954, "percentage": 64.44, "elapsed_time": "1:02:49", "remaining_time": "0:34:40", "throughput": 4257.0, "total_tokens": 16048552} {"current_steps": 24595, "total_steps": 38160, "loss": 0.5317, "lr": 0.00033804648345927267, "epoch": 12.890461215932914, "percentage": 64.45, "elapsed_time": "1:02:50", "remaining_time": "0:34:39", "throughput": 4257.04, "total_tokens": 16051752} {"current_steps": 24600, "total_steps": 38160, "loss": 0.416, "lr": 0.00033783014340187166, "epoch": 12.89308176100629, "percentage": 64.47, "elapsed_time": "1:02:51", "remaining_time": "0:34:38", "throughput": 4257.06, "total_tokens": 16054760} {"current_steps": 24605, "total_steps": 38160, "loss": 0.3307, "lr": 0.0003376138372685545, "epoch": 12.895702306079665, "percentage": 64.48, "elapsed_time": "1:02:52", "remaining_time": "0:34:38", "throughput": 4257.06, "total_tokens": 16057672} {"current_steps": 24610, "total_steps": 38160, "loss": 0.4199, "lr": 0.00033739756510457015, "epoch": 12.89832285115304, "percentage": 64.49, "elapsed_time": "1:02:52", "remaining_time": "0:34:37", "throughput": 4257.09, "total_tokens": 16060744} {"current_steps": 24615, "total_steps": 38160, "loss": 0.4709, "lr": 0.00033718132695516003, "epoch": 12.900943396226415, "percentage": 64.5, "elapsed_time": "1:02:53", "remaining_time": "0:34:36", "throughput": 4257.1, "total_tokens": 16063720} {"current_steps": 24620, "total_steps": 38160, "loss": 0.4297, "lr": 0.00033696512286555865, "epoch": 12.90356394129979, "percentage": 64.52, "elapsed_time": "1:02:54", "remaining_time": "0:34:35", "throughput": 4257.42, "total_tokens": 16069448} {"current_steps": 24625, "total_steps": 38160, "loss": 0.2168, "lr": 0.0003367489528809936, "epoch": 12.906184486373165, "percentage": 64.53, "elapsed_time": "1:02:55", "remaining_time": "0:34:35", "throughput": 4257.63, "total_tokens": 16074280} {"current_steps": 24630, "total_steps": 38160, "loss": 0.4193, "lr": 0.00033653281704668515, "epoch": 12.90880503144654, "percentage": 64.54, "elapsed_time": "1:02:56", "remaining_time": "0:34:34", "throughput": 4257.73, "total_tokens": 16077896} {"current_steps": 24635, "total_steps": 38160, "loss": 0.5499, "lr": 0.0003363167154078465, "epoch": 12.911425576519916, "percentage": 64.56, "elapsed_time": "1:02:56", "remaining_time": "0:34:33", "throughput": 4257.71, "total_tokens": 16080680} {"current_steps": 24640, "total_steps": 38160, "loss": 0.5363, "lr": 0.0003361006480096837, "epoch": 12.914046121593291, "percentage": 64.57, "elapsed_time": "1:02:57", "remaining_time": "0:34:32", "throughput": 4257.72, "total_tokens": 16083656} {"current_steps": 24645, "total_steps": 38160, "loss": 0.3585, "lr": 0.0003358846148973953, "epoch": 12.916666666666666, "percentage": 64.58, "elapsed_time": "1:02:58", "remaining_time": "0:34:31", "throughput": 4257.8, "total_tokens": 16087144} {"current_steps": 24650, "total_steps": 38160, "loss": 0.5328, "lr": 0.0003356686161161732, "epoch": 12.919287211740041, "percentage": 64.6, "elapsed_time": "1:02:59", "remaining_time": "0:34:31", "throughput": 4257.97, "total_tokens": 16091400} {"current_steps": 24655, "total_steps": 38160, "loss": 0.3496, "lr": 0.00033545265171120163, "epoch": 12.921907756813416, "percentage": 64.61, "elapsed_time": "1:02:59", "remaining_time": "0:34:30", "throughput": 4257.93, "total_tokens": 16093864} {"current_steps": 24660, "total_steps": 38160, "loss": 0.3885, "lr": 0.0003352367217276582, "epoch": 12.924528301886792, "percentage": 64.62, "elapsed_time": "1:03:00", "remaining_time": "0:34:29", "throughput": 4257.89, "total_tokens": 16096520} {"current_steps": 24665, "total_steps": 38160, "loss": 0.4159, "lr": 0.0003350208262107131, "epoch": 12.927148846960169, "percentage": 64.64, "elapsed_time": "1:03:01", "remaining_time": "0:34:28", "throughput": 4257.93, "total_tokens": 16099688} {"current_steps": 24670, "total_steps": 38160, "loss": 0.5062, "lr": 0.00033480496520552874, "epoch": 12.929769392033544, "percentage": 64.65, "elapsed_time": "1:03:01", "remaining_time": "0:34:28", "throughput": 4258.04, "total_tokens": 16103528} {"current_steps": 24675, "total_steps": 38160, "loss": 0.6932, "lr": 0.00033458913875726093, "epoch": 12.932389937106919, "percentage": 64.66, "elapsed_time": "1:03:02", "remaining_time": "0:34:27", "throughput": 4258.11, "total_tokens": 16107080} {"current_steps": 24680, "total_steps": 38160, "loss": 0.4403, "lr": 0.00033437334691105837, "epoch": 12.935010482180294, "percentage": 64.68, "elapsed_time": "1:03:03", "remaining_time": "0:34:26", "throughput": 4258.13, "total_tokens": 16110120} {"current_steps": 24685, "total_steps": 38160, "loss": 0.3986, "lr": 0.0003341575897120619, "epoch": 12.93763102725367, "percentage": 64.69, "elapsed_time": "1:03:04", "remaining_time": "0:34:25", "throughput": 4258.21, "total_tokens": 16113640} {"current_steps": 24690, "total_steps": 38160, "loss": 0.4241, "lr": 0.00033394186720540577, "epoch": 12.940251572327044, "percentage": 64.7, "elapsed_time": "1:03:04", "remaining_time": "0:34:24", "throughput": 4258.2, "total_tokens": 16116520} {"current_steps": 24695, "total_steps": 38160, "loss": 0.4602, "lr": 0.00033372617943621665, "epoch": 12.94287211740042, "percentage": 64.71, "elapsed_time": "1:03:05", "remaining_time": "0:34:24", "throughput": 4258.18, "total_tokens": 16119208} {"current_steps": 24700, "total_steps": 38160, "loss": 0.5048, "lr": 0.00033351052644961353, "epoch": 12.945492662473795, "percentage": 64.73, "elapsed_time": "1:03:06", "remaining_time": "0:34:23", "throughput": 4258.16, "total_tokens": 16121960} {"current_steps": 24705, "total_steps": 38160, "loss": 0.3496, "lr": 0.00033329490829070907, "epoch": 12.94811320754717, "percentage": 64.74, "elapsed_time": "1:03:06", "remaining_time": "0:34:22", "throughput": 4258.3, "total_tokens": 16125960} {"current_steps": 24710, "total_steps": 38160, "loss": 0.4144, "lr": 0.0003330793250046078, "epoch": 12.950733752620545, "percentage": 64.75, "elapsed_time": "1:03:07", "remaining_time": "0:34:21", "throughput": 4258.29, "total_tokens": 16128744} {"current_steps": 24715, "total_steps": 38160, "loss": 0.6096, "lr": 0.0003328637766364075, "epoch": 12.95335429769392, "percentage": 64.77, "elapsed_time": "1:03:08", "remaining_time": "0:34:20", "throughput": 4258.34, "total_tokens": 16131944} {"current_steps": 24720, "total_steps": 38160, "loss": 0.5553, "lr": 0.00033264826323119824, "epoch": 12.955974842767295, "percentage": 64.78, "elapsed_time": "1:03:09", "remaining_time": "0:34:20", "throughput": 4258.44, "total_tokens": 16135624} {"current_steps": 24725, "total_steps": 38160, "loss": 0.3843, "lr": 0.00033243278483406326, "epoch": 12.95859538784067, "percentage": 64.79, "elapsed_time": "1:03:09", "remaining_time": "0:34:19", "throughput": 4258.54, "total_tokens": 16139304} {"current_steps": 24730, "total_steps": 38160, "loss": 0.4211, "lr": 0.00033221734149007785, "epoch": 12.961215932914046, "percentage": 64.81, "elapsed_time": "1:03:10", "remaining_time": "0:34:18", "throughput": 4258.56, "total_tokens": 16142312} {"current_steps": 24735, "total_steps": 38160, "loss": 0.4737, "lr": 0.0003320019332443104, "epoch": 12.963836477987421, "percentage": 64.82, "elapsed_time": "1:03:11", "remaining_time": "0:34:17", "throughput": 4258.7, "total_tokens": 16146376} {"current_steps": 24740, "total_steps": 38160, "loss": 0.3968, "lr": 0.00033178656014182185, "epoch": 12.966457023060796, "percentage": 64.83, "elapsed_time": "1:03:12", "remaining_time": "0:34:16", "throughput": 4258.71, "total_tokens": 16149384} {"current_steps": 24745, "total_steps": 38160, "loss": 0.3665, "lr": 0.00033157122222766597, "epoch": 12.969077568134171, "percentage": 64.85, "elapsed_time": "1:03:12", "remaining_time": "0:34:16", "throughput": 4258.88, "total_tokens": 16153768} {"current_steps": 24750, "total_steps": 38160, "loss": 0.3444, "lr": 0.0003313559195468889, "epoch": 12.971698113207546, "percentage": 64.86, "elapsed_time": "1:03:13", "remaining_time": "0:34:15", "throughput": 4259.1, "total_tokens": 16158536} {"current_steps": 24755, "total_steps": 38160, "loss": 0.4374, "lr": 0.0003311406521445293, "epoch": 12.974318658280922, "percentage": 64.87, "elapsed_time": "1:03:14", "remaining_time": "0:34:14", "throughput": 4259.2, "total_tokens": 16162312} {"current_steps": 24760, "total_steps": 38160, "loss": 0.5132, "lr": 0.000330925420065619, "epoch": 12.976939203354299, "percentage": 64.88, "elapsed_time": "1:03:15", "remaining_time": "0:34:14", "throughput": 4259.18, "total_tokens": 16165064} {"current_steps": 24765, "total_steps": 38160, "loss": 0.4186, "lr": 0.0003307102233551817, "epoch": 12.979559748427674, "percentage": 64.9, "elapsed_time": "1:03:15", "remaining_time": "0:34:13", "throughput": 4259.1, "total_tokens": 16167304} {"current_steps": 24770, "total_steps": 38160, "loss": 0.4842, "lr": 0.0003304950620582344, "epoch": 12.982180293501049, "percentage": 64.91, "elapsed_time": "1:03:16", "remaining_time": "0:34:12", "throughput": 4259.21, "total_tokens": 16171016} {"current_steps": 24775, "total_steps": 38160, "loss": 0.4199, "lr": 0.0003302799362197864, "epoch": 12.984800838574424, "percentage": 64.92, "elapsed_time": "1:03:17", "remaining_time": "0:34:11", "throughput": 4259.31, "total_tokens": 16174824} {"current_steps": 24780, "total_steps": 38160, "loss": 0.5065, "lr": 0.00033006484588483947, "epoch": 12.9874213836478, "percentage": 64.94, "elapsed_time": "1:03:18", "remaining_time": "0:34:10", "throughput": 4259.58, "total_tokens": 16179880} {"current_steps": 24785, "total_steps": 38160, "loss": 0.5328, "lr": 0.00032984979109838803, "epoch": 12.990041928721174, "percentage": 64.95, "elapsed_time": "1:03:19", "remaining_time": "0:34:10", "throughput": 4259.57, "total_tokens": 16182856} {"current_steps": 24790, "total_steps": 38160, "loss": 0.5173, "lr": 0.000329634771905419, "epoch": 12.99266247379455, "percentage": 64.96, "elapsed_time": "1:03:19", "remaining_time": "0:34:09", "throughput": 4259.55, "total_tokens": 16185672} {"current_steps": 24795, "total_steps": 38160, "loss": 0.3515, "lr": 0.0003294197883509122, "epoch": 12.995283018867925, "percentage": 64.98, "elapsed_time": "1:03:20", "remaining_time": "0:34:08", "throughput": 4259.54, "total_tokens": 16188392} {"current_steps": 24800, "total_steps": 38160, "loss": 0.471, "lr": 0.00032920484047983947, "epoch": 12.9979035639413, "percentage": 64.99, "elapsed_time": "1:03:21", "remaining_time": "0:34:07", "throughput": 4259.56, "total_tokens": 16191560} {"current_steps": 24804, "total_steps": 38160, "eval_loss": 0.48564380407333374, "epoch": 13.0, "percentage": 65.0, "elapsed_time": "1:03:35", "remaining_time": "0:34:14", "throughput": 4244.15, "total_tokens": 16193456} {"current_steps": 24805, "total_steps": 38160, "loss": 0.3282, "lr": 0.0003289899283371657, "epoch": 13.000524109014675, "percentage": 65.0, "elapsed_time": "1:03:37", "remaining_time": "0:34:15", "throughput": 4242.31, "total_tokens": 16194544} {"current_steps": 24810, "total_steps": 38160, "loss": 0.4105, "lr": 0.00032877505196784795, "epoch": 13.00314465408805, "percentage": 65.02, "elapsed_time": "1:03:38", "remaining_time": "0:34:14", "throughput": 4242.39, "total_tokens": 16198000} {"current_steps": 24815, "total_steps": 38160, "loss": 0.3907, "lr": 0.0003285602114168358, "epoch": 13.005765199161425, "percentage": 65.03, "elapsed_time": "1:03:38", "remaining_time": "0:34:13", "throughput": 4242.38, "total_tokens": 16200816} {"current_steps": 24820, "total_steps": 38160, "loss": 0.4899, "lr": 0.00032834540672907144, "epoch": 13.0083857442348, "percentage": 65.04, "elapsed_time": "1:03:39", "remaining_time": "0:34:13", "throughput": 4242.66, "total_tokens": 16206096} {"current_steps": 24825, "total_steps": 38160, "loss": 0.4096, "lr": 0.00032813063794948983, "epoch": 13.011006289308176, "percentage": 65.06, "elapsed_time": "1:03:40", "remaining_time": "0:34:12", "throughput": 4242.72, "total_tokens": 16209552} {"current_steps": 24830, "total_steps": 38160, "loss": 0.4326, "lr": 0.00032791590512301784, "epoch": 13.01362683438155, "percentage": 65.07, "elapsed_time": "1:03:41", "remaining_time": "0:34:11", "throughput": 4242.65, "total_tokens": 16211984} {"current_steps": 24835, "total_steps": 38160, "loss": 0.4477, "lr": 0.00032770120829457534, "epoch": 13.016247379454926, "percentage": 65.08, "elapsed_time": "1:03:42", "remaining_time": "0:34:10", "throughput": 4242.78, "total_tokens": 16215920} {"current_steps": 24840, "total_steps": 38160, "loss": 0.4736, "lr": 0.00032748654750907447, "epoch": 13.018867924528301, "percentage": 65.09, "elapsed_time": "1:03:42", "remaining_time": "0:34:09", "throughput": 4242.78, "total_tokens": 16218864} {"current_steps": 24845, "total_steps": 38160, "loss": 0.3878, "lr": 0.0003272719228114196, "epoch": 13.021488469601676, "percentage": 65.11, "elapsed_time": "1:03:43", "remaining_time": "0:34:09", "throughput": 4243.21, "total_tokens": 16225936} {"current_steps": 24850, "total_steps": 38160, "loss": 0.5126, "lr": 0.0003270573342465079, "epoch": 13.024109014675052, "percentage": 65.12, "elapsed_time": "1:03:44", "remaining_time": "0:34:08", "throughput": 4243.19, "total_tokens": 16228688} {"current_steps": 24855, "total_steps": 38160, "loss": 0.4544, "lr": 0.00032684278185922877, "epoch": 13.026729559748428, "percentage": 65.13, "elapsed_time": "1:03:45", "remaining_time": "0:34:07", "throughput": 4243.19, "total_tokens": 16231504} {"current_steps": 24860, "total_steps": 38160, "loss": 0.3571, "lr": 0.0003266282656944643, "epoch": 13.029350104821804, "percentage": 65.15, "elapsed_time": "1:03:46", "remaining_time": "0:34:06", "throughput": 4243.23, "total_tokens": 16234736} {"current_steps": 24865, "total_steps": 38160, "loss": 0.4022, "lr": 0.0003264137857970888, "epoch": 13.031970649895179, "percentage": 65.16, "elapsed_time": "1:03:46", "remaining_time": "0:34:06", "throughput": 4243.44, "total_tokens": 16239152} {"current_steps": 24870, "total_steps": 38160, "loss": 0.4134, "lr": 0.0003261993422119688, "epoch": 13.034591194968554, "percentage": 65.17, "elapsed_time": "1:03:47", "remaining_time": "0:34:05", "throughput": 4243.49, "total_tokens": 16242352} {"current_steps": 24875, "total_steps": 38160, "loss": 0.367, "lr": 0.00032598493498396365, "epoch": 13.03721174004193, "percentage": 65.19, "elapsed_time": "1:03:48", "remaining_time": "0:34:04", "throughput": 4243.64, "total_tokens": 16246416} {"current_steps": 24880, "total_steps": 38160, "loss": 0.3716, "lr": 0.0003257705641579247, "epoch": 13.039832285115304, "percentage": 65.2, "elapsed_time": "1:03:49", "remaining_time": "0:34:03", "throughput": 4243.75, "total_tokens": 16250192} {"current_steps": 24885, "total_steps": 38160, "loss": 0.406, "lr": 0.00032555622977869614, "epoch": 13.04245283018868, "percentage": 65.21, "elapsed_time": "1:03:50", "remaining_time": "0:34:03", "throughput": 4243.88, "total_tokens": 16254192} {"current_steps": 24890, "total_steps": 38160, "loss": 0.4259, "lr": 0.00032534193189111407, "epoch": 13.045073375262055, "percentage": 65.23, "elapsed_time": "1:03:50", "remaining_time": "0:34:02", "throughput": 4243.88, "total_tokens": 16257104} {"current_steps": 24895, "total_steps": 38160, "loss": 0.4329, "lr": 0.0003251276705400074, "epoch": 13.04769392033543, "percentage": 65.24, "elapsed_time": "1:03:51", "remaining_time": "0:34:01", "throughput": 4243.87, "total_tokens": 16259888} {"current_steps": 24900, "total_steps": 38160, "loss": 0.4168, "lr": 0.0003249134457701968, "epoch": 13.050314465408805, "percentage": 65.25, "elapsed_time": "1:03:52", "remaining_time": "0:34:00", "throughput": 4243.99, "total_tokens": 16263728} {"current_steps": 24905, "total_steps": 38160, "loss": 0.3518, "lr": 0.000324699257626496, "epoch": 13.05293501048218, "percentage": 65.26, "elapsed_time": "1:03:52", "remaining_time": "0:33:59", "throughput": 4243.97, "total_tokens": 16266576} {"current_steps": 24910, "total_steps": 38160, "loss": 0.3578, "lr": 0.00032448510615371045, "epoch": 13.055555555555555, "percentage": 65.28, "elapsed_time": "1:03:53", "remaining_time": "0:33:59", "throughput": 4243.92, "total_tokens": 16269104} {"current_steps": 24915, "total_steps": 38160, "loss": 0.5384, "lr": 0.0003242709913966384, "epoch": 13.05817610062893, "percentage": 65.29, "elapsed_time": "1:03:54", "remaining_time": "0:33:58", "throughput": 4243.93, "total_tokens": 16271984} {"current_steps": 24920, "total_steps": 38160, "loss": 0.5167, "lr": 0.00032405691340007, "epoch": 13.060796645702306, "percentage": 65.3, "elapsed_time": "1:03:55", "remaining_time": "0:33:57", "throughput": 4244.09, "total_tokens": 16276272} {"current_steps": 24925, "total_steps": 38160, "loss": 0.4383, "lr": 0.0003238428722087884, "epoch": 13.06341719077568, "percentage": 65.32, "elapsed_time": "1:03:55", "remaining_time": "0:33:56", "throughput": 4244.1, "total_tokens": 16279280} {"current_steps": 24930, "total_steps": 38160, "loss": 0.4051, "lr": 0.00032362886786756797, "epoch": 13.066037735849056, "percentage": 65.33, "elapsed_time": "1:03:56", "remaining_time": "0:33:56", "throughput": 4244.26, "total_tokens": 16283440} {"current_steps": 24935, "total_steps": 38160, "loss": 0.4695, "lr": 0.00032341490042117615, "epoch": 13.068658280922431, "percentage": 65.34, "elapsed_time": "1:03:57", "remaining_time": "0:33:55", "throughput": 4244.28, "total_tokens": 16286448} {"current_steps": 24940, "total_steps": 38160, "loss": 0.3277, "lr": 0.00032320096991437277, "epoch": 13.071278825995806, "percentage": 65.36, "elapsed_time": "1:03:57", "remaining_time": "0:33:54", "throughput": 4244.23, "total_tokens": 16289008} {"current_steps": 24945, "total_steps": 38160, "loss": 0.5603, "lr": 0.0003229870763919093, "epoch": 13.073899371069182, "percentage": 65.37, "elapsed_time": "1:03:58", "remaining_time": "0:33:53", "throughput": 4244.3, "total_tokens": 16292592} {"current_steps": 24950, "total_steps": 38160, "loss": 0.3735, "lr": 0.00032277321989853015, "epoch": 13.076519916142558, "percentage": 65.38, "elapsed_time": "1:03:59", "remaining_time": "0:33:52", "throughput": 4244.32, "total_tokens": 16295664} {"current_steps": 24955, "total_steps": 38160, "loss": 0.4121, "lr": 0.00032255940047897137, "epoch": 13.079140461215934, "percentage": 65.4, "elapsed_time": "1:04:00", "remaining_time": "0:33:51", "throughput": 4244.26, "total_tokens": 16298064} {"current_steps": 24960, "total_steps": 38160, "loss": 0.3194, "lr": 0.0003223456181779616, "epoch": 13.081761006289309, "percentage": 65.41, "elapsed_time": "1:04:00", "remaining_time": "0:33:51", "throughput": 4244.19, "total_tokens": 16300400} {"current_steps": 24965, "total_steps": 38160, "loss": 0.3916, "lr": 0.0003221318730402218, "epoch": 13.084381551362684, "percentage": 65.42, "elapsed_time": "1:04:01", "remaining_time": "0:33:50", "throughput": 4244.23, "total_tokens": 16303664} {"current_steps": 24970, "total_steps": 38160, "loss": 0.3964, "lr": 0.00032191816511046483, "epoch": 13.08700209643606, "percentage": 65.44, "elapsed_time": "1:04:02", "remaining_time": "0:33:49", "throughput": 4244.2, "total_tokens": 16306288} {"current_steps": 24975, "total_steps": 38160, "loss": 0.4815, "lr": 0.0003217044944333961, "epoch": 13.089622641509434, "percentage": 65.45, "elapsed_time": "1:04:02", "remaining_time": "0:33:48", "throughput": 4244.28, "total_tokens": 16309808} {"current_steps": 24980, "total_steps": 38160, "loss": 0.3674, "lr": 0.00032149086105371315, "epoch": 13.09224318658281, "percentage": 65.46, "elapsed_time": "1:04:03", "remaining_time": "0:33:47", "throughput": 4244.32, "total_tokens": 16313136} {"current_steps": 24985, "total_steps": 38160, "loss": 0.4199, "lr": 0.00032127726501610554, "epoch": 13.094863731656185, "percentage": 65.47, "elapsed_time": "1:04:04", "remaining_time": "0:33:47", "throughput": 4244.38, "total_tokens": 16316464} {"current_steps": 24990, "total_steps": 38160, "loss": 0.4312, "lr": 0.00032106370636525493, "epoch": 13.09748427672956, "percentage": 65.49, "elapsed_time": "1:04:04", "remaining_time": "0:33:46", "throughput": 4244.38, "total_tokens": 16319376} {"current_steps": 24995, "total_steps": 38160, "loss": 0.5762, "lr": 0.00032085018514583564, "epoch": 13.100104821802935, "percentage": 65.5, "elapsed_time": "1:04:05", "remaining_time": "0:33:45", "throughput": 4244.51, "total_tokens": 16323280} {"current_steps": 25000, "total_steps": 38160, "loss": 0.4152, "lr": 0.00032063670140251366, "epoch": 13.10272536687631, "percentage": 65.51, "elapsed_time": "1:04:06", "remaining_time": "0:33:44", "throughput": 4244.53, "total_tokens": 16326288} {"current_steps": 25005, "total_steps": 38160, "loss": 0.4534, "lr": 0.0003204232551799476, "epoch": 13.105345911949685, "percentage": 65.53, "elapsed_time": "1:04:07", "remaining_time": "0:33:43", "throughput": 4244.5, "total_tokens": 16329008} {"current_steps": 25010, "total_steps": 38160, "loss": 0.36, "lr": 0.00032020984652278797, "epoch": 13.10796645702306, "percentage": 65.54, "elapsed_time": "1:04:07", "remaining_time": "0:33:43", "throughput": 4244.44, "total_tokens": 16331408} {"current_steps": 25015, "total_steps": 38160, "loss": 0.4766, "lr": 0.000319996475475677, "epoch": 13.110587002096436, "percentage": 65.55, "elapsed_time": "1:04:08", "remaining_time": "0:33:42", "throughput": 4244.53, "total_tokens": 16335024} {"current_steps": 25020, "total_steps": 38160, "loss": 0.4278, "lr": 0.0003197831420832499, "epoch": 13.11320754716981, "percentage": 65.57, "elapsed_time": "1:04:09", "remaining_time": "0:33:41", "throughput": 4244.51, "total_tokens": 16337744} {"current_steps": 25025, "total_steps": 38160, "loss": 0.4648, "lr": 0.0003195698463901334, "epoch": 13.115828092243186, "percentage": 65.58, "elapsed_time": "1:04:09", "remaining_time": "0:33:40", "throughput": 4244.5, "total_tokens": 16340656} {"current_steps": 25030, "total_steps": 38160, "loss": 0.4759, "lr": 0.0003193565884409466, "epoch": 13.118448637316561, "percentage": 65.59, "elapsed_time": "1:04:10", "remaining_time": "0:33:39", "throughput": 4244.5, "total_tokens": 16343440} {"current_steps": 25035, "total_steps": 38160, "loss": 0.3356, "lr": 0.0003191433682803008, "epoch": 13.121069182389936, "percentage": 65.61, "elapsed_time": "1:04:11", "remaining_time": "0:33:39", "throughput": 4244.79, "total_tokens": 16349008} {"current_steps": 25040, "total_steps": 38160, "loss": 0.3522, "lr": 0.00031893018595279877, "epoch": 13.123689727463312, "percentage": 65.62, "elapsed_time": "1:04:12", "remaining_time": "0:33:38", "throughput": 4244.75, "total_tokens": 16351728} {"current_steps": 25045, "total_steps": 38160, "loss": 0.5028, "lr": 0.00031871704150303624, "epoch": 13.126310272536688, "percentage": 65.63, "elapsed_time": "1:04:12", "remaining_time": "0:33:37", "throughput": 4244.72, "total_tokens": 16354384} {"current_steps": 25050, "total_steps": 38160, "loss": 0.6667, "lr": 0.00031850393497560034, "epoch": 13.128930817610064, "percentage": 65.64, "elapsed_time": "1:04:13", "remaining_time": "0:33:36", "throughput": 4244.75, "total_tokens": 16357616} {"current_steps": 25055, "total_steps": 38160, "loss": 0.3956, "lr": 0.00031829086641507054, "epoch": 13.131551362683439, "percentage": 65.66, "elapsed_time": "1:04:14", "remaining_time": "0:33:35", "throughput": 4244.76, "total_tokens": 16360592} {"current_steps": 25060, "total_steps": 38160, "loss": 0.408, "lr": 0.00031807783586601865, "epoch": 13.134171907756814, "percentage": 65.67, "elapsed_time": "1:04:14", "remaining_time": "0:33:35", "throughput": 4244.78, "total_tokens": 16363600} {"current_steps": 25065, "total_steps": 38160, "loss": 0.3349, "lr": 0.00031786484337300805, "epoch": 13.13679245283019, "percentage": 65.68, "elapsed_time": "1:04:15", "remaining_time": "0:33:34", "throughput": 4244.76, "total_tokens": 16366352} {"current_steps": 25070, "total_steps": 38160, "loss": 0.3896, "lr": 0.0003176518889805941, "epoch": 13.139412997903564, "percentage": 65.7, "elapsed_time": "1:04:16", "remaining_time": "0:33:33", "throughput": 4244.73, "total_tokens": 16368944} {"current_steps": 25075, "total_steps": 38160, "loss": 0.3994, "lr": 0.0003174389727333248, "epoch": 13.14203354297694, "percentage": 65.71, "elapsed_time": "1:04:16", "remaining_time": "0:33:32", "throughput": 4244.74, "total_tokens": 16371952} {"current_steps": 25080, "total_steps": 38160, "loss": 0.4102, "lr": 0.00031722609467573946, "epoch": 13.144654088050315, "percentage": 65.72, "elapsed_time": "1:04:17", "remaining_time": "0:33:31", "throughput": 4244.73, "total_tokens": 16374704} {"current_steps": 25085, "total_steps": 38160, "loss": 0.4014, "lr": 0.0003170132548523701, "epoch": 13.14727463312369, "percentage": 65.74, "elapsed_time": "1:04:18", "remaining_time": "0:33:31", "throughput": 4244.73, "total_tokens": 16377584} {"current_steps": 25090, "total_steps": 38160, "loss": 0.531, "lr": 0.00031680045330774003, "epoch": 13.149895178197065, "percentage": 65.75, "elapsed_time": "1:04:19", "remaining_time": "0:33:30", "throughput": 4244.74, "total_tokens": 16380560} {"current_steps": 25095, "total_steps": 38160, "loss": 0.5134, "lr": 0.00031658769008636534, "epoch": 13.15251572327044, "percentage": 65.76, "elapsed_time": "1:04:19", "remaining_time": "0:33:29", "throughput": 4244.81, "total_tokens": 16384016} {"current_steps": 25100, "total_steps": 38160, "loss": 0.4428, "lr": 0.0003163749652327532, "epoch": 13.155136268343815, "percentage": 65.78, "elapsed_time": "1:04:20", "remaining_time": "0:33:28", "throughput": 4244.85, "total_tokens": 16387376} {"current_steps": 25105, "total_steps": 38160, "loss": 0.5026, "lr": 0.00031616227879140347, "epoch": 13.15775681341719, "percentage": 65.79, "elapsed_time": "1:04:21", "remaining_time": "0:33:27", "throughput": 4244.9, "total_tokens": 16390704} {"current_steps": 25110, "total_steps": 38160, "loss": 0.4012, "lr": 0.0003159496308068077, "epoch": 13.160377358490566, "percentage": 65.8, "elapsed_time": "1:04:22", "remaining_time": "0:33:27", "throughput": 4244.98, "total_tokens": 16394192} {"current_steps": 25115, "total_steps": 38160, "loss": 0.4016, "lr": 0.00031573702132344926, "epoch": 13.16299790356394, "percentage": 65.81, "elapsed_time": "1:04:22", "remaining_time": "0:33:26", "throughput": 4245.04, "total_tokens": 16397552} {"current_steps": 25120, "total_steps": 38160, "loss": 0.3799, "lr": 0.00031552445038580414, "epoch": 13.165618448637316, "percentage": 65.83, "elapsed_time": "1:04:23", "remaining_time": "0:33:25", "throughput": 4245.04, "total_tokens": 16400400} {"current_steps": 25125, "total_steps": 38160, "loss": 0.3673, "lr": 0.0003153119180383391, "epoch": 13.168238993710691, "percentage": 65.84, "elapsed_time": "1:04:24", "remaining_time": "0:33:24", "throughput": 4245.09, "total_tokens": 16403632} {"current_steps": 25130, "total_steps": 38160, "loss": 0.4368, "lr": 0.0003150994243255138, "epoch": 13.170859538784066, "percentage": 65.85, "elapsed_time": "1:04:24", "remaining_time": "0:33:23", "throughput": 4245.12, "total_tokens": 16406832} {"current_steps": 25135, "total_steps": 38160, "loss": 0.5263, "lr": 0.00031488696929177944, "epoch": 13.173480083857442, "percentage": 65.87, "elapsed_time": "1:04:25", "remaining_time": "0:33:23", "throughput": 4245.35, "total_tokens": 16411760} {"current_steps": 25140, "total_steps": 38160, "loss": 0.4141, "lr": 0.00031467455298157934, "epoch": 13.176100628930818, "percentage": 65.88, "elapsed_time": "1:04:26", "remaining_time": "0:33:22", "throughput": 4245.36, "total_tokens": 16414800} {"current_steps": 25145, "total_steps": 38160, "loss": 0.4173, "lr": 0.0003144621754393483, "epoch": 13.178721174004194, "percentage": 65.89, "elapsed_time": "1:04:27", "remaining_time": "0:33:21", "throughput": 4245.41, "total_tokens": 16418096} {"current_steps": 25150, "total_steps": 38160, "loss": 0.4796, "lr": 0.0003142498367095137, "epoch": 13.181341719077569, "percentage": 65.91, "elapsed_time": "1:04:28", "remaining_time": "0:33:20", "throughput": 4245.47, "total_tokens": 16421552} {"current_steps": 25155, "total_steps": 38160, "loss": 0.3749, "lr": 0.00031403753683649396, "epoch": 13.183962264150944, "percentage": 65.92, "elapsed_time": "1:04:28", "remaining_time": "0:33:20", "throughput": 4245.48, "total_tokens": 16424432} {"current_steps": 25160, "total_steps": 38160, "loss": 0.4403, "lr": 0.0003138252758646999, "epoch": 13.18658280922432, "percentage": 65.93, "elapsed_time": "1:04:29", "remaining_time": "0:33:19", "throughput": 4245.43, "total_tokens": 16426960} {"current_steps": 25165, "total_steps": 38160, "loss": 0.3188, "lr": 0.00031361305383853413, "epoch": 13.189203354297694, "percentage": 65.95, "elapsed_time": "1:04:30", "remaining_time": "0:33:18", "throughput": 4245.49, "total_tokens": 16430320} {"current_steps": 25170, "total_steps": 38160, "loss": 0.4474, "lr": 0.00031340087080239105, "epoch": 13.19182389937107, "percentage": 65.96, "elapsed_time": "1:04:30", "remaining_time": "0:33:17", "throughput": 4245.5, "total_tokens": 16433328} {"current_steps": 25175, "total_steps": 38160, "loss": 0.427, "lr": 0.0003131887268006571, "epoch": 13.194444444444445, "percentage": 65.97, "elapsed_time": "1:04:31", "remaining_time": "0:33:16", "throughput": 4245.55, "total_tokens": 16436688} {"current_steps": 25180, "total_steps": 38160, "loss": 0.3687, "lr": 0.00031297662187771026, "epoch": 13.19706498951782, "percentage": 65.99, "elapsed_time": "1:04:32", "remaining_time": "0:33:16", "throughput": 4245.59, "total_tokens": 16439856} {"current_steps": 25185, "total_steps": 38160, "loss": 0.3806, "lr": 0.0003127645560779203, "epoch": 13.199685534591195, "percentage": 66.0, "elapsed_time": "1:04:32", "remaining_time": "0:33:15", "throughput": 4245.55, "total_tokens": 16442480} {"current_steps": 25190, "total_steps": 38160, "loss": 0.3897, "lr": 0.0003125525294456492, "epoch": 13.20230607966457, "percentage": 66.01, "elapsed_time": "1:04:33", "remaining_time": "0:33:14", "throughput": 4245.66, "total_tokens": 16446192} {"current_steps": 25195, "total_steps": 38160, "loss": 0.3813, "lr": 0.0003123405420252503, "epoch": 13.204926624737945, "percentage": 66.02, "elapsed_time": "1:04:34", "remaining_time": "0:33:13", "throughput": 4245.67, "total_tokens": 16449200} {"current_steps": 25200, "total_steps": 38160, "loss": 0.5637, "lr": 0.00031212859386106927, "epoch": 13.20754716981132, "percentage": 66.04, "elapsed_time": "1:04:35", "remaining_time": "0:33:12", "throughput": 4245.68, "total_tokens": 16452112} {"current_steps": 25205, "total_steps": 38160, "loss": 0.5165, "lr": 0.00031191668499744286, "epoch": 13.210167714884696, "percentage": 66.05, "elapsed_time": "1:04:35", "remaining_time": "0:33:12", "throughput": 4245.77, "total_tokens": 16455760} {"current_steps": 25210, "total_steps": 38160, "loss": 0.4279, "lr": 0.00031170481547870046, "epoch": 13.21278825995807, "percentage": 66.06, "elapsed_time": "1:04:36", "remaining_time": "0:33:11", "throughput": 4245.78, "total_tokens": 16458704} {"current_steps": 25215, "total_steps": 38160, "loss": 0.4444, "lr": 0.00031149298534916215, "epoch": 13.215408805031446, "percentage": 66.08, "elapsed_time": "1:04:37", "remaining_time": "0:33:10", "throughput": 4245.79, "total_tokens": 16461680} {"current_steps": 25220, "total_steps": 38160, "loss": 0.4712, "lr": 0.00031128119465314094, "epoch": 13.218029350104821, "percentage": 66.09, "elapsed_time": "1:04:37", "remaining_time": "0:33:09", "throughput": 4245.79, "total_tokens": 16464496} {"current_steps": 25225, "total_steps": 38160, "loss": 0.3037, "lr": 0.0003110694434349406, "epoch": 13.220649895178196, "percentage": 66.1, "elapsed_time": "1:04:38", "remaining_time": "0:33:08", "throughput": 4245.74, "total_tokens": 16466992} {"current_steps": 25230, "total_steps": 38160, "loss": 0.4106, "lr": 0.0003108577317388574, "epoch": 13.223270440251572, "percentage": 66.12, "elapsed_time": "1:04:39", "remaining_time": "0:33:07", "throughput": 4245.68, "total_tokens": 16469392} {"current_steps": 25235, "total_steps": 38160, "loss": 0.539, "lr": 0.00031064605960917896, "epoch": 13.225890985324948, "percentage": 66.13, "elapsed_time": "1:04:39", "remaining_time": "0:33:07", "throughput": 4245.75, "total_tokens": 16472848} {"current_steps": 25240, "total_steps": 38160, "loss": 0.4651, "lr": 0.00031043442709018446, "epoch": 13.228511530398324, "percentage": 66.14, "elapsed_time": "1:04:40", "remaining_time": "0:33:06", "throughput": 4245.91, "total_tokens": 16477040} {"current_steps": 25245, "total_steps": 38160, "loss": 0.4954, "lr": 0.0003102228342261451, "epoch": 13.231132075471699, "percentage": 66.16, "elapsed_time": "1:04:41", "remaining_time": "0:33:05", "throughput": 4245.97, "total_tokens": 16480432} {"current_steps": 25250, "total_steps": 38160, "loss": 0.4277, "lr": 0.0003100112810613237, "epoch": 13.233752620545074, "percentage": 66.17, "elapsed_time": "1:04:42", "remaining_time": "0:33:04", "throughput": 4245.95, "total_tokens": 16483088} {"current_steps": 25255, "total_steps": 38160, "loss": 0.3725, "lr": 0.00030979976763997484, "epoch": 13.23637316561845, "percentage": 66.18, "elapsed_time": "1:04:42", "remaining_time": "0:33:04", "throughput": 4246.03, "total_tokens": 16486640} {"current_steps": 25260, "total_steps": 38160, "loss": 0.3411, "lr": 0.0003095882940063447, "epoch": 13.238993710691824, "percentage": 66.19, "elapsed_time": "1:04:43", "remaining_time": "0:33:03", "throughput": 4245.98, "total_tokens": 16489168} {"current_steps": 25265, "total_steps": 38160, "loss": 0.4978, "lr": 0.0003093768602046712, "epoch": 13.2416142557652, "percentage": 66.21, "elapsed_time": "1:04:44", "remaining_time": "0:33:02", "throughput": 4245.96, "total_tokens": 16491824} {"current_steps": 25270, "total_steps": 38160, "loss": 0.5388, "lr": 0.00030916546627918375, "epoch": 13.244234800838575, "percentage": 66.22, "elapsed_time": "1:04:44", "remaining_time": "0:33:01", "throughput": 4246.04, "total_tokens": 16495408} {"current_steps": 25275, "total_steps": 38160, "loss": 0.4264, "lr": 0.00030895411227410354, "epoch": 13.24685534591195, "percentage": 66.23, "elapsed_time": "1:04:45", "remaining_time": "0:33:00", "throughput": 4246.15, "total_tokens": 16499280} {"current_steps": 25280, "total_steps": 38160, "loss": 0.3821, "lr": 0.0003087427982336435, "epoch": 13.249475890985325, "percentage": 66.25, "elapsed_time": "1:04:46", "remaining_time": "0:33:00", "throughput": 4246.17, "total_tokens": 16502352} {"current_steps": 25285, "total_steps": 38160, "loss": 0.5734, "lr": 0.00030853152420200804, "epoch": 13.2520964360587, "percentage": 66.26, "elapsed_time": "1:04:47", "remaining_time": "0:32:59", "throughput": 4246.2, "total_tokens": 16505456} {"current_steps": 25290, "total_steps": 38160, "loss": 0.394, "lr": 0.0003083202902233932, "epoch": 13.254716981132075, "percentage": 66.27, "elapsed_time": "1:04:47", "remaining_time": "0:32:58", "throughput": 4246.22, "total_tokens": 16508464} {"current_steps": 25295, "total_steps": 38160, "loss": 0.3944, "lr": 0.00030810909634198727, "epoch": 13.25733752620545, "percentage": 66.29, "elapsed_time": "1:04:48", "remaining_time": "0:32:57", "throughput": 4246.23, "total_tokens": 16511440} {"current_steps": 25300, "total_steps": 38160, "loss": 0.3933, "lr": 0.00030789794260196893, "epoch": 13.259958071278826, "percentage": 66.3, "elapsed_time": "1:04:49", "remaining_time": "0:32:56", "throughput": 4246.29, "total_tokens": 16514800} {"current_steps": 25305, "total_steps": 38160, "loss": 0.3844, "lr": 0.00030768682904750935, "epoch": 13.2625786163522, "percentage": 66.31, "elapsed_time": "1:04:49", "remaining_time": "0:32:56", "throughput": 4246.25, "total_tokens": 16517488} {"current_steps": 25310, "total_steps": 38160, "loss": 0.4775, "lr": 0.00030747575572277107, "epoch": 13.265199161425576, "percentage": 66.33, "elapsed_time": "1:04:50", "remaining_time": "0:32:55", "throughput": 4246.27, "total_tokens": 16520528} {"current_steps": 25315, "total_steps": 38160, "loss": 0.3996, "lr": 0.0003072647226719083, "epoch": 13.267819706498951, "percentage": 66.34, "elapsed_time": "1:04:51", "remaining_time": "0:32:54", "throughput": 4246.36, "total_tokens": 16524144} {"current_steps": 25320, "total_steps": 38160, "loss": 0.3744, "lr": 0.0003070537299390669, "epoch": 13.270440251572326, "percentage": 66.35, "elapsed_time": "1:04:52", "remaining_time": "0:32:53", "throughput": 4246.33, "total_tokens": 16526768} {"current_steps": 25325, "total_steps": 38160, "loss": 0.5481, "lr": 0.0003068427775683838, "epoch": 13.273060796645701, "percentage": 66.37, "elapsed_time": "1:04:52", "remaining_time": "0:32:52", "throughput": 4246.49, "total_tokens": 16531088} {"current_steps": 25330, "total_steps": 38160, "loss": 0.4553, "lr": 0.00030663186560398793, "epoch": 13.275681341719078, "percentage": 66.38, "elapsed_time": "1:04:53", "remaining_time": "0:32:52", "throughput": 4246.48, "total_tokens": 16533904} {"current_steps": 25335, "total_steps": 38160, "loss": 0.5308, "lr": 0.0003064209940899998, "epoch": 13.278301886792454, "percentage": 66.39, "elapsed_time": "1:04:54", "remaining_time": "0:32:51", "throughput": 4246.52, "total_tokens": 16537104} {"current_steps": 25340, "total_steps": 38160, "loss": 0.3238, "lr": 0.00030621016307053105, "epoch": 13.280922431865829, "percentage": 66.4, "elapsed_time": "1:04:54", "remaining_time": "0:32:50", "throughput": 4246.55, "total_tokens": 16540240} {"current_steps": 25345, "total_steps": 38160, "loss": 0.4443, "lr": 0.0003059993725896855, "epoch": 13.283542976939204, "percentage": 66.42, "elapsed_time": "1:04:55", "remaining_time": "0:32:49", "throughput": 4246.55, "total_tokens": 16543248} {"current_steps": 25350, "total_steps": 38160, "loss": 0.4429, "lr": 0.0003057886226915581, "epoch": 13.286163522012579, "percentage": 66.43, "elapsed_time": "1:04:56", "remaining_time": "0:32:48", "throughput": 4246.58, "total_tokens": 16546544} {"current_steps": 25355, "total_steps": 38160, "loss": 0.4728, "lr": 0.00030557791342023476, "epoch": 13.288784067085954, "percentage": 66.44, "elapsed_time": "1:04:57", "remaining_time": "0:32:48", "throughput": 4246.62, "total_tokens": 16549744} {"current_steps": 25360, "total_steps": 38160, "loss": 0.5453, "lr": 0.0003053672448197941, "epoch": 13.29140461215933, "percentage": 66.46, "elapsed_time": "1:04:57", "remaining_time": "0:32:47", "throughput": 4246.62, "total_tokens": 16552656} {"current_steps": 25365, "total_steps": 38160, "loss": 0.7457, "lr": 0.0003051566169343052, "epoch": 13.294025157232705, "percentage": 66.47, "elapsed_time": "1:04:58", "remaining_time": "0:32:46", "throughput": 4246.65, "total_tokens": 16555824} {"current_steps": 25370, "total_steps": 38160, "loss": 0.4338, "lr": 0.00030494602980782917, "epoch": 13.29664570230608, "percentage": 66.48, "elapsed_time": "1:04:59", "remaining_time": "0:32:45", "throughput": 4246.7, "total_tokens": 16559056} {"current_steps": 25375, "total_steps": 38160, "loss": 0.3174, "lr": 0.00030473548348441845, "epoch": 13.299266247379455, "percentage": 66.5, "elapsed_time": "1:04:59", "remaining_time": "0:32:44", "throughput": 4246.67, "total_tokens": 16561744} {"current_steps": 25380, "total_steps": 38160, "loss": 0.4161, "lr": 0.000304524978008117, "epoch": 13.30188679245283, "percentage": 66.51, "elapsed_time": "1:05:00", "remaining_time": "0:32:44", "throughput": 4246.69, "total_tokens": 16564784} {"current_steps": 25385, "total_steps": 38160, "loss": 0.4984, "lr": 0.0003043145134229599, "epoch": 13.304507337526205, "percentage": 66.52, "elapsed_time": "1:05:01", "remaining_time": "0:32:43", "throughput": 4246.65, "total_tokens": 16567280} {"current_steps": 25390, "total_steps": 38160, "loss": 0.4461, "lr": 0.0003041040897729742, "epoch": 13.30712788259958, "percentage": 66.54, "elapsed_time": "1:05:01", "remaining_time": "0:32:42", "throughput": 4246.61, "total_tokens": 16569840} {"current_steps": 25395, "total_steps": 38160, "loss": 0.4929, "lr": 0.0003038937071021778, "epoch": 13.309748427672956, "percentage": 66.55, "elapsed_time": "1:05:02", "remaining_time": "0:32:41", "throughput": 4246.64, "total_tokens": 16572976} {"current_steps": 25400, "total_steps": 38160, "loss": 0.4637, "lr": 0.0003036833654545808, "epoch": 13.31236897274633, "percentage": 66.56, "elapsed_time": "1:05:03", "remaining_time": "0:32:40", "throughput": 4246.64, "total_tokens": 16575792} {"current_steps": 25405, "total_steps": 38160, "loss": 0.4486, "lr": 0.0003034730648741841, "epoch": 13.314989517819706, "percentage": 66.57, "elapsed_time": "1:05:03", "remaining_time": "0:32:40", "throughput": 4246.66, "total_tokens": 16578800} {"current_steps": 25410, "total_steps": 38160, "loss": 0.4268, "lr": 0.00030326280540497996, "epoch": 13.317610062893081, "percentage": 66.59, "elapsed_time": "1:05:04", "remaining_time": "0:32:39", "throughput": 4246.8, "total_tokens": 16582864} {"current_steps": 25415, "total_steps": 38160, "loss": 0.606, "lr": 0.0003030525870909525, "epoch": 13.320230607966456, "percentage": 66.6, "elapsed_time": "1:05:05", "remaining_time": "0:32:38", "throughput": 4246.83, "total_tokens": 16585968} {"current_steps": 25420, "total_steps": 38160, "loss": 0.4532, "lr": 0.0003028424099760768, "epoch": 13.322851153039831, "percentage": 66.61, "elapsed_time": "1:05:06", "remaining_time": "0:32:37", "throughput": 4247.23, "total_tokens": 16592752} {"current_steps": 25425, "total_steps": 38160, "loss": 0.5094, "lr": 0.0003026322741043198, "epoch": 13.325471698113208, "percentage": 66.63, "elapsed_time": "1:05:07", "remaining_time": "0:32:37", "throughput": 4247.23, "total_tokens": 16595632} {"current_steps": 25430, "total_steps": 38160, "loss": 0.4875, "lr": 0.0003024221795196393, "epoch": 13.328092243186584, "percentage": 66.64, "elapsed_time": "1:05:08", "remaining_time": "0:32:36", "throughput": 4247.18, "total_tokens": 16598096} {"current_steps": 25435, "total_steps": 38160, "loss": 0.413, "lr": 0.0003022121262659849, "epoch": 13.330712788259959, "percentage": 66.65, "elapsed_time": "1:05:08", "remaining_time": "0:32:35", "throughput": 4247.19, "total_tokens": 16601040} {"current_steps": 25440, "total_steps": 38160, "loss": 0.5357, "lr": 0.00030200211438729705, "epoch": 13.333333333333334, "percentage": 66.67, "elapsed_time": "1:05:09", "remaining_time": "0:32:34", "throughput": 4247.2, "total_tokens": 16603984} {"current_steps": 25445, "total_steps": 38160, "loss": 0.4883, "lr": 0.000301792143927508, "epoch": 13.335953878406709, "percentage": 66.68, "elapsed_time": "1:05:10", "remaining_time": "0:32:33", "throughput": 4247.25, "total_tokens": 16607280} {"current_steps": 25450, "total_steps": 38160, "loss": 0.4161, "lr": 0.0003015822149305411, "epoch": 13.338574423480084, "percentage": 66.69, "elapsed_time": "1:05:10", "remaining_time": "0:32:33", "throughput": 4247.31, "total_tokens": 16610576} {"current_steps": 25455, "total_steps": 38160, "loss": 0.4775, "lr": 0.0003013723274403113, "epoch": 13.34119496855346, "percentage": 66.71, "elapsed_time": "1:05:11", "remaining_time": "0:32:32", "throughput": 4247.55, "total_tokens": 16615728} {"current_steps": 25460, "total_steps": 38160, "loss": 0.47, "lr": 0.00030116248150072444, "epoch": 13.343815513626835, "percentage": 66.72, "elapsed_time": "1:05:12", "remaining_time": "0:32:31", "throughput": 4247.54, "total_tokens": 16618576} {"current_steps": 25465, "total_steps": 38160, "loss": 0.4333, "lr": 0.00030095267715567816, "epoch": 13.34643605870021, "percentage": 66.73, "elapsed_time": "1:05:13", "remaining_time": "0:32:30", "throughput": 4247.7, "total_tokens": 16622832} {"current_steps": 25470, "total_steps": 38160, "loss": 0.3891, "lr": 0.00030074291444906085, "epoch": 13.349056603773585, "percentage": 66.75, "elapsed_time": "1:05:13", "remaining_time": "0:32:30", "throughput": 4247.63, "total_tokens": 16625168} {"current_steps": 25475, "total_steps": 38160, "loss": 0.4146, "lr": 0.00030053319342475247, "epoch": 13.35167714884696, "percentage": 66.76, "elapsed_time": "1:05:14", "remaining_time": "0:32:29", "throughput": 4247.74, "total_tokens": 16628944} {"current_steps": 25480, "total_steps": 38160, "loss": 0.4132, "lr": 0.00030032351412662465, "epoch": 13.354297693920335, "percentage": 66.77, "elapsed_time": "1:05:15", "remaining_time": "0:32:28", "throughput": 4247.79, "total_tokens": 16632208} {"current_steps": 25485, "total_steps": 38160, "loss": 0.4333, "lr": 0.0003001138765985394, "epoch": 13.35691823899371, "percentage": 66.78, "elapsed_time": "1:05:16", "remaining_time": "0:32:27", "throughput": 4247.76, "total_tokens": 16634960} {"current_steps": 25490, "total_steps": 38160, "loss": 0.4132, "lr": 0.00029990428088435097, "epoch": 13.359538784067086, "percentage": 66.8, "elapsed_time": "1:05:16", "remaining_time": "0:32:26", "throughput": 4247.73, "total_tokens": 16637616} {"current_steps": 25495, "total_steps": 38160, "loss": 0.4864, "lr": 0.000299694727027904, "epoch": 13.36215932914046, "percentage": 66.81, "elapsed_time": "1:05:17", "remaining_time": "0:32:26", "throughput": 4247.77, "total_tokens": 16640880} {"current_steps": 25500, "total_steps": 38160, "loss": 0.4037, "lr": 0.00029948521507303495, "epoch": 13.364779874213836, "percentage": 66.82, "elapsed_time": "1:05:18", "remaining_time": "0:32:25", "throughput": 4247.73, "total_tokens": 16643504} {"current_steps": 25505, "total_steps": 38160, "loss": 0.4191, "lr": 0.0002992757450635714, "epoch": 13.367400419287211, "percentage": 66.84, "elapsed_time": "1:05:18", "remaining_time": "0:32:24", "throughput": 4247.82, "total_tokens": 16647120} {"current_steps": 25510, "total_steps": 38160, "loss": 0.446, "lr": 0.00029906631704333187, "epoch": 13.370020964360586, "percentage": 66.85, "elapsed_time": "1:05:19", "remaining_time": "0:32:23", "throughput": 4247.95, "total_tokens": 16651248} {"current_steps": 25515, "total_steps": 38160, "loss": 0.3254, "lr": 0.0002988569310561264, "epoch": 13.372641509433961, "percentage": 66.86, "elapsed_time": "1:05:20", "remaining_time": "0:32:22", "throughput": 4247.9, "total_tokens": 16653744} {"current_steps": 25520, "total_steps": 38160, "loss": 0.3403, "lr": 0.0002986475871457566, "epoch": 13.375262054507338, "percentage": 66.88, "elapsed_time": "1:05:21", "remaining_time": "0:32:22", "throughput": 4247.91, "total_tokens": 16656752} {"current_steps": 25525, "total_steps": 38160, "loss": 0.3861, "lr": 0.000298438285356014, "epoch": 13.377882599580714, "percentage": 66.89, "elapsed_time": "1:05:21", "remaining_time": "0:32:21", "throughput": 4247.94, "total_tokens": 16659984} {"current_steps": 25530, "total_steps": 38160, "loss": 0.4718, "lr": 0.00029822902573068257, "epoch": 13.380503144654089, "percentage": 66.9, "elapsed_time": "1:05:22", "remaining_time": "0:32:20", "throughput": 4248.01, "total_tokens": 16663440} {"current_steps": 25535, "total_steps": 38160, "loss": 0.4315, "lr": 0.0002980198083135372, "epoch": 13.383123689727464, "percentage": 66.92, "elapsed_time": "1:05:23", "remaining_time": "0:32:19", "throughput": 4248.14, "total_tokens": 16667440} {"current_steps": 25540, "total_steps": 38160, "loss": 0.4739, "lr": 0.0002978106331483435, "epoch": 13.385744234800839, "percentage": 66.93, "elapsed_time": "1:05:24", "remaining_time": "0:32:19", "throughput": 4248.13, "total_tokens": 16670256} {"current_steps": 25545, "total_steps": 38160, "loss": 0.4063, "lr": 0.00029760150027885874, "epoch": 13.388364779874214, "percentage": 66.94, "elapsed_time": "1:05:24", "remaining_time": "0:32:18", "throughput": 4248.12, "total_tokens": 16673040} {"current_steps": 25550, "total_steps": 38160, "loss": 0.4029, "lr": 0.0002973924097488311, "epoch": 13.39098532494759, "percentage": 66.95, "elapsed_time": "1:05:25", "remaining_time": "0:32:17", "throughput": 4248.13, "total_tokens": 16676016} {"current_steps": 25555, "total_steps": 38160, "loss": 0.4456, "lr": 0.00029718336160199977, "epoch": 13.393605870020965, "percentage": 66.97, "elapsed_time": "1:05:26", "remaining_time": "0:32:16", "throughput": 4248.2, "total_tokens": 16679536} {"current_steps": 25560, "total_steps": 38160, "loss": 0.4485, "lr": 0.00029697435588209537, "epoch": 13.39622641509434, "percentage": 66.98, "elapsed_time": "1:05:26", "remaining_time": "0:32:15", "throughput": 4248.23, "total_tokens": 16682672} {"current_steps": 25565, "total_steps": 38160, "loss": 0.3726, "lr": 0.00029676539263283943, "epoch": 13.398846960167715, "percentage": 66.99, "elapsed_time": "1:05:27", "remaining_time": "0:32:15", "throughput": 4248.22, "total_tokens": 16685424} {"current_steps": 25570, "total_steps": 38160, "loss": 0.5266, "lr": 0.0002965564718979448, "epoch": 13.40146750524109, "percentage": 67.01, "elapsed_time": "1:05:28", "remaining_time": "0:32:14", "throughput": 4248.33, "total_tokens": 16689328} {"current_steps": 25575, "total_steps": 38160, "loss": 0.3734, "lr": 0.0002963475937211151, "epoch": 13.404088050314465, "percentage": 67.02, "elapsed_time": "1:05:29", "remaining_time": "0:32:13", "throughput": 4248.39, "total_tokens": 16692656} {"current_steps": 25580, "total_steps": 38160, "loss": 0.4899, "lr": 0.0002961387581460456, "epoch": 13.40670859538784, "percentage": 67.03, "elapsed_time": "1:05:30", "remaining_time": "0:32:12", "throughput": 4248.54, "total_tokens": 16696912} {"current_steps": 25585, "total_steps": 38160, "loss": 0.4921, "lr": 0.0002959299652164221, "epoch": 13.409329140461216, "percentage": 67.05, "elapsed_time": "1:05:30", "remaining_time": "0:32:11", "throughput": 4248.52, "total_tokens": 16699600} {"current_steps": 25590, "total_steps": 38160, "loss": 0.5146, "lr": 0.00029572121497592154, "epoch": 13.41194968553459, "percentage": 67.06, "elapsed_time": "1:05:31", "remaining_time": "0:32:11", "throughput": 4248.53, "total_tokens": 16702608} {"current_steps": 25595, "total_steps": 38160, "loss": 0.3582, "lr": 0.00029551250746821236, "epoch": 13.414570230607966, "percentage": 67.07, "elapsed_time": "1:05:32", "remaining_time": "0:32:10", "throughput": 4248.58, "total_tokens": 16705968} {"current_steps": 25600, "total_steps": 38160, "loss": 0.4707, "lr": 0.0002953038427369537, "epoch": 13.417190775681341, "percentage": 67.09, "elapsed_time": "1:05:32", "remaining_time": "0:32:09", "throughput": 4248.76, "total_tokens": 16710320} {"current_steps": 25605, "total_steps": 38160, "loss": 0.437, "lr": 0.000295095220825796, "epoch": 13.419811320754716, "percentage": 67.1, "elapsed_time": "1:05:33", "remaining_time": "0:32:08", "throughput": 4248.76, "total_tokens": 16713200} {"current_steps": 25610, "total_steps": 38160, "loss": 0.4364, "lr": 0.00029488664177838023, "epoch": 13.422431865828091, "percentage": 67.11, "elapsed_time": "1:05:34", "remaining_time": "0:32:08", "throughput": 4248.77, "total_tokens": 16716176} {"current_steps": 25615, "total_steps": 38160, "loss": 0.3963, "lr": 0.0002946781056383391, "epoch": 13.425052410901468, "percentage": 67.13, "elapsed_time": "1:05:35", "remaining_time": "0:32:07", "throughput": 4248.81, "total_tokens": 16719504} {"current_steps": 25620, "total_steps": 38160, "loss": 0.419, "lr": 0.0002944696124492956, "epoch": 13.427672955974844, "percentage": 67.14, "elapsed_time": "1:05:36", "remaining_time": "0:32:06", "throughput": 4249.02, "total_tokens": 16724176} {"current_steps": 25625, "total_steps": 38160, "loss": 0.2662, "lr": 0.0002942611622548645, "epoch": 13.430293501048219, "percentage": 67.15, "elapsed_time": "1:05:36", "remaining_time": "0:32:05", "throughput": 4249.05, "total_tokens": 16727344} {"current_steps": 25630, "total_steps": 38160, "loss": 0.4267, "lr": 0.00029405275509865103, "epoch": 13.432914046121594, "percentage": 67.16, "elapsed_time": "1:05:37", "remaining_time": "0:32:04", "throughput": 4249.04, "total_tokens": 16730256} {"current_steps": 25635, "total_steps": 38160, "loss": 0.5198, "lr": 0.00029384439102425174, "epoch": 13.435534591194969, "percentage": 67.18, "elapsed_time": "1:05:38", "remaining_time": "0:32:04", "throughput": 4249.05, "total_tokens": 16733168} {"current_steps": 25640, "total_steps": 38160, "loss": 0.5226, "lr": 0.0002936360700752539, "epoch": 13.438155136268344, "percentage": 67.19, "elapsed_time": "1:05:38", "remaining_time": "0:32:03", "throughput": 4249.14, "total_tokens": 16736816} {"current_steps": 25645, "total_steps": 38160, "loss": 0.3794, "lr": 0.00029342779229523573, "epoch": 13.44077568134172, "percentage": 67.2, "elapsed_time": "1:05:39", "remaining_time": "0:32:02", "throughput": 4249.13, "total_tokens": 16739632} {"current_steps": 25650, "total_steps": 38160, "loss": 0.383, "lr": 0.00029321955772776675, "epoch": 13.443396226415095, "percentage": 67.22, "elapsed_time": "1:05:40", "remaining_time": "0:32:01", "throughput": 4249.28, "total_tokens": 16743792} {"current_steps": 25655, "total_steps": 38160, "loss": 0.3305, "lr": 0.00029301136641640723, "epoch": 13.44601677148847, "percentage": 67.23, "elapsed_time": "1:05:41", "remaining_time": "0:32:01", "throughput": 4249.37, "total_tokens": 16747504} {"current_steps": 25660, "total_steps": 38160, "loss": 0.3724, "lr": 0.0002928032184047085, "epoch": 13.448637316561845, "percentage": 67.24, "elapsed_time": "1:05:41", "remaining_time": "0:32:00", "throughput": 4249.48, "total_tokens": 16751312} {"current_steps": 25665, "total_steps": 38160, "loss": 0.4017, "lr": 0.0002925951137362126, "epoch": 13.45125786163522, "percentage": 67.26, "elapsed_time": "1:05:42", "remaining_time": "0:31:59", "throughput": 4249.55, "total_tokens": 16754768} {"current_steps": 25670, "total_steps": 38160, "loss": 0.4237, "lr": 0.00029238705245445264, "epoch": 13.453878406708595, "percentage": 67.27, "elapsed_time": "1:05:43", "remaining_time": "0:31:58", "throughput": 4249.53, "total_tokens": 16757488} {"current_steps": 25675, "total_steps": 38160, "loss": 0.4815, "lr": 0.0002921790346029527, "epoch": 13.45649895178197, "percentage": 67.28, "elapsed_time": "1:05:44", "remaining_time": "0:31:57", "throughput": 4249.48, "total_tokens": 16760048} {"current_steps": 25680, "total_steps": 38160, "loss": 0.5181, "lr": 0.0002919710602252279, "epoch": 13.459119496855346, "percentage": 67.3, "elapsed_time": "1:05:44", "remaining_time": "0:31:57", "throughput": 4249.51, "total_tokens": 16763152} {"current_steps": 25685, "total_steps": 38160, "loss": 0.4193, "lr": 0.0002917631293647838, "epoch": 13.46174004192872, "percentage": 67.31, "elapsed_time": "1:05:45", "remaining_time": "0:31:56", "throughput": 4249.59, "total_tokens": 16766608} {"current_steps": 25690, "total_steps": 38160, "loss": 0.7365, "lr": 0.0002915552420651176, "epoch": 13.464360587002096, "percentage": 67.32, "elapsed_time": "1:05:46", "remaining_time": "0:31:55", "throughput": 4249.99, "total_tokens": 16773584} {"current_steps": 25695, "total_steps": 38160, "loss": 0.3426, "lr": 0.00029134739836971657, "epoch": 13.466981132075471, "percentage": 67.33, "elapsed_time": "1:05:47", "remaining_time": "0:31:54", "throughput": 4250.04, "total_tokens": 16776976} {"current_steps": 25700, "total_steps": 38160, "loss": 0.3537, "lr": 0.0002911395983220595, "epoch": 13.469601677148846, "percentage": 67.35, "elapsed_time": "1:05:48", "remaining_time": "0:31:54", "throughput": 4250.0, "total_tokens": 16779568} {"current_steps": 25705, "total_steps": 38160, "loss": 0.5102, "lr": 0.0002909318419656154, "epoch": 13.472222222222221, "percentage": 67.36, "elapsed_time": "1:05:48", "remaining_time": "0:31:53", "throughput": 4250.02, "total_tokens": 16782576} {"current_steps": 25710, "total_steps": 38160, "loss": 0.4478, "lr": 0.00029072412934384484, "epoch": 13.474842767295598, "percentage": 67.37, "elapsed_time": "1:05:49", "remaining_time": "0:31:52", "throughput": 4250.08, "total_tokens": 16785968} {"current_steps": 25715, "total_steps": 38160, "loss": 0.52, "lr": 0.00029051646050019884, "epoch": 13.477463312368974, "percentage": 67.39, "elapsed_time": "1:05:50", "remaining_time": "0:31:51", "throughput": 4250.2, "total_tokens": 16789872} {"current_steps": 25720, "total_steps": 38160, "loss": 0.3665, "lr": 0.00029030883547811966, "epoch": 13.480083857442349, "percentage": 67.4, "elapsed_time": "1:05:51", "remaining_time": "0:31:51", "throughput": 4250.22, "total_tokens": 16792944} {"current_steps": 25725, "total_steps": 38160, "loss": 0.3392, "lr": 0.0002901012543210397, "epoch": 13.482704402515724, "percentage": 67.41, "elapsed_time": "1:05:51", "remaining_time": "0:31:50", "throughput": 4250.26, "total_tokens": 16796176} {"current_steps": 25730, "total_steps": 38160, "loss": 0.4537, "lr": 0.00028989371707238264, "epoch": 13.485324947589099, "percentage": 67.43, "elapsed_time": "1:05:52", "remaining_time": "0:31:49", "throughput": 4250.3, "total_tokens": 16799504} {"current_steps": 25735, "total_steps": 38160, "loss": 0.4152, "lr": 0.00028968622377556285, "epoch": 13.487945492662474, "percentage": 67.44, "elapsed_time": "1:05:53", "remaining_time": "0:31:48", "throughput": 4250.3, "total_tokens": 16802384} {"current_steps": 25740, "total_steps": 38160, "loss": 0.3576, "lr": 0.00028947877447398567, "epoch": 13.49056603773585, "percentage": 67.45, "elapsed_time": "1:05:53", "remaining_time": "0:31:47", "throughput": 4250.4, "total_tokens": 16806064} {"current_steps": 25745, "total_steps": 38160, "loss": 0.511, "lr": 0.00028927136921104733, "epoch": 13.493186582809225, "percentage": 67.47, "elapsed_time": "1:05:54", "remaining_time": "0:31:47", "throughput": 4250.36, "total_tokens": 16808560} {"current_steps": 25750, "total_steps": 38160, "loss": 0.606, "lr": 0.00028906400803013446, "epoch": 13.4958071278826, "percentage": 67.48, "elapsed_time": "1:05:55", "remaining_time": "0:31:46", "throughput": 4250.39, "total_tokens": 16811696} {"current_steps": 25755, "total_steps": 38160, "loss": 0.369, "lr": 0.00028885669097462435, "epoch": 13.498427672955975, "percentage": 67.49, "elapsed_time": "1:05:56", "remaining_time": "0:31:45", "throughput": 4250.51, "total_tokens": 16815600} {"current_steps": 25760, "total_steps": 38160, "loss": 0.3211, "lr": 0.0002886494180878857, "epoch": 13.50104821802935, "percentage": 67.51, "elapsed_time": "1:05:56", "remaining_time": "0:31:44", "throughput": 4250.46, "total_tokens": 16818064} {"current_steps": 25765, "total_steps": 38160, "loss": 0.4336, "lr": 0.00028844218941327757, "epoch": 13.503668763102725, "percentage": 67.52, "elapsed_time": "1:05:57", "remaining_time": "0:31:43", "throughput": 4250.48, "total_tokens": 16821104} {"current_steps": 25770, "total_steps": 38160, "loss": 0.3712, "lr": 0.0002882350049941498, "epoch": 13.5062893081761, "percentage": 67.53, "elapsed_time": "1:05:58", "remaining_time": "0:31:43", "throughput": 4250.59, "total_tokens": 16824848} {"current_steps": 25775, "total_steps": 38160, "loss": 0.3964, "lr": 0.0002880278648738432, "epoch": 13.508909853249476, "percentage": 67.54, "elapsed_time": "1:05:58", "remaining_time": "0:31:42", "throughput": 4250.64, "total_tokens": 16828144} {"current_steps": 25780, "total_steps": 38160, "loss": 0.4377, "lr": 0.0002878207690956891, "epoch": 13.51153039832285, "percentage": 67.56, "elapsed_time": "1:05:59", "remaining_time": "0:31:41", "throughput": 4250.68, "total_tokens": 16831408} {"current_steps": 25785, "total_steps": 38160, "loss": 0.5307, "lr": 0.00028761371770300915, "epoch": 13.514150943396226, "percentage": 67.57, "elapsed_time": "1:06:00", "remaining_time": "0:31:40", "throughput": 4250.72, "total_tokens": 16834544} {"current_steps": 25790, "total_steps": 38160, "loss": 0.5539, "lr": 0.0002874067107391164, "epoch": 13.516771488469601, "percentage": 67.58, "elapsed_time": "1:06:01", "remaining_time": "0:31:39", "throughput": 4250.72, "total_tokens": 16837360} {"current_steps": 25795, "total_steps": 38160, "loss": 0.3911, "lr": 0.00028719974824731445, "epoch": 13.519392033542976, "percentage": 67.6, "elapsed_time": "1:06:01", "remaining_time": "0:31:39", "throughput": 4250.7, "total_tokens": 16840176} {"current_steps": 25800, "total_steps": 38160, "loss": 0.4586, "lr": 0.0002869928302708975, "epoch": 13.522012578616351, "percentage": 67.61, "elapsed_time": "1:06:02", "remaining_time": "0:31:38", "throughput": 4250.82, "total_tokens": 16844080} {"current_steps": 25805, "total_steps": 38160, "loss": 0.3891, "lr": 0.00028678595685315044, "epoch": 13.524633123689728, "percentage": 67.62, "elapsed_time": "1:06:03", "remaining_time": "0:31:37", "throughput": 4250.82, "total_tokens": 16846928} {"current_steps": 25810, "total_steps": 38160, "loss": 0.4514, "lr": 0.00028657912803734854, "epoch": 13.527253668763104, "percentage": 67.64, "elapsed_time": "1:06:03", "remaining_time": "0:31:36", "throughput": 4250.82, "total_tokens": 16849840} {"current_steps": 25815, "total_steps": 38160, "loss": 0.3618, "lr": 0.00028637234386675816, "epoch": 13.529874213836479, "percentage": 67.65, "elapsed_time": "1:06:04", "remaining_time": "0:31:35", "throughput": 4250.88, "total_tokens": 16853328} {"current_steps": 25820, "total_steps": 38160, "loss": 0.4805, "lr": 0.00028616560438463626, "epoch": 13.532494758909854, "percentage": 67.66, "elapsed_time": "1:06:05", "remaining_time": "0:31:35", "throughput": 4250.87, "total_tokens": 16856080} {"current_steps": 25825, "total_steps": 38160, "loss": 0.3617, "lr": 0.00028595890963423057, "epoch": 13.535115303983229, "percentage": 67.68, "elapsed_time": "1:06:06", "remaining_time": "0:31:34", "throughput": 4250.88, "total_tokens": 16858992} {"current_steps": 25830, "total_steps": 38160, "loss": 0.4013, "lr": 0.0002857522596587789, "epoch": 13.537735849056604, "percentage": 67.69, "elapsed_time": "1:06:06", "remaining_time": "0:31:33", "throughput": 4250.88, "total_tokens": 16861968} {"current_steps": 25835, "total_steps": 38160, "loss": 0.3946, "lr": 0.00028554565450151045, "epoch": 13.54035639412998, "percentage": 67.7, "elapsed_time": "1:06:07", "remaining_time": "0:31:32", "throughput": 4250.94, "total_tokens": 16865232} {"current_steps": 25840, "total_steps": 38160, "loss": 0.3882, "lr": 0.00028533909420564417, "epoch": 13.542976939203355, "percentage": 67.71, "elapsed_time": "1:06:08", "remaining_time": "0:31:31", "throughput": 4250.97, "total_tokens": 16868432} {"current_steps": 25845, "total_steps": 38160, "loss": 0.4201, "lr": 0.00028513257881439047, "epoch": 13.54559748427673, "percentage": 67.73, "elapsed_time": "1:06:08", "remaining_time": "0:31:31", "throughput": 4250.99, "total_tokens": 16871408} {"current_steps": 25850, "total_steps": 38160, "loss": 0.4228, "lr": 0.00028492610837095003, "epoch": 13.548218029350105, "percentage": 67.74, "elapsed_time": "1:06:09", "remaining_time": "0:31:30", "throughput": 4251.09, "total_tokens": 16875184} {"current_steps": 25855, "total_steps": 38160, "loss": 0.3974, "lr": 0.00028471968291851407, "epoch": 13.55083857442348, "percentage": 67.75, "elapsed_time": "1:06:10", "remaining_time": "0:31:29", "throughput": 4251.09, "total_tokens": 16878064} {"current_steps": 25860, "total_steps": 38160, "loss": 0.5388, "lr": 0.0002845133025002645, "epoch": 13.553459119496855, "percentage": 67.77, "elapsed_time": "1:06:11", "remaining_time": "0:31:28", "throughput": 4251.1, "total_tokens": 16881104} {"current_steps": 25865, "total_steps": 38160, "loss": 0.5791, "lr": 0.0002843069671593734, "epoch": 13.55607966457023, "percentage": 67.78, "elapsed_time": "1:06:11", "remaining_time": "0:31:27", "throughput": 4251.13, "total_tokens": 16884272} {"current_steps": 25870, "total_steps": 38160, "loss": 0.4704, "lr": 0.000284100676939004, "epoch": 13.558700209643606, "percentage": 67.79, "elapsed_time": "1:06:12", "remaining_time": "0:31:27", "throughput": 4251.2, "total_tokens": 16887856} {"current_steps": 25875, "total_steps": 38160, "loss": 0.4171, "lr": 0.0002838944318823099, "epoch": 13.56132075471698, "percentage": 67.81, "elapsed_time": "1:06:13", "remaining_time": "0:31:26", "throughput": 4251.22, "total_tokens": 16890928} {"current_steps": 25880, "total_steps": 38160, "loss": 0.4286, "lr": 0.0002836882320324354, "epoch": 13.563941299790356, "percentage": 67.82, "elapsed_time": "1:06:13", "remaining_time": "0:31:25", "throughput": 4251.21, "total_tokens": 16893680} {"current_steps": 25885, "total_steps": 38160, "loss": 0.4829, "lr": 0.00028348207743251477, "epoch": 13.566561844863731, "percentage": 67.83, "elapsed_time": "1:06:14", "remaining_time": "0:31:24", "throughput": 4251.3, "total_tokens": 16897392} {"current_steps": 25890, "total_steps": 38160, "loss": 0.5186, "lr": 0.0002832759681256735, "epoch": 13.569182389937106, "percentage": 67.85, "elapsed_time": "1:06:15", "remaining_time": "0:31:24", "throughput": 4251.26, "total_tokens": 16900016} {"current_steps": 25895, "total_steps": 38160, "loss": 0.3666, "lr": 0.000283069904155027, "epoch": 13.571802935010481, "percentage": 67.86, "elapsed_time": "1:06:16", "remaining_time": "0:31:23", "throughput": 4251.43, "total_tokens": 16904400} {"current_steps": 25900, "total_steps": 38160, "loss": 0.544, "lr": 0.0002828638855636817, "epoch": 13.574423480083858, "percentage": 67.87, "elapsed_time": "1:06:16", "remaining_time": "0:31:22", "throughput": 4251.55, "total_tokens": 16908336} {"current_steps": 25905, "total_steps": 38160, "loss": 0.4132, "lr": 0.0002826579123947345, "epoch": 13.577044025157234, "percentage": 67.89, "elapsed_time": "1:06:17", "remaining_time": "0:31:21", "throughput": 4251.62, "total_tokens": 16911920} {"current_steps": 25910, "total_steps": 38160, "loss": 0.4442, "lr": 0.0002824519846912723, "epoch": 13.579664570230609, "percentage": 67.9, "elapsed_time": "1:06:18", "remaining_time": "0:31:20", "throughput": 4251.63, "total_tokens": 16914896} {"current_steps": 25915, "total_steps": 38160, "loss": 0.4446, "lr": 0.00028224610249637293, "epoch": 13.582285115303984, "percentage": 67.91, "elapsed_time": "1:06:19", "remaining_time": "0:31:20", "throughput": 4251.63, "total_tokens": 16917744} {"current_steps": 25920, "total_steps": 38160, "loss": 0.3888, "lr": 0.00028204026585310483, "epoch": 13.584905660377359, "percentage": 67.92, "elapsed_time": "1:06:19", "remaining_time": "0:31:19", "throughput": 4251.6, "total_tokens": 16920464} {"current_steps": 25925, "total_steps": 38160, "loss": 0.5066, "lr": 0.0002818344748045264, "epoch": 13.587526205450734, "percentage": 67.94, "elapsed_time": "1:06:20", "remaining_time": "0:31:18", "throughput": 4251.68, "total_tokens": 16923920} {"current_steps": 25930, "total_steps": 38160, "loss": 0.39, "lr": 0.0002816287293936868, "epoch": 13.59014675052411, "percentage": 67.95, "elapsed_time": "1:06:21", "remaining_time": "0:31:17", "throughput": 4251.8, "total_tokens": 16927856} {"current_steps": 25935, "total_steps": 38160, "loss": 0.6391, "lr": 0.0002814230296636259, "epoch": 13.592767295597485, "percentage": 67.96, "elapsed_time": "1:06:22", "remaining_time": "0:31:17", "throughput": 4251.79, "total_tokens": 16930672} {"current_steps": 25940, "total_steps": 38160, "loss": 0.4862, "lr": 0.0002812173756573734, "epoch": 13.59538784067086, "percentage": 67.98, "elapsed_time": "1:06:22", "remaining_time": "0:31:16", "throughput": 4251.8, "total_tokens": 16933584} {"current_steps": 25945, "total_steps": 38160, "loss": 0.4368, "lr": 0.00028101176741794984, "epoch": 13.598008385744235, "percentage": 67.99, "elapsed_time": "1:06:23", "remaining_time": "0:31:15", "throughput": 4251.74, "total_tokens": 16935952} {"current_steps": 25950, "total_steps": 38160, "loss": 0.3378, "lr": 0.0002808062049883664, "epoch": 13.60062893081761, "percentage": 68.0, "elapsed_time": "1:06:24", "remaining_time": "0:31:14", "throughput": 4251.76, "total_tokens": 16939024} {"current_steps": 25955, "total_steps": 38160, "loss": 0.4192, "lr": 0.00028060068841162403, "epoch": 13.603249475890985, "percentage": 68.02, "elapsed_time": "1:06:24", "remaining_time": "0:31:13", "throughput": 4251.83, "total_tokens": 16942576} {"current_steps": 25960, "total_steps": 38160, "loss": 0.4955, "lr": 0.00028039521773071477, "epoch": 13.60587002096436, "percentage": 68.03, "elapsed_time": "1:06:25", "remaining_time": "0:31:13", "throughput": 4251.86, "total_tokens": 16945808} {"current_steps": 25965, "total_steps": 38160, "loss": 0.4461, "lr": 0.0002801897929886204, "epoch": 13.608490566037736, "percentage": 68.04, "elapsed_time": "1:06:26", "remaining_time": "0:31:12", "throughput": 4251.87, "total_tokens": 16948752} {"current_steps": 25970, "total_steps": 38160, "loss": 0.4804, "lr": 0.0002799844142283135, "epoch": 13.61111111111111, "percentage": 68.06, "elapsed_time": "1:06:26", "remaining_time": "0:31:11", "throughput": 4251.88, "total_tokens": 16951856} {"current_steps": 25975, "total_steps": 38160, "loss": 0.3922, "lr": 0.00027977908149275733, "epoch": 13.613731656184486, "percentage": 68.07, "elapsed_time": "1:06:27", "remaining_time": "0:31:10", "throughput": 4251.92, "total_tokens": 16955088} {"current_steps": 25980, "total_steps": 38160, "loss": 0.3727, "lr": 0.00027957379482490476, "epoch": 13.616352201257861, "percentage": 68.08, "elapsed_time": "1:06:28", "remaining_time": "0:31:09", "throughput": 4251.98, "total_tokens": 16958576} {"current_steps": 25985, "total_steps": 38160, "loss": 0.4497, "lr": 0.0002793685542676997, "epoch": 13.618972746331236, "percentage": 68.09, "elapsed_time": "1:06:29", "remaining_time": "0:31:09", "throughput": 4252.02, "total_tokens": 16961904} {"current_steps": 25990, "total_steps": 38160, "loss": 0.5589, "lr": 0.0002791633598640758, "epoch": 13.621593291404611, "percentage": 68.11, "elapsed_time": "1:06:29", "remaining_time": "0:31:08", "throughput": 4252.05, "total_tokens": 16965008} {"current_steps": 25995, "total_steps": 38160, "loss": 0.5298, "lr": 0.0002789582116569576, "epoch": 13.624213836477988, "percentage": 68.12, "elapsed_time": "1:06:30", "remaining_time": "0:31:07", "throughput": 4252.12, "total_tokens": 16968592} {"current_steps": 26000, "total_steps": 38160, "loss": 0.3892, "lr": 0.0002787531096892597, "epoch": 13.626834381551364, "percentage": 68.13, "elapsed_time": "1:06:31", "remaining_time": "0:31:06", "throughput": 4252.1, "total_tokens": 16971280} {"current_steps": 26005, "total_steps": 38160, "loss": 0.4893, "lr": 0.0002785480540038874, "epoch": 13.629454926624739, "percentage": 68.15, "elapsed_time": "1:06:32", "remaining_time": "0:31:05", "throughput": 4252.28, "total_tokens": 16975696} {"current_steps": 26010, "total_steps": 38160, "loss": 0.476, "lr": 0.0002783430446437355, "epoch": 13.632075471698114, "percentage": 68.16, "elapsed_time": "1:06:32", "remaining_time": "0:31:05", "throughput": 4252.35, "total_tokens": 16979088} {"current_steps": 26015, "total_steps": 38160, "loss": 0.458, "lr": 0.00027813808165169006, "epoch": 13.634696016771489, "percentage": 68.17, "elapsed_time": "1:06:33", "remaining_time": "0:31:04", "throughput": 4252.3, "total_tokens": 16981552} {"current_steps": 26020, "total_steps": 38160, "loss": 0.2852, "lr": 0.00027793316507062667, "epoch": 13.637316561844864, "percentage": 68.19, "elapsed_time": "1:06:34", "remaining_time": "0:31:03", "throughput": 4252.27, "total_tokens": 16984208} {"current_steps": 26025, "total_steps": 38160, "loss": 0.468, "lr": 0.00027772829494341163, "epoch": 13.63993710691824, "percentage": 68.2, "elapsed_time": "1:06:34", "remaining_time": "0:31:02", "throughput": 4252.35, "total_tokens": 16987824} {"current_steps": 26030, "total_steps": 38160, "loss": 0.4537, "lr": 0.00027752347131290147, "epoch": 13.642557651991615, "percentage": 68.21, "elapsed_time": "1:06:35", "remaining_time": "0:31:02", "throughput": 4252.45, "total_tokens": 16991568} {"current_steps": 26035, "total_steps": 38160, "loss": 0.3679, "lr": 0.0002773186942219431, "epoch": 13.64517819706499, "percentage": 68.23, "elapsed_time": "1:06:36", "remaining_time": "0:31:01", "throughput": 4252.43, "total_tokens": 16994256} {"current_steps": 26040, "total_steps": 38160, "loss": 0.4545, "lr": 0.0002771139637133735, "epoch": 13.647798742138365, "percentage": 68.24, "elapsed_time": "1:06:37", "remaining_time": "0:31:00", "throughput": 4252.41, "total_tokens": 16996976} {"current_steps": 26045, "total_steps": 38160, "loss": 0.4453, "lr": 0.00027690927983001966, "epoch": 13.65041928721174, "percentage": 68.25, "elapsed_time": "1:06:37", "remaining_time": "0:30:59", "throughput": 4252.41, "total_tokens": 16999824} {"current_steps": 26050, "total_steps": 38160, "loss": 0.4558, "lr": 0.00027670464261469937, "epoch": 13.653039832285115, "percentage": 68.27, "elapsed_time": "1:06:38", "remaining_time": "0:30:58", "throughput": 4252.57, "total_tokens": 17004112} {"current_steps": 26055, "total_steps": 38160, "loss": 0.4527, "lr": 0.0002765000521102203, "epoch": 13.65566037735849, "percentage": 68.28, "elapsed_time": "1:06:39", "remaining_time": "0:30:57", "throughput": 4252.53, "total_tokens": 17006672} {"current_steps": 26060, "total_steps": 38160, "loss": 0.4398, "lr": 0.0002762955083593807, "epoch": 13.658280922431866, "percentage": 68.29, "elapsed_time": "1:06:39", "remaining_time": "0:30:57", "throughput": 4252.54, "total_tokens": 17009712} {"current_steps": 26065, "total_steps": 38160, "loss": 0.4832, "lr": 0.0002760910114049686, "epoch": 13.66090146750524, "percentage": 68.3, "elapsed_time": "1:06:40", "remaining_time": "0:30:56", "throughput": 4252.67, "total_tokens": 17013680} {"current_steps": 26070, "total_steps": 38160, "loss": 0.531, "lr": 0.0002758865612897623, "epoch": 13.663522012578616, "percentage": 68.32, "elapsed_time": "1:06:41", "remaining_time": "0:30:55", "throughput": 4252.71, "total_tokens": 17016880} {"current_steps": 26075, "total_steps": 38160, "loss": 0.5601, "lr": 0.00027568215805653045, "epoch": 13.666142557651991, "percentage": 68.33, "elapsed_time": "1:06:42", "remaining_time": "0:30:54", "throughput": 4252.65, "total_tokens": 17019312} {"current_steps": 26080, "total_steps": 38160, "loss": 0.5105, "lr": 0.00027547780174803205, "epoch": 13.668763102725366, "percentage": 68.34, "elapsed_time": "1:06:42", "remaining_time": "0:30:54", "throughput": 4252.65, "total_tokens": 17022032} {"current_steps": 26085, "total_steps": 38160, "loss": 0.4301, "lr": 0.0002752734924070161, "epoch": 13.671383647798741, "percentage": 68.36, "elapsed_time": "1:06:43", "remaining_time": "0:30:53", "throughput": 4252.81, "total_tokens": 17026384} {"current_steps": 26090, "total_steps": 38160, "loss": 0.5461, "lr": 0.00027506923007622177, "epoch": 13.674004192872118, "percentage": 68.37, "elapsed_time": "1:06:44", "remaining_time": "0:30:52", "throughput": 4252.72, "total_tokens": 17028688} {"current_steps": 26095, "total_steps": 38160, "loss": 0.3949, "lr": 0.00027486501479837846, "epoch": 13.676624737945493, "percentage": 68.38, "elapsed_time": "1:06:44", "remaining_time": "0:30:51", "throughput": 4252.75, "total_tokens": 17031792} {"current_steps": 26100, "total_steps": 38160, "loss": 0.5074, "lr": 0.0002746608466162053, "epoch": 13.679245283018869, "percentage": 68.4, "elapsed_time": "1:06:45", "remaining_time": "0:30:50", "throughput": 4252.79, "total_tokens": 17035088} {"current_steps": 26105, "total_steps": 38160, "loss": 0.3223, "lr": 0.0002744567255724123, "epoch": 13.681865828092244, "percentage": 68.41, "elapsed_time": "1:06:46", "remaining_time": "0:30:50", "throughput": 4252.81, "total_tokens": 17038128} {"current_steps": 26110, "total_steps": 38160, "loss": 0.4912, "lr": 0.0002742526517096992, "epoch": 13.684486373165619, "percentage": 68.42, "elapsed_time": "1:06:47", "remaining_time": "0:30:49", "throughput": 4252.89, "total_tokens": 17041744} {"current_steps": 26115, "total_steps": 38160, "loss": 0.4433, "lr": 0.000274048625070756, "epoch": 13.687106918238994, "percentage": 68.44, "elapsed_time": "1:06:47", "remaining_time": "0:30:48", "throughput": 4252.92, "total_tokens": 17044880} {"current_steps": 26120, "total_steps": 38160, "loss": 0.5657, "lr": 0.0002738446456982627, "epoch": 13.68972746331237, "percentage": 68.45, "elapsed_time": "1:06:48", "remaining_time": "0:30:47", "throughput": 4253.06, "total_tokens": 17049040} {"current_steps": 26125, "total_steps": 38160, "loss": 0.5425, "lr": 0.0002736407136348892, "epoch": 13.692348008385745, "percentage": 68.46, "elapsed_time": "1:06:49", "remaining_time": "0:30:47", "throughput": 4253.11, "total_tokens": 17052368} {"current_steps": 26130, "total_steps": 38160, "loss": 0.3682, "lr": 0.0002734368289232959, "epoch": 13.69496855345912, "percentage": 68.47, "elapsed_time": "1:06:50", "remaining_time": "0:30:46", "throughput": 4253.22, "total_tokens": 17056272} {"current_steps": 26135, "total_steps": 38160, "loss": 0.3802, "lr": 0.00027323299160613335, "epoch": 13.697589098532495, "percentage": 68.49, "elapsed_time": "1:06:50", "remaining_time": "0:30:45", "throughput": 4253.25, "total_tokens": 17059440} {"current_steps": 26140, "total_steps": 38160, "loss": 0.4128, "lr": 0.00027302920172604173, "epoch": 13.70020964360587, "percentage": 68.5, "elapsed_time": "1:06:51", "remaining_time": "0:30:44", "throughput": 4253.3, "total_tokens": 17062832} {"current_steps": 26145, "total_steps": 38160, "loss": 0.4744, "lr": 0.00027282545932565214, "epoch": 13.702830188679245, "percentage": 68.51, "elapsed_time": "1:06:52", "remaining_time": "0:30:43", "throughput": 4253.28, "total_tokens": 17065520} {"current_steps": 26150, "total_steps": 38160, "loss": 0.3971, "lr": 0.00027262176444758435, "epoch": 13.70545073375262, "percentage": 68.53, "elapsed_time": "1:06:53", "remaining_time": "0:30:43", "throughput": 4253.33, "total_tokens": 17068848} {"current_steps": 26155, "total_steps": 38160, "loss": 0.3293, "lr": 0.00027241811713444935, "epoch": 13.708071278825996, "percentage": 68.54, "elapsed_time": "1:06:53", "remaining_time": "0:30:42", "throughput": 4253.35, "total_tokens": 17071984} {"current_steps": 26160, "total_steps": 38160, "loss": 0.4758, "lr": 0.0002722145174288478, "epoch": 13.71069182389937, "percentage": 68.55, "elapsed_time": "1:06:54", "remaining_time": "0:30:41", "throughput": 4253.39, "total_tokens": 17075248} {"current_steps": 26165, "total_steps": 38160, "loss": 0.5049, "lr": 0.0002720109653733706, "epoch": 13.713312368972746, "percentage": 68.57, "elapsed_time": "1:06:55", "remaining_time": "0:30:40", "throughput": 4253.5, "total_tokens": 17079120} {"current_steps": 26170, "total_steps": 38160, "loss": 0.466, "lr": 0.00027180746101059856, "epoch": 13.715932914046121, "percentage": 68.58, "elapsed_time": "1:06:56", "remaining_time": "0:30:40", "throughput": 4253.7, "total_tokens": 17083856} {"current_steps": 26175, "total_steps": 38160, "loss": 0.4966, "lr": 0.0002716040043831023, "epoch": 13.718553459119496, "percentage": 68.59, "elapsed_time": "1:06:56", "remaining_time": "0:30:39", "throughput": 4253.74, "total_tokens": 17087056} {"current_steps": 26180, "total_steps": 38160, "loss": 0.4799, "lr": 0.0002714005955334424, "epoch": 13.721174004192871, "percentage": 68.61, "elapsed_time": "1:06:57", "remaining_time": "0:30:38", "throughput": 4253.83, "total_tokens": 17090800} {"current_steps": 26185, "total_steps": 38160, "loss": 0.3818, "lr": 0.00027119723450417, "epoch": 13.723794549266248, "percentage": 68.62, "elapsed_time": "1:06:58", "remaining_time": "0:30:37", "throughput": 4253.77, "total_tokens": 17093168} {"current_steps": 26190, "total_steps": 38160, "loss": 0.3703, "lr": 0.0002709939213378258, "epoch": 13.726415094339622, "percentage": 68.63, "elapsed_time": "1:06:59", "remaining_time": "0:30:36", "throughput": 4253.8, "total_tokens": 17096304} {"current_steps": 26195, "total_steps": 38160, "loss": 0.3505, "lr": 0.0002707906560769408, "epoch": 13.729035639412999, "percentage": 68.65, "elapsed_time": "1:06:59", "remaining_time": "0:30:36", "throughput": 4253.84, "total_tokens": 17099568} {"current_steps": 26200, "total_steps": 38160, "loss": 0.3803, "lr": 0.0002705874387640354, "epoch": 13.731656184486374, "percentage": 68.66, "elapsed_time": "1:07:00", "remaining_time": "0:30:35", "throughput": 4253.97, "total_tokens": 17103696} {"current_steps": 26205, "total_steps": 38160, "loss": 0.4141, "lr": 0.00027038426944162074, "epoch": 13.734276729559749, "percentage": 68.67, "elapsed_time": "1:07:01", "remaining_time": "0:30:34", "throughput": 4253.94, "total_tokens": 17106384} {"current_steps": 26210, "total_steps": 38160, "loss": 0.4473, "lr": 0.0002701811481521971, "epoch": 13.736897274633124, "percentage": 68.68, "elapsed_time": "1:07:01", "remaining_time": "0:30:33", "throughput": 4253.89, "total_tokens": 17109040} {"current_steps": 26215, "total_steps": 38160, "loss": 0.3732, "lr": 0.0002699780749382554, "epoch": 13.7395178197065, "percentage": 68.7, "elapsed_time": "1:07:02", "remaining_time": "0:30:32", "throughput": 4253.95, "total_tokens": 17112496} {"current_steps": 26220, "total_steps": 38160, "loss": 0.4831, "lr": 0.0002697750498422761, "epoch": 13.742138364779874, "percentage": 68.71, "elapsed_time": "1:07:03", "remaining_time": "0:30:32", "throughput": 4253.95, "total_tokens": 17115472} {"current_steps": 26225, "total_steps": 38160, "loss": 0.4105, "lr": 0.0002695720729067301, "epoch": 13.74475890985325, "percentage": 68.72, "elapsed_time": "1:07:04", "remaining_time": "0:30:31", "throughput": 4253.92, "total_tokens": 17118224} {"current_steps": 26230, "total_steps": 38160, "loss": 0.5263, "lr": 0.00026936914417407756, "epoch": 13.747379454926625, "percentage": 68.74, "elapsed_time": "1:07:04", "remaining_time": "0:30:30", "throughput": 4254.05, "total_tokens": 17122384} {"current_steps": 26235, "total_steps": 38160, "loss": 0.3596, "lr": 0.0002691662636867687, "epoch": 13.75, "percentage": 68.75, "elapsed_time": "1:07:05", "remaining_time": "0:30:29", "throughput": 4254.13, "total_tokens": 17125936} {"current_steps": 26240, "total_steps": 38160, "loss": 0.5523, "lr": 0.000268963431487244, "epoch": 13.752620545073375, "percentage": 68.76, "elapsed_time": "1:07:06", "remaining_time": "0:30:29", "throughput": 4254.15, "total_tokens": 17128976} {"current_steps": 26245, "total_steps": 38160, "loss": 0.443, "lr": 0.0002687606476179336, "epoch": 13.75524109014675, "percentage": 68.78, "elapsed_time": "1:07:07", "remaining_time": "0:30:28", "throughput": 4254.26, "total_tokens": 17132912} {"current_steps": 26250, "total_steps": 38160, "loss": 0.5324, "lr": 0.0002685579121212578, "epoch": 13.757861635220126, "percentage": 68.79, "elapsed_time": "1:07:07", "remaining_time": "0:30:27", "throughput": 4254.28, "total_tokens": 17136016} {"current_steps": 26255, "total_steps": 38160, "loss": 0.4102, "lr": 0.00026835522503962616, "epoch": 13.7604821802935, "percentage": 68.8, "elapsed_time": "1:07:08", "remaining_time": "0:30:26", "throughput": 4254.31, "total_tokens": 17139184} {"current_steps": 26260, "total_steps": 38160, "loss": 0.4259, "lr": 0.00026815258641543896, "epoch": 13.763102725366876, "percentage": 68.82, "elapsed_time": "1:07:09", "remaining_time": "0:30:25", "throughput": 4254.33, "total_tokens": 17142352} {"current_steps": 26265, "total_steps": 38160, "loss": 0.4399, "lr": 0.0002679499962910853, "epoch": 13.765723270440251, "percentage": 68.83, "elapsed_time": "1:07:10", "remaining_time": "0:30:25", "throughput": 4254.39, "total_tokens": 17145808} {"current_steps": 26270, "total_steps": 38160, "loss": 0.324, "lr": 0.0002677474547089451, "epoch": 13.768343815513626, "percentage": 68.84, "elapsed_time": "1:07:10", "remaining_time": "0:30:24", "throughput": 4254.38, "total_tokens": 17148720} {"current_steps": 26275, "total_steps": 38160, "loss": 0.5694, "lr": 0.000267544961711388, "epoch": 13.770964360587001, "percentage": 68.85, "elapsed_time": "1:07:11", "remaining_time": "0:30:23", "throughput": 4254.4, "total_tokens": 17151792} {"current_steps": 26280, "total_steps": 38160, "loss": 0.516, "lr": 0.0002673425173407726, "epoch": 13.773584905660378, "percentage": 68.87, "elapsed_time": "1:07:12", "remaining_time": "0:30:22", "throughput": 4254.41, "total_tokens": 17154896} {"current_steps": 26285, "total_steps": 38160, "loss": 0.4093, "lr": 0.00026714012163944826, "epoch": 13.776205450733752, "percentage": 68.88, "elapsed_time": "1:07:13", "remaining_time": "0:30:22", "throughput": 4254.48, "total_tokens": 17158352} {"current_steps": 26290, "total_steps": 38160, "loss": 0.4066, "lr": 0.0002669377746497541, "epoch": 13.778825995807129, "percentage": 68.89, "elapsed_time": "1:07:13", "remaining_time": "0:30:21", "throughput": 4254.53, "total_tokens": 17161648} {"current_steps": 26295, "total_steps": 38160, "loss": 0.3856, "lr": 0.0002667354764140184, "epoch": 13.781446540880504, "percentage": 68.91, "elapsed_time": "1:07:14", "remaining_time": "0:30:20", "throughput": 4254.55, "total_tokens": 17164784} {"current_steps": 26300, "total_steps": 38160, "loss": 0.3866, "lr": 0.00026653322697455987, "epoch": 13.784067085953879, "percentage": 68.92, "elapsed_time": "1:07:15", "remaining_time": "0:30:19", "throughput": 4254.52, "total_tokens": 17167408} {"current_steps": 26305, "total_steps": 38160, "loss": 0.3582, "lr": 0.00026633102637368684, "epoch": 13.786687631027254, "percentage": 68.93, "elapsed_time": "1:07:15", "remaining_time": "0:30:18", "throughput": 4254.57, "total_tokens": 17170704} {"current_steps": 26310, "total_steps": 38160, "loss": 0.3416, "lr": 0.00026612887465369704, "epoch": 13.78930817610063, "percentage": 68.95, "elapsed_time": "1:07:16", "remaining_time": "0:30:18", "throughput": 4254.54, "total_tokens": 17173328} {"current_steps": 26315, "total_steps": 38160, "loss": 0.4875, "lr": 0.0002659267718568786, "epoch": 13.791928721174004, "percentage": 68.96, "elapsed_time": "1:07:17", "remaining_time": "0:30:17", "throughput": 4254.59, "total_tokens": 17176752} {"current_steps": 26320, "total_steps": 38160, "loss": 0.4549, "lr": 0.0002657247180255091, "epoch": 13.79454926624738, "percentage": 68.97, "elapsed_time": "1:07:17", "remaining_time": "0:30:16", "throughput": 4254.62, "total_tokens": 17179824} {"current_steps": 26325, "total_steps": 38160, "loss": 0.3731, "lr": 0.0002655227132018558, "epoch": 13.797169811320755, "percentage": 68.99, "elapsed_time": "1:07:18", "remaining_time": "0:30:15", "throughput": 4254.9, "total_tokens": 17185200} {"current_steps": 26330, "total_steps": 38160, "loss": 0.4021, "lr": 0.00026532075742817594, "epoch": 13.79979035639413, "percentage": 69.0, "elapsed_time": "1:07:19", "remaining_time": "0:30:15", "throughput": 4255.04, "total_tokens": 17189360} {"current_steps": 26335, "total_steps": 38160, "loss": 0.4144, "lr": 0.0002651188507467161, "epoch": 13.802410901467505, "percentage": 69.01, "elapsed_time": "1:07:20", "remaining_time": "0:30:14", "throughput": 4255.04, "total_tokens": 17192208} {"current_steps": 26340, "total_steps": 38160, "loss": 0.5534, "lr": 0.00026491699319971303, "epoch": 13.80503144654088, "percentage": 69.03, "elapsed_time": "1:07:21", "remaining_time": "0:30:13", "throughput": 4255.19, "total_tokens": 17196336} {"current_steps": 26345, "total_steps": 38160, "loss": 0.4093, "lr": 0.00026471518482939317, "epoch": 13.807651991614255, "percentage": 69.04, "elapsed_time": "1:07:21", "remaining_time": "0:30:12", "throughput": 4255.21, "total_tokens": 17199536} {"current_steps": 26350, "total_steps": 38160, "loss": 0.4169, "lr": 0.0002645134256779722, "epoch": 13.81027253668763, "percentage": 69.05, "elapsed_time": "1:07:22", "remaining_time": "0:30:11", "throughput": 4255.16, "total_tokens": 17202064} {"current_steps": 26355, "total_steps": 38160, "loss": 0.4786, "lr": 0.00026431171578765624, "epoch": 13.812893081761006, "percentage": 69.06, "elapsed_time": "1:07:23", "remaining_time": "0:30:11", "throughput": 4255.18, "total_tokens": 17205072} {"current_steps": 26360, "total_steps": 38160, "loss": 0.4481, "lr": 0.0002641100552006402, "epoch": 13.815513626834381, "percentage": 69.08, "elapsed_time": "1:07:24", "remaining_time": "0:30:10", "throughput": 4255.29, "total_tokens": 17208976} {"current_steps": 26365, "total_steps": 38160, "loss": 0.4244, "lr": 0.0002639084439591095, "epoch": 13.818134171907756, "percentage": 69.09, "elapsed_time": "1:07:24", "remaining_time": "0:30:09", "throughput": 4255.35, "total_tokens": 17212272} {"current_steps": 26370, "total_steps": 38160, "loss": 0.5671, "lr": 0.00026370688210523873, "epoch": 13.820754716981131, "percentage": 69.1, "elapsed_time": "1:07:25", "remaining_time": "0:30:08", "throughput": 4255.39, "total_tokens": 17215632} {"current_steps": 26375, "total_steps": 38160, "loss": 0.4832, "lr": 0.00026350536968119275, "epoch": 13.823375262054507, "percentage": 69.12, "elapsed_time": "1:07:26", "remaining_time": "0:30:08", "throughput": 4255.44, "total_tokens": 17218992} {"current_steps": 26380, "total_steps": 38160, "loss": 0.5282, "lr": 0.0002633039067291252, "epoch": 13.825995807127882, "percentage": 69.13, "elapsed_time": "1:07:27", "remaining_time": "0:30:07", "throughput": 4255.51, "total_tokens": 17222480} {"current_steps": 26385, "total_steps": 38160, "loss": 0.4221, "lr": 0.00026310249329118007, "epoch": 13.828616352201259, "percentage": 69.14, "elapsed_time": "1:07:27", "remaining_time": "0:30:06", "throughput": 4255.51, "total_tokens": 17225424} {"current_steps": 26390, "total_steps": 38160, "loss": 0.5111, "lr": 0.0002629011294094905, "epoch": 13.831236897274634, "percentage": 69.16, "elapsed_time": "1:07:28", "remaining_time": "0:30:05", "throughput": 4255.58, "total_tokens": 17228784} {"current_steps": 26395, "total_steps": 38160, "loss": 0.4351, "lr": 0.0002626998151261798, "epoch": 13.833857442348009, "percentage": 69.17, "elapsed_time": "1:07:29", "remaining_time": "0:30:04", "throughput": 4255.63, "total_tokens": 17232144} {"current_steps": 26400, "total_steps": 38160, "loss": 0.3624, "lr": 0.0002624985504833604, "epoch": 13.836477987421384, "percentage": 69.18, "elapsed_time": "1:07:30", "remaining_time": "0:30:04", "throughput": 4255.8, "total_tokens": 17236560} {"current_steps": 26405, "total_steps": 38160, "loss": 0.4361, "lr": 0.0002622973355231349, "epoch": 13.83909853249476, "percentage": 69.2, "elapsed_time": "1:07:30", "remaining_time": "0:30:03", "throughput": 4255.96, "total_tokens": 17240784} {"current_steps": 26410, "total_steps": 38160, "loss": 0.5118, "lr": 0.00026209617028759497, "epoch": 13.841719077568134, "percentage": 69.21, "elapsed_time": "1:07:31", "remaining_time": "0:30:02", "throughput": 4255.99, "total_tokens": 17243856} {"current_steps": 26415, "total_steps": 38160, "loss": 0.5478, "lr": 0.00026189505481882184, "epoch": 13.84433962264151, "percentage": 69.22, "elapsed_time": "1:07:32", "remaining_time": "0:30:01", "throughput": 4256.06, "total_tokens": 17247536} {"current_steps": 26420, "total_steps": 38160, "loss": 0.4479, "lr": 0.00026169398915888687, "epoch": 13.846960167714885, "percentage": 69.23, "elapsed_time": "1:07:33", "remaining_time": "0:30:01", "throughput": 4256.11, "total_tokens": 17250832} {"current_steps": 26425, "total_steps": 38160, "loss": 0.3302, "lr": 0.0002614929733498506, "epoch": 13.84958071278826, "percentage": 69.25, "elapsed_time": "1:07:33", "remaining_time": "0:30:00", "throughput": 4256.18, "total_tokens": 17254256} {"current_steps": 26430, "total_steps": 38160, "loss": 0.3105, "lr": 0.0002612920074337634, "epoch": 13.852201257861635, "percentage": 69.26, "elapsed_time": "1:07:34", "remaining_time": "0:29:59", "throughput": 4256.15, "total_tokens": 17256976} {"current_steps": 26435, "total_steps": 38160, "loss": 0.4523, "lr": 0.00026109109145266496, "epoch": 13.85482180293501, "percentage": 69.27, "elapsed_time": "1:07:35", "remaining_time": "0:29:58", "throughput": 4256.12, "total_tokens": 17259664} {"current_steps": 26440, "total_steps": 38160, "loss": 0.5195, "lr": 0.00026089022544858445, "epoch": 13.857442348008385, "percentage": 69.29, "elapsed_time": "1:07:35", "remaining_time": "0:29:57", "throughput": 4256.14, "total_tokens": 17262736} {"current_steps": 26445, "total_steps": 38160, "loss": 0.492, "lr": 0.00026068940946354075, "epoch": 13.86006289308176, "percentage": 69.3, "elapsed_time": "1:07:36", "remaining_time": "0:29:57", "throughput": 4256.07, "total_tokens": 17265040} {"current_steps": 26450, "total_steps": 38160, "loss": 0.3667, "lr": 0.0002604886435395425, "epoch": 13.862683438155136, "percentage": 69.31, "elapsed_time": "1:07:37", "remaining_time": "0:29:56", "throughput": 4256.15, "total_tokens": 17268656} {"current_steps": 26455, "total_steps": 38160, "loss": 0.3571, "lr": 0.00026028792771858744, "epoch": 13.865303983228511, "percentage": 69.33, "elapsed_time": "1:07:38", "remaining_time": "0:29:55", "throughput": 4256.23, "total_tokens": 17272272} {"current_steps": 26460, "total_steps": 38160, "loss": 0.4686, "lr": 0.00026008726204266333, "epoch": 13.867924528301886, "percentage": 69.34, "elapsed_time": "1:07:38", "remaining_time": "0:29:54", "throughput": 4256.25, "total_tokens": 17275408} {"current_steps": 26465, "total_steps": 38160, "loss": 0.3434, "lr": 0.00025988664655374693, "epoch": 13.870545073375261, "percentage": 69.35, "elapsed_time": "1:07:39", "remaining_time": "0:29:53", "throughput": 4256.24, "total_tokens": 17278224} {"current_steps": 26470, "total_steps": 38160, "loss": 0.4071, "lr": 0.00025968608129380455, "epoch": 13.873165618448636, "percentage": 69.37, "elapsed_time": "1:07:40", "remaining_time": "0:29:53", "throughput": 4256.31, "total_tokens": 17281808} {"current_steps": 26475, "total_steps": 38160, "loss": 0.4825, "lr": 0.00025948556630479234, "epoch": 13.875786163522012, "percentage": 69.38, "elapsed_time": "1:07:41", "remaining_time": "0:29:52", "throughput": 4256.34, "total_tokens": 17285072} {"current_steps": 26480, "total_steps": 38160, "loss": 0.4175, "lr": 0.0002592851016286557, "epoch": 13.878406708595389, "percentage": 69.39, "elapsed_time": "1:07:41", "remaining_time": "0:29:51", "throughput": 4256.34, "total_tokens": 17287952} {"current_steps": 26485, "total_steps": 38160, "loss": 0.4012, "lr": 0.0002590846873073298, "epoch": 13.881027253668764, "percentage": 69.41, "elapsed_time": "1:07:42", "remaining_time": "0:29:50", "throughput": 4256.33, "total_tokens": 17290768} {"current_steps": 26490, "total_steps": 38160, "loss": 0.4462, "lr": 0.0002588843233827387, "epoch": 13.883647798742139, "percentage": 69.42, "elapsed_time": "1:07:43", "remaining_time": "0:29:49", "throughput": 4256.38, "total_tokens": 17294000} {"current_steps": 26495, "total_steps": 38160, "loss": 0.3816, "lr": 0.0002586840098967963, "epoch": 13.886268343815514, "percentage": 69.43, "elapsed_time": "1:07:43", "remaining_time": "0:29:49", "throughput": 4256.45, "total_tokens": 17297520} {"current_steps": 26500, "total_steps": 38160, "loss": 0.359, "lr": 0.00025848374689140587, "epoch": 13.88888888888889, "percentage": 69.44, "elapsed_time": "1:07:44", "remaining_time": "0:29:48", "throughput": 4256.5, "total_tokens": 17300816} {"current_steps": 26505, "total_steps": 38160, "loss": 0.5321, "lr": 0.0002582835344084602, "epoch": 13.891509433962264, "percentage": 69.46, "elapsed_time": "1:07:45", "remaining_time": "0:29:47", "throughput": 4256.67, "total_tokens": 17305232} {"current_steps": 26510, "total_steps": 38160, "loss": 0.344, "lr": 0.00025808337248984175, "epoch": 13.89412997903564, "percentage": 69.47, "elapsed_time": "1:07:46", "remaining_time": "0:29:46", "throughput": 4256.72, "total_tokens": 17308592} {"current_steps": 26515, "total_steps": 38160, "loss": 0.462, "lr": 0.00025788326117742185, "epoch": 13.896750524109015, "percentage": 69.48, "elapsed_time": "1:07:46", "remaining_time": "0:29:46", "throughput": 4256.8, "total_tokens": 17312144} {"current_steps": 26520, "total_steps": 38160, "loss": 0.4276, "lr": 0.00025768320051306127, "epoch": 13.89937106918239, "percentage": 69.5, "elapsed_time": "1:07:47", "remaining_time": "0:29:45", "throughput": 4256.78, "total_tokens": 17314960} {"current_steps": 26525, "total_steps": 38160, "loss": 0.4831, "lr": 0.00025748319053861063, "epoch": 13.901991614255765, "percentage": 69.51, "elapsed_time": "1:07:48", "remaining_time": "0:29:44", "throughput": 4256.86, "total_tokens": 17318512} {"current_steps": 26530, "total_steps": 38160, "loss": 0.4286, "lr": 0.0002572832312959098, "epoch": 13.90461215932914, "percentage": 69.52, "elapsed_time": "1:07:49", "remaining_time": "0:29:43", "throughput": 4256.8, "total_tokens": 17320912} {"current_steps": 26535, "total_steps": 38160, "loss": 0.3355, "lr": 0.0002570833228267879, "epoch": 13.907232704402515, "percentage": 69.54, "elapsed_time": "1:07:49", "remaining_time": "0:29:42", "throughput": 4256.81, "total_tokens": 17323920} {"current_steps": 26540, "total_steps": 38160, "loss": 0.3765, "lr": 0.00025688346517306366, "epoch": 13.90985324947589, "percentage": 69.55, "elapsed_time": "1:07:50", "remaining_time": "0:29:42", "throughput": 4256.86, "total_tokens": 17327344} {"current_steps": 26545, "total_steps": 38160, "loss": 0.4709, "lr": 0.00025668365837654497, "epoch": 13.912473794549266, "percentage": 69.56, "elapsed_time": "1:07:51", "remaining_time": "0:29:41", "throughput": 4256.84, "total_tokens": 17330096} {"current_steps": 26550, "total_steps": 38160, "loss": 0.5458, "lr": 0.0002564839024790288, "epoch": 13.915094339622641, "percentage": 69.58, "elapsed_time": "1:07:51", "remaining_time": "0:29:40", "throughput": 4256.81, "total_tokens": 17332816} {"current_steps": 26555, "total_steps": 38160, "loss": 0.4799, "lr": 0.000256284197522302, "epoch": 13.917714884696016, "percentage": 69.59, "elapsed_time": "1:07:52", "remaining_time": "0:29:39", "throughput": 4256.9, "total_tokens": 17336432} {"current_steps": 26560, "total_steps": 38160, "loss": 0.5024, "lr": 0.00025608454354814075, "epoch": 13.920335429769391, "percentage": 69.6, "elapsed_time": "1:07:53", "remaining_time": "0:29:39", "throughput": 4257.03, "total_tokens": 17340432} {"current_steps": 26565, "total_steps": 38160, "loss": 0.3809, "lr": 0.0002558849405983104, "epoch": 13.922955974842766, "percentage": 69.61, "elapsed_time": "1:07:54", "remaining_time": "0:29:38", "throughput": 4257.23, "total_tokens": 17345232} {"current_steps": 26570, "total_steps": 38160, "loss": 0.3945, "lr": 0.00025568538871456527, "epoch": 13.925576519916142, "percentage": 69.63, "elapsed_time": "1:07:55", "remaining_time": "0:29:37", "throughput": 4257.38, "total_tokens": 17349520} {"current_steps": 26575, "total_steps": 38160, "loss": 0.3912, "lr": 0.00025548588793864976, "epoch": 13.928197064989519, "percentage": 69.64, "elapsed_time": "1:07:55", "remaining_time": "0:29:36", "throughput": 4257.44, "total_tokens": 17353040} {"current_steps": 26580, "total_steps": 38160, "loss": 0.6175, "lr": 0.0002552864383122967, "epoch": 13.930817610062894, "percentage": 69.65, "elapsed_time": "1:07:56", "remaining_time": "0:29:36", "throughput": 4257.44, "total_tokens": 17356048} {"current_steps": 26585, "total_steps": 38160, "loss": 0.4119, "lr": 0.0002550870398772289, "epoch": 13.933438155136269, "percentage": 69.67, "elapsed_time": "1:07:57", "remaining_time": "0:29:35", "throughput": 4257.49, "total_tokens": 17359344} {"current_steps": 26590, "total_steps": 38160, "loss": 0.5819, "lr": 0.0002548876926751584, "epoch": 13.936058700209644, "percentage": 69.68, "elapsed_time": "1:07:58", "remaining_time": "0:29:34", "throughput": 4257.63, "total_tokens": 17363408} {"current_steps": 26595, "total_steps": 38160, "loss": 0.3801, "lr": 0.0002546883967477861, "epoch": 13.93867924528302, "percentage": 69.69, "elapsed_time": "1:07:58", "remaining_time": "0:29:33", "throughput": 4257.68, "total_tokens": 17366672} {"current_steps": 26600, "total_steps": 38160, "loss": 0.308, "lr": 0.00025448915213680245, "epoch": 13.941299790356394, "percentage": 69.71, "elapsed_time": "1:07:59", "remaining_time": "0:29:32", "throughput": 4257.55, "total_tokens": 17368592} {"current_steps": 26605, "total_steps": 38160, "loss": 0.4188, "lr": 0.0002542899588838875, "epoch": 13.94392033542977, "percentage": 69.72, "elapsed_time": "1:08:00", "remaining_time": "0:29:32", "throughput": 4257.51, "total_tokens": 17371152} {"current_steps": 26610, "total_steps": 38160, "loss": 0.4327, "lr": 0.0002540908170307097, "epoch": 13.946540880503145, "percentage": 69.73, "elapsed_time": "1:08:00", "remaining_time": "0:29:31", "throughput": 4257.5, "total_tokens": 17373872} {"current_steps": 26615, "total_steps": 38160, "loss": 0.392, "lr": 0.00025389172661892753, "epoch": 13.94916142557652, "percentage": 69.75, "elapsed_time": "1:08:01", "remaining_time": "0:29:30", "throughput": 4257.53, "total_tokens": 17377200} {"current_steps": 26620, "total_steps": 38160, "loss": 0.4872, "lr": 0.00025369268769018856, "epoch": 13.951781970649895, "percentage": 69.76, "elapsed_time": "1:08:02", "remaining_time": "0:29:29", "throughput": 4257.57, "total_tokens": 17380400} {"current_steps": 26625, "total_steps": 38160, "loss": 0.4194, "lr": 0.00025349370028612914, "epoch": 13.95440251572327, "percentage": 69.77, "elapsed_time": "1:08:02", "remaining_time": "0:29:28", "throughput": 4257.63, "total_tokens": 17383792} {"current_steps": 26630, "total_steps": 38160, "loss": 0.4433, "lr": 0.0002532947644483755, "epoch": 13.957023060796645, "percentage": 69.79, "elapsed_time": "1:08:03", "remaining_time": "0:29:28", "throughput": 4257.59, "total_tokens": 17386352} {"current_steps": 26635, "total_steps": 38160, "loss": 0.5065, "lr": 0.00025309588021854237, "epoch": 13.95964360587002, "percentage": 69.8, "elapsed_time": "1:08:04", "remaining_time": "0:29:27", "throughput": 4257.55, "total_tokens": 17388976} {"current_steps": 26640, "total_steps": 38160, "loss": 0.5132, "lr": 0.0002528970476382343, "epoch": 13.962264150943396, "percentage": 69.81, "elapsed_time": "1:08:05", "remaining_time": "0:29:26", "throughput": 4257.69, "total_tokens": 17393104} {"current_steps": 26645, "total_steps": 38160, "loss": 0.382, "lr": 0.00025269826674904493, "epoch": 13.964884696016771, "percentage": 69.82, "elapsed_time": "1:08:05", "remaining_time": "0:29:25", "throughput": 4257.65, "total_tokens": 17395728} {"current_steps": 26650, "total_steps": 38160, "loss": 0.4187, "lr": 0.0002524995375925566, "epoch": 13.967505241090146, "percentage": 69.84, "elapsed_time": "1:08:06", "remaining_time": "0:29:24", "throughput": 4257.69, "total_tokens": 17399024} {"current_steps": 26655, "total_steps": 38160, "loss": 0.4833, "lr": 0.0002523008602103414, "epoch": 13.970125786163521, "percentage": 69.85, "elapsed_time": "1:08:07", "remaining_time": "0:29:24", "throughput": 4257.83, "total_tokens": 17403312} {"current_steps": 26660, "total_steps": 38160, "loss": 0.3836, "lr": 0.00025210223464396055, "epoch": 13.972746331236896, "percentage": 69.86, "elapsed_time": "1:08:08", "remaining_time": "0:29:23", "throughput": 4257.84, "total_tokens": 17406320} {"current_steps": 26665, "total_steps": 38160, "loss": 0.4067, "lr": 0.00025190366093496376, "epoch": 13.975366876310272, "percentage": 69.88, "elapsed_time": "1:08:08", "remaining_time": "0:29:22", "throughput": 4257.82, "total_tokens": 17409040} {"current_steps": 26670, "total_steps": 38160, "loss": 0.5066, "lr": 0.0002517051391248909, "epoch": 13.977987421383649, "percentage": 69.89, "elapsed_time": "1:08:09", "remaining_time": "0:29:21", "throughput": 4257.81, "total_tokens": 17411824} {"current_steps": 26675, "total_steps": 38160, "loss": 0.4644, "lr": 0.0002515066692552701, "epoch": 13.980607966457024, "percentage": 69.9, "elapsed_time": "1:08:10", "remaining_time": "0:29:21", "throughput": 4257.88, "total_tokens": 17415472} {"current_steps": 26680, "total_steps": 38160, "loss": 0.4866, "lr": 0.00025130825136761916, "epoch": 13.983228511530399, "percentage": 69.92, "elapsed_time": "1:08:10", "remaining_time": "0:29:20", "throughput": 4257.89, "total_tokens": 17418416} {"current_steps": 26685, "total_steps": 38160, "loss": 0.4551, "lr": 0.0002511098855034447, "epoch": 13.985849056603774, "percentage": 69.93, "elapsed_time": "1:08:11", "remaining_time": "0:29:19", "throughput": 4257.95, "total_tokens": 17421904} {"current_steps": 26690, "total_steps": 38160, "loss": 0.4754, "lr": 0.00025091157170424296, "epoch": 13.98846960167715, "percentage": 69.94, "elapsed_time": "1:08:12", "remaining_time": "0:29:18", "throughput": 4257.96, "total_tokens": 17424912} {"current_steps": 26695, "total_steps": 38160, "loss": 0.4721, "lr": 0.0002507133100114984, "epoch": 13.991090146750524, "percentage": 69.96, "elapsed_time": "1:08:13", "remaining_time": "0:29:17", "throughput": 4258.03, "total_tokens": 17428496} {"current_steps": 26700, "total_steps": 38160, "loss": 0.5442, "lr": 0.0002505151004666857, "epoch": 13.9937106918239, "percentage": 69.97, "elapsed_time": "1:08:13", "remaining_time": "0:29:17", "throughput": 4258.1, "total_tokens": 17431920} {"current_steps": 26705, "total_steps": 38160, "loss": 0.3706, "lr": 0.0002503169431112674, "epoch": 13.996331236897275, "percentage": 69.98, "elapsed_time": "1:08:14", "remaining_time": "0:29:16", "throughput": 4258.14, "total_tokens": 17435152} {"current_steps": 26710, "total_steps": 38160, "loss": 0.4008, "lr": 0.0002501188379866961, "epoch": 13.99895178197065, "percentage": 69.99, "elapsed_time": "1:08:15", "remaining_time": "0:29:15", "throughput": 4258.09, "total_tokens": 17437680} {"current_steps": 26712, "total_steps": 38160, "eval_loss": 0.488889217376709, "epoch": 14.0, "percentage": 70.0, "elapsed_time": "1:08:29", "remaining_time": "0:29:21", "throughput": 4243.74, "total_tokens": 17439088} {"current_steps": 26715, "total_steps": 38160, "loss": 0.3368, "lr": 0.0002499207851344133, "epoch": 14.001572327044025, "percentage": 70.01, "elapsed_time": "1:08:31", "remaining_time": "0:29:21", "throughput": 4241.98, "total_tokens": 17441328} {"current_steps": 26720, "total_steps": 38160, "loss": 0.4754, "lr": 0.00024972278459584903, "epoch": 14.0041928721174, "percentage": 70.02, "elapsed_time": "1:08:32", "remaining_time": "0:29:20", "throughput": 4241.96, "total_tokens": 17444016} {"current_steps": 26725, "total_steps": 38160, "loss": 0.3599, "lr": 0.00024952483641242304, "epoch": 14.006813417190775, "percentage": 70.03, "elapsed_time": "1:08:32", "remaining_time": "0:29:19", "throughput": 4241.98, "total_tokens": 17447088} {"current_steps": 26730, "total_steps": 38160, "loss": 0.5022, "lr": 0.0002493269406255435, "epoch": 14.00943396226415, "percentage": 70.05, "elapsed_time": "1:08:33", "remaining_time": "0:29:19", "throughput": 4242.13, "total_tokens": 17451280} {"current_steps": 26735, "total_steps": 38160, "loss": 0.5289, "lr": 0.0002491290972766082, "epoch": 14.012054507337526, "percentage": 70.06, "elapsed_time": "1:08:34", "remaining_time": "0:29:18", "throughput": 4242.29, "total_tokens": 17455792} {"current_steps": 26740, "total_steps": 38160, "loss": 0.3316, "lr": 0.0002489313064070037, "epoch": 14.014675052410901, "percentage": 70.07, "elapsed_time": "1:08:35", "remaining_time": "0:29:17", "throughput": 4242.32, "total_tokens": 17458896} {"current_steps": 26745, "total_steps": 38160, "loss": 0.4803, "lr": 0.00024873356805810566, "epoch": 14.017295597484276, "percentage": 70.09, "elapsed_time": "1:08:36", "remaining_time": "0:29:16", "throughput": 4242.33, "total_tokens": 17461904} {"current_steps": 26750, "total_steps": 38160, "loss": 0.3655, "lr": 0.00024853588227127864, "epoch": 14.019916142557651, "percentage": 70.1, "elapsed_time": "1:08:36", "remaining_time": "0:29:16", "throughput": 4242.4, "total_tokens": 17465424} {"current_steps": 26755, "total_steps": 38160, "loss": 0.4328, "lr": 0.000248338249087876, "epoch": 14.022536687631026, "percentage": 70.11, "elapsed_time": "1:08:37", "remaining_time": "0:29:15", "throughput": 4242.46, "total_tokens": 17468784} {"current_steps": 26760, "total_steps": 38160, "loss": 0.3793, "lr": 0.0002481406685492405, "epoch": 14.025157232704403, "percentage": 70.13, "elapsed_time": "1:08:38", "remaining_time": "0:29:14", "throughput": 4242.44, "total_tokens": 17471632} {"current_steps": 26765, "total_steps": 38160, "loss": 0.3581, "lr": 0.00024794314069670383, "epoch": 14.027777777777779, "percentage": 70.14, "elapsed_time": "1:08:39", "remaining_time": "0:29:13", "throughput": 4242.51, "total_tokens": 17475024} {"current_steps": 26770, "total_steps": 38160, "loss": 0.4833, "lr": 0.0002477456655715865, "epoch": 14.030398322851154, "percentage": 70.15, "elapsed_time": "1:08:39", "remaining_time": "0:29:12", "throughput": 4242.51, "total_tokens": 17477904} {"current_steps": 26775, "total_steps": 38160, "loss": 0.3585, "lr": 0.0002475482432151982, "epoch": 14.033018867924529, "percentage": 70.17, "elapsed_time": "1:08:40", "remaining_time": "0:29:12", "throughput": 4242.47, "total_tokens": 17480464} {"current_steps": 26780, "total_steps": 38160, "loss": 0.4091, "lr": 0.00024735087366883733, "epoch": 14.035639412997904, "percentage": 70.18, "elapsed_time": "1:08:41", "remaining_time": "0:29:11", "throughput": 4242.48, "total_tokens": 17483440} {"current_steps": 26785, "total_steps": 38160, "loss": 0.4513, "lr": 0.00024715355697379115, "epoch": 14.03825995807128, "percentage": 70.19, "elapsed_time": "1:08:41", "remaining_time": "0:29:10", "throughput": 4242.45, "total_tokens": 17485968} {"current_steps": 26790, "total_steps": 38160, "loss": 0.5101, "lr": 0.0002469562931713362, "epoch": 14.040880503144654, "percentage": 70.2, "elapsed_time": "1:08:42", "remaining_time": "0:29:09", "throughput": 4242.47, "total_tokens": 17489104} {"current_steps": 26795, "total_steps": 38160, "loss": 0.4733, "lr": 0.00024675908230273785, "epoch": 14.04350104821803, "percentage": 70.22, "elapsed_time": "1:08:43", "remaining_time": "0:29:08", "throughput": 4242.63, "total_tokens": 17493264} {"current_steps": 26800, "total_steps": 38160, "loss": 0.4732, "lr": 0.00024656192440925055, "epoch": 14.046121593291405, "percentage": 70.23, "elapsed_time": "1:08:43", "remaining_time": "0:29:08", "throughput": 4242.7, "total_tokens": 17496880} {"current_steps": 26805, "total_steps": 38160, "loss": 0.3343, "lr": 0.0002463648195321173, "epoch": 14.04874213836478, "percentage": 70.24, "elapsed_time": "1:08:44", "remaining_time": "0:29:07", "throughput": 4242.61, "total_tokens": 17498992} {"current_steps": 26810, "total_steps": 38160, "loss": 0.314, "lr": 0.00024616776771257, "epoch": 14.051362683438155, "percentage": 70.26, "elapsed_time": "1:08:45", "remaining_time": "0:29:06", "throughput": 4242.92, "total_tokens": 17505136} {"current_steps": 26815, "total_steps": 38160, "loss": 0.3297, "lr": 0.00024597076899182977, "epoch": 14.05398322851153, "percentage": 70.27, "elapsed_time": "1:08:46", "remaining_time": "0:29:05", "throughput": 4243.05, "total_tokens": 17509200} {"current_steps": 26820, "total_steps": 38160, "loss": 0.5492, "lr": 0.0002457738234111066, "epoch": 14.056603773584905, "percentage": 70.28, "elapsed_time": "1:08:47", "remaining_time": "0:29:05", "throughput": 4243.05, "total_tokens": 17512080} {"current_steps": 26825, "total_steps": 38160, "loss": 0.386, "lr": 0.00024557693101159937, "epoch": 14.05922431865828, "percentage": 70.3, "elapsed_time": "1:08:47", "remaining_time": "0:29:04", "throughput": 4243.08, "total_tokens": 17515152} {"current_steps": 26830, "total_steps": 38160, "loss": 0.494, "lr": 0.00024538009183449553, "epoch": 14.061844863731656, "percentage": 70.31, "elapsed_time": "1:08:48", "remaining_time": "0:29:03", "throughput": 4243.14, "total_tokens": 17518576} {"current_steps": 26835, "total_steps": 38160, "loss": 0.3923, "lr": 0.0002451833059209715, "epoch": 14.064465408805031, "percentage": 70.32, "elapsed_time": "1:08:49", "remaining_time": "0:29:02", "throughput": 4243.11, "total_tokens": 17521264} {"current_steps": 26840, "total_steps": 38160, "loss": 0.3794, "lr": 0.00024498657331219274, "epoch": 14.067085953878406, "percentage": 70.34, "elapsed_time": "1:08:50", "remaining_time": "0:29:01", "throughput": 4243.11, "total_tokens": 17524176} {"current_steps": 26845, "total_steps": 38160, "loss": 0.4116, "lr": 0.0002447898940493135, "epoch": 14.069706498951781, "percentage": 70.35, "elapsed_time": "1:08:50", "remaining_time": "0:29:01", "throughput": 4243.17, "total_tokens": 17527600} {"current_steps": 26850, "total_steps": 38160, "loss": 0.4074, "lr": 0.00024459326817347684, "epoch": 14.072327044025156, "percentage": 70.36, "elapsed_time": "1:08:51", "remaining_time": "0:29:00", "throughput": 4243.1, "total_tokens": 17529904} {"current_steps": 26855, "total_steps": 38160, "loss": 0.5548, "lr": 0.0002443966957258148, "epoch": 14.074947589098532, "percentage": 70.37, "elapsed_time": "1:08:52", "remaining_time": "0:28:59", "throughput": 4243.08, "total_tokens": 17532624} {"current_steps": 26860, "total_steps": 38160, "loss": 0.3473, "lr": 0.000244200176747448, "epoch": 14.077568134171909, "percentage": 70.39, "elapsed_time": "1:08:52", "remaining_time": "0:28:58", "throughput": 4243.19, "total_tokens": 17536432} {"current_steps": 26865, "total_steps": 38160, "loss": 0.3697, "lr": 0.00024400371127948568, "epoch": 14.080188679245284, "percentage": 70.4, "elapsed_time": "1:08:53", "remaining_time": "0:28:57", "throughput": 4243.18, "total_tokens": 17539184} {"current_steps": 26870, "total_steps": 38160, "loss": 0.4115, "lr": 0.00024380729936302636, "epoch": 14.082809224318659, "percentage": 70.41, "elapsed_time": "1:08:54", "remaining_time": "0:28:57", "throughput": 4243.21, "total_tokens": 17542288} {"current_steps": 26875, "total_steps": 38160, "loss": 0.3676, "lr": 0.00024361094103915725, "epoch": 14.085429769392034, "percentage": 70.43, "elapsed_time": "1:08:54", "remaining_time": "0:28:56", "throughput": 4243.19, "total_tokens": 17545200} {"current_steps": 26880, "total_steps": 38160, "loss": 0.4023, "lr": 0.00024341463634895444, "epoch": 14.08805031446541, "percentage": 70.44, "elapsed_time": "1:08:55", "remaining_time": "0:28:55", "throughput": 4243.33, "total_tokens": 17549328} {"current_steps": 26885, "total_steps": 38160, "loss": 0.4667, "lr": 0.0002432183853334824, "epoch": 14.090670859538784, "percentage": 70.45, "elapsed_time": "1:08:56", "remaining_time": "0:28:54", "throughput": 4243.38, "total_tokens": 17552496} {"current_steps": 26890, "total_steps": 38160, "loss": 0.4917, "lr": 0.00024302218803379445, "epoch": 14.09329140461216, "percentage": 70.47, "elapsed_time": "1:08:57", "remaining_time": "0:28:53", "throughput": 4243.4, "total_tokens": 17555600} {"current_steps": 26895, "total_steps": 38160, "loss": 0.4314, "lr": 0.000242826044490933, "epoch": 14.095911949685535, "percentage": 70.48, "elapsed_time": "1:08:57", "remaining_time": "0:28:53", "throughput": 4243.45, "total_tokens": 17558928} {"current_steps": 26900, "total_steps": 38160, "loss": 0.4234, "lr": 0.00024262995474592903, "epoch": 14.09853249475891, "percentage": 70.49, "elapsed_time": "1:08:58", "remaining_time": "0:28:52", "throughput": 4243.41, "total_tokens": 17561456} {"current_steps": 26905, "total_steps": 38160, "loss": 0.361, "lr": 0.0002424339188398025, "epoch": 14.101153039832285, "percentage": 70.51, "elapsed_time": "1:08:59", "remaining_time": "0:28:51", "throughput": 4243.5, "total_tokens": 17565072} {"current_steps": 26910, "total_steps": 38160, "loss": 0.4404, "lr": 0.00024223793681356148, "epoch": 14.10377358490566, "percentage": 70.52, "elapsed_time": "1:08:59", "remaining_time": "0:28:50", "throughput": 4243.49, "total_tokens": 17567920} {"current_steps": 26915, "total_steps": 38160, "loss": 0.4768, "lr": 0.00024204200870820358, "epoch": 14.106394129979035, "percentage": 70.53, "elapsed_time": "1:09:00", "remaining_time": "0:28:49", "throughput": 4243.45, "total_tokens": 17570384} {"current_steps": 26920, "total_steps": 38160, "loss": 0.4258, "lr": 0.0002418461345647143, "epoch": 14.10901467505241, "percentage": 70.55, "elapsed_time": "1:09:01", "remaining_time": "0:28:49", "throughput": 4243.5, "total_tokens": 17573616} {"current_steps": 26925, "total_steps": 38160, "loss": 0.3882, "lr": 0.00024165031442406853, "epoch": 14.111635220125786, "percentage": 70.56, "elapsed_time": "1:09:02", "remaining_time": "0:28:48", "throughput": 4243.67, "total_tokens": 17578128} {"current_steps": 26930, "total_steps": 38160, "loss": 0.5445, "lr": 0.00024145454832722956, "epoch": 14.114255765199161, "percentage": 70.57, "elapsed_time": "1:09:02", "remaining_time": "0:28:47", "throughput": 4243.66, "total_tokens": 17580944} {"current_steps": 26935, "total_steps": 38160, "loss": 0.3367, "lr": 0.00024125883631514967, "epoch": 14.116876310272536, "percentage": 70.58, "elapsed_time": "1:09:03", "remaining_time": "0:28:46", "throughput": 4243.7, "total_tokens": 17584208} {"current_steps": 26940, "total_steps": 38160, "loss": 0.4987, "lr": 0.00024106317842876907, "epoch": 14.119496855345911, "percentage": 70.6, "elapsed_time": "1:09:04", "remaining_time": "0:28:46", "throughput": 4243.82, "total_tokens": 17588112} {"current_steps": 26945, "total_steps": 38160, "loss": 0.3558, "lr": 0.0002408675747090177, "epoch": 14.122117400419286, "percentage": 70.61, "elapsed_time": "1:09:05", "remaining_time": "0:28:45", "throughput": 4243.85, "total_tokens": 17591216} {"current_steps": 26950, "total_steps": 38160, "loss": 0.4596, "lr": 0.00024067202519681313, "epoch": 14.124737945492662, "percentage": 70.62, "elapsed_time": "1:09:05", "remaining_time": "0:28:44", "throughput": 4243.87, "total_tokens": 17594352} {"current_steps": 26955, "total_steps": 38160, "loss": 0.3296, "lr": 0.00024047652993306235, "epoch": 14.127358490566039, "percentage": 70.64, "elapsed_time": "1:09:06", "remaining_time": "0:28:43", "throughput": 4243.85, "total_tokens": 17596976} {"current_steps": 26960, "total_steps": 38160, "loss": 0.4031, "lr": 0.00024028108895866084, "epoch": 14.129979035639414, "percentage": 70.65, "elapsed_time": "1:09:07", "remaining_time": "0:28:42", "throughput": 4243.84, "total_tokens": 17599824} {"current_steps": 26965, "total_steps": 38160, "loss": 0.3583, "lr": 0.00024008570231449239, "epoch": 14.132599580712789, "percentage": 70.66, "elapsed_time": "1:09:07", "remaining_time": "0:28:42", "throughput": 4243.9, "total_tokens": 17603312} {"current_steps": 26970, "total_steps": 38160, "loss": 0.4526, "lr": 0.00023989037004142966, "epoch": 14.135220125786164, "percentage": 70.68, "elapsed_time": "1:09:08", "remaining_time": "0:28:41", "throughput": 4243.85, "total_tokens": 17605712} {"current_steps": 26975, "total_steps": 38160, "loss": 0.6139, "lr": 0.0002396950921803343, "epoch": 14.13784067085954, "percentage": 70.69, "elapsed_time": "1:09:09", "remaining_time": "0:28:40", "throughput": 4243.93, "total_tokens": 17609424} {"current_steps": 26980, "total_steps": 38160, "loss": 0.523, "lr": 0.0002394998687720557, "epoch": 14.140461215932914, "percentage": 70.7, "elapsed_time": "1:09:09", "remaining_time": "0:28:39", "throughput": 4243.88, "total_tokens": 17611952} {"current_steps": 26985, "total_steps": 38160, "loss": 0.4089, "lr": 0.0002393046998574328, "epoch": 14.14308176100629, "percentage": 70.72, "elapsed_time": "1:09:10", "remaining_time": "0:28:38", "throughput": 4243.9, "total_tokens": 17614960} {"current_steps": 26990, "total_steps": 38160, "loss": 0.3611, "lr": 0.0002391095854772924, "epoch": 14.145702306079665, "percentage": 70.73, "elapsed_time": "1:09:11", "remaining_time": "0:28:38", "throughput": 4244.04, "total_tokens": 17619152} {"current_steps": 26995, "total_steps": 38160, "loss": 0.4591, "lr": 0.00023891452567245027, "epoch": 14.14832285115304, "percentage": 70.74, "elapsed_time": "1:09:12", "remaining_time": "0:28:37", "throughput": 4244.15, "total_tokens": 17623024} {"current_steps": 27000, "total_steps": 38160, "loss": 0.3109, "lr": 0.00023871952048371093, "epoch": 14.150943396226415, "percentage": 70.75, "elapsed_time": "1:09:13", "remaining_time": "0:28:36", "throughput": 4244.25, "total_tokens": 17626736} {"current_steps": 27005, "total_steps": 38160, "loss": 0.4492, "lr": 0.00023852456995186684, "epoch": 14.15356394129979, "percentage": 70.77, "elapsed_time": "1:09:13", "remaining_time": "0:28:35", "throughput": 4244.27, "total_tokens": 17629808} {"current_steps": 27010, "total_steps": 38160, "loss": 0.5346, "lr": 0.0002383296741176997, "epoch": 14.156184486373165, "percentage": 70.78, "elapsed_time": "1:09:14", "remaining_time": "0:28:35", "throughput": 4244.33, "total_tokens": 17633168} {"current_steps": 27015, "total_steps": 38160, "loss": 0.5687, "lr": 0.00023813483302197964, "epoch": 14.15880503144654, "percentage": 70.79, "elapsed_time": "1:09:15", "remaining_time": "0:28:34", "throughput": 4244.37, "total_tokens": 17636560} {"current_steps": 27020, "total_steps": 38160, "loss": 0.4554, "lr": 0.00023794004670546476, "epoch": 14.161425576519916, "percentage": 70.81, "elapsed_time": "1:09:16", "remaining_time": "0:28:33", "throughput": 4244.52, "total_tokens": 17640784} {"current_steps": 27025, "total_steps": 38160, "loss": 0.3503, "lr": 0.00023774531520890242, "epoch": 14.164046121593291, "percentage": 70.82, "elapsed_time": "1:09:16", "remaining_time": "0:28:32", "throughput": 4244.55, "total_tokens": 17643984} {"current_steps": 27030, "total_steps": 38160, "loss": 0.4586, "lr": 0.00023755063857302833, "epoch": 14.166666666666666, "percentage": 70.83, "elapsed_time": "1:09:17", "remaining_time": "0:28:31", "throughput": 4244.59, "total_tokens": 17647184} {"current_steps": 27035, "total_steps": 38160, "loss": 0.3703, "lr": 0.00023735601683856628, "epoch": 14.169287211740041, "percentage": 70.85, "elapsed_time": "1:09:18", "remaining_time": "0:28:31", "throughput": 4244.55, "total_tokens": 17649808} {"current_steps": 27040, "total_steps": 38160, "loss": 0.4269, "lr": 0.0002371614500462293, "epoch": 14.171907756813416, "percentage": 70.86, "elapsed_time": "1:09:18", "remaining_time": "0:28:30", "throughput": 4244.49, "total_tokens": 17652112} {"current_steps": 27045, "total_steps": 38160, "loss": 0.4319, "lr": 0.00023696693823671816, "epoch": 14.174528301886792, "percentage": 70.87, "elapsed_time": "1:09:19", "remaining_time": "0:28:29", "throughput": 4244.52, "total_tokens": 17655312} {"current_steps": 27050, "total_steps": 38160, "loss": 0.4777, "lr": 0.00023677248145072272, "epoch": 14.177148846960169, "percentage": 70.89, "elapsed_time": "1:09:20", "remaining_time": "0:28:28", "throughput": 4244.69, "total_tokens": 17659792} {"current_steps": 27055, "total_steps": 38160, "loss": 0.3542, "lr": 0.0002365780797289211, "epoch": 14.179769392033544, "percentage": 70.9, "elapsed_time": "1:09:21", "remaining_time": "0:28:27", "throughput": 4244.73, "total_tokens": 17663056} {"current_steps": 27060, "total_steps": 38160, "loss": 0.5029, "lr": 0.00023638373311198014, "epoch": 14.182389937106919, "percentage": 70.91, "elapsed_time": "1:09:21", "remaining_time": "0:28:27", "throughput": 4244.72, "total_tokens": 17665904} {"current_steps": 27065, "total_steps": 38160, "loss": 0.3732, "lr": 0.00023618944164055468, "epoch": 14.185010482180294, "percentage": 70.93, "elapsed_time": "1:09:22", "remaining_time": "0:28:26", "throughput": 4244.72, "total_tokens": 17668912} {"current_steps": 27070, "total_steps": 38160, "loss": 0.3582, "lr": 0.00023599520535528813, "epoch": 14.18763102725367, "percentage": 70.94, "elapsed_time": "1:09:23", "remaining_time": "0:28:25", "throughput": 4244.74, "total_tokens": 17672080} {"current_steps": 27075, "total_steps": 38160, "loss": 0.482, "lr": 0.00023580102429681266, "epoch": 14.190251572327044, "percentage": 70.95, "elapsed_time": "1:09:23", "remaining_time": "0:28:24", "throughput": 4244.72, "total_tokens": 17674736} {"current_steps": 27080, "total_steps": 38160, "loss": 0.3552, "lr": 0.00023560689850574885, "epoch": 14.19287211740042, "percentage": 70.96, "elapsed_time": "1:09:24", "remaining_time": "0:28:24", "throughput": 4244.8, "total_tokens": 17678384} {"current_steps": 27085, "total_steps": 38160, "loss": 0.4382, "lr": 0.00023541282802270563, "epoch": 14.195492662473795, "percentage": 70.98, "elapsed_time": "1:09:25", "remaining_time": "0:28:23", "throughput": 4244.9, "total_tokens": 17682128} {"current_steps": 27090, "total_steps": 38160, "loss": 0.5291, "lr": 0.00023521881288828005, "epoch": 14.19811320754717, "percentage": 70.99, "elapsed_time": "1:09:26", "remaining_time": "0:28:22", "throughput": 4244.9, "total_tokens": 17684944} {"current_steps": 27095, "total_steps": 38160, "loss": 0.4457, "lr": 0.00023502485314305828, "epoch": 14.200733752620545, "percentage": 71.0, "elapsed_time": "1:09:26", "remaining_time": "0:28:21", "throughput": 4244.88, "total_tokens": 17687728} {"current_steps": 27100, "total_steps": 38160, "loss": 0.3825, "lr": 0.00023483094882761397, "epoch": 14.20335429769392, "percentage": 71.02, "elapsed_time": "1:09:27", "remaining_time": "0:28:20", "throughput": 4244.88, "total_tokens": 17690608} {"current_steps": 27105, "total_steps": 38160, "loss": 0.5177, "lr": 0.00023463709998250998, "epoch": 14.205974842767295, "percentage": 71.03, "elapsed_time": "1:09:28", "remaining_time": "0:28:20", "throughput": 4244.99, "total_tokens": 17694512} {"current_steps": 27110, "total_steps": 38160, "loss": 0.3662, "lr": 0.00023444330664829728, "epoch": 14.20859538784067, "percentage": 71.04, "elapsed_time": "1:09:29", "remaining_time": "0:28:19", "throughput": 4245.0, "total_tokens": 17697424} {"current_steps": 27115, "total_steps": 38160, "loss": 0.3149, "lr": 0.00023424956886551536, "epoch": 14.211215932914046, "percentage": 71.06, "elapsed_time": "1:09:29", "remaining_time": "0:28:18", "throughput": 4245.04, "total_tokens": 17700688} {"current_steps": 27120, "total_steps": 38160, "loss": 0.3947, "lr": 0.0002340558866746918, "epoch": 14.213836477987421, "percentage": 71.07, "elapsed_time": "1:09:30", "remaining_time": "0:28:17", "throughput": 4245.12, "total_tokens": 17704336} {"current_steps": 27125, "total_steps": 38160, "loss": 0.3388, "lr": 0.0002338622601163425, "epoch": 14.216457023060796, "percentage": 71.08, "elapsed_time": "1:09:31", "remaining_time": "0:28:16", "throughput": 4245.08, "total_tokens": 17706896} {"current_steps": 27130, "total_steps": 38160, "loss": 0.3415, "lr": 0.00023366868923097213, "epoch": 14.219077568134171, "percentage": 71.1, "elapsed_time": "1:09:31", "remaining_time": "0:28:16", "throughput": 4245.13, "total_tokens": 17710320} {"current_steps": 27135, "total_steps": 38160, "loss": 0.3883, "lr": 0.0002334751740590735, "epoch": 14.221698113207546, "percentage": 71.11, "elapsed_time": "1:09:32", "remaining_time": "0:28:15", "throughput": 4245.14, "total_tokens": 17713296} {"current_steps": 27140, "total_steps": 38160, "loss": 0.3164, "lr": 0.00023328171464112796, "epoch": 14.224318658280922, "percentage": 71.12, "elapsed_time": "1:09:33", "remaining_time": "0:28:14", "throughput": 4245.21, "total_tokens": 17716912} {"current_steps": 27145, "total_steps": 38160, "loss": 0.481, "lr": 0.00023308831101760485, "epoch": 14.226939203354299, "percentage": 71.13, "elapsed_time": "1:09:34", "remaining_time": "0:28:13", "throughput": 4245.19, "total_tokens": 17719632} {"current_steps": 27150, "total_steps": 38160, "loss": 0.4385, "lr": 0.00023289496322896174, "epoch": 14.229559748427674, "percentage": 71.15, "elapsed_time": "1:09:34", "remaining_time": "0:28:12", "throughput": 4245.24, "total_tokens": 17722960} {"current_steps": 27155, "total_steps": 38160, "loss": 0.4879, "lr": 0.00023270167131564512, "epoch": 14.232180293501049, "percentage": 71.16, "elapsed_time": "1:09:35", "remaining_time": "0:28:12", "throughput": 4245.29, "total_tokens": 17726288} {"current_steps": 27160, "total_steps": 38160, "loss": 0.3801, "lr": 0.0002325084353180893, "epoch": 14.234800838574424, "percentage": 71.17, "elapsed_time": "1:09:36", "remaining_time": "0:28:11", "throughput": 4245.32, "total_tokens": 17729488} {"current_steps": 27165, "total_steps": 38160, "loss": 0.4758, "lr": 0.00023231525527671716, "epoch": 14.2374213836478, "percentage": 71.19, "elapsed_time": "1:09:36", "remaining_time": "0:28:10", "throughput": 4245.33, "total_tokens": 17732496} {"current_steps": 27170, "total_steps": 38160, "loss": 0.333, "lr": 0.00023212213123193986, "epoch": 14.240041928721174, "percentage": 71.2, "elapsed_time": "1:09:38", "remaining_time": "0:28:10", "throughput": 4245.67, "total_tokens": 17739088} {"current_steps": 27175, "total_steps": 38160, "loss": 0.4062, "lr": 0.0002319290632241566, "epoch": 14.24266247379455, "percentage": 71.21, "elapsed_time": "1:09:38", "remaining_time": "0:28:09", "throughput": 4245.69, "total_tokens": 17742224} {"current_steps": 27180, "total_steps": 38160, "loss": 0.4419, "lr": 0.0002317360512937548, "epoch": 14.245283018867925, "percentage": 71.23, "elapsed_time": "1:09:39", "remaining_time": "0:28:08", "throughput": 4245.87, "total_tokens": 17746800} {"current_steps": 27185, "total_steps": 38160, "loss": 0.4865, "lr": 0.00023154309548111058, "epoch": 14.2479035639413, "percentage": 71.24, "elapsed_time": "1:09:40", "remaining_time": "0:28:07", "throughput": 4245.89, "total_tokens": 17749936} {"current_steps": 27190, "total_steps": 38160, "loss": 0.4761, "lr": 0.000231350195826588, "epoch": 14.250524109014675, "percentage": 71.25, "elapsed_time": "1:09:41", "remaining_time": "0:28:06", "throughput": 4245.9, "total_tokens": 17752848} {"current_steps": 27195, "total_steps": 38160, "loss": 0.3616, "lr": 0.00023115735237053982, "epoch": 14.25314465408805, "percentage": 71.27, "elapsed_time": "1:09:41", "remaining_time": "0:28:06", "throughput": 4245.98, "total_tokens": 17756592} {"current_steps": 27200, "total_steps": 38160, "loss": 0.5391, "lr": 0.00023096456515330632, "epoch": 14.255765199161425, "percentage": 71.28, "elapsed_time": "1:09:42", "remaining_time": "0:28:05", "throughput": 4246.01, "total_tokens": 17759728} {"current_steps": 27205, "total_steps": 38160, "loss": 0.4588, "lr": 0.0002307718342152163, "epoch": 14.2583857442348, "percentage": 71.29, "elapsed_time": "1:09:43", "remaining_time": "0:28:04", "throughput": 4245.97, "total_tokens": 17762320} {"current_steps": 27210, "total_steps": 38160, "loss": 0.3975, "lr": 0.0002305791595965871, "epoch": 14.261006289308176, "percentage": 71.31, "elapsed_time": "1:09:44", "remaining_time": "0:28:03", "throughput": 4245.99, "total_tokens": 17765424} {"current_steps": 27215, "total_steps": 38160, "loss": 0.4465, "lr": 0.00023038654133772395, "epoch": 14.26362683438155, "percentage": 71.32, "elapsed_time": "1:09:44", "remaining_time": "0:28:02", "throughput": 4246.02, "total_tokens": 17768528} {"current_steps": 27220, "total_steps": 38160, "loss": 0.3198, "lr": 0.00023019397947892062, "epoch": 14.266247379454926, "percentage": 71.33, "elapsed_time": "1:09:45", "remaining_time": "0:28:02", "throughput": 4246.0, "total_tokens": 17771184} {"current_steps": 27225, "total_steps": 38160, "loss": 0.306, "lr": 0.00023000147406045853, "epoch": 14.268867924528301, "percentage": 71.34, "elapsed_time": "1:09:46", "remaining_time": "0:28:01", "throughput": 4246.27, "total_tokens": 17776368} {"current_steps": 27230, "total_steps": 38160, "loss": 0.4554, "lr": 0.00022980902512260786, "epoch": 14.271488469601676, "percentage": 71.36, "elapsed_time": "1:09:47", "remaining_time": "0:28:00", "throughput": 4246.23, "total_tokens": 17779024} {"current_steps": 27235, "total_steps": 38160, "loss": 0.4261, "lr": 0.00022961663270562656, "epoch": 14.274109014675052, "percentage": 71.37, "elapsed_time": "1:09:47", "remaining_time": "0:27:59", "throughput": 4246.29, "total_tokens": 17782544} {"current_steps": 27240, "total_steps": 38160, "loss": 0.3274, "lr": 0.0002294242968497609, "epoch": 14.276729559748428, "percentage": 71.38, "elapsed_time": "1:09:48", "remaining_time": "0:27:59", "throughput": 4246.28, "total_tokens": 17785328} {"current_steps": 27245, "total_steps": 38160, "loss": 0.3651, "lr": 0.00022923201759524552, "epoch": 14.279350104821804, "percentage": 71.4, "elapsed_time": "1:09:49", "remaining_time": "0:27:58", "throughput": 4246.27, "total_tokens": 17788176} {"current_steps": 27250, "total_steps": 38160, "loss": 0.4101, "lr": 0.00022903979498230316, "epoch": 14.281970649895179, "percentage": 71.41, "elapsed_time": "1:09:49", "remaining_time": "0:27:57", "throughput": 4246.32, "total_tokens": 17791504} {"current_steps": 27255, "total_steps": 38160, "loss": 0.4288, "lr": 0.00022884762905114436, "epoch": 14.284591194968554, "percentage": 71.42, "elapsed_time": "1:09:50", "remaining_time": "0:27:56", "throughput": 4246.52, "total_tokens": 17796304} {"current_steps": 27260, "total_steps": 38160, "loss": 0.3499, "lr": 0.00022865551984196792, "epoch": 14.28721174004193, "percentage": 71.44, "elapsed_time": "1:09:51", "remaining_time": "0:27:55", "throughput": 4246.49, "total_tokens": 17798928} {"current_steps": 27265, "total_steps": 38160, "loss": 0.4843, "lr": 0.0002284634673949611, "epoch": 14.289832285115304, "percentage": 71.45, "elapsed_time": "1:09:52", "remaining_time": "0:27:55", "throughput": 4246.56, "total_tokens": 17802480} {"current_steps": 27270, "total_steps": 38160, "loss": 0.4198, "lr": 0.00022827147175029906, "epoch": 14.29245283018868, "percentage": 71.46, "elapsed_time": "1:09:52", "remaining_time": "0:27:54", "throughput": 4246.61, "total_tokens": 17805680} {"current_steps": 27275, "total_steps": 38160, "loss": 0.4185, "lr": 0.0002280795329481452, "epoch": 14.295073375262055, "percentage": 71.48, "elapsed_time": "1:09:53", "remaining_time": "0:27:53", "throughput": 4246.58, "total_tokens": 17808336} {"current_steps": 27280, "total_steps": 38160, "loss": 0.3922, "lr": 0.00022788765102865066, "epoch": 14.29769392033543, "percentage": 71.49, "elapsed_time": "1:09:54", "remaining_time": "0:27:52", "throughput": 4246.59, "total_tokens": 17811280} {"current_steps": 27285, "total_steps": 38160, "loss": 0.4046, "lr": 0.00022769582603195533, "epoch": 14.300314465408805, "percentage": 71.5, "elapsed_time": "1:09:55", "remaining_time": "0:27:52", "throughput": 4246.69, "total_tokens": 17815120} {"current_steps": 27290, "total_steps": 38160, "loss": 0.3822, "lr": 0.00022750405799818634, "epoch": 14.30293501048218, "percentage": 71.51, "elapsed_time": "1:09:55", "remaining_time": "0:27:51", "throughput": 4246.75, "total_tokens": 17818608} {"current_steps": 27295, "total_steps": 38160, "loss": 0.4243, "lr": 0.00022731234696745967, "epoch": 14.305555555555555, "percentage": 71.53, "elapsed_time": "1:09:56", "remaining_time": "0:27:50", "throughput": 4246.89, "total_tokens": 17822640} {"current_steps": 27300, "total_steps": 38160, "loss": 0.5681, "lr": 0.0002271206929798792, "epoch": 14.30817610062893, "percentage": 71.54, "elapsed_time": "1:09:57", "remaining_time": "0:27:49", "throughput": 4246.92, "total_tokens": 17825712} {"current_steps": 27305, "total_steps": 38160, "loss": 0.5637, "lr": 0.00022692909607553642, "epoch": 14.310796645702306, "percentage": 71.55, "elapsed_time": "1:09:58", "remaining_time": "0:27:48", "throughput": 4246.91, "total_tokens": 17828624} {"current_steps": 27310, "total_steps": 38160, "loss": 0.5243, "lr": 0.00022673755629451132, "epoch": 14.31341719077568, "percentage": 71.57, "elapsed_time": "1:09:58", "remaining_time": "0:27:48", "throughput": 4246.93, "total_tokens": 17831696} {"current_steps": 27315, "total_steps": 38160, "loss": 0.2973, "lr": 0.00022654607367687213, "epoch": 14.316037735849056, "percentage": 71.58, "elapsed_time": "1:09:59", "remaining_time": "0:27:47", "throughput": 4247.0, "total_tokens": 17835280} {"current_steps": 27320, "total_steps": 38160, "loss": 0.4992, "lr": 0.00022635464826267442, "epoch": 14.318658280922431, "percentage": 71.59, "elapsed_time": "1:10:00", "remaining_time": "0:27:46", "throughput": 4247.15, "total_tokens": 17839472} {"current_steps": 27325, "total_steps": 38160, "loss": 0.3817, "lr": 0.00022616328009196236, "epoch": 14.321278825995806, "percentage": 71.61, "elapsed_time": "1:10:01", "remaining_time": "0:27:45", "throughput": 4247.24, "total_tokens": 17843152} {"current_steps": 27330, "total_steps": 38160, "loss": 0.5328, "lr": 0.0002259719692047682, "epoch": 14.323899371069182, "percentage": 71.62, "elapsed_time": "1:10:01", "remaining_time": "0:27:45", "throughput": 4247.31, "total_tokens": 17846640} {"current_steps": 27335, "total_steps": 38160, "loss": 0.3739, "lr": 0.00022578071564111163, "epoch": 14.326519916142558, "percentage": 71.63, "elapsed_time": "1:10:02", "remaining_time": "0:27:44", "throughput": 4247.34, "total_tokens": 17849776} {"current_steps": 27340, "total_steps": 38160, "loss": 0.4772, "lr": 0.00022558951944100087, "epoch": 14.329140461215934, "percentage": 71.65, "elapsed_time": "1:10:03", "remaining_time": "0:27:43", "throughput": 4247.44, "total_tokens": 17853488} {"current_steps": 27345, "total_steps": 38160, "loss": 0.3493, "lr": 0.00022539838064443223, "epoch": 14.331761006289309, "percentage": 71.66, "elapsed_time": "1:10:03", "remaining_time": "0:27:42", "throughput": 4247.4, "total_tokens": 17855984} {"current_steps": 27350, "total_steps": 38160, "loss": 0.4171, "lr": 0.00022520729929138933, "epoch": 14.334381551362684, "percentage": 71.67, "elapsed_time": "1:10:04", "remaining_time": "0:27:41", "throughput": 4247.42, "total_tokens": 17858992} {"current_steps": 27355, "total_steps": 38160, "loss": 0.3724, "lr": 0.0002250162754218446, "epoch": 14.33700209643606, "percentage": 71.69, "elapsed_time": "1:10:05", "remaining_time": "0:27:41", "throughput": 4247.47, "total_tokens": 17862352} {"current_steps": 27360, "total_steps": 38160, "loss": 0.3881, "lr": 0.00022482530907575767, "epoch": 14.339622641509434, "percentage": 71.7, "elapsed_time": "1:10:06", "remaining_time": "0:27:40", "throughput": 4247.54, "total_tokens": 17865872} {"current_steps": 27365, "total_steps": 38160, "loss": 0.3507, "lr": 0.00022463440029307674, "epoch": 14.34224318658281, "percentage": 71.71, "elapsed_time": "1:10:06", "remaining_time": "0:27:39", "throughput": 4247.55, "total_tokens": 17868880} {"current_steps": 27370, "total_steps": 38160, "loss": 0.4915, "lr": 0.00022444354911373794, "epoch": 14.344863731656185, "percentage": 71.72, "elapsed_time": "1:10:07", "remaining_time": "0:27:38", "throughput": 4247.61, "total_tokens": 17872272} {"current_steps": 27375, "total_steps": 38160, "loss": 0.4061, "lr": 0.00022425275557766473, "epoch": 14.34748427672956, "percentage": 71.74, "elapsed_time": "1:10:08", "remaining_time": "0:27:37", "throughput": 4247.62, "total_tokens": 17875376} {"current_steps": 27380, "total_steps": 38160, "loss": 0.4094, "lr": 0.00022406201972476937, "epoch": 14.350104821802935, "percentage": 71.75, "elapsed_time": "1:10:09", "remaining_time": "0:27:37", "throughput": 4247.75, "total_tokens": 17879408} {"current_steps": 27385, "total_steps": 38160, "loss": 0.4041, "lr": 0.00022387134159495122, "epoch": 14.35272536687631, "percentage": 71.76, "elapsed_time": "1:10:09", "remaining_time": "0:27:36", "throughput": 4247.85, "total_tokens": 17883120} {"current_steps": 27390, "total_steps": 38160, "loss": 0.4827, "lr": 0.00022368072122809813, "epoch": 14.355345911949685, "percentage": 71.78, "elapsed_time": "1:10:10", "remaining_time": "0:27:35", "throughput": 4247.87, "total_tokens": 17886256} {"current_steps": 27395, "total_steps": 38160, "loss": 0.4087, "lr": 0.0002234901586640858, "epoch": 14.35796645702306, "percentage": 71.79, "elapsed_time": "1:10:11", "remaining_time": "0:27:34", "throughput": 4247.97, "total_tokens": 17890160} {"current_steps": 27400, "total_steps": 38160, "loss": 0.5357, "lr": 0.00022329965394277785, "epoch": 14.360587002096436, "percentage": 71.8, "elapsed_time": "1:10:12", "remaining_time": "0:27:34", "throughput": 4248.08, "total_tokens": 17893904} {"current_steps": 27405, "total_steps": 38160, "loss": 0.4048, "lr": 0.00022310920710402532, "epoch": 14.36320754716981, "percentage": 71.82, "elapsed_time": "1:10:12", "remaining_time": "0:27:33", "throughput": 4248.04, "total_tokens": 17896400} {"current_steps": 27410, "total_steps": 38160, "loss": 0.329, "lr": 0.00022291881818766796, "epoch": 14.365828092243186, "percentage": 71.83, "elapsed_time": "1:10:14", "remaining_time": "0:27:32", "throughput": 4248.43, "total_tokens": 17903056} {"current_steps": 27415, "total_steps": 38160, "loss": 0.583, "lr": 0.00022272848723353252, "epoch": 14.368448637316561, "percentage": 71.84, "elapsed_time": "1:10:14", "remaining_time": "0:27:31", "throughput": 4248.43, "total_tokens": 17906032} {"current_steps": 27420, "total_steps": 38160, "loss": 0.4427, "lr": 0.00022253821428143422, "epoch": 14.371069182389936, "percentage": 71.86, "elapsed_time": "1:10:15", "remaining_time": "0:27:31", "throughput": 4248.44, "total_tokens": 17909040} {"current_steps": 27425, "total_steps": 38160, "loss": 0.4625, "lr": 0.0002223479993711761, "epoch": 14.373689727463312, "percentage": 71.87, "elapsed_time": "1:10:16", "remaining_time": "0:27:30", "throughput": 4248.43, "total_tokens": 17911920} {"current_steps": 27430, "total_steps": 38160, "loss": 0.4982, "lr": 0.00022215784254254906, "epoch": 14.376310272536688, "percentage": 71.88, "elapsed_time": "1:10:16", "remaining_time": "0:27:29", "throughput": 4248.42, "total_tokens": 17914608} {"current_steps": 27435, "total_steps": 38160, "loss": 0.3412, "lr": 0.00022196774383533157, "epoch": 14.378930817610064, "percentage": 71.89, "elapsed_time": "1:10:17", "remaining_time": "0:27:28", "throughput": 4248.51, "total_tokens": 17918352} {"current_steps": 27440, "total_steps": 38160, "loss": 0.3611, "lr": 0.0002217777032892899, "epoch": 14.381551362683439, "percentage": 71.91, "elapsed_time": "1:10:18", "remaining_time": "0:27:28", "throughput": 4248.64, "total_tokens": 17922512} {"current_steps": 27445, "total_steps": 38160, "loss": 0.5707, "lr": 0.00022158772094417863, "epoch": 14.384171907756814, "percentage": 71.92, "elapsed_time": "1:10:19", "remaining_time": "0:27:27", "throughput": 4248.7, "total_tokens": 17925904} {"current_steps": 27450, "total_steps": 38160, "loss": 0.5187, "lr": 0.00022139779683973983, "epoch": 14.38679245283019, "percentage": 71.93, "elapsed_time": "1:10:19", "remaining_time": "0:27:26", "throughput": 4248.66, "total_tokens": 17928400} {"current_steps": 27455, "total_steps": 38160, "loss": 0.3943, "lr": 0.00022120793101570364, "epoch": 14.389412997903564, "percentage": 71.95, "elapsed_time": "1:10:20", "remaining_time": "0:27:25", "throughput": 4248.75, "total_tokens": 17932080} {"current_steps": 27460, "total_steps": 38160, "loss": 0.6396, "lr": 0.00022101812351178762, "epoch": 14.39203354297694, "percentage": 71.96, "elapsed_time": "1:10:21", "remaining_time": "0:27:24", "throughput": 4248.86, "total_tokens": 17936016} {"current_steps": 27465, "total_steps": 38160, "loss": 0.5971, "lr": 0.00022082837436769725, "epoch": 14.394654088050315, "percentage": 71.97, "elapsed_time": "1:10:22", "remaining_time": "0:27:24", "throughput": 4248.95, "total_tokens": 17939664} {"current_steps": 27470, "total_steps": 38160, "loss": 0.3858, "lr": 0.00022063868362312596, "epoch": 14.39727463312369, "percentage": 71.99, "elapsed_time": "1:10:22", "remaining_time": "0:27:23", "throughput": 4248.94, "total_tokens": 17942448} {"current_steps": 27475, "total_steps": 38160, "loss": 0.5047, "lr": 0.00022044905131775495, "epoch": 14.399895178197065, "percentage": 72.0, "elapsed_time": "1:10:23", "remaining_time": "0:27:22", "throughput": 4248.95, "total_tokens": 17945456} {"current_steps": 27480, "total_steps": 38160, "loss": 0.3964, "lr": 0.00022025947749125313, "epoch": 14.40251572327044, "percentage": 72.01, "elapsed_time": "1:10:24", "remaining_time": "0:27:21", "throughput": 4249.07, "total_tokens": 17949488} {"current_steps": 27485, "total_steps": 38160, "loss": 0.3688, "lr": 0.0002200699621832773, "epoch": 14.405136268343815, "percentage": 72.03, "elapsed_time": "1:10:25", "remaining_time": "0:27:20", "throughput": 4249.09, "total_tokens": 17952592} {"current_steps": 27490, "total_steps": 38160, "loss": 0.5905, "lr": 0.0002198805054334718, "epoch": 14.40775681341719, "percentage": 72.04, "elapsed_time": "1:10:25", "remaining_time": "0:27:20", "throughput": 4249.12, "total_tokens": 17955696} {"current_steps": 27495, "total_steps": 38160, "loss": 0.5963, "lr": 0.00021969110728146862, "epoch": 14.410377358490566, "percentage": 72.05, "elapsed_time": "1:10:26", "remaining_time": "0:27:19", "throughput": 4249.19, "total_tokens": 17959440} {"current_steps": 27500, "total_steps": 38160, "loss": 0.3618, "lr": 0.00021950176776688784, "epoch": 14.41299790356394, "percentage": 72.06, "elapsed_time": "1:10:27", "remaining_time": "0:27:18", "throughput": 4249.19, "total_tokens": 17962320} {"current_steps": 27505, "total_steps": 38160, "loss": 0.4749, "lr": 0.0002193124869293372, "epoch": 14.415618448637316, "percentage": 72.08, "elapsed_time": "1:10:27", "remaining_time": "0:27:17", "throughput": 4249.22, "total_tokens": 17965360} {"current_steps": 27510, "total_steps": 38160, "loss": 0.3914, "lr": 0.00021912326480841223, "epoch": 14.418238993710691, "percentage": 72.09, "elapsed_time": "1:10:28", "remaining_time": "0:27:17", "throughput": 4249.19, "total_tokens": 17968112} {"current_steps": 27515, "total_steps": 38160, "loss": 0.502, "lr": 0.0002189341014436958, "epoch": 14.420859538784066, "percentage": 72.1, "elapsed_time": "1:10:29", "remaining_time": "0:27:16", "throughput": 4249.23, "total_tokens": 17971344} {"current_steps": 27520, "total_steps": 38160, "loss": 0.3485, "lr": 0.00021874499687475857, "epoch": 14.423480083857442, "percentage": 72.12, "elapsed_time": "1:10:30", "remaining_time": "0:27:15", "throughput": 4249.26, "total_tokens": 17974480} {"current_steps": 27525, "total_steps": 38160, "loss": 0.5049, "lr": 0.00021855595114115935, "epoch": 14.426100628930818, "percentage": 72.13, "elapsed_time": "1:10:30", "remaining_time": "0:27:14", "throughput": 4249.34, "total_tokens": 17978128} {"current_steps": 27530, "total_steps": 38160, "loss": 0.3497, "lr": 0.00021836696428244418, "epoch": 14.428721174004194, "percentage": 72.14, "elapsed_time": "1:10:31", "remaining_time": "0:27:13", "throughput": 4249.43, "total_tokens": 17981808} {"current_steps": 27535, "total_steps": 38160, "loss": 0.4084, "lr": 0.0002181780363381473, "epoch": 14.431341719077569, "percentage": 72.16, "elapsed_time": "1:10:32", "remaining_time": "0:27:13", "throughput": 4249.42, "total_tokens": 17984624} {"current_steps": 27540, "total_steps": 38160, "loss": 0.3961, "lr": 0.00021798916734779, "epoch": 14.433962264150944, "percentage": 72.17, "elapsed_time": "1:10:32", "remaining_time": "0:27:12", "throughput": 4249.41, "total_tokens": 17987344} {"current_steps": 27545, "total_steps": 38160, "loss": 0.6958, "lr": 0.00021780035735088132, "epoch": 14.43658280922432, "percentage": 72.18, "elapsed_time": "1:10:33", "remaining_time": "0:27:11", "throughput": 4249.48, "total_tokens": 17990928} {"current_steps": 27550, "total_steps": 38160, "loss": 0.4041, "lr": 0.0002176116063869184, "epoch": 14.439203354297694, "percentage": 72.2, "elapsed_time": "1:10:34", "remaining_time": "0:27:10", "throughput": 4249.55, "total_tokens": 17994384} {"current_steps": 27555, "total_steps": 38160, "loss": 0.4656, "lr": 0.00021742291449538582, "epoch": 14.44182389937107, "percentage": 72.21, "elapsed_time": "1:10:35", "remaining_time": "0:27:09", "throughput": 4249.51, "total_tokens": 17996944} {"current_steps": 27560, "total_steps": 38160, "loss": 0.4641, "lr": 0.00021723428171575566, "epoch": 14.444444444444445, "percentage": 72.22, "elapsed_time": "1:10:35", "remaining_time": "0:27:09", "throughput": 4249.57, "total_tokens": 18000464} {"current_steps": 27565, "total_steps": 38160, "loss": 0.3922, "lr": 0.00021704570808748802, "epoch": 14.44706498951782, "percentage": 72.24, "elapsed_time": "1:10:36", "remaining_time": "0:27:08", "throughput": 4249.6, "total_tokens": 18003664} {"current_steps": 27570, "total_steps": 38160, "loss": 0.4248, "lr": 0.00021685719365003008, "epoch": 14.449685534591195, "percentage": 72.25, "elapsed_time": "1:10:37", "remaining_time": "0:27:07", "throughput": 4249.59, "total_tokens": 18006480} {"current_steps": 27575, "total_steps": 38160, "loss": 0.5848, "lr": 0.00021666873844281682, "epoch": 14.45230607966457, "percentage": 72.26, "elapsed_time": "1:10:37", "remaining_time": "0:27:06", "throughput": 4249.6, "total_tokens": 18009424} {"current_steps": 27580, "total_steps": 38160, "loss": 0.3376, "lr": 0.0002164803425052711, "epoch": 14.454926624737945, "percentage": 72.27, "elapsed_time": "1:10:38", "remaining_time": "0:27:05", "throughput": 4249.66, "total_tokens": 18012816} {"current_steps": 27585, "total_steps": 38160, "loss": 0.6486, "lr": 0.0002162920058768031, "epoch": 14.45754716981132, "percentage": 72.29, "elapsed_time": "1:10:39", "remaining_time": "0:27:05", "throughput": 4249.88, "total_tokens": 18017808} {"current_steps": 27590, "total_steps": 38160, "loss": 0.3762, "lr": 0.000216103728596811, "epoch": 14.460167714884696, "percentage": 72.3, "elapsed_time": "1:10:40", "remaining_time": "0:27:04", "throughput": 4249.94, "total_tokens": 18021168} {"current_steps": 27595, "total_steps": 38160, "loss": 0.5142, "lr": 0.00021591551070467975, "epoch": 14.46278825995807, "percentage": 72.31, "elapsed_time": "1:10:40", "remaining_time": "0:27:03", "throughput": 4249.93, "total_tokens": 18023920} {"current_steps": 27600, "total_steps": 38160, "loss": 0.3676, "lr": 0.0002157273522397829, "epoch": 14.465408805031446, "percentage": 72.33, "elapsed_time": "1:10:41", "remaining_time": "0:27:02", "throughput": 4249.98, "total_tokens": 18027248} {"current_steps": 27605, "total_steps": 38160, "loss": 0.46, "lr": 0.0002155392532414806, "epoch": 14.468029350104821, "percentage": 72.34, "elapsed_time": "1:10:42", "remaining_time": "0:27:02", "throughput": 4249.97, "total_tokens": 18030096} {"current_steps": 27610, "total_steps": 38160, "loss": 0.3913, "lr": 0.00021535121374912126, "epoch": 14.470649895178196, "percentage": 72.35, "elapsed_time": "1:10:43", "remaining_time": "0:27:01", "throughput": 4250.04, "total_tokens": 18033584} {"current_steps": 27615, "total_steps": 38160, "loss": 0.4215, "lr": 0.00021516323380204073, "epoch": 14.473270440251572, "percentage": 72.37, "elapsed_time": "1:10:44", "remaining_time": "0:27:00", "throughput": 4250.19, "total_tokens": 18037936} {"current_steps": 27620, "total_steps": 38160, "loss": 0.5958, "lr": 0.00021497531343956188, "epoch": 14.475890985324948, "percentage": 72.38, "elapsed_time": "1:10:44", "remaining_time": "0:26:59", "throughput": 4250.22, "total_tokens": 18041136} {"current_steps": 27625, "total_steps": 38160, "loss": 0.3933, "lr": 0.00021478745270099591, "epoch": 14.478511530398324, "percentage": 72.39, "elapsed_time": "1:10:45", "remaining_time": "0:26:59", "throughput": 4250.27, "total_tokens": 18044368} {"current_steps": 27630, "total_steps": 38160, "loss": 0.5094, "lr": 0.0002145996516256408, "epoch": 14.481132075471699, "percentage": 72.41, "elapsed_time": "1:10:46", "remaining_time": "0:26:58", "throughput": 4250.22, "total_tokens": 18046832} {"current_steps": 27635, "total_steps": 38160, "loss": 0.4683, "lr": 0.00021441191025278256, "epoch": 14.483752620545074, "percentage": 72.42, "elapsed_time": "1:10:46", "remaining_time": "0:26:57", "throughput": 4250.26, "total_tokens": 18050096} {"current_steps": 27640, "total_steps": 38160, "loss": 0.4459, "lr": 0.00021422422862169455, "epoch": 14.48637316561845, "percentage": 72.43, "elapsed_time": "1:10:47", "remaining_time": "0:26:56", "throughput": 4250.21, "total_tokens": 18052528} {"current_steps": 27645, "total_steps": 38160, "loss": 0.3308, "lr": 0.00021403660677163773, "epoch": 14.488993710691824, "percentage": 72.44, "elapsed_time": "1:10:48", "remaining_time": "0:26:55", "throughput": 4250.22, "total_tokens": 18055536} {"current_steps": 27650, "total_steps": 38160, "loss": 0.4092, "lr": 0.00021384904474186018, "epoch": 14.4916142557652, "percentage": 72.46, "elapsed_time": "1:10:48", "remaining_time": "0:26:55", "throughput": 4250.3, "total_tokens": 18059152} {"current_steps": 27655, "total_steps": 38160, "loss": 0.569, "lr": 0.00021366154257159808, "epoch": 14.494234800838575, "percentage": 72.47, "elapsed_time": "1:10:49", "remaining_time": "0:26:54", "throughput": 4250.29, "total_tokens": 18061936} {"current_steps": 27660, "total_steps": 38160, "loss": 0.4286, "lr": 0.00021347410030007435, "epoch": 14.49685534591195, "percentage": 72.48, "elapsed_time": "1:10:50", "remaining_time": "0:26:53", "throughput": 4250.35, "total_tokens": 18065264} {"current_steps": 27665, "total_steps": 38160, "loss": 0.4508, "lr": 0.0002132867179665, "epoch": 14.499475890985325, "percentage": 72.5, "elapsed_time": "1:10:51", "remaining_time": "0:26:52", "throughput": 4250.37, "total_tokens": 18068336} {"current_steps": 27670, "total_steps": 38160, "loss": 0.4374, "lr": 0.00021309939561007341, "epoch": 14.5020964360587, "percentage": 72.51, "elapsed_time": "1:10:51", "remaining_time": "0:26:51", "throughput": 4250.41, "total_tokens": 18071600} {"current_steps": 27675, "total_steps": 38160, "loss": 0.4274, "lr": 0.00021291213326997998, "epoch": 14.504716981132075, "percentage": 72.52, "elapsed_time": "1:10:52", "remaining_time": "0:26:51", "throughput": 4250.52, "total_tokens": 18075472} {"current_steps": 27680, "total_steps": 38160, "loss": 0.3908, "lr": 0.00021272493098539296, "epoch": 14.50733752620545, "percentage": 72.54, "elapsed_time": "1:10:53", "remaining_time": "0:26:50", "throughput": 4250.59, "total_tokens": 18078992} {"current_steps": 27685, "total_steps": 38160, "loss": 0.514, "lr": 0.0002125377887954732, "epoch": 14.509958071278826, "percentage": 72.55, "elapsed_time": "1:10:53", "remaining_time": "0:26:49", "throughput": 4250.59, "total_tokens": 18081872} {"current_steps": 27690, "total_steps": 38160, "loss": 0.3714, "lr": 0.00021235070673936824, "epoch": 14.5125786163522, "percentage": 72.56, "elapsed_time": "1:10:54", "remaining_time": "0:26:48", "throughput": 4250.61, "total_tokens": 18084944} {"current_steps": 27695, "total_steps": 38160, "loss": 0.5238, "lr": 0.00021216368485621394, "epoch": 14.515199161425576, "percentage": 72.58, "elapsed_time": "1:10:55", "remaining_time": "0:26:47", "throughput": 4250.63, "total_tokens": 18088016} {"current_steps": 27700, "total_steps": 38160, "loss": 0.5574, "lr": 0.00021197672318513282, "epoch": 14.517819706498951, "percentage": 72.59, "elapsed_time": "1:10:56", "remaining_time": "0:26:47", "throughput": 4250.66, "total_tokens": 18091216} {"current_steps": 27705, "total_steps": 38160, "loss": 0.4645, "lr": 0.00021178982176523525, "epoch": 14.520440251572326, "percentage": 72.6, "elapsed_time": "1:10:56", "remaining_time": "0:26:46", "throughput": 4250.72, "total_tokens": 18094736} {"current_steps": 27710, "total_steps": 38160, "loss": 0.4659, "lr": 0.0002116029806356189, "epoch": 14.523060796645701, "percentage": 72.62, "elapsed_time": "1:10:57", "remaining_time": "0:26:45", "throughput": 4250.69, "total_tokens": 18097392} {"current_steps": 27715, "total_steps": 38160, "loss": 0.4246, "lr": 0.00021141619983536893, "epoch": 14.525681341719078, "percentage": 72.63, "elapsed_time": "1:10:58", "remaining_time": "0:26:44", "throughput": 4250.65, "total_tokens": 18099888} {"current_steps": 27720, "total_steps": 38160, "loss": 0.3949, "lr": 0.00021122947940355747, "epoch": 14.528301886792454, "percentage": 72.64, "elapsed_time": "1:10:58", "remaining_time": "0:26:43", "throughput": 4250.69, "total_tokens": 18103248} {"current_steps": 27725, "total_steps": 38160, "loss": 0.4464, "lr": 0.00021104281937924462, "epoch": 14.530922431865829, "percentage": 72.65, "elapsed_time": "1:10:59", "remaining_time": "0:26:43", "throughput": 4250.66, "total_tokens": 18105808} {"current_steps": 27730, "total_steps": 38160, "loss": 0.4186, "lr": 0.00021085621980147716, "epoch": 14.533542976939204, "percentage": 72.67, "elapsed_time": "1:11:00", "remaining_time": "0:26:42", "throughput": 4250.67, "total_tokens": 18108880} {"current_steps": 27735, "total_steps": 38160, "loss": 0.4191, "lr": 0.00021066968070928982, "epoch": 14.536163522012579, "percentage": 72.68, "elapsed_time": "1:11:01", "remaining_time": "0:26:41", "throughput": 4250.75, "total_tokens": 18112496} {"current_steps": 27740, "total_steps": 38160, "loss": 0.3526, "lr": 0.00021048320214170463, "epoch": 14.538784067085954, "percentage": 72.69, "elapsed_time": "1:11:01", "remaining_time": "0:26:40", "throughput": 4250.85, "total_tokens": 18116272} {"current_steps": 27745, "total_steps": 38160, "loss": 0.3931, "lr": 0.00021029678413773034, "epoch": 14.54140461215933, "percentage": 72.71, "elapsed_time": "1:11:02", "remaining_time": "0:26:40", "throughput": 4250.91, "total_tokens": 18119696} {"current_steps": 27750, "total_steps": 38160, "loss": 0.4052, "lr": 0.0002101104267363639, "epoch": 14.544025157232705, "percentage": 72.72, "elapsed_time": "1:11:03", "remaining_time": "0:26:39", "throughput": 4251.1, "total_tokens": 18124464} {"current_steps": 27755, "total_steps": 38160, "loss": 0.355, "lr": 0.00020992412997658877, "epoch": 14.54664570230608, "percentage": 72.73, "elapsed_time": "1:11:04", "remaining_time": "0:26:38", "throughput": 4251.11, "total_tokens": 18127472} {"current_steps": 27760, "total_steps": 38160, "loss": 0.4528, "lr": 0.0002097378938973763, "epoch": 14.549266247379455, "percentage": 72.75, "elapsed_time": "1:11:04", "remaining_time": "0:26:37", "throughput": 4251.09, "total_tokens": 18130224} {"current_steps": 27765, "total_steps": 38160, "loss": 0.3677, "lr": 0.0002095517185376849, "epoch": 14.55188679245283, "percentage": 72.76, "elapsed_time": "1:11:05", "remaining_time": "0:26:36", "throughput": 4251.07, "total_tokens": 18132976} {"current_steps": 27770, "total_steps": 38160, "loss": 0.4321, "lr": 0.0002093656039364606, "epoch": 14.554507337526205, "percentage": 72.77, "elapsed_time": "1:11:06", "remaining_time": "0:26:36", "throughput": 4251.12, "total_tokens": 18136336} {"current_steps": 27775, "total_steps": 38160, "loss": 0.3491, "lr": 0.00020917955013263618, "epoch": 14.55712788259958, "percentage": 72.79, "elapsed_time": "1:11:06", "remaining_time": "0:26:35", "throughput": 4251.1, "total_tokens": 18139056} {"current_steps": 27780, "total_steps": 38160, "loss": 0.4062, "lr": 0.00020899355716513186, "epoch": 14.559748427672956, "percentage": 72.8, "elapsed_time": "1:11:07", "remaining_time": "0:26:34", "throughput": 4251.06, "total_tokens": 18141552} {"current_steps": 27785, "total_steps": 38160, "loss": 0.5064, "lr": 0.00020880762507285544, "epoch": 14.56236897274633, "percentage": 72.81, "elapsed_time": "1:11:08", "remaining_time": "0:26:33", "throughput": 4251.06, "total_tokens": 18144496} {"current_steps": 27790, "total_steps": 38160, "loss": 0.3658, "lr": 0.00020862175389470172, "epoch": 14.564989517819706, "percentage": 72.82, "elapsed_time": "1:11:08", "remaining_time": "0:26:32", "throughput": 4251.11, "total_tokens": 18147792} {"current_steps": 27795, "total_steps": 38160, "loss": 0.5015, "lr": 0.00020843594366955288, "epoch": 14.567610062893081, "percentage": 72.84, "elapsed_time": "1:11:09", "remaining_time": "0:26:32", "throughput": 4251.13, "total_tokens": 18150864} {"current_steps": 27800, "total_steps": 38160, "loss": 0.3773, "lr": 0.0002082501944362784, "epoch": 14.570230607966456, "percentage": 72.85, "elapsed_time": "1:11:10", "remaining_time": "0:26:31", "throughput": 4251.18, "total_tokens": 18154192} {"current_steps": 27805, "total_steps": 38160, "loss": 0.4562, "lr": 0.00020806450623373486, "epoch": 14.572851153039831, "percentage": 72.86, "elapsed_time": "1:11:11", "remaining_time": "0:26:30", "throughput": 4251.23, "total_tokens": 18157616} {"current_steps": 27810, "total_steps": 38160, "loss": 0.3914, "lr": 0.00020787887910076586, "epoch": 14.575471698113208, "percentage": 72.88, "elapsed_time": "1:11:11", "remaining_time": "0:26:29", "throughput": 4251.24, "total_tokens": 18160624} {"current_steps": 27815, "total_steps": 38160, "loss": 0.5241, "lr": 0.00020769331307620258, "epoch": 14.578092243186584, "percentage": 72.89, "elapsed_time": "1:11:12", "remaining_time": "0:26:29", "throughput": 4251.3, "total_tokens": 18164048} {"current_steps": 27820, "total_steps": 38160, "loss": 0.5825, "lr": 0.0002075078081988635, "epoch": 14.580712788259959, "percentage": 72.9, "elapsed_time": "1:11:13", "remaining_time": "0:26:28", "throughput": 4251.35, "total_tokens": 18167408} {"current_steps": 27825, "total_steps": 38160, "loss": 0.3209, "lr": 0.00020732236450755415, "epoch": 14.583333333333334, "percentage": 72.92, "elapsed_time": "1:11:14", "remaining_time": "0:26:27", "throughput": 4251.38, "total_tokens": 18170608} {"current_steps": 27830, "total_steps": 38160, "loss": 0.472, "lr": 0.00020713698204106708, "epoch": 14.585953878406709, "percentage": 72.93, "elapsed_time": "1:11:14", "remaining_time": "0:26:26", "throughput": 4251.34, "total_tokens": 18173136} {"current_steps": 27835, "total_steps": 38160, "loss": 0.5252, "lr": 0.00020695166083818206, "epoch": 14.588574423480084, "percentage": 72.94, "elapsed_time": "1:11:15", "remaining_time": "0:26:25", "throughput": 4251.34, "total_tokens": 18176048} {"current_steps": 27840, "total_steps": 38160, "loss": 0.5091, "lr": 0.0002067664009376663, "epoch": 14.59119496855346, "percentage": 72.96, "elapsed_time": "1:11:16", "remaining_time": "0:26:25", "throughput": 4251.4, "total_tokens": 18179440} {"current_steps": 27845, "total_steps": 38160, "loss": 0.4915, "lr": 0.0002065812023782741, "epoch": 14.593815513626835, "percentage": 72.97, "elapsed_time": "1:11:16", "remaining_time": "0:26:24", "throughput": 4251.37, "total_tokens": 18182032} {"current_steps": 27850, "total_steps": 38160, "loss": 0.4245, "lr": 0.00020639606519874703, "epoch": 14.59643605870021, "percentage": 72.98, "elapsed_time": "1:11:17", "remaining_time": "0:26:23", "throughput": 4251.34, "total_tokens": 18184656} {"current_steps": 27855, "total_steps": 38160, "loss": 0.4473, "lr": 0.00020621098943781352, "epoch": 14.599056603773585, "percentage": 73.0, "elapsed_time": "1:11:18", "remaining_time": "0:26:22", "throughput": 4251.29, "total_tokens": 18187088} {"current_steps": 27860, "total_steps": 38160, "loss": 0.3805, "lr": 0.0002060259751341891, "epoch": 14.60167714884696, "percentage": 73.01, "elapsed_time": "1:11:18", "remaining_time": "0:26:21", "throughput": 4251.29, "total_tokens": 18189936} {"current_steps": 27865, "total_steps": 38160, "loss": 0.3587, "lr": 0.00020584102232657688, "epoch": 14.604297693920335, "percentage": 73.02, "elapsed_time": "1:11:19", "remaining_time": "0:26:21", "throughput": 4251.34, "total_tokens": 18193360} {"current_steps": 27870, "total_steps": 38160, "loss": 0.2909, "lr": 0.0002056561310536668, "epoch": 14.60691823899371, "percentage": 73.03, "elapsed_time": "1:11:20", "remaining_time": "0:26:20", "throughput": 4251.32, "total_tokens": 18196080} {"current_steps": 27875, "total_steps": 38160, "loss": 0.3938, "lr": 0.0002054713013541361, "epoch": 14.609538784067086, "percentage": 73.05, "elapsed_time": "1:11:20", "remaining_time": "0:26:19", "throughput": 4251.35, "total_tokens": 18199248} {"current_steps": 27880, "total_steps": 38160, "loss": 0.3668, "lr": 0.00020528653326664915, "epoch": 14.61215932914046, "percentage": 73.06, "elapsed_time": "1:11:21", "remaining_time": "0:26:18", "throughput": 4251.46, "total_tokens": 18203088} {"current_steps": 27885, "total_steps": 38160, "loss": 0.4116, "lr": 0.00020510182682985717, "epoch": 14.614779874213836, "percentage": 73.07, "elapsed_time": "1:11:22", "remaining_time": "0:26:17", "throughput": 4251.44, "total_tokens": 18205936} {"current_steps": 27890, "total_steps": 38160, "loss": 0.4469, "lr": 0.00020491718208239847, "epoch": 14.617400419287211, "percentage": 73.09, "elapsed_time": "1:11:23", "remaining_time": "0:26:17", "throughput": 4251.55, "total_tokens": 18209712} {"current_steps": 27895, "total_steps": 38160, "loss": 0.45, "lr": 0.00020473259906289877, "epoch": 14.620020964360586, "percentage": 73.1, "elapsed_time": "1:11:24", "remaining_time": "0:26:16", "throughput": 4251.78, "total_tokens": 18214864} {"current_steps": 27900, "total_steps": 38160, "loss": 0.3866, "lr": 0.00020454807780997077, "epoch": 14.622641509433961, "percentage": 73.11, "elapsed_time": "1:11:24", "remaining_time": "0:26:15", "throughput": 4251.8, "total_tokens": 18218032} {"current_steps": 27905, "total_steps": 38160, "loss": 0.3935, "lr": 0.0002043636183622144, "epoch": 14.625262054507338, "percentage": 73.13, "elapsed_time": "1:11:25", "remaining_time": "0:26:14", "throughput": 4251.93, "total_tokens": 18222096} {"current_steps": 27910, "total_steps": 38160, "loss": 0.4527, "lr": 0.00020417922075821626, "epoch": 14.627882599580714, "percentage": 73.14, "elapsed_time": "1:11:26", "remaining_time": "0:26:14", "throughput": 4251.97, "total_tokens": 18225360} {"current_steps": 27915, "total_steps": 38160, "loss": 0.5327, "lr": 0.00020399488503655005, "epoch": 14.630503144654089, "percentage": 73.15, "elapsed_time": "1:11:27", "remaining_time": "0:26:13", "throughput": 4251.97, "total_tokens": 18228304} {"current_steps": 27920, "total_steps": 38160, "loss": 0.5401, "lr": 0.00020381061123577688, "epoch": 14.633123689727464, "percentage": 73.17, "elapsed_time": "1:11:27", "remaining_time": "0:26:12", "throughput": 4252.0, "total_tokens": 18231504} {"current_steps": 27925, "total_steps": 38160, "loss": 0.4637, "lr": 0.00020362639939444473, "epoch": 14.635744234800839, "percentage": 73.18, "elapsed_time": "1:11:28", "remaining_time": "0:26:11", "throughput": 4251.99, "total_tokens": 18234320} {"current_steps": 27930, "total_steps": 38160, "loss": 0.4121, "lr": 0.0002034422495510888, "epoch": 14.638364779874214, "percentage": 73.19, "elapsed_time": "1:11:29", "remaining_time": "0:26:10", "throughput": 4252.01, "total_tokens": 18237296} {"current_steps": 27935, "total_steps": 38160, "loss": 0.4625, "lr": 0.00020325816174423077, "epoch": 14.64098532494759, "percentage": 73.2, "elapsed_time": "1:11:29", "remaining_time": "0:26:10", "throughput": 4251.95, "total_tokens": 18239696} {"current_steps": 27940, "total_steps": 38160, "loss": 0.5882, "lr": 0.00020307413601238012, "epoch": 14.643605870020965, "percentage": 73.22, "elapsed_time": "1:11:30", "remaining_time": "0:26:09", "throughput": 4252.0, "total_tokens": 18243088} {"current_steps": 27945, "total_steps": 38160, "loss": 0.5, "lr": 0.00020289017239403246, "epoch": 14.64622641509434, "percentage": 73.23, "elapsed_time": "1:11:31", "remaining_time": "0:26:08", "throughput": 4252.02, "total_tokens": 18246096} {"current_steps": 27950, "total_steps": 38160, "loss": 0.3387, "lr": 0.0002027062709276712, "epoch": 14.648846960167715, "percentage": 73.24, "elapsed_time": "1:11:31", "remaining_time": "0:26:07", "throughput": 4252.07, "total_tokens": 18249424} {"current_steps": 27955, "total_steps": 38160, "loss": 0.3408, "lr": 0.00020252243165176632, "epoch": 14.65146750524109, "percentage": 73.26, "elapsed_time": "1:11:32", "remaining_time": "0:26:07", "throughput": 4252.14, "total_tokens": 18252976} {"current_steps": 27960, "total_steps": 38160, "loss": 0.4808, "lr": 0.00020233865460477508, "epoch": 14.654088050314465, "percentage": 73.27, "elapsed_time": "1:11:33", "remaining_time": "0:26:06", "throughput": 4252.1, "total_tokens": 18255568} {"current_steps": 27965, "total_steps": 38160, "loss": 0.3687, "lr": 0.00020215493982514128, "epoch": 14.65670859538784, "percentage": 73.28, "elapsed_time": "1:11:34", "remaining_time": "0:26:05", "throughput": 4252.22, "total_tokens": 18259664} {"current_steps": 27970, "total_steps": 38160, "loss": 0.3184, "lr": 0.00020197128735129622, "epoch": 14.659329140461216, "percentage": 73.3, "elapsed_time": "1:11:34", "remaining_time": "0:26:04", "throughput": 4252.25, "total_tokens": 18262896} {"current_steps": 27975, "total_steps": 38160, "loss": 0.4143, "lr": 0.0002017876972216575, "epoch": 14.66194968553459, "percentage": 73.31, "elapsed_time": "1:11:35", "remaining_time": "0:26:03", "throughput": 4252.25, "total_tokens": 18265776} {"current_steps": 27980, "total_steps": 38160, "loss": 0.4659, "lr": 0.00020160416947463046, "epoch": 14.664570230607966, "percentage": 73.32, "elapsed_time": "1:11:36", "remaining_time": "0:26:03", "throughput": 4252.21, "total_tokens": 18268336} {"current_steps": 27985, "total_steps": 38160, "loss": 0.4876, "lr": 0.00020142070414860702, "epoch": 14.667190775681341, "percentage": 73.34, "elapsed_time": "1:11:36", "remaining_time": "0:26:02", "throughput": 4252.22, "total_tokens": 18271312} {"current_steps": 27990, "total_steps": 38160, "loss": 0.3474, "lr": 0.0002012373012819657, "epoch": 14.669811320754716, "percentage": 73.35, "elapsed_time": "1:11:37", "remaining_time": "0:26:01", "throughput": 4252.22, "total_tokens": 18274224} {"current_steps": 27995, "total_steps": 38160, "loss": 0.4803, "lr": 0.00020105396091307247, "epoch": 14.672431865828091, "percentage": 73.36, "elapsed_time": "1:11:38", "remaining_time": "0:26:00", "throughput": 4252.23, "total_tokens": 18277200} {"current_steps": 28000, "total_steps": 38160, "loss": 0.4094, "lr": 0.0002008706830802803, "epoch": 14.675052410901468, "percentage": 73.38, "elapsed_time": "1:11:38", "remaining_time": "0:25:59", "throughput": 4252.21, "total_tokens": 18280016} {"current_steps": 28005, "total_steps": 38160, "loss": 0.4543, "lr": 0.00020068746782192837, "epoch": 14.677672955974844, "percentage": 73.39, "elapsed_time": "1:11:39", "remaining_time": "0:25:59", "throughput": 4252.26, "total_tokens": 18283312} {"current_steps": 28010, "total_steps": 38160, "loss": 0.4791, "lr": 0.00020050431517634366, "epoch": 14.680293501048219, "percentage": 73.4, "elapsed_time": "1:11:40", "remaining_time": "0:25:58", "throughput": 4252.24, "total_tokens": 18286064} {"current_steps": 28015, "total_steps": 38160, "loss": 0.6439, "lr": 0.00020032122518183915, "epoch": 14.682914046121594, "percentage": 73.41, "elapsed_time": "1:11:40", "remaining_time": "0:25:57", "throughput": 4252.18, "total_tokens": 18288496} {"current_steps": 28020, "total_steps": 38160, "loss": 0.4623, "lr": 0.00020013819787671538, "epoch": 14.685534591194969, "percentage": 73.43, "elapsed_time": "1:11:41", "remaining_time": "0:25:56", "throughput": 4252.11, "total_tokens": 18290768} {"current_steps": 28025, "total_steps": 38160, "loss": 0.4255, "lr": 0.00019995523329925985, "epoch": 14.688155136268344, "percentage": 73.44, "elapsed_time": "1:11:42", "remaining_time": "0:25:55", "throughput": 4252.15, "total_tokens": 18294096} {"current_steps": 28030, "total_steps": 38160, "loss": 0.4384, "lr": 0.00019977233148774627, "epoch": 14.69077568134172, "percentage": 73.45, "elapsed_time": "1:11:43", "remaining_time": "0:25:55", "throughput": 4252.18, "total_tokens": 18297296} {"current_steps": 28035, "total_steps": 38160, "loss": 0.3535, "lr": 0.00019958949248043573, "epoch": 14.693396226415095, "percentage": 73.47, "elapsed_time": "1:11:43", "remaining_time": "0:25:54", "throughput": 4252.19, "total_tokens": 18300176} {"current_steps": 28040, "total_steps": 38160, "loss": 0.5187, "lr": 0.00019940671631557628, "epoch": 14.69601677148847, "percentage": 73.48, "elapsed_time": "1:11:44", "remaining_time": "0:25:53", "throughput": 4252.21, "total_tokens": 18303280} {"current_steps": 28045, "total_steps": 38160, "loss": 0.4306, "lr": 0.0001992240030314022, "epoch": 14.698637316561845, "percentage": 73.49, "elapsed_time": "1:11:45", "remaining_time": "0:25:52", "throughput": 4252.23, "total_tokens": 18306320} {"current_steps": 28050, "total_steps": 38160, "loss": 0.4601, "lr": 0.00019904135266613532, "epoch": 14.70125786163522, "percentage": 73.51, "elapsed_time": "1:11:45", "remaining_time": "0:25:51", "throughput": 4252.24, "total_tokens": 18309264} {"current_steps": 28055, "total_steps": 38160, "loss": 0.389, "lr": 0.00019885876525798407, "epoch": 14.703878406708595, "percentage": 73.52, "elapsed_time": "1:11:46", "remaining_time": "0:25:51", "throughput": 4252.24, "total_tokens": 18312144} {"current_steps": 28060, "total_steps": 38160, "loss": 0.3739, "lr": 0.0001986762408451434, "epoch": 14.70649895178197, "percentage": 73.53, "elapsed_time": "1:11:47", "remaining_time": "0:25:50", "throughput": 4252.18, "total_tokens": 18314448} {"current_steps": 28065, "total_steps": 38160, "loss": 0.4019, "lr": 0.00019849377946579562, "epoch": 14.709119496855346, "percentage": 73.55, "elapsed_time": "1:11:47", "remaining_time": "0:25:49", "throughput": 4252.17, "total_tokens": 18317200} {"current_steps": 28070, "total_steps": 38160, "loss": 0.4763, "lr": 0.00019831138115810926, "epoch": 14.71174004192872, "percentage": 73.56, "elapsed_time": "1:11:48", "remaining_time": "0:25:48", "throughput": 4252.22, "total_tokens": 18320464} {"current_steps": 28075, "total_steps": 38160, "loss": 0.4822, "lr": 0.00019812904596024005, "epoch": 14.714360587002096, "percentage": 73.57, "elapsed_time": "1:11:49", "remaining_time": "0:25:47", "throughput": 4252.24, "total_tokens": 18323568} {"current_steps": 28080, "total_steps": 38160, "loss": 0.5554, "lr": 0.00019794677391033055, "epoch": 14.716981132075471, "percentage": 73.58, "elapsed_time": "1:11:49", "remaining_time": "0:25:47", "throughput": 4252.29, "total_tokens": 18326928} {"current_steps": 28085, "total_steps": 38160, "loss": 0.5122, "lr": 0.00019776456504651014, "epoch": 14.719601677148846, "percentage": 73.6, "elapsed_time": "1:11:50", "remaining_time": "0:25:46", "throughput": 4252.28, "total_tokens": 18329808} {"current_steps": 28090, "total_steps": 38160, "loss": 0.5033, "lr": 0.0001975824194068946, "epoch": 14.722222222222221, "percentage": 73.61, "elapsed_time": "1:11:51", "remaining_time": "0:25:45", "throughput": 4252.36, "total_tokens": 18333424} {"current_steps": 28095, "total_steps": 38160, "loss": 0.3356, "lr": 0.00019740033702958653, "epoch": 14.724842767295598, "percentage": 73.62, "elapsed_time": "1:11:52", "remaining_time": "0:25:44", "throughput": 4252.35, "total_tokens": 18336176} {"current_steps": 28100, "total_steps": 38160, "loss": 0.3632, "lr": 0.0001972183179526758, "epoch": 14.727463312368974, "percentage": 73.64, "elapsed_time": "1:11:52", "remaining_time": "0:25:43", "throughput": 4252.4, "total_tokens": 18339568} {"current_steps": 28105, "total_steps": 38160, "loss": 0.3456, "lr": 0.0001970363622142386, "epoch": 14.730083857442349, "percentage": 73.65, "elapsed_time": "1:11:53", "remaining_time": "0:25:43", "throughput": 4252.42, "total_tokens": 18342640} {"current_steps": 28110, "total_steps": 38160, "loss": 0.3701, "lr": 0.00019685446985233824, "epoch": 14.732704402515724, "percentage": 73.66, "elapsed_time": "1:11:54", "remaining_time": "0:25:42", "throughput": 4252.44, "total_tokens": 18345712} {"current_steps": 28115, "total_steps": 38160, "loss": 0.2969, "lr": 0.00019667264090502412, "epoch": 14.735324947589099, "percentage": 73.68, "elapsed_time": "1:11:54", "remaining_time": "0:25:41", "throughput": 4252.43, "total_tokens": 18348528} {"current_steps": 28120, "total_steps": 38160, "loss": 0.4981, "lr": 0.0001964908754103331, "epoch": 14.737945492662474, "percentage": 73.69, "elapsed_time": "1:11:55", "remaining_time": "0:25:40", "throughput": 4252.57, "total_tokens": 18352720} {"current_steps": 28125, "total_steps": 38160, "loss": 0.3792, "lr": 0.00019630917340628822, "epoch": 14.74056603773585, "percentage": 73.7, "elapsed_time": "1:11:56", "remaining_time": "0:25:40", "throughput": 4252.69, "total_tokens": 18356752} {"current_steps": 28130, "total_steps": 38160, "loss": 0.3193, "lr": 0.00019612753493089959, "epoch": 14.743186582809225, "percentage": 73.72, "elapsed_time": "1:11:57", "remaining_time": "0:25:39", "throughput": 4252.74, "total_tokens": 18360080} {"current_steps": 28135, "total_steps": 38160, "loss": 0.5289, "lr": 0.00019594596002216387, "epoch": 14.7458071278826, "percentage": 73.73, "elapsed_time": "1:11:57", "remaining_time": "0:25:38", "throughput": 4252.75, "total_tokens": 18363056} {"current_steps": 28140, "total_steps": 38160, "loss": 0.4409, "lr": 0.00019576444871806465, "epoch": 14.748427672955975, "percentage": 73.74, "elapsed_time": "1:11:58", "remaining_time": "0:25:37", "throughput": 4252.7, "total_tokens": 18365488} {"current_steps": 28145, "total_steps": 38160, "loss": 0.4176, "lr": 0.0001955830010565719, "epoch": 14.75104821802935, "percentage": 73.76, "elapsed_time": "1:11:59", "remaining_time": "0:25:36", "throughput": 4252.69, "total_tokens": 18368368} {"current_steps": 28150, "total_steps": 38160, "loss": 0.483, "lr": 0.00019540161707564213, "epoch": 14.753668763102725, "percentage": 73.77, "elapsed_time": "1:11:59", "remaining_time": "0:25:36", "throughput": 4252.74, "total_tokens": 18371696} {"current_steps": 28155, "total_steps": 38160, "loss": 0.4323, "lr": 0.000195220296813219, "epoch": 14.7562893081761, "percentage": 73.78, "elapsed_time": "1:12:00", "remaining_time": "0:25:35", "throughput": 4252.74, "total_tokens": 18374576} {"current_steps": 28160, "total_steps": 38160, "loss": 0.403, "lr": 0.00019503904030723274, "epoch": 14.758909853249476, "percentage": 73.79, "elapsed_time": "1:12:01", "remaining_time": "0:25:34", "throughput": 4252.85, "total_tokens": 18378512} {"current_steps": 28165, "total_steps": 38160, "loss": 0.5063, "lr": 0.00019485784759560004, "epoch": 14.76153039832285, "percentage": 73.81, "elapsed_time": "1:12:02", "remaining_time": "0:25:33", "throughput": 4252.92, "total_tokens": 18382032} {"current_steps": 28170, "total_steps": 38160, "loss": 0.3538, "lr": 0.0001946767187162247, "epoch": 14.764150943396226, "percentage": 73.82, "elapsed_time": "1:12:02", "remaining_time": "0:25:33", "throughput": 4252.98, "total_tokens": 18385520} {"current_steps": 28175, "total_steps": 38160, "loss": 0.4559, "lr": 0.00019449565370699618, "epoch": 14.766771488469601, "percentage": 73.83, "elapsed_time": "1:12:03", "remaining_time": "0:25:32", "throughput": 4252.94, "total_tokens": 18388016} {"current_steps": 28180, "total_steps": 38160, "loss": 0.3027, "lr": 0.00019431465260579152, "epoch": 14.769392033542976, "percentage": 73.85, "elapsed_time": "1:12:04", "remaining_time": "0:25:31", "throughput": 4252.94, "total_tokens": 18390928} {"current_steps": 28185, "total_steps": 38160, "loss": 0.2985, "lr": 0.00019413371545047404, "epoch": 14.772012578616351, "percentage": 73.86, "elapsed_time": "1:12:04", "remaining_time": "0:25:30", "throughput": 4252.86, "total_tokens": 18393072} {"current_steps": 28190, "total_steps": 38160, "loss": 0.4906, "lr": 0.00019395284227889382, "epoch": 14.774633123689728, "percentage": 73.87, "elapsed_time": "1:12:05", "remaining_time": "0:25:29", "throughput": 4252.83, "total_tokens": 18395728} {"current_steps": 28195, "total_steps": 38160, "loss": 0.4946, "lr": 0.00019377203312888764, "epoch": 14.777253668763104, "percentage": 73.89, "elapsed_time": "1:12:06", "remaining_time": "0:25:29", "throughput": 4252.84, "total_tokens": 18398704} {"current_steps": 28200, "total_steps": 38160, "loss": 0.4787, "lr": 0.0001935912880382784, "epoch": 14.779874213836479, "percentage": 73.9, "elapsed_time": "1:12:06", "remaining_time": "0:25:28", "throughput": 4252.9, "total_tokens": 18402096} {"current_steps": 28205, "total_steps": 38160, "loss": 0.4358, "lr": 0.00019341060704487596, "epoch": 14.782494758909854, "percentage": 73.91, "elapsed_time": "1:12:07", "remaining_time": "0:25:27", "throughput": 4253.04, "total_tokens": 18406256} {"current_steps": 28210, "total_steps": 38160, "loss": 0.5, "lr": 0.00019322999018647668, "epoch": 14.785115303983229, "percentage": 73.93, "elapsed_time": "1:12:08", "remaining_time": "0:25:26", "throughput": 4253.12, "total_tokens": 18409968} {"current_steps": 28215, "total_steps": 38160, "loss": 0.372, "lr": 0.00019304943750086362, "epoch": 14.787735849056604, "percentage": 73.94, "elapsed_time": "1:12:09", "remaining_time": "0:25:26", "throughput": 4253.46, "total_tokens": 18416272} {"current_steps": 28220, "total_steps": 38160, "loss": 0.5812, "lr": 0.0001928689490258066, "epoch": 14.79035639412998, "percentage": 73.95, "elapsed_time": "1:12:10", "remaining_time": "0:25:25", "throughput": 4253.46, "total_tokens": 18419248} {"current_steps": 28225, "total_steps": 38160, "loss": 0.5099, "lr": 0.00019268852479906146, "epoch": 14.792976939203355, "percentage": 73.96, "elapsed_time": "1:12:11", "remaining_time": "0:25:24", "throughput": 4253.44, "total_tokens": 18421968} {"current_steps": 28230, "total_steps": 38160, "loss": 0.361, "lr": 0.0001925081648583708, "epoch": 14.79559748427673, "percentage": 73.98, "elapsed_time": "1:12:11", "remaining_time": "0:25:23", "throughput": 4253.44, "total_tokens": 18424816} {"current_steps": 28235, "total_steps": 38160, "loss": 0.3564, "lr": 0.00019232786924146394, "epoch": 14.798218029350105, "percentage": 73.99, "elapsed_time": "1:12:12", "remaining_time": "0:25:22", "throughput": 4253.51, "total_tokens": 18428272} {"current_steps": 28240, "total_steps": 38160, "loss": 0.5927, "lr": 0.00019214763798605677, "epoch": 14.80083857442348, "percentage": 74.0, "elapsed_time": "1:12:13", "remaining_time": "0:25:22", "throughput": 4253.49, "total_tokens": 18431024} {"current_steps": 28245, "total_steps": 38160, "loss": 0.4123, "lr": 0.00019196747112985158, "epoch": 14.803459119496855, "percentage": 74.02, "elapsed_time": "1:12:13", "remaining_time": "0:25:21", "throughput": 4253.54, "total_tokens": 18434416} {"current_steps": 28250, "total_steps": 38160, "loss": 0.4507, "lr": 0.00019178736871053737, "epoch": 14.80607966457023, "percentage": 74.03, "elapsed_time": "1:12:14", "remaining_time": "0:25:20", "throughput": 4253.56, "total_tokens": 18437680} {"current_steps": 28255, "total_steps": 38160, "loss": 0.4178, "lr": 0.00019160733076578935, "epoch": 14.808700209643606, "percentage": 74.04, "elapsed_time": "1:12:15", "remaining_time": "0:25:19", "throughput": 4253.64, "total_tokens": 18441296} {"current_steps": 28260, "total_steps": 38160, "loss": 0.5899, "lr": 0.0001914273573332692, "epoch": 14.81132075471698, "percentage": 74.06, "elapsed_time": "1:12:16", "remaining_time": "0:25:19", "throughput": 4253.67, "total_tokens": 18444336} {"current_steps": 28265, "total_steps": 38160, "loss": 0.4666, "lr": 0.00019124744845062553, "epoch": 14.813941299790356, "percentage": 74.07, "elapsed_time": "1:12:16", "remaining_time": "0:25:18", "throughput": 4253.67, "total_tokens": 18447216} {"current_steps": 28270, "total_steps": 38160, "loss": 0.4863, "lr": 0.00019106760415549324, "epoch": 14.816561844863731, "percentage": 74.08, "elapsed_time": "1:12:17", "remaining_time": "0:25:17", "throughput": 4253.64, "total_tokens": 18449840} {"current_steps": 28275, "total_steps": 38160, "loss": 0.3588, "lr": 0.0001908878244854938, "epoch": 14.819182389937106, "percentage": 74.1, "elapsed_time": "1:12:18", "remaining_time": "0:25:16", "throughput": 4253.66, "total_tokens": 18452848} {"current_steps": 28280, "total_steps": 38160, "loss": 0.4351, "lr": 0.00019070810947823498, "epoch": 14.821802935010481, "percentage": 74.11, "elapsed_time": "1:12:18", "remaining_time": "0:25:15", "throughput": 4253.73, "total_tokens": 18456336} {"current_steps": 28285, "total_steps": 38160, "loss": 0.4117, "lr": 0.0001905284591713109, "epoch": 14.824423480083858, "percentage": 74.12, "elapsed_time": "1:12:19", "remaining_time": "0:25:15", "throughput": 4253.69, "total_tokens": 18458896} {"current_steps": 28290, "total_steps": 38160, "loss": 0.463, "lr": 0.00019034887360230246, "epoch": 14.827044025157234, "percentage": 74.14, "elapsed_time": "1:12:20", "remaining_time": "0:25:14", "throughput": 4253.74, "total_tokens": 18462224} {"current_steps": 28295, "total_steps": 38160, "loss": 0.423, "lr": 0.000190169352808777, "epoch": 14.829664570230609, "percentage": 74.15, "elapsed_time": "1:12:20", "remaining_time": "0:25:13", "throughput": 4253.77, "total_tokens": 18465424} {"current_steps": 28300, "total_steps": 38160, "loss": 0.3837, "lr": 0.00018998989682828844, "epoch": 14.832285115303984, "percentage": 74.16, "elapsed_time": "1:12:21", "remaining_time": "0:25:12", "throughput": 4253.87, "total_tokens": 18469328} {"current_steps": 28305, "total_steps": 38160, "loss": 0.3493, "lr": 0.00018981050569837643, "epoch": 14.834905660377359, "percentage": 74.17, "elapsed_time": "1:12:22", "remaining_time": "0:25:11", "throughput": 4253.84, "total_tokens": 18472016} {"current_steps": 28310, "total_steps": 38160, "loss": 0.4786, "lr": 0.000189631179456568, "epoch": 14.837526205450734, "percentage": 74.19, "elapsed_time": "1:12:23", "remaining_time": "0:25:11", "throughput": 4253.85, "total_tokens": 18474928} {"current_steps": 28315, "total_steps": 38160, "loss": 0.5456, "lr": 0.00018945191814037578, "epoch": 14.84014675052411, "percentage": 74.2, "elapsed_time": "1:12:23", "remaining_time": "0:25:10", "throughput": 4253.99, "total_tokens": 18479088} {"current_steps": 28320, "total_steps": 38160, "loss": 0.3567, "lr": 0.00018927272178729938, "epoch": 14.842767295597485, "percentage": 74.21, "elapsed_time": "1:12:24", "remaining_time": "0:25:09", "throughput": 4253.98, "total_tokens": 18481840} {"current_steps": 28325, "total_steps": 38160, "loss": 0.5811, "lr": 0.00018909359043482477, "epoch": 14.84538784067086, "percentage": 74.23, "elapsed_time": "1:12:25", "remaining_time": "0:25:08", "throughput": 4254.02, "total_tokens": 18485104} {"current_steps": 28330, "total_steps": 38160, "loss": 0.5143, "lr": 0.00018891452412042386, "epoch": 14.848008385744235, "percentage": 74.24, "elapsed_time": "1:12:26", "remaining_time": "0:25:08", "throughput": 4254.2, "total_tokens": 18489680} {"current_steps": 28335, "total_steps": 38160, "loss": 0.6819, "lr": 0.00018873552288155542, "epoch": 14.85062893081761, "percentage": 74.25, "elapsed_time": "1:12:26", "remaining_time": "0:25:07", "throughput": 4254.21, "total_tokens": 18492688} {"current_steps": 28340, "total_steps": 38160, "loss": 0.5184, "lr": 0.00018855658675566471, "epoch": 14.853249475890985, "percentage": 74.27, "elapsed_time": "1:12:28", "remaining_time": "0:25:06", "throughput": 4254.59, "total_tokens": 18499696} {"current_steps": 28345, "total_steps": 38160, "loss": 0.548, "lr": 0.00018837771578018275, "epoch": 14.85587002096436, "percentage": 74.28, "elapsed_time": "1:12:28", "remaining_time": "0:25:05", "throughput": 4254.55, "total_tokens": 18502192} {"current_steps": 28350, "total_steps": 38160, "loss": 0.4848, "lr": 0.00018819890999252747, "epoch": 14.858490566037736, "percentage": 74.29, "elapsed_time": "1:12:29", "remaining_time": "0:25:05", "throughput": 4254.66, "total_tokens": 18506128} {"current_steps": 28355, "total_steps": 38160, "loss": 0.5111, "lr": 0.0001880201694301032, "epoch": 14.86111111111111, "percentage": 74.31, "elapsed_time": "1:12:30", "remaining_time": "0:25:04", "throughput": 4254.73, "total_tokens": 18509680} {"current_steps": 28360, "total_steps": 38160, "loss": 0.4115, "lr": 0.00018784149413030005, "epoch": 14.863731656184486, "percentage": 74.32, "elapsed_time": "1:12:31", "remaining_time": "0:25:03", "throughput": 4254.79, "total_tokens": 18513264} {"current_steps": 28365, "total_steps": 38160, "loss": 0.3784, "lr": 0.00018766288413049503, "epoch": 14.866352201257861, "percentage": 74.33, "elapsed_time": "1:12:31", "remaining_time": "0:25:02", "throughput": 4254.82, "total_tokens": 18516464} {"current_steps": 28370, "total_steps": 38160, "loss": 0.5533, "lr": 0.00018748433946805148, "epoch": 14.868972746331236, "percentage": 74.34, "elapsed_time": "1:12:32", "remaining_time": "0:25:02", "throughput": 4254.88, "total_tokens": 18519920} {"current_steps": 28375, "total_steps": 38160, "loss": 0.3499, "lr": 0.00018730586018031854, "epoch": 14.871593291404611, "percentage": 74.36, "elapsed_time": "1:12:33", "remaining_time": "0:25:01", "throughput": 4254.99, "total_tokens": 18523888} {"current_steps": 28380, "total_steps": 38160, "loss": 0.3951, "lr": 0.00018712744630463248, "epoch": 14.874213836477988, "percentage": 74.37, "elapsed_time": "1:12:34", "remaining_time": "0:25:00", "throughput": 4255.17, "total_tokens": 18528560} {"current_steps": 28385, "total_steps": 38160, "loss": 0.4068, "lr": 0.000186949097878315, "epoch": 14.876834381551364, "percentage": 74.38, "elapsed_time": "1:12:35", "remaining_time": "0:24:59", "throughput": 4255.25, "total_tokens": 18532272} {"current_steps": 28390, "total_steps": 38160, "loss": 0.4779, "lr": 0.0001867708149386748, "epoch": 14.879454926624739, "percentage": 74.4, "elapsed_time": "1:12:35", "remaining_time": "0:24:58", "throughput": 4255.25, "total_tokens": 18535216} {"current_steps": 28395, "total_steps": 38160, "loss": 0.3157, "lr": 0.0001865925975230068, "epoch": 14.882075471698114, "percentage": 74.41, "elapsed_time": "1:12:36", "remaining_time": "0:24:58", "throughput": 4255.29, "total_tokens": 18538512} {"current_steps": 28400, "total_steps": 38160, "loss": 0.4064, "lr": 0.0001864144456685916, "epoch": 14.884696016771489, "percentage": 74.42, "elapsed_time": "1:12:37", "remaining_time": "0:24:57", "throughput": 4255.33, "total_tokens": 18541776} {"current_steps": 28405, "total_steps": 38160, "loss": 0.4717, "lr": 0.00018623635941269706, "epoch": 14.887316561844864, "percentage": 74.44, "elapsed_time": "1:12:38", "remaining_time": "0:24:56", "throughput": 4255.45, "total_tokens": 18545776} {"current_steps": 28410, "total_steps": 38160, "loss": 0.4383, "lr": 0.00018605833879257628, "epoch": 14.88993710691824, "percentage": 74.45, "elapsed_time": "1:12:38", "remaining_time": "0:24:55", "throughput": 4255.54, "total_tokens": 18549552} {"current_steps": 28415, "total_steps": 38160, "loss": 0.4376, "lr": 0.0001858803838454694, "epoch": 14.892557651991615, "percentage": 74.46, "elapsed_time": "1:12:39", "remaining_time": "0:24:55", "throughput": 4255.64, "total_tokens": 18553328} {"current_steps": 28420, "total_steps": 38160, "loss": 0.3934, "lr": 0.0001857024946086026, "epoch": 14.89517819706499, "percentage": 74.48, "elapsed_time": "1:12:40", "remaining_time": "0:24:54", "throughput": 4255.72, "total_tokens": 18557072} {"current_steps": 28425, "total_steps": 38160, "loss": 0.3635, "lr": 0.00018552467111918836, "epoch": 14.897798742138365, "percentage": 74.49, "elapsed_time": "1:12:41", "remaining_time": "0:24:53", "throughput": 4255.7, "total_tokens": 18559824} {"current_steps": 28430, "total_steps": 38160, "loss": 0.3774, "lr": 0.00018534691341442507, "epoch": 14.90041928721174, "percentage": 74.5, "elapsed_time": "1:12:41", "remaining_time": "0:24:52", "throughput": 4255.72, "total_tokens": 18562928} {"current_steps": 28435, "total_steps": 38160, "loss": 0.4597, "lr": 0.0001851692215314979, "epoch": 14.903039832285115, "percentage": 74.52, "elapsed_time": "1:12:42", "remaining_time": "0:24:52", "throughput": 4255.72, "total_tokens": 18565744} {"current_steps": 28440, "total_steps": 38160, "loss": 0.4863, "lr": 0.0001849915955075776, "epoch": 14.90566037735849, "percentage": 74.53, "elapsed_time": "1:12:43", "remaining_time": "0:24:51", "throughput": 4255.74, "total_tokens": 18568880} {"current_steps": 28445, "total_steps": 38160, "loss": 0.4629, "lr": 0.0001848140353798217, "epoch": 14.908280922431866, "percentage": 74.54, "elapsed_time": "1:12:43", "remaining_time": "0:24:50", "throughput": 4255.72, "total_tokens": 18571600} {"current_steps": 28450, "total_steps": 38160, "loss": 0.3894, "lr": 0.00018463654118537382, "epoch": 14.91090146750524, "percentage": 74.55, "elapsed_time": "1:12:44", "remaining_time": "0:24:49", "throughput": 4255.78, "total_tokens": 18575056} {"current_steps": 28455, "total_steps": 38160, "loss": 0.3638, "lr": 0.00018445911296136386, "epoch": 14.913522012578616, "percentage": 74.57, "elapsed_time": "1:12:45", "remaining_time": "0:24:48", "throughput": 4255.94, "total_tokens": 18579568} {"current_steps": 28460, "total_steps": 38160, "loss": 0.3952, "lr": 0.00018428175074490754, "epoch": 14.916142557651991, "percentage": 74.58, "elapsed_time": "1:12:46", "remaining_time": "0:24:48", "throughput": 4255.96, "total_tokens": 18582640} {"current_steps": 28465, "total_steps": 38160, "loss": 0.4886, "lr": 0.00018410445457310687, "epoch": 14.918763102725366, "percentage": 74.59, "elapsed_time": "1:12:46", "remaining_time": "0:24:47", "throughput": 4255.97, "total_tokens": 18585584} {"current_steps": 28470, "total_steps": 38160, "loss": 0.5693, "lr": 0.00018392722448305044, "epoch": 14.921383647798741, "percentage": 74.61, "elapsed_time": "1:12:47", "remaining_time": "0:24:46", "throughput": 4256.07, "total_tokens": 18589488} {"current_steps": 28475, "total_steps": 38160, "loss": 0.5592, "lr": 0.00018375006051181265, "epoch": 14.924004192872118, "percentage": 74.62, "elapsed_time": "1:12:48", "remaining_time": "0:24:45", "throughput": 4256.18, "total_tokens": 18593424} {"current_steps": 28480, "total_steps": 38160, "loss": 0.3375, "lr": 0.0001835729626964544, "epoch": 14.926624737945493, "percentage": 74.63, "elapsed_time": "1:12:49", "remaining_time": "0:24:45", "throughput": 4256.19, "total_tokens": 18596368} {"current_steps": 28485, "total_steps": 38160, "loss": 0.4387, "lr": 0.00018339593107402242, "epoch": 14.929245283018869, "percentage": 74.65, "elapsed_time": "1:12:50", "remaining_time": "0:24:44", "throughput": 4256.26, "total_tokens": 18599952} {"current_steps": 28490, "total_steps": 38160, "loss": 0.4033, "lr": 0.00018321896568154945, "epoch": 14.931865828092244, "percentage": 74.66, "elapsed_time": "1:12:50", "remaining_time": "0:24:43", "throughput": 4256.3, "total_tokens": 18603248} {"current_steps": 28495, "total_steps": 38160, "loss": 0.3808, "lr": 0.00018304206655605476, "epoch": 14.934486373165619, "percentage": 74.67, "elapsed_time": "1:12:51", "remaining_time": "0:24:42", "throughput": 4256.36, "total_tokens": 18606768} {"current_steps": 28500, "total_steps": 38160, "loss": 0.397, "lr": 0.00018286523373454378, "epoch": 14.937106918238994, "percentage": 74.69, "elapsed_time": "1:12:52", "remaining_time": "0:24:41", "throughput": 4256.36, "total_tokens": 18609648} {"current_steps": 28505, "total_steps": 38160, "loss": 0.4019, "lr": 0.00018268846725400783, "epoch": 14.93972746331237, "percentage": 74.7, "elapsed_time": "1:12:52", "remaining_time": "0:24:41", "throughput": 4256.36, "total_tokens": 18612624} {"current_steps": 28510, "total_steps": 38160, "loss": 0.4914, "lr": 0.00018251176715142458, "epoch": 14.942348008385745, "percentage": 74.71, "elapsed_time": "1:12:53", "remaining_time": "0:24:40", "throughput": 4256.38, "total_tokens": 18615728} {"current_steps": 28515, "total_steps": 38160, "loss": 0.2881, "lr": 0.00018233513346375756, "epoch": 14.94496855345912, "percentage": 74.72, "elapsed_time": "1:12:54", "remaining_time": "0:24:39", "throughput": 4256.39, "total_tokens": 18618832} {"current_steps": 28520, "total_steps": 38160, "loss": 0.4759, "lr": 0.00018215856622795634, "epoch": 14.947589098532495, "percentage": 74.74, "elapsed_time": "1:12:55", "remaining_time": "0:24:38", "throughput": 4256.54, "total_tokens": 18623056} {"current_steps": 28525, "total_steps": 38160, "loss": 0.3835, "lr": 0.00018198206548095697, "epoch": 14.95020964360587, "percentage": 74.75, "elapsed_time": "1:12:55", "remaining_time": "0:24:38", "throughput": 4256.55, "total_tokens": 18626032} {"current_steps": 28530, "total_steps": 38160, "loss": 0.383, "lr": 0.00018180563125968135, "epoch": 14.952830188679245, "percentage": 74.76, "elapsed_time": "1:12:56", "remaining_time": "0:24:37", "throughput": 4256.53, "total_tokens": 18628784} {"current_steps": 28535, "total_steps": 38160, "loss": 0.4505, "lr": 0.00018162926360103766, "epoch": 14.95545073375262, "percentage": 74.78, "elapsed_time": "1:12:57", "remaining_time": "0:24:36", "throughput": 4256.71, "total_tokens": 18633648} {"current_steps": 28540, "total_steps": 38160, "loss": 0.4821, "lr": 0.0001814529625419199, "epoch": 14.958071278825996, "percentage": 74.79, "elapsed_time": "1:12:58", "remaining_time": "0:24:35", "throughput": 4256.8, "total_tokens": 18637520} {"current_steps": 28545, "total_steps": 38160, "loss": 0.4906, "lr": 0.00018127672811920798, "epoch": 14.96069182389937, "percentage": 74.8, "elapsed_time": "1:12:59", "remaining_time": "0:24:35", "throughput": 4256.92, "total_tokens": 18641488} {"current_steps": 28550, "total_steps": 38160, "loss": 0.369, "lr": 0.00018110056036976834, "epoch": 14.963312368972746, "percentage": 74.82, "elapsed_time": "1:12:59", "remaining_time": "0:24:34", "throughput": 4256.91, "total_tokens": 18644336} {"current_steps": 28555, "total_steps": 38160, "loss": 0.3521, "lr": 0.00018092445933045332, "epoch": 14.965932914046121, "percentage": 74.83, "elapsed_time": "1:13:00", "remaining_time": "0:24:33", "throughput": 4257.0, "total_tokens": 18647984} {"current_steps": 28560, "total_steps": 38160, "loss": 0.4816, "lr": 0.00018074842503810118, "epoch": 14.968553459119496, "percentage": 74.84, "elapsed_time": "1:13:01", "remaining_time": "0:24:32", "throughput": 4256.98, "total_tokens": 18650704} {"current_steps": 28565, "total_steps": 38160, "loss": 0.4727, "lr": 0.00018057245752953666, "epoch": 14.971174004192871, "percentage": 74.86, "elapsed_time": "1:13:02", "remaining_time": "0:24:31", "throughput": 4257.09, "total_tokens": 18654640} {"current_steps": 28570, "total_steps": 38160, "loss": 0.5566, "lr": 0.00018039655684156948, "epoch": 14.973794549266248, "percentage": 74.87, "elapsed_time": "1:13:02", "remaining_time": "0:24:31", "throughput": 4257.07, "total_tokens": 18657392} {"current_steps": 28575, "total_steps": 38160, "loss": 0.371, "lr": 0.00018022072301099635, "epoch": 14.976415094339622, "percentage": 74.88, "elapsed_time": "1:13:03", "remaining_time": "0:24:30", "throughput": 4257.01, "total_tokens": 18659696} {"current_steps": 28580, "total_steps": 38160, "loss": 0.4108, "lr": 0.00018004495607459975, "epoch": 14.979035639412999, "percentage": 74.9, "elapsed_time": "1:13:03", "remaining_time": "0:24:29", "throughput": 4257.0, "total_tokens": 18662608} {"current_steps": 28585, "total_steps": 38160, "loss": 0.5954, "lr": 0.00017986925606914805, "epoch": 14.981656184486374, "percentage": 74.91, "elapsed_time": "1:13:04", "remaining_time": "0:24:28", "throughput": 4256.99, "total_tokens": 18665328} {"current_steps": 28590, "total_steps": 38160, "loss": 0.3526, "lr": 0.00017969362303139598, "epoch": 14.984276729559749, "percentage": 74.92, "elapsed_time": "1:13:05", "remaining_time": "0:24:27", "throughput": 4257.03, "total_tokens": 18668560} {"current_steps": 28595, "total_steps": 38160, "loss": 0.7004, "lr": 0.00017951805699808365, "epoch": 14.986897274633124, "percentage": 74.93, "elapsed_time": "1:13:06", "remaining_time": "0:24:27", "throughput": 4257.16, "total_tokens": 18672784} {"current_steps": 28600, "total_steps": 38160, "loss": 0.4813, "lr": 0.00017934255800593747, "epoch": 14.9895178197065, "percentage": 74.95, "elapsed_time": "1:13:06", "remaining_time": "0:24:26", "throughput": 4257.12, "total_tokens": 18675344} {"current_steps": 28605, "total_steps": 38160, "loss": 0.5485, "lr": 0.0001791671260916698, "epoch": 14.992138364779874, "percentage": 74.96, "elapsed_time": "1:13:07", "remaining_time": "0:24:25", "throughput": 4257.23, "total_tokens": 18679312} {"current_steps": 28610, "total_steps": 38160, "loss": 0.4369, "lr": 0.00017899176129197914, "epoch": 14.99475890985325, "percentage": 74.97, "elapsed_time": "1:13:08", "remaining_time": "0:24:24", "throughput": 4257.22, "total_tokens": 18682160} {"current_steps": 28615, "total_steps": 38160, "loss": 0.4837, "lr": 0.00017881646364354998, "epoch": 14.997379454926625, "percentage": 74.99, "elapsed_time": "1:13:09", "remaining_time": "0:24:24", "throughput": 4257.24, "total_tokens": 18685264} {"current_steps": 28620, "total_steps": 38160, "loss": 0.4933, "lr": 0.00017864123318305213, "epoch": 15.0, "percentage": 75.0, "elapsed_time": "1:13:09", "remaining_time": "0:24:23", "throughput": 4257.08, "total_tokens": 18687760} {"current_steps": 28620, "total_steps": 38160, "eval_loss": 0.4885338842868805, "epoch": 15.0, "percentage": 75.0, "elapsed_time": "1:13:23", "remaining_time": "0:24:27", "throughput": 4243.83, "total_tokens": 18687760} {"current_steps": 28625, "total_steps": 38160, "loss": 0.5488, "lr": 0.00017846606994714222, "epoch": 15.002620545073375, "percentage": 75.01, "elapsed_time": "1:13:25", "remaining_time": "0:24:27", "throughput": 4242.31, "total_tokens": 18691216} {"current_steps": 28630, "total_steps": 38160, "loss": 0.4591, "lr": 0.0001782909739724621, "epoch": 15.00524109014675, "percentage": 75.03, "elapsed_time": "1:13:26", "remaining_time": "0:24:26", "throughput": 4242.32, "total_tokens": 18694256} {"current_steps": 28635, "total_steps": 38160, "loss": 0.4116, "lr": 0.0001781159452956399, "epoch": 15.007861635220126, "percentage": 75.04, "elapsed_time": "1:13:27", "remaining_time": "0:24:26", "throughput": 4242.68, "total_tokens": 18701296} {"current_steps": 28640, "total_steps": 38160, "loss": 0.5121, "lr": 0.00017794098395328977, "epoch": 15.0104821802935, "percentage": 75.05, "elapsed_time": "1:13:28", "remaining_time": "0:24:25", "throughput": 4242.71, "total_tokens": 18704592} {"current_steps": 28645, "total_steps": 38160, "loss": 0.3881, "lr": 0.00017776608998201172, "epoch": 15.013102725366876, "percentage": 75.07, "elapsed_time": "1:13:29", "remaining_time": "0:24:24", "throughput": 4242.75, "total_tokens": 18707984} {"current_steps": 28650, "total_steps": 38160, "loss": 0.5712, "lr": 0.00017759126341839132, "epoch": 15.015723270440251, "percentage": 75.08, "elapsed_time": "1:13:30", "remaining_time": "0:24:23", "throughput": 4242.72, "total_tokens": 18710608} {"current_steps": 28655, "total_steps": 38160, "loss": 0.4356, "lr": 0.0001774165042990003, "epoch": 15.018343815513626, "percentage": 75.09, "elapsed_time": "1:13:30", "remaining_time": "0:24:23", "throughput": 4242.76, "total_tokens": 18713904} {"current_steps": 28660, "total_steps": 38160, "loss": 0.369, "lr": 0.00017724181266039635, "epoch": 15.020964360587001, "percentage": 75.1, "elapsed_time": "1:13:31", "remaining_time": "0:24:22", "throughput": 4242.77, "total_tokens": 18716816} {"current_steps": 28665, "total_steps": 38160, "loss": 0.6404, "lr": 0.00017706718853912292, "epoch": 15.023584905660377, "percentage": 75.12, "elapsed_time": "1:13:32", "remaining_time": "0:24:21", "throughput": 4242.77, "total_tokens": 18719696} {"current_steps": 28670, "total_steps": 38160, "loss": 0.3505, "lr": 0.00017689263197170964, "epoch": 15.026205450733753, "percentage": 75.13, "elapsed_time": "1:13:32", "remaining_time": "0:24:20", "throughput": 4242.87, "total_tokens": 18723600} {"current_steps": 28675, "total_steps": 38160, "loss": 0.4887, "lr": 0.00017671814299467136, "epoch": 15.028825995807129, "percentage": 75.14, "elapsed_time": "1:13:33", "remaining_time": "0:24:19", "throughput": 4242.93, "total_tokens": 18727088} {"current_steps": 28680, "total_steps": 38160, "loss": 0.5053, "lr": 0.00017654372164450954, "epoch": 15.031446540880504, "percentage": 75.16, "elapsed_time": "1:13:34", "remaining_time": "0:24:19", "throughput": 4242.98, "total_tokens": 18730576} {"current_steps": 28685, "total_steps": 38160, "loss": 0.4437, "lr": 0.0001763693679577108, "epoch": 15.034067085953879, "percentage": 75.17, "elapsed_time": "1:13:35", "remaining_time": "0:24:18", "throughput": 4243.01, "total_tokens": 18733840} {"current_steps": 28690, "total_steps": 38160, "loss": 0.415, "lr": 0.00017619508197074812, "epoch": 15.036687631027254, "percentage": 75.18, "elapsed_time": "1:13:35", "remaining_time": "0:24:17", "throughput": 4243.0, "total_tokens": 18736592} {"current_steps": 28695, "total_steps": 38160, "loss": 0.4597, "lr": 0.0001760208637200803, "epoch": 15.03930817610063, "percentage": 75.2, "elapsed_time": "1:13:36", "remaining_time": "0:24:16", "throughput": 4243.09, "total_tokens": 18740208} {"current_steps": 28700, "total_steps": 38160, "loss": 0.4325, "lr": 0.00017584671324215152, "epoch": 15.041928721174004, "percentage": 75.21, "elapsed_time": "1:13:37", "remaining_time": "0:24:16", "throughput": 4243.12, "total_tokens": 18743472} {"current_steps": 28705, "total_steps": 38160, "loss": 0.4106, "lr": 0.00017567263057339212, "epoch": 15.04454926624738, "percentage": 75.22, "elapsed_time": "1:13:38", "remaining_time": "0:24:15", "throughput": 4243.07, "total_tokens": 18745968} {"current_steps": 28710, "total_steps": 38160, "loss": 0.4217, "lr": 0.00017549861575021848, "epoch": 15.047169811320755, "percentage": 75.24, "elapsed_time": "1:13:38", "remaining_time": "0:24:14", "throughput": 4243.16, "total_tokens": 18749744} {"current_steps": 28715, "total_steps": 38160, "loss": 0.375, "lr": 0.00017532466880903214, "epoch": 15.04979035639413, "percentage": 75.25, "elapsed_time": "1:13:39", "remaining_time": "0:24:13", "throughput": 4243.17, "total_tokens": 18752752} {"current_steps": 28720, "total_steps": 38160, "loss": 0.347, "lr": 0.00017515078978622102, "epoch": 15.052410901467505, "percentage": 75.26, "elapsed_time": "1:13:40", "remaining_time": "0:24:12", "throughput": 4243.13, "total_tokens": 18755248} {"current_steps": 28725, "total_steps": 38160, "loss": 0.4537, "lr": 0.0001749769787181587, "epoch": 15.05503144654088, "percentage": 75.28, "elapsed_time": "1:13:40", "remaining_time": "0:24:12", "throughput": 4243.18, "total_tokens": 18758704} {"current_steps": 28730, "total_steps": 38160, "loss": 0.5111, "lr": 0.00017480323564120426, "epoch": 15.057651991614255, "percentage": 75.29, "elapsed_time": "1:13:41", "remaining_time": "0:24:11", "throughput": 4243.21, "total_tokens": 18761872} {"current_steps": 28735, "total_steps": 38160, "loss": 0.3957, "lr": 0.00017462956059170287, "epoch": 15.06027253668763, "percentage": 75.3, "elapsed_time": "1:13:42", "remaining_time": "0:24:10", "throughput": 4243.14, "total_tokens": 18764144} {"current_steps": 28740, "total_steps": 38160, "loss": 0.2815, "lr": 0.00017445595360598553, "epoch": 15.062893081761006, "percentage": 75.31, "elapsed_time": "1:13:43", "remaining_time": "0:24:09", "throughput": 4243.21, "total_tokens": 18767728} {"current_steps": 28745, "total_steps": 38160, "loss": 0.4478, "lr": 0.0001742824147203686, "epoch": 15.065513626834381, "percentage": 75.33, "elapsed_time": "1:13:43", "remaining_time": "0:24:08", "throughput": 4243.22, "total_tokens": 18770736} {"current_steps": 28750, "total_steps": 38160, "loss": 0.3451, "lr": 0.00017410894397115463, "epoch": 15.068134171907756, "percentage": 75.34, "elapsed_time": "1:13:44", "remaining_time": "0:24:08", "throughput": 4243.24, "total_tokens": 18773872} {"current_steps": 28755, "total_steps": 38160, "loss": 0.3551, "lr": 0.00017393554139463147, "epoch": 15.070754716981131, "percentage": 75.35, "elapsed_time": "1:13:45", "remaining_time": "0:24:07", "throughput": 4243.27, "total_tokens": 18777040} {"current_steps": 28760, "total_steps": 38160, "loss": 0.3662, "lr": 0.00017376220702707308, "epoch": 15.073375262054507, "percentage": 75.37, "elapsed_time": "1:13:45", "remaining_time": "0:24:06", "throughput": 4243.39, "total_tokens": 18781232} {"current_steps": 28765, "total_steps": 38160, "loss": 0.4136, "lr": 0.00017358894090473926, "epoch": 15.075995807127883, "percentage": 75.38, "elapsed_time": "1:13:46", "remaining_time": "0:24:05", "throughput": 4243.46, "total_tokens": 18784656} {"current_steps": 28770, "total_steps": 38160, "loss": 0.427, "lr": 0.00017341574306387492, "epoch": 15.078616352201259, "percentage": 75.39, "elapsed_time": "1:13:47", "remaining_time": "0:24:05", "throughput": 4243.59, "total_tokens": 18788848} {"current_steps": 28775, "total_steps": 38160, "loss": 0.3869, "lr": 0.00017324261354071147, "epoch": 15.081236897274634, "percentage": 75.41, "elapsed_time": "1:13:48", "remaining_time": "0:24:04", "throughput": 4243.64, "total_tokens": 18792368} {"current_steps": 28780, "total_steps": 38160, "loss": 0.2757, "lr": 0.00017306955237146522, "epoch": 15.083857442348009, "percentage": 75.42, "elapsed_time": "1:13:48", "remaining_time": "0:24:03", "throughput": 4243.55, "total_tokens": 18794480} {"current_steps": 28785, "total_steps": 38160, "loss": 0.5335, "lr": 0.0001728965595923388, "epoch": 15.086477987421384, "percentage": 75.43, "elapsed_time": "1:13:49", "remaining_time": "0:24:02", "throughput": 4243.57, "total_tokens": 18797680} {"current_steps": 28790, "total_steps": 38160, "loss": 0.3696, "lr": 0.00017272363523952033, "epoch": 15.08909853249476, "percentage": 75.45, "elapsed_time": "1:13:50", "remaining_time": "0:24:01", "throughput": 4243.57, "total_tokens": 18800656} {"current_steps": 28795, "total_steps": 38160, "loss": 0.4511, "lr": 0.0001725507793491838, "epoch": 15.091719077568134, "percentage": 75.46, "elapsed_time": "1:13:51", "remaining_time": "0:24:01", "throughput": 4243.58, "total_tokens": 18803792} {"current_steps": 28800, "total_steps": 38160, "loss": 0.4445, "lr": 0.00017237799195748827, "epoch": 15.09433962264151, "percentage": 75.47, "elapsed_time": "1:13:51", "remaining_time": "0:24:00", "throughput": 4243.59, "total_tokens": 18806768} {"current_steps": 28805, "total_steps": 38160, "loss": 0.3638, "lr": 0.00017220527310057927, "epoch": 15.096960167714885, "percentage": 75.48, "elapsed_time": "1:13:52", "remaining_time": "0:23:59", "throughput": 4243.6, "total_tokens": 18809680} {"current_steps": 28810, "total_steps": 38160, "loss": 0.3876, "lr": 0.0001720326228145873, "epoch": 15.09958071278826, "percentage": 75.5, "elapsed_time": "1:13:53", "remaining_time": "0:23:58", "throughput": 4243.67, "total_tokens": 18813296} {"current_steps": 28815, "total_steps": 38160, "loss": 0.3442, "lr": 0.00017186004113562903, "epoch": 15.102201257861635, "percentage": 75.51, "elapsed_time": "1:13:54", "remaining_time": "0:23:58", "throughput": 4243.75, "total_tokens": 18817040} {"current_steps": 28820, "total_steps": 38160, "loss": 0.446, "lr": 0.00017168752809980655, "epoch": 15.10482180293501, "percentage": 75.52, "elapsed_time": "1:13:54", "remaining_time": "0:23:57", "throughput": 4243.79, "total_tokens": 18820400} {"current_steps": 28825, "total_steps": 38160, "loss": 0.2906, "lr": 0.00017151508374320767, "epoch": 15.107442348008385, "percentage": 75.54, "elapsed_time": "1:13:55", "remaining_time": "0:23:56", "throughput": 4243.77, "total_tokens": 18823152} {"current_steps": 28830, "total_steps": 38160, "loss": 0.5056, "lr": 0.00017134270810190583, "epoch": 15.11006289308176, "percentage": 75.55, "elapsed_time": "1:13:56", "remaining_time": "0:23:55", "throughput": 4243.74, "total_tokens": 18825776} {"current_steps": 28835, "total_steps": 38160, "loss": 0.4419, "lr": 0.0001711704012119597, "epoch": 15.112683438155136, "percentage": 75.56, "elapsed_time": "1:13:56", "remaining_time": "0:23:54", "throughput": 4243.75, "total_tokens": 18828816} {"current_steps": 28840, "total_steps": 38160, "loss": 0.4313, "lr": 0.0001709981631094142, "epoch": 15.115303983228511, "percentage": 75.58, "elapsed_time": "1:13:57", "remaining_time": "0:23:54", "throughput": 4243.83, "total_tokens": 18832624} {"current_steps": 28845, "total_steps": 38160, "loss": 0.4224, "lr": 0.00017082599383029946, "epoch": 15.117924528301886, "percentage": 75.59, "elapsed_time": "1:13:58", "remaining_time": "0:23:53", "throughput": 4243.97, "total_tokens": 18836848} {"current_steps": 28850, "total_steps": 38160, "loss": 0.535, "lr": 0.0001706538934106316, "epoch": 15.120545073375261, "percentage": 75.6, "elapsed_time": "1:13:59", "remaining_time": "0:23:52", "throughput": 4243.98, "total_tokens": 18839824} {"current_steps": 28855, "total_steps": 38160, "loss": 0.5364, "lr": 0.00017048186188641185, "epoch": 15.123165618448636, "percentage": 75.62, "elapsed_time": "1:13:59", "remaining_time": "0:23:51", "throughput": 4243.94, "total_tokens": 18842416} {"current_steps": 28860, "total_steps": 38160, "loss": 0.363, "lr": 0.0001703098992936271, "epoch": 15.125786163522013, "percentage": 75.63, "elapsed_time": "1:14:00", "remaining_time": "0:23:50", "throughput": 4243.95, "total_tokens": 18845424} {"current_steps": 28865, "total_steps": 38160, "loss": 0.4947, "lr": 0.00017013800566825012, "epoch": 15.128406708595389, "percentage": 75.64, "elapsed_time": "1:14:01", "remaining_time": "0:23:50", "throughput": 4243.96, "total_tokens": 18848592} {"current_steps": 28870, "total_steps": 38160, "loss": 0.467, "lr": 0.00016996618104623905, "epoch": 15.131027253668764, "percentage": 75.66, "elapsed_time": "1:14:01", "remaining_time": "0:23:49", "throughput": 4243.95, "total_tokens": 18851408} {"current_steps": 28875, "total_steps": 38160, "loss": 0.4333, "lr": 0.00016979442546353774, "epoch": 15.133647798742139, "percentage": 75.67, "elapsed_time": "1:14:02", "remaining_time": "0:23:48", "throughput": 4243.97, "total_tokens": 18854512} {"current_steps": 28880, "total_steps": 38160, "loss": 0.4992, "lr": 0.00016962273895607555, "epoch": 15.136268343815514, "percentage": 75.68, "elapsed_time": "1:14:03", "remaining_time": "0:23:47", "throughput": 4244.08, "total_tokens": 18858704} {"current_steps": 28885, "total_steps": 38160, "loss": 0.4566, "lr": 0.00016945112155976723, "epoch": 15.13888888888889, "percentage": 75.69, "elapsed_time": "1:14:04", "remaining_time": "0:23:47", "throughput": 4244.15, "total_tokens": 18862256} {"current_steps": 28890, "total_steps": 38160, "loss": 0.4819, "lr": 0.000169279573310513, "epoch": 15.141509433962264, "percentage": 75.71, "elapsed_time": "1:14:05", "remaining_time": "0:23:46", "throughput": 4244.31, "total_tokens": 18866640} {"current_steps": 28895, "total_steps": 38160, "loss": 0.2971, "lr": 0.00016910809424419904, "epoch": 15.14412997903564, "percentage": 75.72, "elapsed_time": "1:14:05", "remaining_time": "0:23:45", "throughput": 4244.28, "total_tokens": 18869392} {"current_steps": 28900, "total_steps": 38160, "loss": 0.4439, "lr": 0.00016893668439669674, "epoch": 15.146750524109015, "percentage": 75.73, "elapsed_time": "1:14:06", "remaining_time": "0:23:44", "throughput": 4244.29, "total_tokens": 18872336} {"current_steps": 28905, "total_steps": 38160, "loss": 0.4975, "lr": 0.0001687653438038632, "epoch": 15.14937106918239, "percentage": 75.75, "elapsed_time": "1:14:07", "remaining_time": "0:23:43", "throughput": 4244.36, "total_tokens": 18876016} {"current_steps": 28910, "total_steps": 38160, "loss": 0.4004, "lr": 0.00016859407250154084, "epoch": 15.151991614255765, "percentage": 75.76, "elapsed_time": "1:14:08", "remaining_time": "0:23:43", "throughput": 4244.35, "total_tokens": 18878896} {"current_steps": 28915, "total_steps": 38160, "loss": 0.4212, "lr": 0.0001684228705255575, "epoch": 15.15461215932914, "percentage": 75.77, "elapsed_time": "1:14:08", "remaining_time": "0:23:42", "throughput": 4244.34, "total_tokens": 18881680} {"current_steps": 28920, "total_steps": 38160, "loss": 0.3506, "lr": 0.00016825173791172677, "epoch": 15.157232704402515, "percentage": 75.79, "elapsed_time": "1:14:09", "remaining_time": "0:23:41", "throughput": 4244.38, "total_tokens": 18884912} {"current_steps": 28925, "total_steps": 38160, "loss": 0.4028, "lr": 0.0001680806746958477, "epoch": 15.15985324947589, "percentage": 75.8, "elapsed_time": "1:14:10", "remaining_time": "0:23:40", "throughput": 4244.4, "total_tokens": 18888048} {"current_steps": 28930, "total_steps": 38160, "loss": 0.5457, "lr": 0.00016790968091370494, "epoch": 15.162473794549266, "percentage": 75.81, "elapsed_time": "1:14:11", "remaining_time": "0:23:40", "throughput": 4244.58, "total_tokens": 18892656} {"current_steps": 28935, "total_steps": 38160, "loss": 0.4306, "lr": 0.00016773875660106824, "epoch": 15.165094339622641, "percentage": 75.83, "elapsed_time": "1:14:11", "remaining_time": "0:23:39", "throughput": 4244.55, "total_tokens": 18895312} {"current_steps": 28940, "total_steps": 38160, "loss": 0.4367, "lr": 0.0001675679017936928, "epoch": 15.167714884696016, "percentage": 75.84, "elapsed_time": "1:14:12", "remaining_time": "0:23:38", "throughput": 4244.5, "total_tokens": 18897712} {"current_steps": 28945, "total_steps": 38160, "loss": 0.4676, "lr": 0.00016739711652731976, "epoch": 15.170335429769391, "percentage": 75.85, "elapsed_time": "1:14:12", "remaining_time": "0:23:37", "throughput": 4244.45, "total_tokens": 18900112} {"current_steps": 28950, "total_steps": 38160, "loss": 0.3495, "lr": 0.00016722640083767542, "epoch": 15.172955974842766, "percentage": 75.86, "elapsed_time": "1:14:13", "remaining_time": "0:23:36", "throughput": 4244.56, "total_tokens": 18903920} {"current_steps": 28955, "total_steps": 38160, "loss": 0.5532, "lr": 0.00016705575476047153, "epoch": 15.175576519916143, "percentage": 75.88, "elapsed_time": "1:14:14", "remaining_time": "0:23:36", "throughput": 4244.93, "total_tokens": 18911056} {"current_steps": 28960, "total_steps": 38160, "loss": 0.4506, "lr": 0.0001668851783314055, "epoch": 15.178197064989519, "percentage": 75.89, "elapsed_time": "1:14:15", "remaining_time": "0:23:35", "throughput": 4244.87, "total_tokens": 18913360} {"current_steps": 28965, "total_steps": 38160, "loss": 0.5377, "lr": 0.00016671467158615977, "epoch": 15.180817610062894, "percentage": 75.9, "elapsed_time": "1:14:16", "remaining_time": "0:23:34", "throughput": 4245.01, "total_tokens": 18917648} {"current_steps": 28970, "total_steps": 38160, "loss": 0.6281, "lr": 0.00016654423456040224, "epoch": 15.183438155136269, "percentage": 75.92, "elapsed_time": "1:14:17", "remaining_time": "0:23:33", "throughput": 4245.05, "total_tokens": 18921008} {"current_steps": 28975, "total_steps": 38160, "loss": 0.3589, "lr": 0.0001663738672897866, "epoch": 15.186058700209644, "percentage": 75.93, "elapsed_time": "1:14:17", "remaining_time": "0:23:33", "throughput": 4245.14, "total_tokens": 18924816} {"current_steps": 28980, "total_steps": 38160, "loss": 0.4208, "lr": 0.0001662035698099517, "epoch": 15.18867924528302, "percentage": 75.94, "elapsed_time": "1:14:18", "remaining_time": "0:23:32", "throughput": 4245.13, "total_tokens": 18927664} {"current_steps": 28985, "total_steps": 38160, "loss": 0.3598, "lr": 0.00016603334215652206, "epoch": 15.191299790356394, "percentage": 75.96, "elapsed_time": "1:14:19", "remaining_time": "0:23:31", "throughput": 4245.11, "total_tokens": 18930384} {"current_steps": 28990, "total_steps": 38160, "loss": 0.4989, "lr": 0.0001658631843651069, "epoch": 15.19392033542977, "percentage": 75.97, "elapsed_time": "1:14:20", "remaining_time": "0:23:30", "throughput": 4245.12, "total_tokens": 18933488} {"current_steps": 28995, "total_steps": 38160, "loss": 0.4271, "lr": 0.00016569309647130177, "epoch": 15.196540880503145, "percentage": 75.98, "elapsed_time": "1:14:20", "remaining_time": "0:23:29", "throughput": 4245.09, "total_tokens": 18936080} {"current_steps": 29000, "total_steps": 38160, "loss": 0.4355, "lr": 0.00016552307851068666, "epoch": 15.19916142557652, "percentage": 76.0, "elapsed_time": "1:14:21", "remaining_time": "0:23:29", "throughput": 4245.2, "total_tokens": 18940112} {"current_steps": 29005, "total_steps": 38160, "loss": 0.3741, "lr": 0.00016535313051882765, "epoch": 15.201781970649895, "percentage": 76.01, "elapsed_time": "1:14:22", "remaining_time": "0:23:28", "throughput": 4245.31, "total_tokens": 18944144} {"current_steps": 29010, "total_steps": 38160, "loss": 0.3702, "lr": 0.00016518325253127604, "epoch": 15.20440251572327, "percentage": 76.02, "elapsed_time": "1:14:23", "remaining_time": "0:23:27", "throughput": 4245.43, "total_tokens": 18948112} {"current_steps": 29015, "total_steps": 38160, "loss": 0.3239, "lr": 0.00016501344458356803, "epoch": 15.207023060796645, "percentage": 76.04, "elapsed_time": "1:14:23", "remaining_time": "0:23:26", "throughput": 4245.51, "total_tokens": 18951792} {"current_steps": 29020, "total_steps": 38160, "loss": 0.4435, "lr": 0.00016484370671122588, "epoch": 15.20964360587002, "percentage": 76.05, "elapsed_time": "1:14:24", "remaining_time": "0:23:26", "throughput": 4245.57, "total_tokens": 18955248} {"current_steps": 29025, "total_steps": 38160, "loss": 0.4672, "lr": 0.00016467403894975641, "epoch": 15.212264150943396, "percentage": 76.06, "elapsed_time": "1:14:25", "remaining_time": "0:23:25", "throughput": 4245.6, "total_tokens": 18958384} {"current_steps": 29030, "total_steps": 38160, "loss": 0.351, "lr": 0.0001645044413346524, "epoch": 15.214884696016771, "percentage": 76.07, "elapsed_time": "1:14:26", "remaining_time": "0:23:24", "throughput": 4245.63, "total_tokens": 18961584} {"current_steps": 29035, "total_steps": 38160, "loss": 0.3327, "lr": 0.00016433491390139177, "epoch": 15.217505241090146, "percentage": 76.09, "elapsed_time": "1:14:26", "remaining_time": "0:23:23", "throughput": 4245.66, "total_tokens": 18964720} {"current_steps": 29040, "total_steps": 38160, "loss": 0.5405, "lr": 0.00016416545668543786, "epoch": 15.220125786163521, "percentage": 76.1, "elapsed_time": "1:14:27", "remaining_time": "0:23:23", "throughput": 4245.68, "total_tokens": 18967888} {"current_steps": 29045, "total_steps": 38160, "loss": 0.3949, "lr": 0.0001639960697222388, "epoch": 15.222746331236896, "percentage": 76.11, "elapsed_time": "1:14:28", "remaining_time": "0:23:22", "throughput": 4245.63, "total_tokens": 18970384} {"current_steps": 29050, "total_steps": 38160, "loss": 0.3285, "lr": 0.00016382675304722877, "epoch": 15.225366876310272, "percentage": 76.13, "elapsed_time": "1:14:28", "remaining_time": "0:23:21", "throughput": 4245.6, "total_tokens": 18973072} {"current_steps": 29055, "total_steps": 38160, "loss": 0.3735, "lr": 0.00016365750669582662, "epoch": 15.227987421383649, "percentage": 76.14, "elapsed_time": "1:14:29", "remaining_time": "0:23:20", "throughput": 4245.6, "total_tokens": 18976016} {"current_steps": 29060, "total_steps": 38160, "loss": 0.4216, "lr": 0.00016348833070343682, "epoch": 15.230607966457024, "percentage": 76.15, "elapsed_time": "1:14:30", "remaining_time": "0:23:19", "throughput": 4245.61, "total_tokens": 18978992} {"current_steps": 29065, "total_steps": 38160, "loss": 0.4699, "lr": 0.00016331922510544932, "epoch": 15.233228511530399, "percentage": 76.17, "elapsed_time": "1:14:31", "remaining_time": "0:23:19", "throughput": 4245.67, "total_tokens": 18982480} {"current_steps": 29070, "total_steps": 38160, "loss": 0.4248, "lr": 0.0001631501899372387, "epoch": 15.235849056603774, "percentage": 76.18, "elapsed_time": "1:14:31", "remaining_time": "0:23:18", "throughput": 4245.72, "total_tokens": 18985936} {"current_steps": 29075, "total_steps": 38160, "loss": 0.4733, "lr": 0.0001629812252341653, "epoch": 15.23846960167715, "percentage": 76.19, "elapsed_time": "1:14:32", "remaining_time": "0:23:17", "throughput": 4245.74, "total_tokens": 18989072} {"current_steps": 29080, "total_steps": 38160, "loss": 0.3176, "lr": 0.0001628123310315749, "epoch": 15.241090146750524, "percentage": 76.21, "elapsed_time": "1:14:33", "remaining_time": "0:23:16", "throughput": 4245.75, "total_tokens": 18992080} {"current_steps": 29085, "total_steps": 38160, "loss": 0.5097, "lr": 0.00016264350736479777, "epoch": 15.2437106918239, "percentage": 76.22, "elapsed_time": "1:14:33", "remaining_time": "0:23:15", "throughput": 4245.76, "total_tokens": 18995120} {"current_steps": 29090, "total_steps": 38160, "loss": 0.5032, "lr": 0.00016247475426915038, "epoch": 15.246331236897275, "percentage": 76.23, "elapsed_time": "1:14:34", "remaining_time": "0:23:15", "throughput": 4245.72, "total_tokens": 18997712} {"current_steps": 29095, "total_steps": 38160, "loss": 0.401, "lr": 0.0001623060717799335, "epoch": 15.24895178197065, "percentage": 76.24, "elapsed_time": "1:14:35", "remaining_time": "0:23:14", "throughput": 4245.7, "total_tokens": 19000368} {"current_steps": 29100, "total_steps": 38160, "loss": 0.3558, "lr": 0.0001621374599324338, "epoch": 15.251572327044025, "percentage": 76.26, "elapsed_time": "1:14:35", "remaining_time": "0:23:13", "throughput": 4245.76, "total_tokens": 19003856} {"current_steps": 29105, "total_steps": 38160, "loss": 0.3611, "lr": 0.00016196891876192292, "epoch": 15.2541928721174, "percentage": 76.27, "elapsed_time": "1:14:36", "remaining_time": "0:23:12", "throughput": 4245.72, "total_tokens": 19006448} {"current_steps": 29110, "total_steps": 38160, "loss": 0.42, "lr": 0.00016180044830365798, "epoch": 15.256813417190775, "percentage": 76.28, "elapsed_time": "1:14:37", "remaining_time": "0:23:11", "throughput": 4245.76, "total_tokens": 19009712} {"current_steps": 29115, "total_steps": 38160, "loss": 0.4396, "lr": 0.00016163204859288066, "epoch": 15.25943396226415, "percentage": 76.3, "elapsed_time": "1:14:38", "remaining_time": "0:23:11", "throughput": 4245.76, "total_tokens": 19012688} {"current_steps": 29120, "total_steps": 38160, "loss": 0.3575, "lr": 0.00016146371966481866, "epoch": 15.262054507337526, "percentage": 76.31, "elapsed_time": "1:14:38", "remaining_time": "0:23:10", "throughput": 4245.81, "total_tokens": 19016112} {"current_steps": 29125, "total_steps": 38160, "loss": 0.4792, "lr": 0.00016129546155468411, "epoch": 15.264675052410901, "percentage": 76.32, "elapsed_time": "1:14:39", "remaining_time": "0:23:09", "throughput": 4245.94, "total_tokens": 19020304} {"current_steps": 29130, "total_steps": 38160, "loss": 0.4235, "lr": 0.00016112727429767483, "epoch": 15.267295597484276, "percentage": 76.34, "elapsed_time": "1:14:40", "remaining_time": "0:23:08", "throughput": 4245.86, "total_tokens": 19022512} {"current_steps": 29135, "total_steps": 38160, "loss": 0.4834, "lr": 0.00016095915792897392, "epoch": 15.269916142557651, "percentage": 76.35, "elapsed_time": "1:14:40", "remaining_time": "0:23:08", "throughput": 4245.87, "total_tokens": 19025552} {"current_steps": 29140, "total_steps": 38160, "loss": 0.3912, "lr": 0.000160791112483749, "epoch": 15.272536687631026, "percentage": 76.36, "elapsed_time": "1:14:41", "remaining_time": "0:23:07", "throughput": 4245.87, "total_tokens": 19028496} {"current_steps": 29145, "total_steps": 38160, "loss": 0.4226, "lr": 0.00016062313799715362, "epoch": 15.275157232704402, "percentage": 76.38, "elapsed_time": "1:14:42", "remaining_time": "0:23:06", "throughput": 4245.86, "total_tokens": 19031280} {"current_steps": 29150, "total_steps": 38160, "loss": 0.4944, "lr": 0.00016045523450432576, "epoch": 15.277777777777779, "percentage": 76.39, "elapsed_time": "1:14:42", "remaining_time": "0:23:05", "throughput": 4245.83, "total_tokens": 19033872} {"current_steps": 29155, "total_steps": 38160, "loss": 0.4383, "lr": 0.0001602874020403891, "epoch": 15.280398322851154, "percentage": 76.4, "elapsed_time": "1:14:43", "remaining_time": "0:23:04", "throughput": 4245.81, "total_tokens": 19036688} {"current_steps": 29160, "total_steps": 38160, "loss": 0.4051, "lr": 0.00016011964064045232, "epoch": 15.283018867924529, "percentage": 76.42, "elapsed_time": "1:14:44", "remaining_time": "0:23:04", "throughput": 4245.83, "total_tokens": 19039792} {"current_steps": 29165, "total_steps": 38160, "loss": 0.3988, "lr": 0.00015995195033960936, "epoch": 15.285639412997904, "percentage": 76.43, "elapsed_time": "1:14:45", "remaining_time": "0:23:03", "throughput": 4245.92, "total_tokens": 19043696} {"current_steps": 29170, "total_steps": 38160, "loss": 0.3418, "lr": 0.00015978433117293884, "epoch": 15.28825995807128, "percentage": 76.44, "elapsed_time": "1:14:45", "remaining_time": "0:23:02", "throughput": 4245.92, "total_tokens": 19046512} {"current_steps": 29175, "total_steps": 38160, "loss": 0.4569, "lr": 0.0001596167831755047, "epoch": 15.290880503144654, "percentage": 76.45, "elapsed_time": "1:14:46", "remaining_time": "0:23:01", "throughput": 4245.98, "total_tokens": 19050128} {"current_steps": 29180, "total_steps": 38160, "loss": 0.3238, "lr": 0.00015944930638235626, "epoch": 15.29350104821803, "percentage": 76.47, "elapsed_time": "1:14:47", "remaining_time": "0:23:00", "throughput": 4245.95, "total_tokens": 19052848} {"current_steps": 29185, "total_steps": 38160, "loss": 0.3002, "lr": 0.00015928190082852773, "epoch": 15.296121593291405, "percentage": 76.48, "elapsed_time": "1:14:47", "remaining_time": "0:23:00", "throughput": 4245.95, "total_tokens": 19055792} {"current_steps": 29190, "total_steps": 38160, "loss": 0.4481, "lr": 0.0001591145665490384, "epoch": 15.29874213836478, "percentage": 76.49, "elapsed_time": "1:14:48", "remaining_time": "0:22:59", "throughput": 4245.97, "total_tokens": 19058992} {"current_steps": 29195, "total_steps": 38160, "loss": 0.4776, "lr": 0.00015894730357889287, "epoch": 15.301362683438155, "percentage": 76.51, "elapsed_time": "1:14:49", "remaining_time": "0:22:58", "throughput": 4246.11, "total_tokens": 19063280} {"current_steps": 29200, "total_steps": 38160, "loss": 0.4965, "lr": 0.0001587801119530805, "epoch": 15.30398322851153, "percentage": 76.52, "elapsed_time": "1:14:50", "remaining_time": "0:22:57", "throughput": 4246.21, "total_tokens": 19067312} {"current_steps": 29205, "total_steps": 38160, "loss": 0.4676, "lr": 0.00015861299170657572, "epoch": 15.306603773584905, "percentage": 76.53, "elapsed_time": "1:14:51", "remaining_time": "0:22:57", "throughput": 4246.28, "total_tokens": 19070992} {"current_steps": 29210, "total_steps": 38160, "loss": 0.4726, "lr": 0.00015844594287433834, "epoch": 15.30922431865828, "percentage": 76.55, "elapsed_time": "1:14:51", "remaining_time": "0:22:56", "throughput": 4246.23, "total_tokens": 19073520} {"current_steps": 29215, "total_steps": 38160, "loss": 0.3916, "lr": 0.00015827896549131304, "epoch": 15.311844863731656, "percentage": 76.56, "elapsed_time": "1:14:52", "remaining_time": "0:22:55", "throughput": 4246.15, "total_tokens": 19075664} {"current_steps": 29220, "total_steps": 38160, "loss": 0.5275, "lr": 0.0001581120595924298, "epoch": 15.314465408805031, "percentage": 76.57, "elapsed_time": "1:14:53", "remaining_time": "0:22:54", "throughput": 4246.15, "total_tokens": 19078704} {"current_steps": 29225, "total_steps": 38160, "loss": 0.4648, "lr": 0.00015794522521260317, "epoch": 15.317085953878406, "percentage": 76.59, "elapsed_time": "1:14:53", "remaining_time": "0:22:53", "throughput": 4246.23, "total_tokens": 19082416} {"current_steps": 29230, "total_steps": 38160, "loss": 0.4344, "lr": 0.00015777846238673293, "epoch": 15.319706498951781, "percentage": 76.6, "elapsed_time": "1:14:54", "remaining_time": "0:22:53", "throughput": 4246.2, "total_tokens": 19085040} {"current_steps": 29235, "total_steps": 38160, "loss": 0.4983, "lr": 0.00015761177114970404, "epoch": 15.322327044025156, "percentage": 76.61, "elapsed_time": "1:14:55", "remaining_time": "0:22:52", "throughput": 4246.3, "total_tokens": 19089008} {"current_steps": 29240, "total_steps": 38160, "loss": 0.3898, "lr": 0.0001574451515363865, "epoch": 15.324947589098532, "percentage": 76.62, "elapsed_time": "1:14:56", "remaining_time": "0:22:51", "throughput": 4246.37, "total_tokens": 19092560} {"current_steps": 29245, "total_steps": 38160, "loss": 0.3615, "lr": 0.00015727860358163536, "epoch": 15.327568134171909, "percentage": 76.64, "elapsed_time": "1:14:56", "remaining_time": "0:22:50", "throughput": 4246.3, "total_tokens": 19094832} {"current_steps": 29250, "total_steps": 38160, "loss": 0.4101, "lr": 0.00015711212732029035, "epoch": 15.330188679245284, "percentage": 76.65, "elapsed_time": "1:14:57", "remaining_time": "0:22:50", "throughput": 4246.35, "total_tokens": 19098192} {"current_steps": 29255, "total_steps": 38160, "loss": 0.3535, "lr": 0.00015694572278717627, "epoch": 15.332809224318659, "percentage": 76.66, "elapsed_time": "1:14:58", "remaining_time": "0:22:49", "throughput": 4246.43, "total_tokens": 19101808} {"current_steps": 29260, "total_steps": 38160, "loss": 0.3131, "lr": 0.00015677939001710323, "epoch": 15.335429769392034, "percentage": 76.68, "elapsed_time": "1:14:58", "remaining_time": "0:22:48", "throughput": 4246.39, "total_tokens": 19104336} {"current_steps": 29265, "total_steps": 38160, "loss": 0.4022, "lr": 0.00015661312904486613, "epoch": 15.33805031446541, "percentage": 76.69, "elapsed_time": "1:14:59", "remaining_time": "0:22:47", "throughput": 4246.44, "total_tokens": 19107600} {"current_steps": 29270, "total_steps": 38160, "loss": 0.4827, "lr": 0.00015644693990524483, "epoch": 15.340670859538784, "percentage": 76.7, "elapsed_time": "1:15:00", "remaining_time": "0:22:46", "throughput": 4246.45, "total_tokens": 19110640} {"current_steps": 29275, "total_steps": 38160, "loss": 0.2954, "lr": 0.00015628082263300448, "epoch": 15.34329140461216, "percentage": 76.72, "elapsed_time": "1:15:01", "remaining_time": "0:22:46", "throughput": 4246.45, "total_tokens": 19113552} {"current_steps": 29280, "total_steps": 38160, "loss": 0.4814, "lr": 0.00015611477726289465, "epoch": 15.345911949685535, "percentage": 76.73, "elapsed_time": "1:15:01", "remaining_time": "0:22:45", "throughput": 4246.51, "total_tokens": 19117104} {"current_steps": 29285, "total_steps": 38160, "loss": 0.4881, "lr": 0.00015594880382964994, "epoch": 15.34853249475891, "percentage": 76.74, "elapsed_time": "1:15:02", "remaining_time": "0:22:44", "throughput": 4246.49, "total_tokens": 19119856} {"current_steps": 29290, "total_steps": 38160, "loss": 0.4139, "lr": 0.00015578290236799037, "epoch": 15.351153039832285, "percentage": 76.76, "elapsed_time": "1:15:03", "remaining_time": "0:22:43", "throughput": 4246.5, "total_tokens": 19122864} {"current_steps": 29295, "total_steps": 38160, "loss": 0.4468, "lr": 0.00015561707291262061, "epoch": 15.35377358490566, "percentage": 76.77, "elapsed_time": "1:15:03", "remaining_time": "0:22:42", "throughput": 4246.52, "total_tokens": 19125872} {"current_steps": 29300, "total_steps": 38160, "loss": 0.5134, "lr": 0.00015545131549823043, "epoch": 15.356394129979035, "percentage": 76.78, "elapsed_time": "1:15:04", "remaining_time": "0:22:42", "throughput": 4246.48, "total_tokens": 19128400} {"current_steps": 29305, "total_steps": 38160, "loss": 0.4517, "lr": 0.0001552856301594942, "epoch": 15.35901467505241, "percentage": 76.8, "elapsed_time": "1:15:05", "remaining_time": "0:22:41", "throughput": 4246.48, "total_tokens": 19131280} {"current_steps": 29310, "total_steps": 38160, "loss": 0.3303, "lr": 0.00015512001693107126, "epoch": 15.361635220125786, "percentage": 76.81, "elapsed_time": "1:15:05", "remaining_time": "0:22:40", "throughput": 4246.46, "total_tokens": 19134032} {"current_steps": 29315, "total_steps": 38160, "loss": 0.3757, "lr": 0.0001549544758476062, "epoch": 15.364255765199161, "percentage": 76.82, "elapsed_time": "1:15:06", "remaining_time": "0:22:39", "throughput": 4246.57, "total_tokens": 19137904} {"current_steps": 29320, "total_steps": 38160, "loss": 0.4704, "lr": 0.00015478900694372832, "epoch": 15.366876310272536, "percentage": 76.83, "elapsed_time": "1:15:07", "remaining_time": "0:22:39", "throughput": 4246.74, "total_tokens": 19142544} {"current_steps": 29325, "total_steps": 38160, "loss": 0.4689, "lr": 0.00015462361025405196, "epoch": 15.369496855345911, "percentage": 76.85, "elapsed_time": "1:15:08", "remaining_time": "0:22:38", "throughput": 4246.77, "total_tokens": 19145712} {"current_steps": 29330, "total_steps": 38160, "loss": 0.3993, "lr": 0.0001544582858131759, "epoch": 15.372117400419286, "percentage": 76.86, "elapsed_time": "1:15:09", "remaining_time": "0:22:37", "throughput": 4246.84, "total_tokens": 19149328} {"current_steps": 29335, "total_steps": 38160, "loss": 0.3401, "lr": 0.00015429303365568448, "epoch": 15.374737945492662, "percentage": 76.87, "elapsed_time": "1:15:09", "remaining_time": "0:22:36", "throughput": 4246.91, "total_tokens": 19152912} {"current_steps": 29340, "total_steps": 38160, "loss": 0.5934, "lr": 0.00015412785381614625, "epoch": 15.377358490566039, "percentage": 76.89, "elapsed_time": "1:15:10", "remaining_time": "0:22:35", "throughput": 4246.98, "total_tokens": 19156496} {"current_steps": 29345, "total_steps": 38160, "loss": 0.4191, "lr": 0.000153962746329115, "epoch": 15.379979035639414, "percentage": 76.9, "elapsed_time": "1:15:11", "remaining_time": "0:22:35", "throughput": 4247.27, "total_tokens": 19162224} {"current_steps": 29350, "total_steps": 38160, "loss": 0.5305, "lr": 0.0001537977112291295, "epoch": 15.382599580712789, "percentage": 76.91, "elapsed_time": "1:15:12", "remaining_time": "0:22:34", "throughput": 4247.36, "total_tokens": 19166000} {"current_steps": 29355, "total_steps": 38160, "loss": 0.4798, "lr": 0.00015363274855071323, "epoch": 15.385220125786164, "percentage": 76.93, "elapsed_time": "1:15:13", "remaining_time": "0:22:33", "throughput": 4247.34, "total_tokens": 19168720} {"current_steps": 29360, "total_steps": 38160, "loss": 0.3575, "lr": 0.0001534678583283743, "epoch": 15.38784067085954, "percentage": 76.94, "elapsed_time": "1:15:13", "remaining_time": "0:22:32", "throughput": 4247.36, "total_tokens": 19171824} {"current_steps": 29365, "total_steps": 38160, "loss": 0.4041, "lr": 0.00015330304059660605, "epoch": 15.390461215932914, "percentage": 76.95, "elapsed_time": "1:15:14", "remaining_time": "0:22:32", "throughput": 4247.45, "total_tokens": 19175536} {"current_steps": 29370, "total_steps": 38160, "loss": 0.4355, "lr": 0.00015313829538988628, "epoch": 15.39308176100629, "percentage": 76.97, "elapsed_time": "1:15:15", "remaining_time": "0:22:31", "throughput": 4247.51, "total_tokens": 19179120} {"current_steps": 29375, "total_steps": 38160, "loss": 0.4362, "lr": 0.00015297362274267783, "epoch": 15.395702306079665, "percentage": 76.98, "elapsed_time": "1:15:16", "remaining_time": "0:22:30", "throughput": 4247.64, "total_tokens": 19183344} {"current_steps": 29380, "total_steps": 38160, "loss": 0.4215, "lr": 0.00015280902268942866, "epoch": 15.39832285115304, "percentage": 76.99, "elapsed_time": "1:15:17", "remaining_time": "0:22:29", "throughput": 4247.76, "total_tokens": 19187600} {"current_steps": 29385, "total_steps": 38160, "loss": 0.4462, "lr": 0.00015264449526457074, "epoch": 15.400943396226415, "percentage": 77.0, "elapsed_time": "1:15:17", "remaining_time": "0:22:29", "throughput": 4247.85, "total_tokens": 19191440} {"current_steps": 29390, "total_steps": 38160, "loss": 0.4672, "lr": 0.00015248004050252178, "epoch": 15.40356394129979, "percentage": 77.02, "elapsed_time": "1:15:18", "remaining_time": "0:22:28", "throughput": 4247.85, "total_tokens": 19194352} {"current_steps": 29395, "total_steps": 38160, "loss": 0.4159, "lr": 0.00015231565843768348, "epoch": 15.406184486373165, "percentage": 77.03, "elapsed_time": "1:15:19", "remaining_time": "0:22:27", "throughput": 4247.82, "total_tokens": 19197040} {"current_steps": 29400, "total_steps": 38160, "loss": 0.3992, "lr": 0.00015215134910444284, "epoch": 15.40880503144654, "percentage": 77.04, "elapsed_time": "1:15:20", "remaining_time": "0:22:26", "throughput": 4247.89, "total_tokens": 19200624} {"current_steps": 29405, "total_steps": 38160, "loss": 0.5715, "lr": 0.00015198711253717163, "epoch": 15.411425576519916, "percentage": 77.06, "elapsed_time": "1:15:20", "remaining_time": "0:22:25", "throughput": 4247.9, "total_tokens": 19203600} {"current_steps": 29410, "total_steps": 38160, "loss": 0.3287, "lr": 0.00015182294877022596, "epoch": 15.414046121593291, "percentage": 77.07, "elapsed_time": "1:15:21", "remaining_time": "0:22:25", "throughput": 4247.85, "total_tokens": 19206032} {"current_steps": 29415, "total_steps": 38160, "loss": 0.3791, "lr": 0.00015165885783794726, "epoch": 15.416666666666666, "percentage": 77.08, "elapsed_time": "1:15:22", "remaining_time": "0:22:24", "throughput": 4247.8, "total_tokens": 19208624} {"current_steps": 29420, "total_steps": 38160, "loss": 0.3376, "lr": 0.0001514948397746615, "epoch": 15.419287211740041, "percentage": 77.1, "elapsed_time": "1:15:22", "remaining_time": "0:22:23", "throughput": 4247.73, "total_tokens": 19210896} {"current_steps": 29425, "total_steps": 38160, "loss": 0.4489, "lr": 0.0001513308946146792, "epoch": 15.421907756813416, "percentage": 77.11, "elapsed_time": "1:15:23", "remaining_time": "0:22:22", "throughput": 4247.73, "total_tokens": 19213680} {"current_steps": 29430, "total_steps": 38160, "loss": 0.4185, "lr": 0.0001511670223922959, "epoch": 15.424528301886792, "percentage": 77.12, "elapsed_time": "1:15:23", "remaining_time": "0:22:21", "throughput": 4247.72, "total_tokens": 19216464} {"current_steps": 29435, "total_steps": 38160, "loss": 0.4732, "lr": 0.000151003223141792, "epoch": 15.427148846960169, "percentage": 77.14, "elapsed_time": "1:15:24", "remaining_time": "0:22:21", "throughput": 4247.69, "total_tokens": 19219184} {"current_steps": 29440, "total_steps": 38160, "loss": 0.4356, "lr": 0.00015083949689743202, "epoch": 15.429769392033544, "percentage": 77.15, "elapsed_time": "1:15:25", "remaining_time": "0:22:20", "throughput": 4247.71, "total_tokens": 19222288} {"current_steps": 29445, "total_steps": 38160, "loss": 0.4084, "lr": 0.00015067584369346594, "epoch": 15.432389937106919, "percentage": 77.16, "elapsed_time": "1:15:26", "remaining_time": "0:22:19", "throughput": 4247.76, "total_tokens": 19225776} {"current_steps": 29450, "total_steps": 38160, "loss": 0.3511, "lr": 0.00015051226356412818, "epoch": 15.435010482180294, "percentage": 77.18, "elapsed_time": "1:15:26", "remaining_time": "0:22:18", "throughput": 4247.75, "total_tokens": 19228496} {"current_steps": 29455, "total_steps": 38160, "loss": 0.4635, "lr": 0.00015034875654363754, "epoch": 15.43763102725367, "percentage": 77.19, "elapsed_time": "1:15:27", "remaining_time": "0:22:18", "throughput": 4247.83, "total_tokens": 19232272} {"current_steps": 29460, "total_steps": 38160, "loss": 0.4897, "lr": 0.00015018532266619818, "epoch": 15.440251572327044, "percentage": 77.2, "elapsed_time": "1:15:28", "remaining_time": "0:22:17", "throughput": 4247.87, "total_tokens": 19235568} {"current_steps": 29465, "total_steps": 38160, "loss": 0.4255, "lr": 0.00015002196196599828, "epoch": 15.44287211740042, "percentage": 77.21, "elapsed_time": "1:15:28", "remaining_time": "0:22:16", "throughput": 4247.86, "total_tokens": 19238352} {"current_steps": 29470, "total_steps": 38160, "loss": 0.5226, "lr": 0.00014985867447721114, "epoch": 15.445492662473795, "percentage": 77.23, "elapsed_time": "1:15:29", "remaining_time": "0:22:15", "throughput": 4247.89, "total_tokens": 19241616} {"current_steps": 29475, "total_steps": 38160, "loss": 0.3538, "lr": 0.00014969546023399467, "epoch": 15.44811320754717, "percentage": 77.24, "elapsed_time": "1:15:30", "remaining_time": "0:22:14", "throughput": 4248.09, "total_tokens": 19246512} {"current_steps": 29480, "total_steps": 38160, "loss": 0.3973, "lr": 0.00014953231927049165, "epoch": 15.450733752620545, "percentage": 77.25, "elapsed_time": "1:15:31", "remaining_time": "0:22:14", "throughput": 4248.17, "total_tokens": 19250128} {"current_steps": 29485, "total_steps": 38160, "loss": 0.4912, "lr": 0.00014936925162082904, "epoch": 15.45335429769392, "percentage": 77.27, "elapsed_time": "1:15:32", "remaining_time": "0:22:13", "throughput": 4248.17, "total_tokens": 19252976} {"current_steps": 29490, "total_steps": 38160, "loss": 0.4989, "lr": 0.00014920625731911863, "epoch": 15.455974842767295, "percentage": 77.28, "elapsed_time": "1:15:32", "remaining_time": "0:22:12", "throughput": 4248.15, "total_tokens": 19255664} {"current_steps": 29495, "total_steps": 38160, "loss": 0.3421, "lr": 0.00014904333639945716, "epoch": 15.45859538784067, "percentage": 77.29, "elapsed_time": "1:15:33", "remaining_time": "0:22:11", "throughput": 4248.2, "total_tokens": 19259088} {"current_steps": 29500, "total_steps": 38160, "loss": 0.4446, "lr": 0.00014888048889592575, "epoch": 15.461215932914046, "percentage": 77.31, "elapsed_time": "1:15:34", "remaining_time": "0:22:11", "throughput": 4248.38, "total_tokens": 19263792} {"current_steps": 29505, "total_steps": 38160, "loss": 0.3507, "lr": 0.00014871771484259046, "epoch": 15.463836477987421, "percentage": 77.32, "elapsed_time": "1:15:35", "remaining_time": "0:22:10", "throughput": 4248.45, "total_tokens": 19267312} {"current_steps": 29510, "total_steps": 38160, "loss": 0.5406, "lr": 0.00014855501427350144, "epoch": 15.466457023060796, "percentage": 77.33, "elapsed_time": "1:15:35", "remaining_time": "0:22:09", "throughput": 4248.46, "total_tokens": 19270256} {"current_steps": 29515, "total_steps": 38160, "loss": 0.5137, "lr": 0.00014839238722269405, "epoch": 15.469077568134171, "percentage": 77.35, "elapsed_time": "1:15:36", "remaining_time": "0:22:08", "throughput": 4248.46, "total_tokens": 19273200} {"current_steps": 29520, "total_steps": 38160, "loss": 0.4439, "lr": 0.00014822983372418774, "epoch": 15.471698113207546, "percentage": 77.36, "elapsed_time": "1:15:37", "remaining_time": "0:22:07", "throughput": 4248.48, "total_tokens": 19276240} {"current_steps": 29525, "total_steps": 38160, "loss": 0.4049, "lr": 0.00014806735381198705, "epoch": 15.474318658280922, "percentage": 77.37, "elapsed_time": "1:15:38", "remaining_time": "0:22:07", "throughput": 4248.65, "total_tokens": 19280656} {"current_steps": 29530, "total_steps": 38160, "loss": 0.3863, "lr": 0.00014790494752008087, "epoch": 15.476939203354299, "percentage": 77.38, "elapsed_time": "1:15:38", "remaining_time": "0:22:06", "throughput": 4248.75, "total_tokens": 19284656} {"current_steps": 29535, "total_steps": 38160, "loss": 0.4347, "lr": 0.00014774261488244295, "epoch": 15.479559748427674, "percentage": 77.4, "elapsed_time": "1:15:39", "remaining_time": "0:22:05", "throughput": 4248.78, "total_tokens": 19287888} {"current_steps": 29540, "total_steps": 38160, "loss": 0.4399, "lr": 0.00014758035593303114, "epoch": 15.482180293501049, "percentage": 77.41, "elapsed_time": "1:15:40", "remaining_time": "0:22:04", "throughput": 4248.77, "total_tokens": 19290704} {"current_steps": 29545, "total_steps": 38160, "loss": 0.4091, "lr": 0.00014741817070578817, "epoch": 15.484800838574424, "percentage": 77.42, "elapsed_time": "1:15:41", "remaining_time": "0:22:04", "throughput": 4248.81, "total_tokens": 19293968} {"current_steps": 29550, "total_steps": 38160, "loss": 0.5227, "lr": 0.0001472560592346414, "epoch": 15.4874213836478, "percentage": 77.44, "elapsed_time": "1:15:41", "remaining_time": "0:22:03", "throughput": 4248.86, "total_tokens": 19297360} {"current_steps": 29555, "total_steps": 38160, "loss": 0.4502, "lr": 0.0001470940215535027, "epoch": 15.490041928721174, "percentage": 77.45, "elapsed_time": "1:15:42", "remaining_time": "0:22:02", "throughput": 4248.91, "total_tokens": 19300688} {"current_steps": 29560, "total_steps": 38160, "loss": 0.3507, "lr": 0.00014693205769626878, "epoch": 15.49266247379455, "percentage": 77.46, "elapsed_time": "1:15:43", "remaining_time": "0:22:01", "throughput": 4248.94, "total_tokens": 19303888} {"current_steps": 29565, "total_steps": 38160, "loss": 0.4811, "lr": 0.00014677016769682028, "epoch": 15.495283018867925, "percentage": 77.48, "elapsed_time": "1:15:43", "remaining_time": "0:22:01", "throughput": 4249.0, "total_tokens": 19307344} {"current_steps": 29570, "total_steps": 38160, "loss": 0.4277, "lr": 0.00014660835158902268, "epoch": 15.4979035639413, "percentage": 77.49, "elapsed_time": "1:15:44", "remaining_time": "0:22:00", "throughput": 4249.1, "total_tokens": 19311312} {"current_steps": 29575, "total_steps": 38160, "loss": 0.4081, "lr": 0.00014644660940672628, "epoch": 15.500524109014675, "percentage": 77.5, "elapsed_time": "1:15:45", "remaining_time": "0:21:59", "throughput": 4249.15, "total_tokens": 19314768} {"current_steps": 29580, "total_steps": 38160, "loss": 0.474, "lr": 0.0001462849411837656, "epoch": 15.50314465408805, "percentage": 77.52, "elapsed_time": "1:15:46", "remaining_time": "0:21:58", "throughput": 4249.15, "total_tokens": 19317744} {"current_steps": 29585, "total_steps": 38160, "loss": 0.471, "lr": 0.00014612334695395985, "epoch": 15.505765199161425, "percentage": 77.53, "elapsed_time": "1:15:47", "remaining_time": "0:21:57", "throughput": 4249.28, "total_tokens": 19321840} {"current_steps": 29590, "total_steps": 38160, "loss": 0.3769, "lr": 0.0001459618267511128, "epoch": 15.5083857442348, "percentage": 77.54, "elapsed_time": "1:15:47", "remaining_time": "0:21:57", "throughput": 4249.33, "total_tokens": 19325232} {"current_steps": 29595, "total_steps": 38160, "loss": 0.4163, "lr": 0.00014580038060901256, "epoch": 15.511006289308176, "percentage": 77.56, "elapsed_time": "1:15:48", "remaining_time": "0:21:56", "throughput": 4249.34, "total_tokens": 19328240} {"current_steps": 29600, "total_steps": 38160, "loss": 0.3352, "lr": 0.00014563900856143157, "epoch": 15.51362683438155, "percentage": 77.57, "elapsed_time": "1:15:49", "remaining_time": "0:21:55", "throughput": 4249.34, "total_tokens": 19331216} {"current_steps": 29605, "total_steps": 38160, "loss": 0.4891, "lr": 0.0001454777106421273, "epoch": 15.516247379454926, "percentage": 77.58, "elapsed_time": "1:15:50", "remaining_time": "0:21:54", "throughput": 4249.51, "total_tokens": 19335760} {"current_steps": 29610, "total_steps": 38160, "loss": 0.4058, "lr": 0.00014531648688484127, "epoch": 15.518867924528301, "percentage": 77.59, "elapsed_time": "1:15:50", "remaining_time": "0:21:54", "throughput": 4249.51, "total_tokens": 19338672} {"current_steps": 29615, "total_steps": 38160, "loss": 0.4931, "lr": 0.0001451553373233, "epoch": 15.521488469601676, "percentage": 77.61, "elapsed_time": "1:15:51", "remaining_time": "0:21:53", "throughput": 4249.5, "total_tokens": 19341424} {"current_steps": 29620, "total_steps": 38160, "loss": 0.3959, "lr": 0.00014499426199121379, "epoch": 15.524109014675052, "percentage": 77.62, "elapsed_time": "1:15:52", "remaining_time": "0:21:52", "throughput": 4249.57, "total_tokens": 19345104} {"current_steps": 29625, "total_steps": 38160, "loss": 0.4159, "lr": 0.0001448332609222777, "epoch": 15.526729559748428, "percentage": 77.63, "elapsed_time": "1:15:53", "remaining_time": "0:21:51", "throughput": 4249.64, "total_tokens": 19348688} {"current_steps": 29630, "total_steps": 38160, "loss": 0.4304, "lr": 0.0001446723341501715, "epoch": 15.529350104821804, "percentage": 77.65, "elapsed_time": "1:15:53", "remaining_time": "0:21:50", "throughput": 4249.74, "total_tokens": 19352560} {"current_steps": 29635, "total_steps": 38160, "loss": 0.3851, "lr": 0.00014451148170855922, "epoch": 15.531970649895179, "percentage": 77.66, "elapsed_time": "1:15:54", "remaining_time": "0:21:50", "throughput": 4249.74, "total_tokens": 19355600} {"current_steps": 29640, "total_steps": 38160, "loss": 0.4061, "lr": 0.0001443507036310895, "epoch": 15.534591194968554, "percentage": 77.67, "elapsed_time": "1:15:55", "remaining_time": "0:21:49", "throughput": 4249.82, "total_tokens": 19359280} {"current_steps": 29645, "total_steps": 38160, "loss": 0.389, "lr": 0.00014418999995139493, "epoch": 15.53721174004193, "percentage": 77.69, "elapsed_time": "1:15:56", "remaining_time": "0:21:48", "throughput": 4249.96, "total_tokens": 19363600} {"current_steps": 29650, "total_steps": 38160, "loss": 0.4415, "lr": 0.00014402937070309325, "epoch": 15.539832285115304, "percentage": 77.7, "elapsed_time": "1:15:56", "remaining_time": "0:21:47", "throughput": 4249.96, "total_tokens": 19366608} {"current_steps": 29655, "total_steps": 38160, "loss": 0.5023, "lr": 0.0001438688159197859, "epoch": 15.54245283018868, "percentage": 77.71, "elapsed_time": "1:15:57", "remaining_time": "0:21:47", "throughput": 4250.0, "total_tokens": 19369936} {"current_steps": 29660, "total_steps": 38160, "loss": 0.3541, "lr": 0.0001437083356350593, "epoch": 15.545073375262055, "percentage": 77.73, "elapsed_time": "1:15:58", "remaining_time": "0:21:46", "throughput": 4250.11, "total_tokens": 19373968} {"current_steps": 29665, "total_steps": 38160, "loss": 0.6039, "lr": 0.0001435479298824841, "epoch": 15.54769392033543, "percentage": 77.74, "elapsed_time": "1:15:59", "remaining_time": "0:21:45", "throughput": 4250.08, "total_tokens": 19376528} {"current_steps": 29670, "total_steps": 38160, "loss": 0.4405, "lr": 0.00014338759869561557, "epoch": 15.550314465408805, "percentage": 77.75, "elapsed_time": "1:15:59", "remaining_time": "0:21:44", "throughput": 4250.2, "total_tokens": 19380752} {"current_steps": 29675, "total_steps": 38160, "loss": 0.4055, "lr": 0.00014322734210799287, "epoch": 15.55293501048218, "percentage": 77.76, "elapsed_time": "1:16:00", "remaining_time": "0:21:44", "throughput": 4250.22, "total_tokens": 19383824} {"current_steps": 29680, "total_steps": 38160, "loss": 0.5299, "lr": 0.0001430671601531398, "epoch": 15.555555555555555, "percentage": 77.78, "elapsed_time": "1:16:01", "remaining_time": "0:21:43", "throughput": 4250.26, "total_tokens": 19387184} {"current_steps": 29685, "total_steps": 38160, "loss": 0.414, "lr": 0.00014290705286456473, "epoch": 15.55817610062893, "percentage": 77.79, "elapsed_time": "1:16:02", "remaining_time": "0:21:42", "throughput": 4250.33, "total_tokens": 19390704} {"current_steps": 29690, "total_steps": 38160, "loss": 0.3137, "lr": 0.00014274702027576024, "epoch": 15.560796645702306, "percentage": 77.8, "elapsed_time": "1:16:02", "remaining_time": "0:21:41", "throughput": 4250.31, "total_tokens": 19393456} {"current_steps": 29695, "total_steps": 38160, "loss": 0.3485, "lr": 0.00014258706242020354, "epoch": 15.56341719077568, "percentage": 77.82, "elapsed_time": "1:16:03", "remaining_time": "0:21:40", "throughput": 4250.26, "total_tokens": 19395920} {"current_steps": 29700, "total_steps": 38160, "loss": 0.3749, "lr": 0.00014242717933135558, "epoch": 15.566037735849056, "percentage": 77.83, "elapsed_time": "1:16:04", "remaining_time": "0:21:40", "throughput": 4250.2, "total_tokens": 19398288} {"current_steps": 29705, "total_steps": 38160, "loss": 0.3887, "lr": 0.0001422673710426625, "epoch": 15.568658280922431, "percentage": 77.84, "elapsed_time": "1:16:04", "remaining_time": "0:21:39", "throughput": 4250.22, "total_tokens": 19401488} {"current_steps": 29710, "total_steps": 38160, "loss": 0.5705, "lr": 0.00014210763758755403, "epoch": 15.571278825995806, "percentage": 77.86, "elapsed_time": "1:16:05", "remaining_time": "0:21:38", "throughput": 4250.34, "total_tokens": 19405584} {"current_steps": 29715, "total_steps": 38160, "loss": 0.519, "lr": 0.00014194797899944468, "epoch": 15.573899371069182, "percentage": 77.87, "elapsed_time": "1:16:06", "remaining_time": "0:21:37", "throughput": 4250.42, "total_tokens": 19409328} {"current_steps": 29720, "total_steps": 38160, "loss": 0.3863, "lr": 0.00014178839531173344, "epoch": 15.576519916142558, "percentage": 77.88, "elapsed_time": "1:16:07", "remaining_time": "0:21:36", "throughput": 4250.43, "total_tokens": 19412304} {"current_steps": 29725, "total_steps": 38160, "loss": 0.323, "lr": 0.00014162888655780303, "epoch": 15.579140461215934, "percentage": 77.9, "elapsed_time": "1:16:07", "remaining_time": "0:21:36", "throughput": 4250.48, "total_tokens": 19415792} {"current_steps": 29730, "total_steps": 38160, "loss": 0.4624, "lr": 0.00014146945277102108, "epoch": 15.581761006289309, "percentage": 77.91, "elapsed_time": "1:16:08", "remaining_time": "0:21:35", "throughput": 4250.56, "total_tokens": 19419440} {"current_steps": 29735, "total_steps": 38160, "loss": 0.4577, "lr": 0.00014131009398473938, "epoch": 15.584381551362684, "percentage": 77.92, "elapsed_time": "1:16:09", "remaining_time": "0:21:34", "throughput": 4250.54, "total_tokens": 19422256} {"current_steps": 29740, "total_steps": 38160, "loss": 0.485, "lr": 0.00014115081023229376, "epoch": 15.58700209643606, "percentage": 77.94, "elapsed_time": "1:16:10", "remaining_time": "0:21:33", "throughput": 4250.58, "total_tokens": 19425680} {"current_steps": 29745, "total_steps": 38160, "loss": 0.3569, "lr": 0.00014099160154700462, "epoch": 15.589622641509434, "percentage": 77.95, "elapsed_time": "1:16:10", "remaining_time": "0:21:33", "throughput": 4250.66, "total_tokens": 19429200} {"current_steps": 29750, "total_steps": 38160, "loss": 0.4202, "lr": 0.00014083246796217684, "epoch": 15.59224318658281, "percentage": 77.96, "elapsed_time": "1:16:11", "remaining_time": "0:21:32", "throughput": 4250.69, "total_tokens": 19432528} {"current_steps": 29755, "total_steps": 38160, "loss": 0.3941, "lr": 0.00014067340951109898, "epoch": 15.594863731656185, "percentage": 77.97, "elapsed_time": "1:16:12", "remaining_time": "0:21:31", "throughput": 4250.76, "total_tokens": 19436112} {"current_steps": 29760, "total_steps": 38160, "loss": 0.4531, "lr": 0.00014051442622704447, "epoch": 15.59748427672956, "percentage": 77.99, "elapsed_time": "1:16:13", "remaining_time": "0:21:30", "throughput": 4250.78, "total_tokens": 19439120} {"current_steps": 29765, "total_steps": 38160, "loss": 0.5349, "lr": 0.0001403555181432709, "epoch": 15.600104821802935, "percentage": 78.0, "elapsed_time": "1:16:13", "remaining_time": "0:21:30", "throughput": 4250.8, "total_tokens": 19442256} {"current_steps": 29770, "total_steps": 38160, "loss": 0.3953, "lr": 0.00014019668529301977, "epoch": 15.60272536687631, "percentage": 78.01, "elapsed_time": "1:16:14", "remaining_time": "0:21:29", "throughput": 4250.78, "total_tokens": 19445040} {"current_steps": 29775, "total_steps": 38160, "loss": 0.5115, "lr": 0.00014003792770951733, "epoch": 15.605345911949685, "percentage": 78.03, "elapsed_time": "1:16:15", "remaining_time": "0:21:28", "throughput": 4250.73, "total_tokens": 19447472} {"current_steps": 29780, "total_steps": 38160, "loss": 0.5159, "lr": 0.00013987924542597363, "epoch": 15.60796645702306, "percentage": 78.04, "elapsed_time": "1:16:15", "remaining_time": "0:21:27", "throughput": 4250.67, "total_tokens": 19449840} {"current_steps": 29785, "total_steps": 38160, "loss": 0.4579, "lr": 0.0001397206384755833, "epoch": 15.610587002096436, "percentage": 78.05, "elapsed_time": "1:16:16", "remaining_time": "0:21:26", "throughput": 4250.7, "total_tokens": 19453040} {"current_steps": 29790, "total_steps": 38160, "loss": 0.5498, "lr": 0.00013956210689152526, "epoch": 15.61320754716981, "percentage": 78.07, "elapsed_time": "1:16:17", "remaining_time": "0:21:26", "throughput": 4250.68, "total_tokens": 19455792} {"current_steps": 29795, "total_steps": 38160, "loss": 0.4811, "lr": 0.0001394036507069622, "epoch": 15.615828092243186, "percentage": 78.08, "elapsed_time": "1:16:17", "remaining_time": "0:21:25", "throughput": 4250.7, "total_tokens": 19458928} {"current_steps": 29800, "total_steps": 38160, "loss": 0.3913, "lr": 0.00013924526995504172, "epoch": 15.618448637316561, "percentage": 78.09, "elapsed_time": "1:16:18", "remaining_time": "0:21:24", "throughput": 4250.73, "total_tokens": 19462128} {"current_steps": 29805, "total_steps": 38160, "loss": 0.3915, "lr": 0.00013908696466889486, "epoch": 15.621069182389936, "percentage": 78.11, "elapsed_time": "1:16:19", "remaining_time": "0:21:23", "throughput": 4250.66, "total_tokens": 19464368} {"current_steps": 29810, "total_steps": 38160, "loss": 0.4034, "lr": 0.0001389287348816375, "epoch": 15.623689727463312, "percentage": 78.12, "elapsed_time": "1:16:19", "remaining_time": "0:21:22", "throughput": 4250.71, "total_tokens": 19467792} {"current_steps": 29815, "total_steps": 38160, "loss": 0.3856, "lr": 0.00013877058062636944, "epoch": 15.626310272536688, "percentage": 78.13, "elapsed_time": "1:16:20", "remaining_time": "0:21:22", "throughput": 4250.97, "total_tokens": 19473584} {"current_steps": 29820, "total_steps": 38160, "loss": 0.4936, "lr": 0.00013861250193617498, "epoch": 15.628930817610064, "percentage": 78.14, "elapsed_time": "1:16:21", "remaining_time": "0:21:21", "throughput": 4251.11, "total_tokens": 19477936} {"current_steps": 29825, "total_steps": 38160, "loss": 0.4599, "lr": 0.00013845449884412203, "epoch": 15.631551362683439, "percentage": 78.16, "elapsed_time": "1:16:22", "remaining_time": "0:21:20", "throughput": 4251.18, "total_tokens": 19481488} {"current_steps": 29830, "total_steps": 38160, "loss": 0.5806, "lr": 0.00013829657138326334, "epoch": 15.634171907756814, "percentage": 78.17, "elapsed_time": "1:16:23", "remaining_time": "0:21:19", "throughput": 4251.18, "total_tokens": 19484432} {"current_steps": 29835, "total_steps": 38160, "loss": 0.4234, "lr": 0.00013813871958663526, "epoch": 15.63679245283019, "percentage": 78.18, "elapsed_time": "1:16:23", "remaining_time": "0:21:19", "throughput": 4251.18, "total_tokens": 19487376} {"current_steps": 29840, "total_steps": 38160, "loss": 0.4108, "lr": 0.0001379809434872587, "epoch": 15.639412997903564, "percentage": 78.2, "elapsed_time": "1:16:24", "remaining_time": "0:21:18", "throughput": 4251.16, "total_tokens": 19490224} {"current_steps": 29845, "total_steps": 38160, "loss": 0.3899, "lr": 0.0001378232431181386, "epoch": 15.64203354297694, "percentage": 78.21, "elapsed_time": "1:16:25", "remaining_time": "0:21:17", "throughput": 4251.16, "total_tokens": 19493072} {"current_steps": 29850, "total_steps": 38160, "loss": 0.3395, "lr": 0.00013766561851226428, "epoch": 15.644654088050315, "percentage": 78.22, "elapsed_time": "1:16:26", "remaining_time": "0:21:16", "throughput": 4251.15, "total_tokens": 19495952} {"current_steps": 29855, "total_steps": 38160, "loss": 0.5679, "lr": 0.00013750806970260886, "epoch": 15.64727463312369, "percentage": 78.24, "elapsed_time": "1:16:26", "remaining_time": "0:21:15", "throughput": 4251.21, "total_tokens": 19499440} {"current_steps": 29860, "total_steps": 38160, "loss": 0.4042, "lr": 0.00013735059672212959, "epoch": 15.649895178197065, "percentage": 78.25, "elapsed_time": "1:16:27", "remaining_time": "0:21:15", "throughput": 4251.16, "total_tokens": 19501904} {"current_steps": 29865, "total_steps": 38160, "loss": 0.5306, "lr": 0.00013719319960376808, "epoch": 15.65251572327044, "percentage": 78.26, "elapsed_time": "1:16:28", "remaining_time": "0:21:14", "throughput": 4251.19, "total_tokens": 19505200} {"current_steps": 29870, "total_steps": 38160, "loss": 0.3832, "lr": 0.00013703587838045017, "epoch": 15.655136268343815, "percentage": 78.28, "elapsed_time": "1:16:28", "remaining_time": "0:21:13", "throughput": 4251.25, "total_tokens": 19508784} {"current_steps": 29875, "total_steps": 38160, "loss": 0.3627, "lr": 0.00013687863308508568, "epoch": 15.65775681341719, "percentage": 78.29, "elapsed_time": "1:16:29", "remaining_time": "0:21:12", "throughput": 4251.21, "total_tokens": 19511312} {"current_steps": 29880, "total_steps": 38160, "loss": 0.3632, "lr": 0.00013672146375056849, "epoch": 15.660377358490566, "percentage": 78.3, "elapsed_time": "1:16:30", "remaining_time": "0:21:11", "throughput": 4251.2, "total_tokens": 19514064} {"current_steps": 29885, "total_steps": 38160, "loss": 0.4446, "lr": 0.00013656437040977643, "epoch": 15.66299790356394, "percentage": 78.31, "elapsed_time": "1:16:30", "remaining_time": "0:21:11", "throughput": 4251.18, "total_tokens": 19516816} {"current_steps": 29890, "total_steps": 38160, "loss": 0.4131, "lr": 0.00013640735309557178, "epoch": 15.665618448637316, "percentage": 78.33, "elapsed_time": "1:16:31", "remaining_time": "0:21:10", "throughput": 4251.2, "total_tokens": 19519888} {"current_steps": 29895, "total_steps": 38160, "loss": 0.4133, "lr": 0.00013625041184080078, "epoch": 15.668238993710691, "percentage": 78.34, "elapsed_time": "1:16:32", "remaining_time": "0:21:09", "throughput": 4251.28, "total_tokens": 19523472} {"current_steps": 29900, "total_steps": 38160, "loss": 0.308, "lr": 0.00013609354667829378, "epoch": 15.670859538784066, "percentage": 78.35, "elapsed_time": "1:16:33", "remaining_time": "0:21:08", "throughput": 4251.36, "total_tokens": 19527184} {"current_steps": 29905, "total_steps": 38160, "loss": 0.3918, "lr": 0.00013593675764086521, "epoch": 15.673480083857442, "percentage": 78.37, "elapsed_time": "1:16:33", "remaining_time": "0:21:08", "throughput": 4251.46, "total_tokens": 19531056} {"current_steps": 29910, "total_steps": 38160, "loss": 0.5211, "lr": 0.00013578004476131356, "epoch": 15.676100628930818, "percentage": 78.38, "elapsed_time": "1:16:34", "remaining_time": "0:21:07", "throughput": 4251.54, "total_tokens": 19534832} {"current_steps": 29915, "total_steps": 38160, "loss": 0.4078, "lr": 0.00013562340807242112, "epoch": 15.678721174004194, "percentage": 78.39, "elapsed_time": "1:16:35", "remaining_time": "0:21:06", "throughput": 4251.57, "total_tokens": 19538064} {"current_steps": 29920, "total_steps": 38160, "loss": 0.3275, "lr": 0.00013546684760695472, "epoch": 15.681341719077569, "percentage": 78.41, "elapsed_time": "1:16:36", "remaining_time": "0:21:05", "throughput": 4251.62, "total_tokens": 19541584} {"current_steps": 29925, "total_steps": 38160, "loss": 0.5082, "lr": 0.00013531036339766494, "epoch": 15.683962264150944, "percentage": 78.42, "elapsed_time": "1:16:36", "remaining_time": "0:21:05", "throughput": 4251.66, "total_tokens": 19544816} {"current_steps": 29930, "total_steps": 38160, "loss": 0.4756, "lr": 0.00013515395547728675, "epoch": 15.68658280922432, "percentage": 78.43, "elapsed_time": "1:16:37", "remaining_time": "0:21:04", "throughput": 4251.63, "total_tokens": 19547440} {"current_steps": 29935, "total_steps": 38160, "loss": 0.3949, "lr": 0.00013499762387853866, "epoch": 15.689203354297694, "percentage": 78.45, "elapsed_time": "1:16:38", "remaining_time": "0:21:03", "throughput": 4251.64, "total_tokens": 19550480} {"current_steps": 29940, "total_steps": 38160, "loss": 0.3888, "lr": 0.00013484136863412333, "epoch": 15.69182389937107, "percentage": 78.46, "elapsed_time": "1:16:39", "remaining_time": "0:21:02", "throughput": 4251.73, "total_tokens": 19554416} {"current_steps": 29945, "total_steps": 38160, "loss": 0.4122, "lr": 0.00013468518977672773, "epoch": 15.694444444444445, "percentage": 78.47, "elapsed_time": "1:16:39", "remaining_time": "0:21:01", "throughput": 4251.72, "total_tokens": 19557200} {"current_steps": 29950, "total_steps": 38160, "loss": 0.3794, "lr": 0.0001345290873390227, "epoch": 15.69706498951782, "percentage": 78.49, "elapsed_time": "1:16:40", "remaining_time": "0:21:01", "throughput": 4251.74, "total_tokens": 19560368} {"current_steps": 29955, "total_steps": 38160, "loss": 0.3317, "lr": 0.00013437306135366322, "epoch": 15.699685534591195, "percentage": 78.5, "elapsed_time": "1:16:41", "remaining_time": "0:21:00", "throughput": 4251.76, "total_tokens": 19563536} {"current_steps": 29960, "total_steps": 38160, "loss": 0.3918, "lr": 0.00013421711185328806, "epoch": 15.70230607966457, "percentage": 78.51, "elapsed_time": "1:16:41", "remaining_time": "0:20:59", "throughput": 4251.76, "total_tokens": 19566448} {"current_steps": 29965, "total_steps": 38160, "loss": 0.4233, "lr": 0.00013406123887051984, "epoch": 15.704926624737945, "percentage": 78.52, "elapsed_time": "1:16:42", "remaining_time": "0:20:58", "throughput": 4251.74, "total_tokens": 19569104} {"current_steps": 29970, "total_steps": 38160, "loss": 0.316, "lr": 0.0001339054424379656, "epoch": 15.70754716981132, "percentage": 78.54, "elapsed_time": "1:16:43", "remaining_time": "0:20:58", "throughput": 4252.08, "total_tokens": 19575952} {"current_steps": 29975, "total_steps": 38160, "loss": 0.5069, "lr": 0.00013374972258821621, "epoch": 15.710167714884696, "percentage": 78.55, "elapsed_time": "1:16:44", "remaining_time": "0:20:57", "throughput": 4252.08, "total_tokens": 19578864} {"current_steps": 29980, "total_steps": 38160, "loss": 0.43, "lr": 0.00013359407935384642, "epoch": 15.71278825995807, "percentage": 78.56, "elapsed_time": "1:16:45", "remaining_time": "0:20:56", "throughput": 4252.12, "total_tokens": 19582160} {"current_steps": 29985, "total_steps": 38160, "loss": 0.502, "lr": 0.0001334385127674152, "epoch": 15.715408805031446, "percentage": 78.58, "elapsed_time": "1:16:46", "remaining_time": "0:20:55", "throughput": 4252.14, "total_tokens": 19585392} {"current_steps": 29990, "total_steps": 38160, "loss": 0.5646, "lr": 0.00013328302286146515, "epoch": 15.718029350104821, "percentage": 78.59, "elapsed_time": "1:16:46", "remaining_time": "0:20:55", "throughput": 4252.2, "total_tokens": 19588976} {"current_steps": 29995, "total_steps": 38160, "loss": 0.4608, "lr": 0.00013312760966852283, "epoch": 15.720649895178196, "percentage": 78.6, "elapsed_time": "1:16:47", "remaining_time": "0:20:54", "throughput": 4252.25, "total_tokens": 19592496} {"current_steps": 30000, "total_steps": 38160, "loss": 0.5499, "lr": 0.00013297227322109912, "epoch": 15.723270440251572, "percentage": 78.62, "elapsed_time": "1:16:48", "remaining_time": "0:20:53", "throughput": 4252.3, "total_tokens": 19595888} {"current_steps": 30005, "total_steps": 38160, "loss": 0.3561, "lr": 0.00013281701355168852, "epoch": 15.725890985324948, "percentage": 78.63, "elapsed_time": "1:16:49", "remaining_time": "0:20:52", "throughput": 4252.45, "total_tokens": 19600272} {"current_steps": 30010, "total_steps": 38160, "loss": 0.3745, "lr": 0.00013266183069276982, "epoch": 15.728511530398324, "percentage": 78.64, "elapsed_time": "1:16:49", "remaining_time": "0:20:51", "throughput": 4252.55, "total_tokens": 19604272} {"current_steps": 30015, "total_steps": 38160, "loss": 0.4434, "lr": 0.00013250672467680514, "epoch": 15.731132075471699, "percentage": 78.66, "elapsed_time": "1:16:50", "remaining_time": "0:20:51", "throughput": 4252.65, "total_tokens": 19608176} {"current_steps": 30020, "total_steps": 38160, "loss": 0.3698, "lr": 0.00013235169553624127, "epoch": 15.733752620545074, "percentage": 78.67, "elapsed_time": "1:16:51", "remaining_time": "0:20:50", "throughput": 4252.72, "total_tokens": 19611728} {"current_steps": 30025, "total_steps": 38160, "loss": 0.3517, "lr": 0.00013219674330350816, "epoch": 15.73637316561845, "percentage": 78.68, "elapsed_time": "1:16:52", "remaining_time": "0:20:49", "throughput": 4252.74, "total_tokens": 19614896} {"current_steps": 30030, "total_steps": 38160, "loss": 0.4442, "lr": 0.00013204186801102024, "epoch": 15.738993710691824, "percentage": 78.69, "elapsed_time": "1:16:53", "remaining_time": "0:20:48", "throughput": 4252.86, "total_tokens": 19619024} {"current_steps": 30035, "total_steps": 38160, "loss": 0.4936, "lr": 0.0001318870696911758, "epoch": 15.7416142557652, "percentage": 78.71, "elapsed_time": "1:16:53", "remaining_time": "0:20:48", "throughput": 4252.91, "total_tokens": 19622448} {"current_steps": 30040, "total_steps": 38160, "loss": 0.4844, "lr": 0.00013173234837635656, "epoch": 15.744234800838575, "percentage": 78.72, "elapsed_time": "1:16:54", "remaining_time": "0:20:47", "throughput": 4252.98, "total_tokens": 19626096} {"current_steps": 30045, "total_steps": 38160, "loss": 0.4055, "lr": 0.00013157770409892878, "epoch": 15.74685534591195, "percentage": 78.73, "elapsed_time": "1:16:55", "remaining_time": "0:20:46", "throughput": 4253.0, "total_tokens": 19629168} {"current_steps": 30050, "total_steps": 38160, "loss": 0.3401, "lr": 0.00013142313689124197, "epoch": 15.749475890985325, "percentage": 78.75, "elapsed_time": "1:16:56", "remaining_time": "0:20:45", "throughput": 4253.03, "total_tokens": 19632464} {"current_steps": 30055, "total_steps": 38160, "loss": 0.5991, "lr": 0.00013126864678562994, "epoch": 15.7520964360587, "percentage": 78.76, "elapsed_time": "1:16:56", "remaining_time": "0:20:45", "throughput": 4253.09, "total_tokens": 19636016} {"current_steps": 30060, "total_steps": 38160, "loss": 0.4501, "lr": 0.00013111423381441034, "epoch": 15.754716981132075, "percentage": 78.77, "elapsed_time": "1:16:57", "remaining_time": "0:20:44", "throughput": 4253.11, "total_tokens": 19639184} {"current_steps": 30065, "total_steps": 38160, "loss": 0.3918, "lr": 0.00013095989800988468, "epoch": 15.75733752620545, "percentage": 78.79, "elapsed_time": "1:16:58", "remaining_time": "0:20:43", "throughput": 4253.06, "total_tokens": 19641648} {"current_steps": 30070, "total_steps": 38160, "loss": 0.4776, "lr": 0.000130805639404338, "epoch": 15.759958071278826, "percentage": 78.8, "elapsed_time": "1:16:58", "remaining_time": "0:20:42", "throughput": 4253.08, "total_tokens": 19644816} {"current_steps": 30075, "total_steps": 38160, "loss": 0.4493, "lr": 0.0001306514580300397, "epoch": 15.7625786163522, "percentage": 78.81, "elapsed_time": "1:16:59", "remaining_time": "0:20:41", "throughput": 4253.06, "total_tokens": 19647504} {"current_steps": 30080, "total_steps": 38160, "loss": 0.3845, "lr": 0.00013049735391924244, "epoch": 15.765199161425576, "percentage": 78.83, "elapsed_time": "1:17:00", "remaining_time": "0:20:41", "throughput": 4253.06, "total_tokens": 19650480} {"current_steps": 30085, "total_steps": 38160, "loss": 0.4496, "lr": 0.00013034332710418328, "epoch": 15.767819706498951, "percentage": 78.84, "elapsed_time": "1:17:01", "remaining_time": "0:20:40", "throughput": 4253.09, "total_tokens": 19653712} {"current_steps": 30090, "total_steps": 38160, "loss": 0.4409, "lr": 0.00013018937761708298, "epoch": 15.770440251572326, "percentage": 78.85, "elapsed_time": "1:17:01", "remaining_time": "0:20:39", "throughput": 4253.04, "total_tokens": 19656144} {"current_steps": 30095, "total_steps": 38160, "loss": 0.5713, "lr": 0.0001300355054901457, "epoch": 15.773060796645701, "percentage": 78.87, "elapsed_time": "1:17:02", "remaining_time": "0:20:38", "throughput": 4252.99, "total_tokens": 19658640} {"current_steps": 30100, "total_steps": 38160, "loss": 0.5243, "lr": 0.0001298817107555599, "epoch": 15.775681341719078, "percentage": 78.88, "elapsed_time": "1:17:03", "remaining_time": "0:20:37", "throughput": 4253.03, "total_tokens": 19661872} {"current_steps": 30105, "total_steps": 38160, "loss": 0.4038, "lr": 0.0001297279934454978, "epoch": 15.778301886792454, "percentage": 78.89, "elapsed_time": "1:17:03", "remaining_time": "0:20:37", "throughput": 4253.06, "total_tokens": 19665136} {"current_steps": 30110, "total_steps": 38160, "loss": 0.4387, "lr": 0.000129574353592115, "epoch": 15.780922431865829, "percentage": 78.9, "elapsed_time": "1:17:04", "remaining_time": "0:20:36", "throughput": 4253.06, "total_tokens": 19668112} {"current_steps": 30115, "total_steps": 38160, "loss": 0.3652, "lr": 0.00012942079122755162, "epoch": 15.783542976939204, "percentage": 78.92, "elapsed_time": "1:17:05", "remaining_time": "0:20:35", "throughput": 4253.1, "total_tokens": 19671312} {"current_steps": 30120, "total_steps": 38160, "loss": 0.4187, "lr": 0.00012926730638393075, "epoch": 15.786163522012579, "percentage": 78.93, "elapsed_time": "1:17:05", "remaining_time": "0:20:34", "throughput": 4253.08, "total_tokens": 19674064} {"current_steps": 30125, "total_steps": 38160, "loss": 0.3944, "lr": 0.0001291138990933598, "epoch": 15.788784067085954, "percentage": 78.94, "elapsed_time": "1:17:06", "remaining_time": "0:20:33", "throughput": 4253.05, "total_tokens": 19676752} {"current_steps": 30130, "total_steps": 38160, "loss": 0.4309, "lr": 0.00012896056938792994, "epoch": 15.79140461215933, "percentage": 78.96, "elapsed_time": "1:17:07", "remaining_time": "0:20:33", "throughput": 4253.02, "total_tokens": 19679376} {"current_steps": 30135, "total_steps": 38160, "loss": 0.4614, "lr": 0.000128807317299716, "epoch": 15.794025157232705, "percentage": 78.97, "elapsed_time": "1:17:07", "remaining_time": "0:20:32", "throughput": 4252.97, "total_tokens": 19681872} {"current_steps": 30140, "total_steps": 38160, "loss": 0.5544, "lr": 0.00012865414286077637, "epoch": 15.79664570230608, "percentage": 78.98, "elapsed_time": "1:17:08", "remaining_time": "0:20:31", "throughput": 4252.98, "total_tokens": 19684816} {"current_steps": 30145, "total_steps": 38160, "loss": 0.4126, "lr": 0.00012850104610315365, "epoch": 15.799266247379455, "percentage": 79.0, "elapsed_time": "1:17:09", "remaining_time": "0:20:30", "throughput": 4253.23, "total_tokens": 19690224} {"current_steps": 30150, "total_steps": 38160, "loss": 0.4515, "lr": 0.00012834802705887372, "epoch": 15.80188679245283, "percentage": 79.01, "elapsed_time": "1:17:10", "remaining_time": "0:20:30", "throughput": 4253.21, "total_tokens": 19693040} {"current_steps": 30155, "total_steps": 38160, "loss": 0.3173, "lr": 0.00012819508575994643, "epoch": 15.804507337526205, "percentage": 79.02, "elapsed_time": "1:17:10", "remaining_time": "0:20:29", "throughput": 4253.21, "total_tokens": 19695952} {"current_steps": 30160, "total_steps": 38160, "loss": 0.3793, "lr": 0.0001280422222383656, "epoch": 15.80712788259958, "percentage": 79.04, "elapsed_time": "1:17:11", "remaining_time": "0:20:28", "throughput": 4253.24, "total_tokens": 19699216} {"current_steps": 30165, "total_steps": 38160, "loss": 0.4826, "lr": 0.00012788943652610818, "epoch": 15.809748427672956, "percentage": 79.05, "elapsed_time": "1:17:12", "remaining_time": "0:20:27", "throughput": 4253.31, "total_tokens": 19702832} {"current_steps": 30170, "total_steps": 38160, "loss": 0.4683, "lr": 0.0001277367286551356, "epoch": 15.81236897274633, "percentage": 79.06, "elapsed_time": "1:17:13", "remaining_time": "0:20:26", "throughput": 4253.29, "total_tokens": 19705552} {"current_steps": 30175, "total_steps": 38160, "loss": 0.4527, "lr": 0.00012758409865739213, "epoch": 15.814989517819706, "percentage": 79.07, "elapsed_time": "1:17:13", "remaining_time": "0:20:26", "throughput": 4253.36, "total_tokens": 19709104} {"current_steps": 30180, "total_steps": 38160, "loss": 0.3915, "lr": 0.00012743154656480655, "epoch": 15.817610062893081, "percentage": 79.09, "elapsed_time": "1:17:14", "remaining_time": "0:20:25", "throughput": 4253.51, "total_tokens": 19713424} {"current_steps": 30185, "total_steps": 38160, "loss": 0.5219, "lr": 0.00012727907240929094, "epoch": 15.820230607966456, "percentage": 79.1, "elapsed_time": "1:17:15", "remaining_time": "0:20:24", "throughput": 4253.58, "total_tokens": 19716976} {"current_steps": 30190, "total_steps": 38160, "loss": 0.4243, "lr": 0.00012712667622274127, "epoch": 15.822851153039831, "percentage": 79.11, "elapsed_time": "1:17:16", "remaining_time": "0:20:23", "throughput": 4253.6, "total_tokens": 19720048} {"current_steps": 30195, "total_steps": 38160, "loss": 0.4477, "lr": 0.000126974358037037, "epoch": 15.825471698113208, "percentage": 79.13, "elapsed_time": "1:17:16", "remaining_time": "0:20:23", "throughput": 4253.57, "total_tokens": 19722704} {"current_steps": 30200, "total_steps": 38160, "loss": 0.4198, "lr": 0.00012682211788404114, "epoch": 15.828092243186584, "percentage": 79.14, "elapsed_time": "1:17:17", "remaining_time": "0:20:22", "throughput": 4253.6, "total_tokens": 19725872} {"current_steps": 30205, "total_steps": 38160, "loss": 0.5915, "lr": 0.0001266699557956008, "epoch": 15.830712788259959, "percentage": 79.15, "elapsed_time": "1:17:18", "remaining_time": "0:20:21", "throughput": 4253.56, "total_tokens": 19728336} {"current_steps": 30210, "total_steps": 38160, "loss": 0.3167, "lr": 0.00012651787180354657, "epoch": 15.833333333333334, "percentage": 79.17, "elapsed_time": "1:17:18", "remaining_time": "0:20:20", "throughput": 4253.66, "total_tokens": 19732304} {"current_steps": 30215, "total_steps": 38160, "loss": 0.3588, "lr": 0.00012636586593969262, "epoch": 15.835953878406709, "percentage": 79.18, "elapsed_time": "1:17:19", "remaining_time": "0:20:20", "throughput": 4253.72, "total_tokens": 19735952} {"current_steps": 30220, "total_steps": 38160, "loss": 0.4124, "lr": 0.000126213938235837, "epoch": 15.838574423480084, "percentage": 79.19, "elapsed_time": "1:17:20", "remaining_time": "0:20:19", "throughput": 4253.81, "total_tokens": 19739792} {"current_steps": 30225, "total_steps": 38160, "loss": 0.3513, "lr": 0.0001260620887237611, "epoch": 15.84119496855346, "percentage": 79.21, "elapsed_time": "1:17:21", "remaining_time": "0:20:18", "throughput": 4253.8, "total_tokens": 19742640} {"current_steps": 30230, "total_steps": 38160, "loss": 0.489, "lr": 0.00012591031743523006, "epoch": 15.843815513626835, "percentage": 79.22, "elapsed_time": "1:17:21", "remaining_time": "0:20:17", "throughput": 4253.76, "total_tokens": 19745200} {"current_steps": 30235, "total_steps": 38160, "loss": 0.3807, "lr": 0.00012575862440199277, "epoch": 15.84643605870021, "percentage": 79.23, "elapsed_time": "1:17:22", "remaining_time": "0:20:16", "throughput": 4253.75, "total_tokens": 19748080} {"current_steps": 30240, "total_steps": 38160, "loss": 0.3993, "lr": 0.00012560700965578165, "epoch": 15.849056603773585, "percentage": 79.25, "elapsed_time": "1:17:23", "remaining_time": "0:20:16", "throughput": 4253.75, "total_tokens": 19750960} {"current_steps": 30245, "total_steps": 38160, "loss": 0.3764, "lr": 0.0001254554732283129, "epoch": 15.85167714884696, "percentage": 79.26, "elapsed_time": "1:17:24", "remaining_time": "0:20:15", "throughput": 4253.9, "total_tokens": 19755408} {"current_steps": 30250, "total_steps": 38160, "loss": 0.4874, "lr": 0.0001253040151512862, "epoch": 15.854297693920335, "percentage": 79.27, "elapsed_time": "1:17:24", "remaining_time": "0:20:14", "throughput": 4253.93, "total_tokens": 19758608} {"current_steps": 30255, "total_steps": 38160, "loss": 0.4399, "lr": 0.0001251526354563846, "epoch": 15.85691823899371, "percentage": 79.28, "elapsed_time": "1:17:25", "remaining_time": "0:20:13", "throughput": 4253.97, "total_tokens": 19762064} {"current_steps": 30260, "total_steps": 38160, "loss": 0.4557, "lr": 0.0001250013341752752, "epoch": 15.859538784067086, "percentage": 79.3, "elapsed_time": "1:17:26", "remaining_time": "0:20:13", "throughput": 4253.98, "total_tokens": 19765072} {"current_steps": 30265, "total_steps": 38160, "loss": 0.3975, "lr": 0.00012485011133960843, "epoch": 15.86215932914046, "percentage": 79.31, "elapsed_time": "1:17:27", "remaining_time": "0:20:12", "throughput": 4254.04, "total_tokens": 19768624} {"current_steps": 30270, "total_steps": 38160, "loss": 0.4004, "lr": 0.00012469896698101863, "epoch": 15.864779874213836, "percentage": 79.32, "elapsed_time": "1:17:27", "remaining_time": "0:20:11", "throughput": 4254.09, "total_tokens": 19771984} {"current_steps": 30275, "total_steps": 38160, "loss": 0.5666, "lr": 0.00012454790113112325, "epoch": 15.867400419287211, "percentage": 79.34, "elapsed_time": "1:17:28", "remaining_time": "0:20:10", "throughput": 4254.27, "total_tokens": 19776720} {"current_steps": 30280, "total_steps": 38160, "loss": 0.5333, "lr": 0.00012439691382152345, "epoch": 15.870020964360586, "percentage": 79.35, "elapsed_time": "1:17:29", "remaining_time": "0:20:09", "throughput": 4254.3, "total_tokens": 19779984} {"current_steps": 30285, "total_steps": 38160, "loss": 0.4412, "lr": 0.00012424600508380412, "epoch": 15.872641509433961, "percentage": 79.36, "elapsed_time": "1:17:30", "remaining_time": "0:20:09", "throughput": 4254.27, "total_tokens": 19782544} {"current_steps": 30290, "total_steps": 38160, "loss": 0.4035, "lr": 0.00012409517494953377, "epoch": 15.875262054507338, "percentage": 79.38, "elapsed_time": "1:17:30", "remaining_time": "0:20:08", "throughput": 4254.27, "total_tokens": 19785456} {"current_steps": 30295, "total_steps": 38160, "loss": 0.448, "lr": 0.00012394442345026418, "epoch": 15.877882599580714, "percentage": 79.39, "elapsed_time": "1:17:31", "remaining_time": "0:20:07", "throughput": 4254.29, "total_tokens": 19788624} {"current_steps": 30300, "total_steps": 38160, "loss": 0.3957, "lr": 0.00012379375061753118, "epoch": 15.880503144654089, "percentage": 79.4, "elapsed_time": "1:17:32", "remaining_time": "0:20:06", "throughput": 4254.24, "total_tokens": 19791088} {"current_steps": 30305, "total_steps": 38160, "loss": 0.3259, "lr": 0.00012364315648285353, "epoch": 15.883123689727464, "percentage": 79.42, "elapsed_time": "1:17:32", "remaining_time": "0:20:06", "throughput": 4254.29, "total_tokens": 19794576} {"current_steps": 30310, "total_steps": 38160, "loss": 0.3468, "lr": 0.00012349264107773363, "epoch": 15.885744234800839, "percentage": 79.43, "elapsed_time": "1:17:33", "remaining_time": "0:20:05", "throughput": 4254.36, "total_tokens": 19798160} {"current_steps": 30315, "total_steps": 38160, "loss": 0.3858, "lr": 0.00012334220443365785, "epoch": 15.888364779874214, "percentage": 79.44, "elapsed_time": "1:17:34", "remaining_time": "0:20:04", "throughput": 4254.35, "total_tokens": 19801040} {"current_steps": 30320, "total_steps": 38160, "loss": 0.3763, "lr": 0.00012319184658209575, "epoch": 15.89098532494759, "percentage": 79.45, "elapsed_time": "1:17:34", "remaining_time": "0:20:03", "throughput": 4254.36, "total_tokens": 19804016} {"current_steps": 30325, "total_steps": 38160, "loss": 0.4152, "lr": 0.00012304156755450063, "epoch": 15.893605870020965, "percentage": 79.47, "elapsed_time": "1:17:35", "remaining_time": "0:20:02", "throughput": 4254.4, "total_tokens": 19807504} {"current_steps": 30330, "total_steps": 38160, "loss": 0.5289, "lr": 0.00012289136738230906, "epoch": 15.89622641509434, "percentage": 79.48, "elapsed_time": "1:17:36", "remaining_time": "0:20:02", "throughput": 4254.33, "total_tokens": 19809712} {"current_steps": 30335, "total_steps": 38160, "loss": 0.3882, "lr": 0.00012274124609694092, "epoch": 15.898846960167715, "percentage": 79.49, "elapsed_time": "1:17:37", "remaining_time": "0:20:01", "throughput": 4254.31, "total_tokens": 19812496} {"current_steps": 30340, "total_steps": 38160, "loss": 0.4432, "lr": 0.00012259120372980014, "epoch": 15.90146750524109, "percentage": 79.51, "elapsed_time": "1:17:37", "remaining_time": "0:20:00", "throughput": 4254.31, "total_tokens": 19815568} {"current_steps": 30345, "total_steps": 38160, "loss": 0.3441, "lr": 0.0001224412403122739, "epoch": 15.904088050314465, "percentage": 79.52, "elapsed_time": "1:17:38", "remaining_time": "0:19:59", "throughput": 4254.24, "total_tokens": 19817808} {"current_steps": 30350, "total_steps": 38160, "loss": 0.3779, "lr": 0.0001222913558757328, "epoch": 15.90670859538784, "percentage": 79.53, "elapsed_time": "1:17:39", "remaining_time": "0:19:58", "throughput": 4254.21, "total_tokens": 19820432} {"current_steps": 30355, "total_steps": 38160, "loss": 0.527, "lr": 0.00012214155045153085, "epoch": 15.909329140461216, "percentage": 79.55, "elapsed_time": "1:17:39", "remaining_time": "0:19:58", "throughput": 4254.24, "total_tokens": 19823696} {"current_steps": 30360, "total_steps": 38160, "loss": 0.3824, "lr": 0.00012199182407100584, "epoch": 15.91194968553459, "percentage": 79.56, "elapsed_time": "1:17:40", "remaining_time": "0:19:57", "throughput": 4254.32, "total_tokens": 19827408} {"current_steps": 30365, "total_steps": 38160, "loss": 0.3972, "lr": 0.00012184217676547855, "epoch": 15.914570230607966, "percentage": 79.57, "elapsed_time": "1:17:41", "remaining_time": "0:19:56", "throughput": 4254.32, "total_tokens": 19830384} {"current_steps": 30370, "total_steps": 38160, "loss": 0.4529, "lr": 0.00012169260856625358, "epoch": 15.917190775681341, "percentage": 79.59, "elapsed_time": "1:17:41", "remaining_time": "0:19:55", "throughput": 4254.34, "total_tokens": 19833520} {"current_steps": 30375, "total_steps": 38160, "loss": 0.4195, "lr": 0.000121543119504619, "epoch": 15.919811320754716, "percentage": 79.6, "elapsed_time": "1:17:42", "remaining_time": "0:19:55", "throughput": 4254.43, "total_tokens": 19837360} {"current_steps": 30380, "total_steps": 38160, "loss": 0.4524, "lr": 0.00012139370961184626, "epoch": 15.922431865828091, "percentage": 79.61, "elapsed_time": "1:17:43", "remaining_time": "0:19:54", "throughput": 4254.53, "total_tokens": 19841232} {"current_steps": 30385, "total_steps": 38160, "loss": 0.4941, "lr": 0.00012124437891918994, "epoch": 15.925052410901468, "percentage": 79.63, "elapsed_time": "1:17:44", "remaining_time": "0:19:53", "throughput": 4254.48, "total_tokens": 19843728} {"current_steps": 30390, "total_steps": 38160, "loss": 0.4516, "lr": 0.0001210951274578887, "epoch": 15.927672955974844, "percentage": 79.64, "elapsed_time": "1:17:44", "remaining_time": "0:19:52", "throughput": 4254.47, "total_tokens": 19846512} {"current_steps": 30395, "total_steps": 38160, "loss": 0.4062, "lr": 0.00012094595525916379, "epoch": 15.930293501048219, "percentage": 79.65, "elapsed_time": "1:17:45", "remaining_time": "0:19:51", "throughput": 4254.46, "total_tokens": 19849360} {"current_steps": 30400, "total_steps": 38160, "loss": 0.4661, "lr": 0.0001207968623542206, "epoch": 15.932914046121594, "percentage": 79.66, "elapsed_time": "1:17:46", "remaining_time": "0:19:51", "throughput": 4254.51, "total_tokens": 19852720} {"current_steps": 30405, "total_steps": 38160, "loss": 0.4615, "lr": 0.00012064784877424778, "epoch": 15.935534591194969, "percentage": 79.68, "elapsed_time": "1:17:47", "remaining_time": "0:19:50", "throughput": 4254.6, "total_tokens": 19856592} {"current_steps": 30410, "total_steps": 38160, "loss": 0.4508, "lr": 0.00012049891455041695, "epoch": 15.938155136268344, "percentage": 79.69, "elapsed_time": "1:17:47", "remaining_time": "0:19:49", "throughput": 4254.62, "total_tokens": 19859728} {"current_steps": 30415, "total_steps": 38160, "loss": 0.5123, "lr": 0.00012035005971388379, "epoch": 15.94077568134172, "percentage": 79.7, "elapsed_time": "1:17:48", "remaining_time": "0:19:48", "throughput": 4254.66, "total_tokens": 19863120} {"current_steps": 30420, "total_steps": 38160, "loss": 0.4417, "lr": 0.0001202012842957867, "epoch": 15.943396226415095, "percentage": 79.72, "elapsed_time": "1:17:49", "remaining_time": "0:19:48", "throughput": 4254.68, "total_tokens": 19866256} {"current_steps": 30425, "total_steps": 38160, "loss": 0.4893, "lr": 0.00012005258832724797, "epoch": 15.94601677148847, "percentage": 79.73, "elapsed_time": "1:17:49", "remaining_time": "0:19:47", "throughput": 4254.66, "total_tokens": 19869008} {"current_steps": 30430, "total_steps": 38160, "loss": 0.4502, "lr": 0.00011990397183937324, "epoch": 15.948637316561845, "percentage": 79.74, "elapsed_time": "1:17:50", "remaining_time": "0:19:46", "throughput": 4254.62, "total_tokens": 19871600} {"current_steps": 30435, "total_steps": 38160, "loss": 0.4739, "lr": 0.00011975543486325108, "epoch": 15.95125786163522, "percentage": 79.76, "elapsed_time": "1:17:51", "remaining_time": "0:19:45", "throughput": 4254.58, "total_tokens": 19874224} {"current_steps": 30440, "total_steps": 38160, "loss": 0.3962, "lr": 0.00011960697742995392, "epoch": 15.953878406708595, "percentage": 79.77, "elapsed_time": "1:17:51", "remaining_time": "0:19:44", "throughput": 4254.54, "total_tokens": 19876848} {"current_steps": 30445, "total_steps": 38160, "loss": 0.3827, "lr": 0.00011945859957053746, "epoch": 15.95649895178197, "percentage": 79.78, "elapsed_time": "1:17:52", "remaining_time": "0:19:44", "throughput": 4254.6, "total_tokens": 19880432} {"current_steps": 30450, "total_steps": 38160, "loss": 0.3652, "lr": 0.00011931030131604036, "epoch": 15.959119496855346, "percentage": 79.8, "elapsed_time": "1:17:53", "remaining_time": "0:19:43", "throughput": 4254.59, "total_tokens": 19883184} {"current_steps": 30455, "total_steps": 38160, "loss": 0.316, "lr": 0.00011916208269748507, "epoch": 15.96174004192872, "percentage": 79.81, "elapsed_time": "1:17:54", "remaining_time": "0:19:42", "throughput": 4254.62, "total_tokens": 19886416} {"current_steps": 30460, "total_steps": 38160, "loss": 0.4162, "lr": 0.00011901394374587743, "epoch": 15.964360587002096, "percentage": 79.82, "elapsed_time": "1:17:54", "remaining_time": "0:19:41", "throughput": 4254.66, "total_tokens": 19889776} {"current_steps": 30465, "total_steps": 38160, "loss": 0.4118, "lr": 0.00011886588449220609, "epoch": 15.966981132075471, "percentage": 79.83, "elapsed_time": "1:17:55", "remaining_time": "0:19:40", "throughput": 4254.74, "total_tokens": 19893488} {"current_steps": 30470, "total_steps": 38160, "loss": 0.3591, "lr": 0.00011871790496744351, "epoch": 15.969601677148846, "percentage": 79.85, "elapsed_time": "1:17:56", "remaining_time": "0:19:40", "throughput": 4254.79, "total_tokens": 19896848} {"current_steps": 30475, "total_steps": 38160, "loss": 0.3762, "lr": 0.00011857000520254546, "epoch": 15.972222222222221, "percentage": 79.86, "elapsed_time": "1:17:57", "remaining_time": "0:19:39", "throughput": 4254.98, "total_tokens": 19901808} {"current_steps": 30480, "total_steps": 38160, "loss": 0.4045, "lr": 0.0001184221852284506, "epoch": 15.974842767295598, "percentage": 79.87, "elapsed_time": "1:17:58", "remaining_time": "0:19:38", "throughput": 4255.01, "total_tokens": 19905040} {"current_steps": 30485, "total_steps": 38160, "loss": 0.5211, "lr": 0.00011827444507608143, "epoch": 15.977463312368974, "percentage": 79.89, "elapsed_time": "1:17:58", "remaining_time": "0:19:37", "throughput": 4255.05, "total_tokens": 19908368} {"current_steps": 30490, "total_steps": 38160, "loss": 0.4026, "lr": 0.00011812678477634325, "epoch": 15.980083857442349, "percentage": 79.9, "elapsed_time": "1:17:59", "remaining_time": "0:19:37", "throughput": 4255.07, "total_tokens": 19911440} {"current_steps": 30495, "total_steps": 38160, "loss": 0.3329, "lr": 0.0001179792043601251, "epoch": 15.982704402515724, "percentage": 79.91, "elapsed_time": "1:18:00", "remaining_time": "0:19:36", "throughput": 4255.15, "total_tokens": 19915184} {"current_steps": 30500, "total_steps": 38160, "loss": 0.3127, "lr": 0.00011783170385829905, "epoch": 15.985324947589099, "percentage": 79.93, "elapsed_time": "1:18:01", "remaining_time": "0:19:35", "throughput": 4255.23, "total_tokens": 19918896} {"current_steps": 30505, "total_steps": 38160, "loss": 0.4243, "lr": 0.00011768428330172071, "epoch": 15.987945492662474, "percentage": 79.94, "elapsed_time": "1:18:01", "remaining_time": "0:19:34", "throughput": 4255.26, "total_tokens": 19922128} {"current_steps": 30510, "total_steps": 38160, "loss": 0.4916, "lr": 0.00011753694272122856, "epoch": 15.99056603773585, "percentage": 79.95, "elapsed_time": "1:18:02", "remaining_time": "0:19:34", "throughput": 4255.21, "total_tokens": 19924688} {"current_steps": 30515, "total_steps": 38160, "loss": 0.3634, "lr": 0.00011738968214764456, "epoch": 15.993186582809225, "percentage": 79.97, "elapsed_time": "1:18:03", "remaining_time": "0:19:33", "throughput": 4255.32, "total_tokens": 19928816} {"current_steps": 30520, "total_steps": 38160, "loss": 0.4268, "lr": 0.00011724250161177391, "epoch": 15.9958071278826, "percentage": 79.98, "elapsed_time": "1:18:03", "remaining_time": "0:19:32", "throughput": 4255.33, "total_tokens": 19931792} {"current_steps": 30525, "total_steps": 38160, "loss": 0.3565, "lr": 0.00011709540114440525, "epoch": 15.998427672955975, "percentage": 79.99, "elapsed_time": "1:18:04", "remaining_time": "0:19:31", "throughput": 4255.28, "total_tokens": 19934288} {"current_steps": 30528, "total_steps": 38160, "eval_loss": 0.4923257529735565, "epoch": 16.0, "percentage": 80.0, "elapsed_time": "1:18:18", "remaining_time": "0:19:34", "throughput": 4242.72, "total_tokens": 19936088} {"current_steps": 30530, "total_steps": 38160, "loss": 0.415, "lr": 0.00011694838077631043, "epoch": 16.00104821802935, "percentage": 80.01, "elapsed_time": "1:18:20", "remaining_time": "0:19:34", "throughput": 4241.1, "total_tokens": 19936984} {"current_steps": 30535, "total_steps": 38160, "loss": 0.4216, "lr": 0.0001168014405382441, "epoch": 16.003668763102727, "percentage": 80.02, "elapsed_time": "1:18:21", "remaining_time": "0:19:34", "throughput": 4241.08, "total_tokens": 19939704} {"current_steps": 30540, "total_steps": 38160, "loss": 0.4092, "lr": 0.0001166545804609448, "epoch": 16.0062893081761, "percentage": 80.03, "elapsed_time": "1:18:22", "remaining_time": "0:19:33", "throughput": 4241.2, "total_tokens": 19943928} {"current_steps": 30545, "total_steps": 38160, "loss": 0.5021, "lr": 0.00011650780057513367, "epoch": 16.008909853249477, "percentage": 80.04, "elapsed_time": "1:18:23", "remaining_time": "0:19:32", "throughput": 4241.32, "total_tokens": 19948088} {"current_steps": 30550, "total_steps": 38160, "loss": 0.514, "lr": 0.00011636110091151553, "epoch": 16.01153039832285, "percentage": 80.06, "elapsed_time": "1:18:23", "remaining_time": "0:19:31", "throughput": 4241.31, "total_tokens": 19950968} {"current_steps": 30555, "total_steps": 38160, "loss": 0.3633, "lr": 0.00011621448150077834, "epoch": 16.014150943396228, "percentage": 80.07, "elapsed_time": "1:18:24", "remaining_time": "0:19:30", "throughput": 4241.23, "total_tokens": 19953048} {"current_steps": 30560, "total_steps": 38160, "loss": 0.3872, "lr": 0.0001160679423735933, "epoch": 16.0167714884696, "percentage": 80.08, "elapsed_time": "1:18:25", "remaining_time": "0:19:30", "throughput": 4241.31, "total_tokens": 19956888} {"current_steps": 30565, "total_steps": 38160, "loss": 0.4271, "lr": 0.00011592148356061455, "epoch": 16.019392033542978, "percentage": 80.1, "elapsed_time": "1:18:26", "remaining_time": "0:19:29", "throughput": 4241.34, "total_tokens": 19960152} {"current_steps": 30570, "total_steps": 38160, "loss": 0.2645, "lr": 0.00011577510509247951, "epoch": 16.02201257861635, "percentage": 80.11, "elapsed_time": "1:18:26", "remaining_time": "0:19:28", "throughput": 4241.29, "total_tokens": 19962584} {"current_steps": 30575, "total_steps": 38160, "loss": 0.4472, "lr": 0.00011562880699980904, "epoch": 16.02463312368973, "percentage": 80.12, "elapsed_time": "1:18:27", "remaining_time": "0:19:27", "throughput": 4241.3, "total_tokens": 19965560} {"current_steps": 30580, "total_steps": 38160, "loss": 0.3832, "lr": 0.00011548258931320704, "epoch": 16.0272536687631, "percentage": 80.14, "elapsed_time": "1:18:28", "remaining_time": "0:19:27", "throughput": 4241.29, "total_tokens": 19968408} {"current_steps": 30585, "total_steps": 38160, "loss": 0.4308, "lr": 0.00011533645206326049, "epoch": 16.02987421383648, "percentage": 80.15, "elapsed_time": "1:18:28", "remaining_time": "0:19:26", "throughput": 4241.39, "total_tokens": 19972504} {"current_steps": 30590, "total_steps": 38160, "loss": 0.4075, "lr": 0.00011519039528053999, "epoch": 16.032494758909852, "percentage": 80.16, "elapsed_time": "1:18:29", "remaining_time": "0:19:25", "throughput": 4241.36, "total_tokens": 19975224} {"current_steps": 30595, "total_steps": 38160, "loss": 0.5058, "lr": 0.00011504441899559837, "epoch": 16.03511530398323, "percentage": 80.18, "elapsed_time": "1:18:30", "remaining_time": "0:19:24", "throughput": 4241.45, "total_tokens": 19979096} {"current_steps": 30600, "total_steps": 38160, "loss": 0.4247, "lr": 0.00011489852323897249, "epoch": 16.037735849056602, "percentage": 80.19, "elapsed_time": "1:18:31", "remaining_time": "0:19:23", "throughput": 4241.46, "total_tokens": 19982232} {"current_steps": 30605, "total_steps": 38160, "loss": 0.6223, "lr": 0.0001147527080411821, "epoch": 16.04035639412998, "percentage": 80.2, "elapsed_time": "1:18:31", "remaining_time": "0:19:23", "throughput": 4241.52, "total_tokens": 19985816} {"current_steps": 30610, "total_steps": 38160, "loss": 0.4858, "lr": 0.00011460697343273002, "epoch": 16.042976939203353, "percentage": 80.21, "elapsed_time": "1:18:32", "remaining_time": "0:19:22", "throughput": 4241.45, "total_tokens": 19987960} {"current_steps": 30615, "total_steps": 38160, "loss": 0.4379, "lr": 0.00011446131944410249, "epoch": 16.04559748427673, "percentage": 80.23, "elapsed_time": "1:18:33", "remaining_time": "0:19:21", "throughput": 4241.47, "total_tokens": 19991096} {"current_steps": 30620, "total_steps": 38160, "loss": 0.486, "lr": 0.00011431574610576844, "epoch": 16.048218029350103, "percentage": 80.24, "elapsed_time": "1:18:33", "remaining_time": "0:19:20", "throughput": 4241.43, "total_tokens": 19993656} {"current_steps": 30625, "total_steps": 38160, "loss": 0.5278, "lr": 0.00011417025344818005, "epoch": 16.05083857442348, "percentage": 80.25, "elapsed_time": "1:18:34", "remaining_time": "0:19:20", "throughput": 4241.53, "total_tokens": 19997624} {"current_steps": 30630, "total_steps": 38160, "loss": 0.5246, "lr": 0.00011402484150177289, "epoch": 16.053459119496857, "percentage": 80.27, "elapsed_time": "1:18:35", "remaining_time": "0:19:19", "throughput": 4241.5, "total_tokens": 20000248} {"current_steps": 30635, "total_steps": 38160, "loss": 0.3825, "lr": 0.00011387951029696542, "epoch": 16.05607966457023, "percentage": 80.28, "elapsed_time": "1:18:36", "remaining_time": "0:19:18", "throughput": 4241.51, "total_tokens": 20003352} {"current_steps": 30640, "total_steps": 38160, "loss": 0.3341, "lr": 0.00011373425986415941, "epoch": 16.058700209643607, "percentage": 80.29, "elapsed_time": "1:18:36", "remaining_time": "0:19:17", "throughput": 4241.58, "total_tokens": 20006968} {"current_steps": 30645, "total_steps": 38160, "loss": 0.3459, "lr": 0.00011358909023373953, "epoch": 16.06132075471698, "percentage": 80.31, "elapsed_time": "1:18:37", "remaining_time": "0:19:16", "throughput": 4241.62, "total_tokens": 20010296} {"current_steps": 30650, "total_steps": 38160, "loss": 0.4384, "lr": 0.00011344400143607342, "epoch": 16.063941299790358, "percentage": 80.32, "elapsed_time": "1:18:38", "remaining_time": "0:19:16", "throughput": 4241.71, "total_tokens": 20014136} {"current_steps": 30655, "total_steps": 38160, "loss": 0.3388, "lr": 0.00011329899350151212, "epoch": 16.06656184486373, "percentage": 80.33, "elapsed_time": "1:18:39", "remaining_time": "0:19:15", "throughput": 4241.79, "total_tokens": 20017848} {"current_steps": 30660, "total_steps": 38160, "loss": 0.4232, "lr": 0.00011315406646038973, "epoch": 16.069182389937108, "percentage": 80.35, "elapsed_time": "1:18:39", "remaining_time": "0:19:14", "throughput": 4241.8, "total_tokens": 20020984} {"current_steps": 30665, "total_steps": 38160, "loss": 0.5275, "lr": 0.0001130092203430232, "epoch": 16.07180293501048, "percentage": 80.36, "elapsed_time": "1:18:40", "remaining_time": "0:19:13", "throughput": 4241.89, "total_tokens": 20024792} {"current_steps": 30670, "total_steps": 38160, "loss": 0.4638, "lr": 0.00011286445517971289, "epoch": 16.07442348008386, "percentage": 80.37, "elapsed_time": "1:18:41", "remaining_time": "0:19:13", "throughput": 4242.02, "total_tokens": 20029208} {"current_steps": 30675, "total_steps": 38160, "loss": 0.4941, "lr": 0.00011271977100074188, "epoch": 16.07704402515723, "percentage": 80.39, "elapsed_time": "1:18:42", "remaining_time": "0:19:12", "throughput": 4242.02, "total_tokens": 20032120} {"current_steps": 30680, "total_steps": 38160, "loss": 0.332, "lr": 0.00011257516783637633, "epoch": 16.07966457023061, "percentage": 80.4, "elapsed_time": "1:18:43", "remaining_time": "0:19:11", "throughput": 4242.09, "total_tokens": 20035896} {"current_steps": 30685, "total_steps": 38160, "loss": 0.381, "lr": 0.00011243064571686573, "epoch": 16.082285115303982, "percentage": 80.41, "elapsed_time": "1:18:43", "remaining_time": "0:19:10", "throughput": 4242.03, "total_tokens": 20038232} {"current_steps": 30690, "total_steps": 38160, "loss": 0.5784, "lr": 0.00011228620467244238, "epoch": 16.08490566037736, "percentage": 80.42, "elapsed_time": "1:18:44", "remaining_time": "0:19:09", "throughput": 4242.02, "total_tokens": 20041016} {"current_steps": 30695, "total_steps": 38160, "loss": 0.3291, "lr": 0.00011214184473332183, "epoch": 16.087526205450732, "percentage": 80.44, "elapsed_time": "1:18:45", "remaining_time": "0:19:09", "throughput": 4242.0, "total_tokens": 20043832} {"current_steps": 30700, "total_steps": 38160, "loss": 0.4055, "lr": 0.0001119975659297025, "epoch": 16.09014675052411, "percentage": 80.45, "elapsed_time": "1:18:45", "remaining_time": "0:19:08", "throughput": 4242.08, "total_tokens": 20047576} {"current_steps": 30705, "total_steps": 38160, "loss": 0.4921, "lr": 0.00011185336829176568, "epoch": 16.092767295597483, "percentage": 80.46, "elapsed_time": "1:18:46", "remaining_time": "0:19:07", "throughput": 4242.16, "total_tokens": 20051288} {"current_steps": 30710, "total_steps": 38160, "loss": 0.3525, "lr": 0.00011170925184967601, "epoch": 16.09538784067086, "percentage": 80.48, "elapsed_time": "1:18:47", "remaining_time": "0:19:06", "throughput": 4242.17, "total_tokens": 20054264} {"current_steps": 30715, "total_steps": 38160, "loss": 0.5081, "lr": 0.00011156521663358094, "epoch": 16.098008385744233, "percentage": 80.49, "elapsed_time": "1:18:48", "remaining_time": "0:19:06", "throughput": 4242.16, "total_tokens": 20057112} {"current_steps": 30720, "total_steps": 38160, "loss": 0.4813, "lr": 0.00011142126267361124, "epoch": 16.10062893081761, "percentage": 80.5, "elapsed_time": "1:18:48", "remaining_time": "0:19:05", "throughput": 4242.12, "total_tokens": 20059608} {"current_steps": 30725, "total_steps": 38160, "loss": 0.3561, "lr": 0.00011127738999988007, "epoch": 16.103249475890987, "percentage": 80.52, "elapsed_time": "1:18:49", "remaining_time": "0:19:04", "throughput": 4242.16, "total_tokens": 20063064} {"current_steps": 30730, "total_steps": 38160, "loss": 0.418, "lr": 0.00011113359864248429, "epoch": 16.10587002096436, "percentage": 80.53, "elapsed_time": "1:18:50", "remaining_time": "0:19:03", "throughput": 4242.23, "total_tokens": 20066616} {"current_steps": 30735, "total_steps": 38160, "loss": 0.3658, "lr": 0.00011098988863150317, "epoch": 16.108490566037737, "percentage": 80.54, "elapsed_time": "1:18:50", "remaining_time": "0:19:02", "throughput": 4242.26, "total_tokens": 20069848} {"current_steps": 30740, "total_steps": 38160, "loss": 0.4763, "lr": 0.0001108462599969992, "epoch": 16.11111111111111, "percentage": 80.56, "elapsed_time": "1:18:51", "remaining_time": "0:19:02", "throughput": 4242.36, "total_tokens": 20073688} {"current_steps": 30745, "total_steps": 38160, "loss": 0.392, "lr": 0.000110702712769018, "epoch": 16.113731656184488, "percentage": 80.57, "elapsed_time": "1:18:52", "remaining_time": "0:19:01", "throughput": 4242.4, "total_tokens": 20077016} {"current_steps": 30750, "total_steps": 38160, "loss": 0.4363, "lr": 0.00011055924697758801, "epoch": 16.11635220125786, "percentage": 80.58, "elapsed_time": "1:18:53", "remaining_time": "0:19:00", "throughput": 4242.45, "total_tokens": 20080408} {"current_steps": 30755, "total_steps": 38160, "loss": 0.3639, "lr": 0.00011041586265272052, "epoch": 16.118972746331238, "percentage": 80.59, "elapsed_time": "1:18:53", "remaining_time": "0:18:59", "throughput": 4242.48, "total_tokens": 20083640} {"current_steps": 30760, "total_steps": 38160, "loss": 0.3944, "lr": 0.00011027255982441003, "epoch": 16.12159329140461, "percentage": 80.61, "elapsed_time": "1:18:54", "remaining_time": "0:18:59", "throughput": 4242.48, "total_tokens": 20086616} {"current_steps": 30765, "total_steps": 38160, "loss": 0.3927, "lr": 0.00011012933852263369, "epoch": 16.12421383647799, "percentage": 80.62, "elapsed_time": "1:18:55", "remaining_time": "0:18:58", "throughput": 4242.49, "total_tokens": 20089592} {"current_steps": 30770, "total_steps": 38160, "loss": 0.3446, "lr": 0.00010998619877735184, "epoch": 16.12683438155136, "percentage": 80.63, "elapsed_time": "1:18:56", "remaining_time": "0:18:57", "throughput": 4242.54, "total_tokens": 20092952} {"current_steps": 30775, "total_steps": 38160, "loss": 0.4131, "lr": 0.0001098431406185078, "epoch": 16.12945492662474, "percentage": 80.65, "elapsed_time": "1:18:56", "remaining_time": "0:18:56", "throughput": 4242.56, "total_tokens": 20096120} {"current_steps": 30780, "total_steps": 38160, "loss": 0.467, "lr": 0.00010970016407602751, "epoch": 16.132075471698112, "percentage": 80.66, "elapsed_time": "1:18:57", "remaining_time": "0:18:55", "throughput": 4242.7, "total_tokens": 20100376} {"current_steps": 30785, "total_steps": 38160, "loss": 0.5038, "lr": 0.00010955726917982023, "epoch": 16.13469601677149, "percentage": 80.67, "elapsed_time": "1:18:58", "remaining_time": "0:18:55", "throughput": 4242.79, "total_tokens": 20104184} {"current_steps": 30790, "total_steps": 38160, "loss": 0.3962, "lr": 0.00010941445595977767, "epoch": 16.137316561844862, "percentage": 80.69, "elapsed_time": "1:18:59", "remaining_time": "0:18:54", "throughput": 4242.8, "total_tokens": 20107224} {"current_steps": 30795, "total_steps": 38160, "loss": 0.436, "lr": 0.00010927172444577494, "epoch": 16.13993710691824, "percentage": 80.7, "elapsed_time": "1:18:59", "remaining_time": "0:18:53", "throughput": 4242.79, "total_tokens": 20110008} {"current_steps": 30800, "total_steps": 38160, "loss": 0.4086, "lr": 0.00010912907466766985, "epoch": 16.142557651991613, "percentage": 80.71, "elapsed_time": "1:19:00", "remaining_time": "0:18:52", "throughput": 4242.85, "total_tokens": 20113560} {"current_steps": 30805, "total_steps": 38160, "loss": 0.5696, "lr": 0.00010898650665530302, "epoch": 16.14517819706499, "percentage": 80.73, "elapsed_time": "1:19:01", "remaining_time": "0:18:52", "throughput": 4242.97, "total_tokens": 20117720} {"current_steps": 30810, "total_steps": 38160, "loss": 0.449, "lr": 0.000108844020438498, "epoch": 16.147798742138363, "percentage": 80.74, "elapsed_time": "1:19:02", "remaining_time": "0:18:51", "throughput": 4243.06, "total_tokens": 20121496} {"current_steps": 30815, "total_steps": 38160, "loss": 0.3677, "lr": 0.00010870161604706152, "epoch": 16.15041928721174, "percentage": 80.75, "elapsed_time": "1:19:02", "remaining_time": "0:18:50", "throughput": 4243.06, "total_tokens": 20124312} {"current_steps": 30820, "total_steps": 38160, "loss": 0.5221, "lr": 0.00010855929351078264, "epoch": 16.153039832285117, "percentage": 80.77, "elapsed_time": "1:19:03", "remaining_time": "0:18:49", "throughput": 4243.1, "total_tokens": 20127608} {"current_steps": 30825, "total_steps": 38160, "loss": 0.4725, "lr": 0.00010841705285943382, "epoch": 16.15566037735849, "percentage": 80.78, "elapsed_time": "1:19:04", "remaining_time": "0:18:48", "throughput": 4243.07, "total_tokens": 20130168} {"current_steps": 30830, "total_steps": 38160, "loss": 0.5515, "lr": 0.0001082748941227702, "epoch": 16.158280922431867, "percentage": 80.79, "elapsed_time": "1:19:04", "remaining_time": "0:18:48", "throughput": 4243.1, "total_tokens": 20133368} {"current_steps": 30835, "total_steps": 38160, "loss": 0.4323, "lr": 0.00010813281733052959, "epoch": 16.16090146750524, "percentage": 80.8, "elapsed_time": "1:19:05", "remaining_time": "0:18:47", "throughput": 4243.12, "total_tokens": 20136504} {"current_steps": 30840, "total_steps": 38160, "loss": 0.3363, "lr": 0.00010799082251243292, "epoch": 16.163522012578618, "percentage": 80.82, "elapsed_time": "1:19:06", "remaining_time": "0:18:46", "throughput": 4243.15, "total_tokens": 20139672} {"current_steps": 30845, "total_steps": 38160, "loss": 0.4943, "lr": 0.00010784890969818407, "epoch": 16.16614255765199, "percentage": 80.83, "elapsed_time": "1:19:07", "remaining_time": "0:18:45", "throughput": 4243.18, "total_tokens": 20142840} {"current_steps": 30850, "total_steps": 38160, "loss": 0.3931, "lr": 0.00010770707891746928, "epoch": 16.168763102725368, "percentage": 80.84, "elapsed_time": "1:19:07", "remaining_time": "0:18:45", "throughput": 4243.17, "total_tokens": 20145688} {"current_steps": 30855, "total_steps": 38160, "loss": 0.4667, "lr": 0.00010756533019995817, "epoch": 16.17138364779874, "percentage": 80.86, "elapsed_time": "1:19:08", "remaining_time": "0:18:44", "throughput": 4243.14, "total_tokens": 20148216} {"current_steps": 30860, "total_steps": 38160, "loss": 0.5211, "lr": 0.0001074236635753027, "epoch": 16.17400419287212, "percentage": 80.87, "elapsed_time": "1:19:09", "remaining_time": "0:18:43", "throughput": 4243.25, "total_tokens": 20152280} {"current_steps": 30865, "total_steps": 38160, "loss": 0.435, "lr": 0.00010728207907313809, "epoch": 16.17662473794549, "percentage": 80.88, "elapsed_time": "1:19:09", "remaining_time": "0:18:42", "throughput": 4243.23, "total_tokens": 20154968} {"current_steps": 30870, "total_steps": 38160, "loss": 0.3953, "lr": 0.0001071405767230822, "epoch": 16.17924528301887, "percentage": 80.9, "elapsed_time": "1:19:10", "remaining_time": "0:18:41", "throughput": 4243.29, "total_tokens": 20158680} {"current_steps": 30875, "total_steps": 38160, "loss": 0.4381, "lr": 0.0001069991565547358, "epoch": 16.181865828092242, "percentage": 80.91, "elapsed_time": "1:19:11", "remaining_time": "0:18:41", "throughput": 4243.28, "total_tokens": 20161528} {"current_steps": 30880, "total_steps": 38160, "loss": 0.3361, "lr": 0.00010685781859768223, "epoch": 16.18448637316562, "percentage": 80.92, "elapsed_time": "1:19:12", "remaining_time": "0:18:40", "throughput": 4243.5, "total_tokens": 20167000} {"current_steps": 30885, "total_steps": 38160, "loss": 0.4142, "lr": 0.00010671656288148768, "epoch": 16.187106918238992, "percentage": 80.94, "elapsed_time": "1:19:13", "remaining_time": "0:18:39", "throughput": 4243.53, "total_tokens": 20170168} {"current_steps": 30890, "total_steps": 38160, "loss": 0.3966, "lr": 0.00010657538943570138, "epoch": 16.18972746331237, "percentage": 80.95, "elapsed_time": "1:19:14", "remaining_time": "0:18:38", "throughput": 4243.76, "total_tokens": 20175608} {"current_steps": 30895, "total_steps": 38160, "loss": 0.5315, "lr": 0.00010643429828985518, "epoch": 16.192348008385743, "percentage": 80.96, "elapsed_time": "1:19:14", "remaining_time": "0:18:38", "throughput": 4243.76, "total_tokens": 20178520} {"current_steps": 30900, "total_steps": 38160, "loss": 0.4163, "lr": 0.0001062932894734639, "epoch": 16.19496855345912, "percentage": 80.97, "elapsed_time": "1:19:15", "remaining_time": "0:18:37", "throughput": 4243.78, "total_tokens": 20181624} {"current_steps": 30905, "total_steps": 38160, "loss": 0.4684, "lr": 0.00010615236301602476, "epoch": 16.197589098532493, "percentage": 80.99, "elapsed_time": "1:19:16", "remaining_time": "0:18:36", "throughput": 4243.81, "total_tokens": 20184728} {"current_steps": 30910, "total_steps": 38160, "loss": 0.3471, "lr": 0.00010601151894701794, "epoch": 16.20020964360587, "percentage": 81.0, "elapsed_time": "1:19:17", "remaining_time": "0:18:35", "throughput": 4243.85, "total_tokens": 20188120} {"current_steps": 30915, "total_steps": 38160, "loss": 0.421, "lr": 0.0001058707572959065, "epoch": 16.202830188679247, "percentage": 81.01, "elapsed_time": "1:19:17", "remaining_time": "0:18:34", "throughput": 4243.79, "total_tokens": 20190456} {"current_steps": 30920, "total_steps": 38160, "loss": 0.4898, "lr": 0.00010573007809213614, "epoch": 16.20545073375262, "percentage": 81.03, "elapsed_time": "1:19:18", "remaining_time": "0:18:34", "throughput": 4243.85, "total_tokens": 20193944} {"current_steps": 30925, "total_steps": 38160, "loss": 0.4091, "lr": 0.00010558948136513536, "epoch": 16.208071278825997, "percentage": 81.04, "elapsed_time": "1:19:19", "remaining_time": "0:18:33", "throughput": 4243.82, "total_tokens": 20196568} {"current_steps": 30930, "total_steps": 38160, "loss": 0.3422, "lr": 0.00010544896714431557, "epoch": 16.21069182389937, "percentage": 81.05, "elapsed_time": "1:19:19", "remaining_time": "0:18:32", "throughput": 4243.82, "total_tokens": 20199576} {"current_steps": 30935, "total_steps": 38160, "loss": 0.4593, "lr": 0.0001053085354590706, "epoch": 16.213312368972748, "percentage": 81.07, "elapsed_time": "1:19:20", "remaining_time": "0:18:31", "throughput": 4243.83, "total_tokens": 20202712} {"current_steps": 30940, "total_steps": 38160, "loss": 0.4985, "lr": 0.00010516818633877695, "epoch": 16.21593291404612, "percentage": 81.08, "elapsed_time": "1:19:21", "remaining_time": "0:18:31", "throughput": 4243.81, "total_tokens": 20205368} {"current_steps": 30945, "total_steps": 38160, "loss": 0.4723, "lr": 0.00010502791981279425, "epoch": 16.218553459119498, "percentage": 81.09, "elapsed_time": "1:19:21", "remaining_time": "0:18:30", "throughput": 4243.92, "total_tokens": 20209464} {"current_steps": 30950, "total_steps": 38160, "loss": 0.3963, "lr": 0.00010488773591046469, "epoch": 16.22117400419287, "percentage": 81.11, "elapsed_time": "1:19:22", "remaining_time": "0:18:29", "throughput": 4243.98, "total_tokens": 20213016} {"current_steps": 30955, "total_steps": 38160, "loss": 0.404, "lr": 0.0001047476346611132, "epoch": 16.22379454926625, "percentage": 81.12, "elapsed_time": "1:19:23", "remaining_time": "0:18:28", "throughput": 4243.95, "total_tokens": 20215640} {"current_steps": 30960, "total_steps": 38160, "loss": 0.3817, "lr": 0.00010460761609404724, "epoch": 16.22641509433962, "percentage": 81.13, "elapsed_time": "1:19:24", "remaining_time": "0:18:27", "throughput": 4243.96, "total_tokens": 20218648} {"current_steps": 30965, "total_steps": 38160, "loss": 0.326, "lr": 0.00010446768023855701, "epoch": 16.229035639413, "percentage": 81.15, "elapsed_time": "1:19:25", "remaining_time": "0:18:27", "throughput": 4244.15, "total_tokens": 20223576} {"current_steps": 30970, "total_steps": 38160, "loss": 0.3575, "lr": 0.00010432782712391559, "epoch": 16.231656184486372, "percentage": 81.16, "elapsed_time": "1:19:25", "remaining_time": "0:18:26", "throughput": 4244.19, "total_tokens": 20226808} {"current_steps": 30975, "total_steps": 38160, "loss": 0.3254, "lr": 0.00010418805677937871, "epoch": 16.23427672955975, "percentage": 81.17, "elapsed_time": "1:19:26", "remaining_time": "0:18:25", "throughput": 4244.21, "total_tokens": 20229944} {"current_steps": 30980, "total_steps": 38160, "loss": 0.5754, "lr": 0.00010404836923418465, "epoch": 16.236897274633122, "percentage": 81.18, "elapsed_time": "1:19:27", "remaining_time": "0:18:24", "throughput": 4244.25, "total_tokens": 20233304} {"current_steps": 30985, "total_steps": 38160, "loss": 0.4635, "lr": 0.00010390876451755477, "epoch": 16.2395178197065, "percentage": 81.2, "elapsed_time": "1:19:28", "remaining_time": "0:18:24", "throughput": 4244.34, "total_tokens": 20237112} {"current_steps": 30990, "total_steps": 38160, "loss": 0.4145, "lr": 0.0001037692426586922, "epoch": 16.242138364779873, "percentage": 81.21, "elapsed_time": "1:19:28", "remaining_time": "0:18:23", "throughput": 4244.33, "total_tokens": 20239992} {"current_steps": 30995, "total_steps": 38160, "loss": 0.3588, "lr": 0.0001036298036867837, "epoch": 16.24475890985325, "percentage": 81.22, "elapsed_time": "1:19:29", "remaining_time": "0:18:22", "throughput": 4244.36, "total_tokens": 20243320} {"current_steps": 31000, "total_steps": 38160, "loss": 0.3417, "lr": 0.00010349044763099819, "epoch": 16.247379454926623, "percentage": 81.24, "elapsed_time": "1:19:30", "remaining_time": "0:18:21", "throughput": 4244.47, "total_tokens": 20247512} {"current_steps": 31005, "total_steps": 38160, "loss": 0.2584, "lr": 0.00010335117452048742, "epoch": 16.25, "percentage": 81.25, "elapsed_time": "1:19:31", "remaining_time": "0:18:21", "throughput": 4244.79, "total_tokens": 20254168} {"current_steps": 31010, "total_steps": 38160, "loss": 0.4317, "lr": 0.00010321198438438589, "epoch": 16.252620545073377, "percentage": 81.26, "elapsed_time": "1:19:32", "remaining_time": "0:18:20", "throughput": 4244.96, "total_tokens": 20258872} {"current_steps": 31015, "total_steps": 38160, "loss": 0.411, "lr": 0.00010307287725181036, "epoch": 16.25524109014675, "percentage": 81.28, "elapsed_time": "1:19:33", "remaining_time": "0:18:19", "throughput": 4244.97, "total_tokens": 20261976} {"current_steps": 31020, "total_steps": 38160, "loss": 0.3702, "lr": 0.00010293385315186049, "epoch": 16.257861635220127, "percentage": 81.29, "elapsed_time": "1:19:33", "remaining_time": "0:18:18", "throughput": 4244.95, "total_tokens": 20264696} {"current_steps": 31025, "total_steps": 38160, "loss": 0.426, "lr": 0.00010279491211361853, "epoch": 16.2604821802935, "percentage": 81.3, "elapsed_time": "1:19:34", "remaining_time": "0:18:18", "throughput": 4244.99, "total_tokens": 20267992} {"current_steps": 31030, "total_steps": 38160, "loss": 0.5465, "lr": 0.00010265605416614938, "epoch": 16.263102725366878, "percentage": 81.32, "elapsed_time": "1:19:35", "remaining_time": "0:18:17", "throughput": 4245.06, "total_tokens": 20271736} {"current_steps": 31035, "total_steps": 38160, "loss": 0.3315, "lr": 0.00010251727933850069, "epoch": 16.26572327044025, "percentage": 81.33, "elapsed_time": "1:19:36", "remaining_time": "0:18:16", "throughput": 4245.09, "total_tokens": 20274968} {"current_steps": 31040, "total_steps": 38160, "loss": 0.3938, "lr": 0.00010237858765970231, "epoch": 16.268343815513628, "percentage": 81.34, "elapsed_time": "1:19:36", "remaining_time": "0:18:15", "throughput": 4245.2, "total_tokens": 20278936} {"current_steps": 31045, "total_steps": 38160, "loss": 0.348, "lr": 0.00010223997915876726, "epoch": 16.270964360587, "percentage": 81.35, "elapsed_time": "1:19:37", "remaining_time": "0:18:14", "throughput": 4245.25, "total_tokens": 20282296} {"current_steps": 31050, "total_steps": 38160, "loss": 0.3748, "lr": 0.00010210145386469049, "epoch": 16.27358490566038, "percentage": 81.37, "elapsed_time": "1:19:38", "remaining_time": "0:18:14", "throughput": 4245.28, "total_tokens": 20285464} {"current_steps": 31055, "total_steps": 38160, "loss": 0.4635, "lr": 0.00010196301180645012, "epoch": 16.27620545073375, "percentage": 81.38, "elapsed_time": "1:19:39", "remaining_time": "0:18:13", "throughput": 4245.34, "total_tokens": 20289176} {"current_steps": 31060, "total_steps": 38160, "loss": 0.4278, "lr": 0.0001018246530130067, "epoch": 16.27882599580713, "percentage": 81.39, "elapsed_time": "1:19:39", "remaining_time": "0:18:12", "throughput": 4245.38, "total_tokens": 20292504} {"current_steps": 31065, "total_steps": 38160, "loss": 0.5305, "lr": 0.00010168637751330328, "epoch": 16.281446540880502, "percentage": 81.41, "elapsed_time": "1:19:40", "remaining_time": "0:18:11", "throughput": 4245.44, "total_tokens": 20295992} {"current_steps": 31070, "total_steps": 38160, "loss": 0.4638, "lr": 0.00010154818533626552, "epoch": 16.28406708595388, "percentage": 81.42, "elapsed_time": "1:19:41", "remaining_time": "0:18:11", "throughput": 4245.52, "total_tokens": 20299672} {"current_steps": 31075, "total_steps": 38160, "loss": 0.3934, "lr": 0.00010141007651080153, "epoch": 16.286687631027252, "percentage": 81.43, "elapsed_time": "1:19:42", "remaining_time": "0:18:10", "throughput": 4245.51, "total_tokens": 20302520} {"current_steps": 31080, "total_steps": 38160, "loss": 0.4915, "lr": 0.00010127205106580212, "epoch": 16.28930817610063, "percentage": 81.45, "elapsed_time": "1:19:42", "remaining_time": "0:18:09", "throughput": 4245.49, "total_tokens": 20305272} {"current_steps": 31085, "total_steps": 38160, "loss": 0.428, "lr": 0.0001011341090301407, "epoch": 16.291928721174003, "percentage": 81.46, "elapsed_time": "1:19:43", "remaining_time": "0:18:08", "throughput": 4245.47, "total_tokens": 20307992} {"current_steps": 31090, "total_steps": 38160, "loss": 0.3305, "lr": 0.00010099625043267336, "epoch": 16.29454926624738, "percentage": 81.47, "elapsed_time": "1:19:44", "remaining_time": "0:18:07", "throughput": 4245.43, "total_tokens": 20310520} {"current_steps": 31095, "total_steps": 38160, "loss": 0.4228, "lr": 0.00010085847530223812, "epoch": 16.297169811320753, "percentage": 81.49, "elapsed_time": "1:19:44", "remaining_time": "0:18:07", "throughput": 4245.37, "total_tokens": 20312824} {"current_steps": 31100, "total_steps": 38160, "loss": 0.5431, "lr": 0.00010072078366765641, "epoch": 16.29979035639413, "percentage": 81.5, "elapsed_time": "1:19:45", "remaining_time": "0:18:06", "throughput": 4245.3, "total_tokens": 20315032} {"current_steps": 31105, "total_steps": 38160, "loss": 0.5125, "lr": 0.00010058317555773139, "epoch": 16.302410901467507, "percentage": 81.51, "elapsed_time": "1:19:46", "remaining_time": "0:18:05", "throughput": 4245.35, "total_tokens": 20318456} {"current_steps": 31110, "total_steps": 38160, "loss": 0.5032, "lr": 0.00010044565100124925, "epoch": 16.30503144654088, "percentage": 81.53, "elapsed_time": "1:19:46", "remaining_time": "0:18:04", "throughput": 4245.36, "total_tokens": 20321464} {"current_steps": 31115, "total_steps": 38160, "loss": 0.5014, "lr": 0.00010030821002697871, "epoch": 16.307651991614257, "percentage": 81.54, "elapsed_time": "1:19:47", "remaining_time": "0:18:03", "throughput": 4245.41, "total_tokens": 20324984} {"current_steps": 31120, "total_steps": 38160, "loss": 0.3957, "lr": 0.00010017085266367054, "epoch": 16.31027253668763, "percentage": 81.55, "elapsed_time": "1:19:48", "remaining_time": "0:18:03", "throughput": 4245.37, "total_tokens": 20327512} {"current_steps": 31125, "total_steps": 38160, "loss": 0.4305, "lr": 0.00010003357894005854, "epoch": 16.312893081761008, "percentage": 81.56, "elapsed_time": "1:19:48", "remaining_time": "0:18:02", "throughput": 4245.37, "total_tokens": 20330520} {"current_steps": 31130, "total_steps": 38160, "loss": 0.4554, "lr": 9.989638888485885e-05, "epoch": 16.31551362683438, "percentage": 81.58, "elapsed_time": "1:19:49", "remaining_time": "0:18:01", "throughput": 4245.37, "total_tokens": 20333368} {"current_steps": 31135, "total_steps": 38160, "loss": 0.3693, "lr": 9.975928252676991e-05, "epoch": 16.318134171907758, "percentage": 81.59, "elapsed_time": "1:19:50", "remaining_time": "0:18:00", "throughput": 4245.38, "total_tokens": 20336440} {"current_steps": 31140, "total_steps": 38160, "loss": 0.4137, "lr": 9.962225989447288e-05, "epoch": 16.32075471698113, "percentage": 81.6, "elapsed_time": "1:19:50", "remaining_time": "0:18:00", "throughput": 4245.37, "total_tokens": 20339160} {"current_steps": 31145, "total_steps": 38160, "loss": 0.3151, "lr": 9.948532101663144e-05, "epoch": 16.32337526205451, "percentage": 81.62, "elapsed_time": "1:19:51", "remaining_time": "0:17:59", "throughput": 4245.39, "total_tokens": 20342232} {"current_steps": 31150, "total_steps": 38160, "loss": 0.4747, "lr": 9.934846592189134e-05, "epoch": 16.32599580712788, "percentage": 81.63, "elapsed_time": "1:19:52", "remaining_time": "0:17:58", "throughput": 4245.41, "total_tokens": 20345304} {"current_steps": 31155, "total_steps": 38160, "loss": 0.4877, "lr": 9.921169463888153e-05, "epoch": 16.32861635220126, "percentage": 81.64, "elapsed_time": "1:19:52", "remaining_time": "0:17:57", "throughput": 4245.37, "total_tokens": 20347736} {"current_steps": 31160, "total_steps": 38160, "loss": 0.3365, "lr": 9.907500719621253e-05, "epoch": 16.331236897274632, "percentage": 81.66, "elapsed_time": "1:19:53", "remaining_time": "0:17:56", "throughput": 4245.35, "total_tokens": 20350552} {"current_steps": 31165, "total_steps": 38160, "loss": 0.2715, "lr": 9.893840362247809e-05, "epoch": 16.33385744234801, "percentage": 81.67, "elapsed_time": "1:19:54", "remaining_time": "0:17:56", "throughput": 4245.34, "total_tokens": 20353432} {"current_steps": 31170, "total_steps": 38160, "loss": 0.4209, "lr": 9.880188394625417e-05, "epoch": 16.336477987421382, "percentage": 81.68, "elapsed_time": "1:19:55", "remaining_time": "0:17:55", "throughput": 4245.37, "total_tokens": 20356664} {"current_steps": 31175, "total_steps": 38160, "loss": 0.4769, "lr": 9.86654481960989e-05, "epoch": 16.33909853249476, "percentage": 81.7, "elapsed_time": "1:19:55", "remaining_time": "0:17:54", "throughput": 4245.43, "total_tokens": 20360152} {"current_steps": 31180, "total_steps": 38160, "loss": 0.5343, "lr": 9.852909640055325e-05, "epoch": 16.341719077568133, "percentage": 81.71, "elapsed_time": "1:19:56", "remaining_time": "0:17:53", "throughput": 4245.43, "total_tokens": 20363128} {"current_steps": 31185, "total_steps": 38160, "loss": 0.3667, "lr": 9.839282858814047e-05, "epoch": 16.34433962264151, "percentage": 81.72, "elapsed_time": "1:19:57", "remaining_time": "0:17:52", "throughput": 4245.45, "total_tokens": 20366168} {"current_steps": 31190, "total_steps": 38160, "loss": 0.4018, "lr": 9.825664478736607e-05, "epoch": 16.346960167714883, "percentage": 81.73, "elapsed_time": "1:19:57", "remaining_time": "0:17:52", "throughput": 4245.4, "total_tokens": 20368664} {"current_steps": 31195, "total_steps": 38160, "loss": 0.5078, "lr": 9.812054502671835e-05, "epoch": 16.34958071278826, "percentage": 81.75, "elapsed_time": "1:19:58", "remaining_time": "0:17:51", "throughput": 4245.43, "total_tokens": 20371864} {"current_steps": 31200, "total_steps": 38160, "loss": 0.4199, "lr": 9.798452933466761e-05, "epoch": 16.352201257861637, "percentage": 81.76, "elapsed_time": "1:19:59", "remaining_time": "0:17:50", "throughput": 4245.36, "total_tokens": 20374136} {"current_steps": 31205, "total_steps": 38160, "loss": 0.4062, "lr": 9.784859773966693e-05, "epoch": 16.35482180293501, "percentage": 81.77, "elapsed_time": "1:19:59", "remaining_time": "0:17:49", "throughput": 4245.38, "total_tokens": 20377304} {"current_steps": 31210, "total_steps": 38160, "loss": 0.425, "lr": 9.771275027015159e-05, "epoch": 16.357442348008387, "percentage": 81.79, "elapsed_time": "1:20:00", "remaining_time": "0:17:49", "throughput": 4245.41, "total_tokens": 20380504} {"current_steps": 31215, "total_steps": 38160, "loss": 0.4106, "lr": 9.757698695453954e-05, "epoch": 16.36006289308176, "percentage": 81.8, "elapsed_time": "1:20:01", "remaining_time": "0:17:48", "throughput": 4245.51, "total_tokens": 20384536} {"current_steps": 31220, "total_steps": 38160, "loss": 0.3911, "lr": 9.74413078212305e-05, "epoch": 16.362683438155138, "percentage": 81.81, "elapsed_time": "1:20:02", "remaining_time": "0:17:47", "throughput": 4245.53, "total_tokens": 20387640} {"current_steps": 31225, "total_steps": 38160, "loss": 0.5446, "lr": 9.730571289860746e-05, "epoch": 16.36530398322851, "percentage": 81.83, "elapsed_time": "1:20:02", "remaining_time": "0:17:46", "throughput": 4245.52, "total_tokens": 20390456} {"current_steps": 31230, "total_steps": 38160, "loss": 0.4527, "lr": 9.717020221503493e-05, "epoch": 16.367924528301888, "percentage": 81.84, "elapsed_time": "1:20:03", "remaining_time": "0:17:45", "throughput": 4245.54, "total_tokens": 20393592} {"current_steps": 31235, "total_steps": 38160, "loss": 0.4604, "lr": 9.703477579886038e-05, "epoch": 16.37054507337526, "percentage": 81.85, "elapsed_time": "1:20:04", "remaining_time": "0:17:45", "throughput": 4245.56, "total_tokens": 20396760} {"current_steps": 31240, "total_steps": 38160, "loss": 0.4717, "lr": 9.689943367841347e-05, "epoch": 16.37316561844864, "percentage": 81.87, "elapsed_time": "1:20:05", "remaining_time": "0:17:44", "throughput": 4245.64, "total_tokens": 20400504} {"current_steps": 31245, "total_steps": 38160, "loss": 0.4483, "lr": 9.676417588200632e-05, "epoch": 16.37578616352201, "percentage": 81.88, "elapsed_time": "1:20:05", "remaining_time": "0:17:43", "throughput": 4245.81, "total_tokens": 20405176} {"current_steps": 31250, "total_steps": 38160, "loss": 0.454, "lr": 9.662900243793321e-05, "epoch": 16.37840670859539, "percentage": 81.89, "elapsed_time": "1:20:06", "remaining_time": "0:17:42", "throughput": 4245.88, "total_tokens": 20408888} {"current_steps": 31255, "total_steps": 38160, "loss": 0.6191, "lr": 9.649391337447084e-05, "epoch": 16.381027253668762, "percentage": 81.91, "elapsed_time": "1:20:07", "remaining_time": "0:17:42", "throughput": 4245.92, "total_tokens": 20412088} {"current_steps": 31260, "total_steps": 38160, "loss": 0.4773, "lr": 9.635890871987829e-05, "epoch": 16.38364779874214, "percentage": 81.92, "elapsed_time": "1:20:08", "remaining_time": "0:17:41", "throughput": 4246.03, "total_tokens": 20416120} {"current_steps": 31265, "total_steps": 38160, "loss": 0.4535, "lr": 9.622398850239705e-05, "epoch": 16.386268343815512, "percentage": 81.93, "elapsed_time": "1:20:09", "remaining_time": "0:17:40", "throughput": 4246.19, "total_tokens": 20420696} {"current_steps": 31270, "total_steps": 38160, "loss": 0.4544, "lr": 9.608915275025104e-05, "epoch": 16.38888888888889, "percentage": 81.94, "elapsed_time": "1:20:09", "remaining_time": "0:17:39", "throughput": 4246.25, "total_tokens": 20424248} {"current_steps": 31275, "total_steps": 38160, "loss": 0.3968, "lr": 9.595440149164619e-05, "epoch": 16.391509433962263, "percentage": 81.96, "elapsed_time": "1:20:10", "remaining_time": "0:17:39", "throughput": 4246.31, "total_tokens": 20427768} {"current_steps": 31280, "total_steps": 38160, "loss": 0.3874, "lr": 9.581973475477085e-05, "epoch": 16.39412997903564, "percentage": 81.97, "elapsed_time": "1:20:11", "remaining_time": "0:17:38", "throughput": 4246.36, "total_tokens": 20431224} {"current_steps": 31285, "total_steps": 38160, "loss": 0.3779, "lr": 9.568515256779587e-05, "epoch": 16.396750524109013, "percentage": 81.98, "elapsed_time": "1:20:12", "remaining_time": "0:17:37", "throughput": 4246.37, "total_tokens": 20434232} {"current_steps": 31290, "total_steps": 38160, "loss": 0.4816, "lr": 9.555065495887433e-05, "epoch": 16.39937106918239, "percentage": 82.0, "elapsed_time": "1:20:12", "remaining_time": "0:17:36", "throughput": 4246.41, "total_tokens": 20437720} {"current_steps": 31295, "total_steps": 38160, "loss": 0.4526, "lr": 9.541624195614152e-05, "epoch": 16.401991614255767, "percentage": 82.01, "elapsed_time": "1:20:13", "remaining_time": "0:17:35", "throughput": 4246.42, "total_tokens": 20440696} {"current_steps": 31300, "total_steps": 38160, "loss": 0.478, "lr": 9.528191358771532e-05, "epoch": 16.40461215932914, "percentage": 82.02, "elapsed_time": "1:20:14", "remaining_time": "0:17:35", "throughput": 4246.42, "total_tokens": 20443544} {"current_steps": 31305, "total_steps": 38160, "loss": 0.5983, "lr": 9.514766988169549e-05, "epoch": 16.407232704402517, "percentage": 82.04, "elapsed_time": "1:20:15", "remaining_time": "0:17:34", "throughput": 4246.6, "total_tokens": 20448280} {"current_steps": 31310, "total_steps": 38160, "loss": 0.4415, "lr": 9.501351086616422e-05, "epoch": 16.40985324947589, "percentage": 82.05, "elapsed_time": "1:20:16", "remaining_time": "0:17:33", "throughput": 4246.7, "total_tokens": 20452344} {"current_steps": 31315, "total_steps": 38160, "loss": 0.4138, "lr": 9.487943656918613e-05, "epoch": 16.412473794549268, "percentage": 82.06, "elapsed_time": "1:20:16", "remaining_time": "0:17:32", "throughput": 4246.73, "total_tokens": 20455480} {"current_steps": 31320, "total_steps": 38160, "loss": 0.401, "lr": 9.474544701880805e-05, "epoch": 16.41509433962264, "percentage": 82.08, "elapsed_time": "1:20:17", "remaining_time": "0:17:32", "throughput": 4246.71, "total_tokens": 20458168} {"current_steps": 31325, "total_steps": 38160, "loss": 0.2963, "lr": 9.461154224305923e-05, "epoch": 16.417714884696018, "percentage": 82.09, "elapsed_time": "1:20:18", "remaining_time": "0:17:31", "throughput": 4246.7, "total_tokens": 20460984} {"current_steps": 31330, "total_steps": 38160, "loss": 0.4983, "lr": 9.447772226995082e-05, "epoch": 16.42033542976939, "percentage": 82.1, "elapsed_time": "1:20:18", "remaining_time": "0:17:30", "throughput": 4246.72, "total_tokens": 20464056} {"current_steps": 31335, "total_steps": 38160, "loss": 0.4386, "lr": 9.434398712747639e-05, "epoch": 16.42295597484277, "percentage": 82.11, "elapsed_time": "1:20:19", "remaining_time": "0:17:29", "throughput": 4246.72, "total_tokens": 20467096} {"current_steps": 31340, "total_steps": 38160, "loss": 0.475, "lr": 9.421033684361185e-05, "epoch": 16.42557651991614, "percentage": 82.13, "elapsed_time": "1:20:20", "remaining_time": "0:17:28", "throughput": 4246.7, "total_tokens": 20469720} {"current_steps": 31345, "total_steps": 38160, "loss": 0.6117, "lr": 9.407677144631533e-05, "epoch": 16.42819706498952, "percentage": 82.14, "elapsed_time": "1:20:20", "remaining_time": "0:17:28", "throughput": 4246.76, "total_tokens": 20473240} {"current_steps": 31350, "total_steps": 38160, "loss": 0.4385, "lr": 9.394329096352732e-05, "epoch": 16.430817610062892, "percentage": 82.15, "elapsed_time": "1:20:21", "remaining_time": "0:17:27", "throughput": 4246.81, "total_tokens": 20476600} {"current_steps": 31355, "total_steps": 38160, "loss": 0.4447, "lr": 9.380989542317037e-05, "epoch": 16.43343815513627, "percentage": 82.17, "elapsed_time": "1:20:22", "remaining_time": "0:17:26", "throughput": 4246.8, "total_tokens": 20479448} {"current_steps": 31360, "total_steps": 38160, "loss": 0.4824, "lr": 9.367658485314907e-05, "epoch": 16.436058700209642, "percentage": 82.18, "elapsed_time": "1:20:23", "remaining_time": "0:17:25", "throughput": 4246.86, "total_tokens": 20483128} {"current_steps": 31365, "total_steps": 38160, "loss": 0.4798, "lr": 9.354335928135066e-05, "epoch": 16.43867924528302, "percentage": 82.19, "elapsed_time": "1:20:24", "remaining_time": "0:17:25", "throughput": 4247.05, "total_tokens": 20487896} {"current_steps": 31370, "total_steps": 38160, "loss": 0.3939, "lr": 9.341021873564432e-05, "epoch": 16.441299790356393, "percentage": 82.21, "elapsed_time": "1:20:24", "remaining_time": "0:17:24", "throughput": 4247.1, "total_tokens": 20491352} {"current_steps": 31375, "total_steps": 38160, "loss": 0.4775, "lr": 9.327716324388164e-05, "epoch": 16.44392033542977, "percentage": 82.22, "elapsed_time": "1:20:25", "remaining_time": "0:17:23", "throughput": 4247.07, "total_tokens": 20493912} {"current_steps": 31380, "total_steps": 38160, "loss": 0.3761, "lr": 9.314419283389641e-05, "epoch": 16.446540880503143, "percentage": 82.23, "elapsed_time": "1:20:26", "remaining_time": "0:17:22", "throughput": 4247.27, "total_tokens": 20499128} {"current_steps": 31385, "total_steps": 38160, "loss": 0.4519, "lr": 9.30113075335044e-05, "epoch": 16.44916142557652, "percentage": 82.25, "elapsed_time": "1:20:27", "remaining_time": "0:17:22", "throughput": 4247.34, "total_tokens": 20502648} {"current_steps": 31390, "total_steps": 38160, "loss": 0.4054, "lr": 9.287850737050352e-05, "epoch": 16.451781970649897, "percentage": 82.26, "elapsed_time": "1:20:27", "remaining_time": "0:17:21", "throughput": 4247.38, "total_tokens": 20506040} {"current_steps": 31395, "total_steps": 38160, "loss": 0.4216, "lr": 9.274579237267422e-05, "epoch": 16.45440251572327, "percentage": 82.27, "elapsed_time": "1:20:28", "remaining_time": "0:17:20", "throughput": 4247.39, "total_tokens": 20508984} {"current_steps": 31400, "total_steps": 38160, "loss": 0.4624, "lr": 9.261316256777897e-05, "epoch": 16.457023060796647, "percentage": 82.29, "elapsed_time": "1:20:29", "remaining_time": "0:17:19", "throughput": 4247.41, "total_tokens": 20512184} {"current_steps": 31405, "total_steps": 38160, "loss": 0.3987, "lr": 9.24806179835625e-05, "epoch": 16.45964360587002, "percentage": 82.3, "elapsed_time": "1:20:30", "remaining_time": "0:17:18", "throughput": 4247.42, "total_tokens": 20515128} {"current_steps": 31410, "total_steps": 38160, "loss": 0.5246, "lr": 9.234815864775137e-05, "epoch": 16.462264150943398, "percentage": 82.31, "elapsed_time": "1:20:30", "remaining_time": "0:17:18", "throughput": 4247.45, "total_tokens": 20518392} {"current_steps": 31415, "total_steps": 38160, "loss": 0.4279, "lr": 9.221578458805485e-05, "epoch": 16.46488469601677, "percentage": 82.32, "elapsed_time": "1:20:31", "remaining_time": "0:17:17", "throughput": 4247.4, "total_tokens": 20520952} {"current_steps": 31420, "total_steps": 38160, "loss": 0.4541, "lr": 9.208349583216385e-05, "epoch": 16.467505241090148, "percentage": 82.34, "elapsed_time": "1:20:32", "remaining_time": "0:17:16", "throughput": 4247.38, "total_tokens": 20523576} {"current_steps": 31425, "total_steps": 38160, "loss": 0.3765, "lr": 9.195129240775174e-05, "epoch": 16.47012578616352, "percentage": 82.35, "elapsed_time": "1:20:32", "remaining_time": "0:17:15", "throughput": 4247.43, "total_tokens": 20526872} {"current_steps": 31430, "total_steps": 38160, "loss": 0.4431, "lr": 9.181917434247417e-05, "epoch": 16.4727463312369, "percentage": 82.36, "elapsed_time": "1:20:33", "remaining_time": "0:17:15", "throughput": 4247.58, "total_tokens": 20531544} {"current_steps": 31435, "total_steps": 38160, "loss": 0.3918, "lr": 9.168714166396835e-05, "epoch": 16.47536687631027, "percentage": 82.38, "elapsed_time": "1:20:34", "remaining_time": "0:17:14", "throughput": 4247.58, "total_tokens": 20534392} {"current_steps": 31440, "total_steps": 38160, "loss": 0.4681, "lr": 9.155519439985438e-05, "epoch": 16.47798742138365, "percentage": 82.39, "elapsed_time": "1:20:35", "remaining_time": "0:17:13", "throughput": 4247.57, "total_tokens": 20537272} {"current_steps": 31445, "total_steps": 38160, "loss": 0.4035, "lr": 9.142333257773383e-05, "epoch": 16.480607966457022, "percentage": 82.4, "elapsed_time": "1:20:35", "remaining_time": "0:17:12", "throughput": 4247.61, "total_tokens": 20540568} {"current_steps": 31450, "total_steps": 38160, "loss": 0.4983, "lr": 9.12915562251908e-05, "epoch": 16.4832285115304, "percentage": 82.42, "elapsed_time": "1:20:36", "remaining_time": "0:17:11", "throughput": 4247.65, "total_tokens": 20543832} {"current_steps": 31455, "total_steps": 38160, "loss": 0.4368, "lr": 9.115986536979149e-05, "epoch": 16.485849056603772, "percentage": 82.43, "elapsed_time": "1:20:37", "remaining_time": "0:17:11", "throughput": 4247.65, "total_tokens": 20546808} {"current_steps": 31460, "total_steps": 38160, "loss": 0.4741, "lr": 9.10282600390841e-05, "epoch": 16.48846960167715, "percentage": 82.44, "elapsed_time": "1:20:37", "remaining_time": "0:17:10", "throughput": 4247.67, "total_tokens": 20549880} {"current_steps": 31465, "total_steps": 38160, "loss": 0.43, "lr": 9.08967402605988e-05, "epoch": 16.491090146750523, "percentage": 82.46, "elapsed_time": "1:20:38", "remaining_time": "0:17:09", "throughput": 4247.75, "total_tokens": 20553816} {"current_steps": 31470, "total_steps": 38160, "loss": 0.3954, "lr": 9.07653060618483e-05, "epoch": 16.4937106918239, "percentage": 82.47, "elapsed_time": "1:20:39", "remaining_time": "0:17:08", "throughput": 4247.88, "total_tokens": 20558072} {"current_steps": 31475, "total_steps": 38160, "loss": 0.5628, "lr": 9.063395747032676e-05, "epoch": 16.496331236897273, "percentage": 82.48, "elapsed_time": "1:20:40", "remaining_time": "0:17:08", "throughput": 4247.85, "total_tokens": 20560632} {"current_steps": 31480, "total_steps": 38160, "loss": 0.438, "lr": 9.050269451351112e-05, "epoch": 16.49895178197065, "percentage": 82.49, "elapsed_time": "1:20:40", "remaining_time": "0:17:07", "throughput": 4247.9, "total_tokens": 20563960} {"current_steps": 31485, "total_steps": 38160, "loss": 0.3332, "lr": 9.037151721886006e-05, "epoch": 16.501572327044027, "percentage": 82.51, "elapsed_time": "1:20:41", "remaining_time": "0:17:06", "throughput": 4247.89, "total_tokens": 20566776} {"current_steps": 31490, "total_steps": 38160, "loss": 0.4073, "lr": 9.024042561381424e-05, "epoch": 16.5041928721174, "percentage": 82.52, "elapsed_time": "1:20:42", "remaining_time": "0:17:05", "throughput": 4247.87, "total_tokens": 20569400} {"current_steps": 31495, "total_steps": 38160, "loss": 0.4043, "lr": 9.010941972579656e-05, "epoch": 16.506813417190777, "percentage": 82.53, "elapsed_time": "1:20:42", "remaining_time": "0:17:04", "throughput": 4247.79, "total_tokens": 20571480} {"current_steps": 31500, "total_steps": 38160, "loss": 0.5062, "lr": 8.99784995822121e-05, "epoch": 16.50943396226415, "percentage": 82.55, "elapsed_time": "1:20:43", "remaining_time": "0:17:04", "throughput": 4247.75, "total_tokens": 20574008} {"current_steps": 31505, "total_steps": 38160, "loss": 0.515, "lr": 8.984766521044769e-05, "epoch": 16.512054507337528, "percentage": 82.56, "elapsed_time": "1:20:44", "remaining_time": "0:17:03", "throughput": 4247.72, "total_tokens": 20576696} {"current_steps": 31510, "total_steps": 38160, "loss": 0.399, "lr": 8.971691663787252e-05, "epoch": 16.5146750524109, "percentage": 82.57, "elapsed_time": "1:20:44", "remaining_time": "0:17:02", "throughput": 4247.76, "total_tokens": 20579960} {"current_steps": 31515, "total_steps": 38160, "loss": 0.3897, "lr": 8.958625389183756e-05, "epoch": 16.517295597484278, "percentage": 82.59, "elapsed_time": "1:20:45", "remaining_time": "0:17:01", "throughput": 4247.77, "total_tokens": 20582936} {"current_steps": 31520, "total_steps": 38160, "loss": 0.5293, "lr": 8.9455676999676e-05, "epoch": 16.51991614255765, "percentage": 82.6, "elapsed_time": "1:20:46", "remaining_time": "0:17:00", "throughput": 4247.8, "total_tokens": 20586168} {"current_steps": 31525, "total_steps": 38160, "loss": 0.4298, "lr": 8.932518598870309e-05, "epoch": 16.52253668763103, "percentage": 82.61, "elapsed_time": "1:20:46", "remaining_time": "0:17:00", "throughput": 4247.81, "total_tokens": 20589112} {"current_steps": 31530, "total_steps": 38160, "loss": 0.3659, "lr": 8.919478088621614e-05, "epoch": 16.5251572327044, "percentage": 82.63, "elapsed_time": "1:20:47", "remaining_time": "0:16:59", "throughput": 4247.93, "total_tokens": 20593240} {"current_steps": 31535, "total_steps": 38160, "loss": 0.3958, "lr": 8.906446171949422e-05, "epoch": 16.52777777777778, "percentage": 82.64, "elapsed_time": "1:20:48", "remaining_time": "0:16:58", "throughput": 4247.93, "total_tokens": 20596152} {"current_steps": 31540, "total_steps": 38160, "loss": 0.4961, "lr": 8.893422851579885e-05, "epoch": 16.530398322851152, "percentage": 82.65, "elapsed_time": "1:20:49", "remaining_time": "0:16:57", "throughput": 4248.03, "total_tokens": 20600152} {"current_steps": 31545, "total_steps": 38160, "loss": 0.4173, "lr": 8.8804081302373e-05, "epoch": 16.53301886792453, "percentage": 82.67, "elapsed_time": "1:20:50", "remaining_time": "0:16:57", "throughput": 4248.09, "total_tokens": 20603672} {"current_steps": 31550, "total_steps": 38160, "loss": 0.3497, "lr": 8.867402010644221e-05, "epoch": 16.535639412997902, "percentage": 82.68, "elapsed_time": "1:20:50", "remaining_time": "0:16:56", "throughput": 4248.04, "total_tokens": 20606104} {"current_steps": 31555, "total_steps": 38160, "loss": 0.4215, "lr": 8.854404495521389e-05, "epoch": 16.53825995807128, "percentage": 82.69, "elapsed_time": "1:20:51", "remaining_time": "0:16:55", "throughput": 4248.09, "total_tokens": 20609688} {"current_steps": 31560, "total_steps": 38160, "loss": 0.2892, "lr": 8.841415587587709e-05, "epoch": 16.540880503144653, "percentage": 82.7, "elapsed_time": "1:20:52", "remaining_time": "0:16:54", "throughput": 4248.16, "total_tokens": 20613336} {"current_steps": 31565, "total_steps": 38160, "loss": 0.4255, "lr": 8.828435289560344e-05, "epoch": 16.54350104821803, "percentage": 82.72, "elapsed_time": "1:20:52", "remaining_time": "0:16:53", "throughput": 4248.14, "total_tokens": 20615992} {"current_steps": 31570, "total_steps": 38160, "loss": 0.4386, "lr": 8.815463604154588e-05, "epoch": 16.546121593291403, "percentage": 82.73, "elapsed_time": "1:20:53", "remaining_time": "0:16:53", "throughput": 4248.09, "total_tokens": 20618520} {"current_steps": 31575, "total_steps": 38160, "loss": 0.4901, "lr": 8.80250053408399e-05, "epoch": 16.54874213836478, "percentage": 82.74, "elapsed_time": "1:20:54", "remaining_time": "0:16:52", "throughput": 4248.13, "total_tokens": 20622008} {"current_steps": 31580, "total_steps": 38160, "loss": 0.6044, "lr": 8.789546082060273e-05, "epoch": 16.551362683438157, "percentage": 82.76, "elapsed_time": "1:20:55", "remaining_time": "0:16:51", "throughput": 4248.15, "total_tokens": 20625240} {"current_steps": 31585, "total_steps": 38160, "loss": 0.5157, "lr": 8.776600250793371e-05, "epoch": 16.55398322851153, "percentage": 82.77, "elapsed_time": "1:20:55", "remaining_time": "0:16:50", "throughput": 4248.15, "total_tokens": 20628056} {"current_steps": 31590, "total_steps": 38160, "loss": 0.4473, "lr": 8.763663042991399e-05, "epoch": 16.556603773584907, "percentage": 82.78, "elapsed_time": "1:20:56", "remaining_time": "0:16:50", "throughput": 4248.13, "total_tokens": 20630776} {"current_steps": 31595, "total_steps": 38160, "loss": 0.4038, "lr": 8.75073446136066e-05, "epoch": 16.55922431865828, "percentage": 82.8, "elapsed_time": "1:20:57", "remaining_time": "0:16:49", "throughput": 4248.23, "total_tokens": 20634776} {"current_steps": 31600, "total_steps": 38160, "loss": 0.3734, "lr": 8.737814508605674e-05, "epoch": 16.561844863731658, "percentage": 82.81, "elapsed_time": "1:20:57", "remaining_time": "0:16:48", "throughput": 4248.19, "total_tokens": 20637400} {"current_steps": 31605, "total_steps": 38160, "loss": 0.4265, "lr": 8.724903187429145e-05, "epoch": 16.56446540880503, "percentage": 82.82, "elapsed_time": "1:20:58", "remaining_time": "0:16:47", "throughput": 4248.29, "total_tokens": 20641432} {"current_steps": 31610, "total_steps": 38160, "loss": 0.3983, "lr": 8.71200050053198e-05, "epoch": 16.567085953878408, "percentage": 82.84, "elapsed_time": "1:20:59", "remaining_time": "0:16:46", "throughput": 4248.32, "total_tokens": 20644696} {"current_steps": 31615, "total_steps": 38160, "loss": 0.3515, "lr": 8.699106450613287e-05, "epoch": 16.56970649895178, "percentage": 82.85, "elapsed_time": "1:21:00", "remaining_time": "0:16:46", "throughput": 4248.37, "total_tokens": 20648088} {"current_steps": 31620, "total_steps": 38160, "loss": 0.4745, "lr": 8.686221040370334e-05, "epoch": 16.572327044025158, "percentage": 82.86, "elapsed_time": "1:21:01", "remaining_time": "0:16:45", "throughput": 4248.49, "total_tokens": 20652312} {"current_steps": 31625, "total_steps": 38160, "loss": 0.4208, "lr": 8.673344272498596e-05, "epoch": 16.57494758909853, "percentage": 82.87, "elapsed_time": "1:21:01", "remaining_time": "0:16:44", "throughput": 4248.49, "total_tokens": 20655288} {"current_steps": 31630, "total_steps": 38160, "loss": 0.4375, "lr": 8.660476149691759e-05, "epoch": 16.57756813417191, "percentage": 82.89, "elapsed_time": "1:21:02", "remaining_time": "0:16:43", "throughput": 4248.49, "total_tokens": 20658200} {"current_steps": 31635, "total_steps": 38160, "loss": 0.3402, "lr": 8.647616674641684e-05, "epoch": 16.580188679245282, "percentage": 82.9, "elapsed_time": "1:21:03", "remaining_time": "0:16:43", "throughput": 4248.45, "total_tokens": 20660696} {"current_steps": 31640, "total_steps": 38160, "loss": 0.4157, "lr": 8.63476585003844e-05, "epoch": 16.58280922431866, "percentage": 82.91, "elapsed_time": "1:21:03", "remaining_time": "0:16:42", "throughput": 4248.43, "total_tokens": 20663416} {"current_steps": 31645, "total_steps": 38160, "loss": 0.4663, "lr": 8.621923678570259e-05, "epoch": 16.585429769392032, "percentage": 82.93, "elapsed_time": "1:21:04", "remaining_time": "0:16:41", "throughput": 4248.52, "total_tokens": 20667352} {"current_steps": 31650, "total_steps": 38160, "loss": 0.454, "lr": 8.609090162923567e-05, "epoch": 16.58805031446541, "percentage": 82.94, "elapsed_time": "1:21:05", "remaining_time": "0:16:40", "throughput": 4248.47, "total_tokens": 20669752} {"current_steps": 31655, "total_steps": 38160, "loss": 0.3907, "lr": 8.596265305783002e-05, "epoch": 16.590670859538783, "percentage": 82.95, "elapsed_time": "1:21:05", "remaining_time": "0:16:39", "throughput": 4248.47, "total_tokens": 20672664} {"current_steps": 31660, "total_steps": 38160, "loss": 0.4124, "lr": 8.583449109831375e-05, "epoch": 16.59329140461216, "percentage": 82.97, "elapsed_time": "1:21:06", "remaining_time": "0:16:39", "throughput": 4248.47, "total_tokens": 20675672} {"current_steps": 31665, "total_steps": 38160, "loss": 0.4167, "lr": 8.570641577749705e-05, "epoch": 16.595911949685533, "percentage": 82.98, "elapsed_time": "1:21:07", "remaining_time": "0:16:38", "throughput": 4248.47, "total_tokens": 20678520} {"current_steps": 31670, "total_steps": 38160, "loss": 0.5169, "lr": 8.557842712217162e-05, "epoch": 16.59853249475891, "percentage": 82.99, "elapsed_time": "1:21:07", "remaining_time": "0:16:37", "throughput": 4248.42, "total_tokens": 20680984} {"current_steps": 31675, "total_steps": 38160, "loss": 0.5806, "lr": 8.545052515911112e-05, "epoch": 16.601153039832283, "percentage": 83.01, "elapsed_time": "1:21:08", "remaining_time": "0:16:36", "throughput": 4248.44, "total_tokens": 20684184} {"current_steps": 31680, "total_steps": 38160, "loss": 0.3641, "lr": 8.532270991507136e-05, "epoch": 16.60377358490566, "percentage": 83.02, "elapsed_time": "1:21:09", "remaining_time": "0:16:36", "throughput": 4248.5, "total_tokens": 20687640} {"current_steps": 31685, "total_steps": 38160, "loss": 0.3911, "lr": 8.519498141678983e-05, "epoch": 16.606394129979037, "percentage": 83.03, "elapsed_time": "1:21:10", "remaining_time": "0:16:35", "throughput": 4248.48, "total_tokens": 20690392} {"current_steps": 31690, "total_steps": 38160, "loss": 0.3647, "lr": 8.506733969098579e-05, "epoch": 16.60901467505241, "percentage": 83.05, "elapsed_time": "1:21:10", "remaining_time": "0:16:34", "throughput": 4248.57, "total_tokens": 20694264} {"current_steps": 31695, "total_steps": 38160, "loss": 0.3653, "lr": 8.49397847643606e-05, "epoch": 16.611635220125788, "percentage": 83.06, "elapsed_time": "1:21:11", "remaining_time": "0:16:33", "throughput": 4248.54, "total_tokens": 20696888} {"current_steps": 31700, "total_steps": 38160, "loss": 0.4857, "lr": 8.481231666359723e-05, "epoch": 16.61425576519916, "percentage": 83.07, "elapsed_time": "1:21:12", "remaining_time": "0:16:32", "throughput": 4248.56, "total_tokens": 20700056} {"current_steps": 31705, "total_steps": 38160, "loss": 0.4933, "lr": 8.468493541536031e-05, "epoch": 16.616876310272538, "percentage": 83.08, "elapsed_time": "1:21:12", "remaining_time": "0:16:32", "throughput": 4248.56, "total_tokens": 20703000} {"current_steps": 31710, "total_steps": 38160, "loss": 0.4268, "lr": 8.455764104629681e-05, "epoch": 16.61949685534591, "percentage": 83.1, "elapsed_time": "1:21:13", "remaining_time": "0:16:31", "throughput": 4248.6, "total_tokens": 20706360} {"current_steps": 31715, "total_steps": 38160, "loss": 0.3218, "lr": 8.443043358303515e-05, "epoch": 16.622117400419288, "percentage": 83.11, "elapsed_time": "1:21:14", "remaining_time": "0:16:30", "throughput": 4248.71, "total_tokens": 20710328} {"current_steps": 31720, "total_steps": 38160, "loss": 0.4794, "lr": 8.430331305218585e-05, "epoch": 16.62473794549266, "percentage": 83.12, "elapsed_time": "1:21:15", "remaining_time": "0:16:29", "throughput": 4248.73, "total_tokens": 20713496} {"current_steps": 31725, "total_steps": 38160, "loss": 0.2957, "lr": 8.417627948034096e-05, "epoch": 16.62735849056604, "percentage": 83.14, "elapsed_time": "1:21:16", "remaining_time": "0:16:29", "throughput": 4248.8, "total_tokens": 20717240} {"current_steps": 31730, "total_steps": 38160, "loss": 0.3756, "lr": 8.404933289407424e-05, "epoch": 16.629979035639412, "percentage": 83.15, "elapsed_time": "1:21:16", "remaining_time": "0:16:28", "throughput": 4248.85, "total_tokens": 20720696} {"current_steps": 31735, "total_steps": 38160, "loss": 0.5324, "lr": 8.392247331994174e-05, "epoch": 16.63259958071279, "percentage": 83.16, "elapsed_time": "1:21:18", "remaining_time": "0:16:27", "throughput": 4249.19, "total_tokens": 20727736} {"current_steps": 31740, "total_steps": 38160, "loss": 0.4282, "lr": 8.37957007844809e-05, "epoch": 16.635220125786162, "percentage": 83.18, "elapsed_time": "1:21:18", "remaining_time": "0:16:26", "throughput": 4249.19, "total_tokens": 20730584} {"current_steps": 31745, "total_steps": 38160, "loss": 0.467, "lr": 8.366901531421134e-05, "epoch": 16.63784067085954, "percentage": 83.19, "elapsed_time": "1:21:19", "remaining_time": "0:16:26", "throughput": 4249.13, "total_tokens": 20732984} {"current_steps": 31750, "total_steps": 38160, "loss": 0.3157, "lr": 8.354241693563385e-05, "epoch": 16.640461215932913, "percentage": 83.2, "elapsed_time": "1:21:20", "remaining_time": "0:16:25", "throughput": 4249.19, "total_tokens": 20736440} {"current_steps": 31755, "total_steps": 38160, "loss": 0.34, "lr": 8.341590567523166e-05, "epoch": 16.64308176100629, "percentage": 83.22, "elapsed_time": "1:21:21", "remaining_time": "0:16:24", "throughput": 4249.52, "total_tokens": 20743480} {"current_steps": 31760, "total_steps": 38160, "loss": 0.5033, "lr": 8.328948155946924e-05, "epoch": 16.645702306079663, "percentage": 83.23, "elapsed_time": "1:21:22", "remaining_time": "0:16:23", "throughput": 4249.51, "total_tokens": 20746360} {"current_steps": 31765, "total_steps": 38160, "loss": 0.4085, "lr": 8.316314461479318e-05, "epoch": 16.64832285115304, "percentage": 83.24, "elapsed_time": "1:21:22", "remaining_time": "0:16:23", "throughput": 4249.62, "total_tokens": 20750424} {"current_steps": 31770, "total_steps": 38160, "loss": 0.4839, "lr": 8.303689486763177e-05, "epoch": 16.650943396226417, "percentage": 83.25, "elapsed_time": "1:21:23", "remaining_time": "0:16:22", "throughput": 4249.6, "total_tokens": 20753112} {"current_steps": 31775, "total_steps": 38160, "loss": 0.4929, "lr": 8.291073234439512e-05, "epoch": 16.65356394129979, "percentage": 83.27, "elapsed_time": "1:21:24", "remaining_time": "0:16:21", "throughput": 4249.62, "total_tokens": 20756216} {"current_steps": 31780, "total_steps": 38160, "loss": 0.3799, "lr": 8.27846570714747e-05, "epoch": 16.656184486373167, "percentage": 83.28, "elapsed_time": "1:21:25", "remaining_time": "0:16:20", "throughput": 4249.79, "total_tokens": 20760792} {"current_steps": 31785, "total_steps": 38160, "loss": 0.4232, "lr": 8.265866907524427e-05, "epoch": 16.65880503144654, "percentage": 83.29, "elapsed_time": "1:21:25", "remaining_time": "0:16:19", "throughput": 4249.83, "total_tokens": 20764120} {"current_steps": 31790, "total_steps": 38160, "loss": 0.4013, "lr": 8.253276838205892e-05, "epoch": 16.661425576519918, "percentage": 83.31, "elapsed_time": "1:21:26", "remaining_time": "0:16:19", "throughput": 4249.87, "total_tokens": 20767384} {"current_steps": 31795, "total_steps": 38160, "loss": 0.4163, "lr": 8.240695501825568e-05, "epoch": 16.66404612159329, "percentage": 83.32, "elapsed_time": "1:21:27", "remaining_time": "0:16:18", "throughput": 4249.9, "total_tokens": 20770680} {"current_steps": 31800, "total_steps": 38160, "loss": 0.4215, "lr": 8.228122901015345e-05, "epoch": 16.666666666666668, "percentage": 83.33, "elapsed_time": "1:21:27", "remaining_time": "0:16:17", "throughput": 4249.85, "total_tokens": 20773080} {"current_steps": 31805, "total_steps": 38160, "loss": 0.4451, "lr": 8.21555903840524e-05, "epoch": 16.66928721174004, "percentage": 83.35, "elapsed_time": "1:21:28", "remaining_time": "0:16:16", "throughput": 4249.79, "total_tokens": 20775416} {"current_steps": 31810, "total_steps": 38160, "loss": 0.4002, "lr": 8.203003916623491e-05, "epoch": 16.671907756813418, "percentage": 83.36, "elapsed_time": "1:21:29", "remaining_time": "0:16:16", "throughput": 4249.83, "total_tokens": 20778840} {"current_steps": 31815, "total_steps": 38160, "loss": 0.4921, "lr": 8.190457538296464e-05, "epoch": 16.67452830188679, "percentage": 83.37, "elapsed_time": "1:21:29", "remaining_time": "0:16:15", "throughput": 4249.82, "total_tokens": 20781592} {"current_steps": 31820, "total_steps": 38160, "loss": 0.4129, "lr": 8.177919906048736e-05, "epoch": 16.67714884696017, "percentage": 83.39, "elapsed_time": "1:21:30", "remaining_time": "0:16:14", "throughput": 4249.86, "total_tokens": 20784856} {"current_steps": 31825, "total_steps": 38160, "loss": 0.3617, "lr": 8.165391022503044e-05, "epoch": 16.679769392033542, "percentage": 83.4, "elapsed_time": "1:21:31", "remaining_time": "0:16:13", "throughput": 4249.81, "total_tokens": 20787352} {"current_steps": 31830, "total_steps": 38160, "loss": 0.4109, "lr": 8.152870890280261e-05, "epoch": 16.68238993710692, "percentage": 83.41, "elapsed_time": "1:21:32", "remaining_time": "0:16:12", "throughput": 4249.91, "total_tokens": 20791416} {"current_steps": 31835, "total_steps": 38160, "loss": 0.3537, "lr": 8.140359511999473e-05, "epoch": 16.685010482180292, "percentage": 83.43, "elapsed_time": "1:21:32", "remaining_time": "0:16:12", "throughput": 4249.89, "total_tokens": 20794200} {"current_steps": 31840, "total_steps": 38160, "loss": 0.4487, "lr": 8.127856890277923e-05, "epoch": 16.68763102725367, "percentage": 83.44, "elapsed_time": "1:21:33", "remaining_time": "0:16:11", "throughput": 4249.95, "total_tokens": 20797720} {"current_steps": 31845, "total_steps": 38160, "loss": 0.4298, "lr": 8.115363027730998e-05, "epoch": 16.690251572327043, "percentage": 83.45, "elapsed_time": "1:21:34", "remaining_time": "0:16:10", "throughput": 4250.06, "total_tokens": 20801784} {"current_steps": 31850, "total_steps": 38160, "loss": 0.474, "lr": 8.102877926972286e-05, "epoch": 16.69287211740042, "percentage": 83.46, "elapsed_time": "1:21:35", "remaining_time": "0:16:09", "throughput": 4250.08, "total_tokens": 20804984} {"current_steps": 31855, "total_steps": 38160, "loss": 0.3478, "lr": 8.090401590613533e-05, "epoch": 16.695492662473793, "percentage": 83.48, "elapsed_time": "1:21:35", "remaining_time": "0:16:09", "throughput": 4250.12, "total_tokens": 20808280} {"current_steps": 31860, "total_steps": 38160, "loss": 0.3834, "lr": 8.077934021264627e-05, "epoch": 16.69811320754717, "percentage": 83.49, "elapsed_time": "1:21:36", "remaining_time": "0:16:08", "throughput": 4250.06, "total_tokens": 20810584} {"current_steps": 31865, "total_steps": 38160, "loss": 0.3618, "lr": 8.065475221533652e-05, "epoch": 16.700733752620543, "percentage": 83.5, "elapsed_time": "1:21:37", "remaining_time": "0:16:07", "throughput": 4250.07, "total_tokens": 20813624} {"current_steps": 31870, "total_steps": 38160, "loss": 0.5304, "lr": 8.053025194026858e-05, "epoch": 16.70335429769392, "percentage": 83.52, "elapsed_time": "1:21:37", "remaining_time": "0:16:06", "throughput": 4250.07, "total_tokens": 20816504} {"current_steps": 31875, "total_steps": 38160, "loss": 0.3997, "lr": 8.040583941348623e-05, "epoch": 16.705974842767297, "percentage": 83.53, "elapsed_time": "1:21:38", "remaining_time": "0:16:05", "throughput": 4250.2, "total_tokens": 20820952} {"current_steps": 31880, "total_steps": 38160, "loss": 0.3818, "lr": 8.028151466101541e-05, "epoch": 16.70859538784067, "percentage": 83.54, "elapsed_time": "1:21:39", "remaining_time": "0:16:05", "throughput": 4250.33, "total_tokens": 20825240} {"current_steps": 31885, "total_steps": 38160, "loss": 0.4828, "lr": 8.015727770886321e-05, "epoch": 16.711215932914047, "percentage": 83.56, "elapsed_time": "1:21:40", "remaining_time": "0:16:04", "throughput": 4250.38, "total_tokens": 20828856} {"current_steps": 31890, "total_steps": 38160, "loss": 0.3867, "lr": 8.00331285830187e-05, "epoch": 16.71383647798742, "percentage": 83.57, "elapsed_time": "1:21:41", "remaining_time": "0:16:03", "throughput": 4250.39, "total_tokens": 20831928} {"current_steps": 31895, "total_steps": 38160, "loss": 0.4806, "lr": 7.990906730945247e-05, "epoch": 16.716457023060798, "percentage": 83.58, "elapsed_time": "1:21:42", "remaining_time": "0:16:02", "throughput": 4250.51, "total_tokens": 20836184} {"current_steps": 31900, "total_steps": 38160, "loss": 0.48, "lr": 7.978509391411681e-05, "epoch": 16.71907756813417, "percentage": 83.6, "elapsed_time": "1:21:42", "remaining_time": "0:16:02", "throughput": 4250.56, "total_tokens": 20839544} {"current_steps": 31905, "total_steps": 38160, "loss": 0.3382, "lr": 7.966120842294544e-05, "epoch": 16.721698113207548, "percentage": 83.61, "elapsed_time": "1:21:43", "remaining_time": "0:16:01", "throughput": 4250.55, "total_tokens": 20842360} {"current_steps": 31910, "total_steps": 38160, "loss": 0.5303, "lr": 7.953741086185368e-05, "epoch": 16.72431865828092, "percentage": 83.62, "elapsed_time": "1:21:44", "remaining_time": "0:16:00", "throughput": 4250.63, "total_tokens": 20846040} {"current_steps": 31915, "total_steps": 38160, "loss": 0.3578, "lr": 7.941370125673864e-05, "epoch": 16.7269392033543, "percentage": 83.63, "elapsed_time": "1:21:44", "remaining_time": "0:15:59", "throughput": 4250.63, "total_tokens": 20848952} {"current_steps": 31920, "total_steps": 38160, "loss": 0.4083, "lr": 7.9290079633479e-05, "epoch": 16.729559748427672, "percentage": 83.65, "elapsed_time": "1:21:45", "remaining_time": "0:15:58", "throughput": 4250.67, "total_tokens": 20852184} {"current_steps": 31925, "total_steps": 38160, "loss": 0.3335, "lr": 7.916654601793516e-05, "epoch": 16.73218029350105, "percentage": 83.66, "elapsed_time": "1:21:46", "remaining_time": "0:15:58", "throughput": 4250.68, "total_tokens": 20855224} {"current_steps": 31930, "total_steps": 38160, "loss": 0.4006, "lr": 7.904310043594859e-05, "epoch": 16.734800838574422, "percentage": 83.67, "elapsed_time": "1:21:47", "remaining_time": "0:15:57", "throughput": 4250.74, "total_tokens": 20858808} {"current_steps": 31935, "total_steps": 38160, "loss": 0.37, "lr": 7.891974291334303e-05, "epoch": 16.7374213836478, "percentage": 83.69, "elapsed_time": "1:21:47", "remaining_time": "0:15:56", "throughput": 4250.75, "total_tokens": 20861784} {"current_steps": 31940, "total_steps": 38160, "loss": 0.3517, "lr": 7.879647347592322e-05, "epoch": 16.740041928721173, "percentage": 83.7, "elapsed_time": "1:21:48", "remaining_time": "0:15:55", "throughput": 4250.76, "total_tokens": 20864888} {"current_steps": 31945, "total_steps": 38160, "loss": 0.3183, "lr": 7.867329214947578e-05, "epoch": 16.74266247379455, "percentage": 83.71, "elapsed_time": "1:21:49", "remaining_time": "0:15:55", "throughput": 4250.76, "total_tokens": 20867768} {"current_steps": 31950, "total_steps": 38160, "loss": 0.4716, "lr": 7.855019895976889e-05, "epoch": 16.745283018867923, "percentage": 83.73, "elapsed_time": "1:21:49", "remaining_time": "0:15:54", "throughput": 4250.8, "total_tokens": 20871096} {"current_steps": 31955, "total_steps": 38160, "loss": 0.5398, "lr": 7.842719393255232e-05, "epoch": 16.7479035639413, "percentage": 83.74, "elapsed_time": "1:21:50", "remaining_time": "0:15:53", "throughput": 4250.85, "total_tokens": 20874424} {"current_steps": 31960, "total_steps": 38160, "loss": 0.4571, "lr": 7.830427709355725e-05, "epoch": 16.750524109014677, "percentage": 83.75, "elapsed_time": "1:21:51", "remaining_time": "0:15:52", "throughput": 4250.87, "total_tokens": 20877496} {"current_steps": 31965, "total_steps": 38160, "loss": 0.56, "lr": 7.818144846849634e-05, "epoch": 16.75314465408805, "percentage": 83.77, "elapsed_time": "1:21:52", "remaining_time": "0:15:51", "throughput": 4250.84, "total_tokens": 20880120} {"current_steps": 31970, "total_steps": 38160, "loss": 0.3455, "lr": 7.805870808306403e-05, "epoch": 16.755765199161427, "percentage": 83.78, "elapsed_time": "1:21:52", "remaining_time": "0:15:51", "throughput": 4250.83, "total_tokens": 20883128} {"current_steps": 31975, "total_steps": 38160, "loss": 0.3929, "lr": 7.793605596293618e-05, "epoch": 16.7583857442348, "percentage": 83.79, "elapsed_time": "1:21:53", "remaining_time": "0:15:50", "throughput": 4250.81, "total_tokens": 20885816} {"current_steps": 31980, "total_steps": 38160, "loss": 0.4653, "lr": 7.781349213377048e-05, "epoch": 16.761006289308177, "percentage": 83.81, "elapsed_time": "1:21:54", "remaining_time": "0:15:49", "throughput": 4250.84, "total_tokens": 20889016} {"current_steps": 31985, "total_steps": 38160, "loss": 0.4925, "lr": 7.769101662120559e-05, "epoch": 16.76362683438155, "percentage": 83.82, "elapsed_time": "1:21:54", "remaining_time": "0:15:48", "throughput": 4250.83, "total_tokens": 20891832} {"current_steps": 31990, "total_steps": 38160, "loss": 0.4105, "lr": 7.756862945086196e-05, "epoch": 16.766247379454928, "percentage": 83.83, "elapsed_time": "1:21:55", "remaining_time": "0:15:48", "throughput": 4250.87, "total_tokens": 20895128} {"current_steps": 31995, "total_steps": 38160, "loss": 0.6022, "lr": 7.744633064834172e-05, "epoch": 16.7688679245283, "percentage": 83.84, "elapsed_time": "1:21:56", "remaining_time": "0:15:47", "throughput": 4250.87, "total_tokens": 20897944} {"current_steps": 32000, "total_steps": 38160, "loss": 0.5209, "lr": 7.732412023922836e-05, "epoch": 16.771488469601678, "percentage": 83.86, "elapsed_time": "1:21:56", "remaining_time": "0:15:46", "throughput": 4250.88, "total_tokens": 20901112} {"current_steps": 32005, "total_steps": 38160, "loss": 0.4826, "lr": 7.720199824908692e-05, "epoch": 16.77410901467505, "percentage": 83.87, "elapsed_time": "1:21:57", "remaining_time": "0:15:45", "throughput": 4250.94, "total_tokens": 20904568} {"current_steps": 32010, "total_steps": 38160, "loss": 0.3572, "lr": 7.707996470346402e-05, "epoch": 16.77672955974843, "percentage": 83.88, "elapsed_time": "1:21:58", "remaining_time": "0:15:44", "throughput": 4251.01, "total_tokens": 20908184} {"current_steps": 32015, "total_steps": 38160, "loss": 0.4328, "lr": 7.695801962788756e-05, "epoch": 16.779350104821802, "percentage": 83.9, "elapsed_time": "1:21:59", "remaining_time": "0:15:44", "throughput": 4251.09, "total_tokens": 20911800} {"current_steps": 32020, "total_steps": 38160, "loss": 0.4367, "lr": 7.683616304786695e-05, "epoch": 16.78197064989518, "percentage": 83.91, "elapsed_time": "1:21:59", "remaining_time": "0:15:43", "throughput": 4251.02, "total_tokens": 20914040} {"current_steps": 32025, "total_steps": 38160, "loss": 0.4669, "lr": 7.671439498889332e-05, "epoch": 16.784591194968552, "percentage": 83.92, "elapsed_time": "1:22:00", "remaining_time": "0:15:42", "throughput": 4251.06, "total_tokens": 20917304} {"current_steps": 32030, "total_steps": 38160, "loss": 0.4741, "lr": 7.65927154764392e-05, "epoch": 16.78721174004193, "percentage": 83.94, "elapsed_time": "1:22:01", "remaining_time": "0:15:41", "throughput": 4251.07, "total_tokens": 20920344} {"current_steps": 32035, "total_steps": 38160, "loss": 0.4764, "lr": 7.647112453595862e-05, "epoch": 16.789832285115303, "percentage": 83.95, "elapsed_time": "1:22:01", "remaining_time": "0:15:41", "throughput": 4251.13, "total_tokens": 20923928} {"current_steps": 32040, "total_steps": 38160, "loss": 0.3448, "lr": 7.634962219288688e-05, "epoch": 16.79245283018868, "percentage": 83.96, "elapsed_time": "1:22:02", "remaining_time": "0:15:40", "throughput": 4251.1, "total_tokens": 20926584} {"current_steps": 32045, "total_steps": 38160, "loss": 0.4241, "lr": 7.622820847264083e-05, "epoch": 16.795073375262053, "percentage": 83.98, "elapsed_time": "1:22:03", "remaining_time": "0:15:39", "throughput": 4251.11, "total_tokens": 20929656} {"current_steps": 32050, "total_steps": 38160, "loss": 0.4474, "lr": 7.610688340061894e-05, "epoch": 16.79769392033543, "percentage": 83.99, "elapsed_time": "1:22:03", "remaining_time": "0:15:38", "throughput": 4251.09, "total_tokens": 20932344} {"current_steps": 32055, "total_steps": 38160, "loss": 0.4648, "lr": 7.598564700220101e-05, "epoch": 16.800314465408803, "percentage": 84.0, "elapsed_time": "1:22:04", "remaining_time": "0:15:37", "throughput": 4251.14, "total_tokens": 20935864} {"current_steps": 32060, "total_steps": 38160, "loss": 0.5036, "lr": 7.586449930274842e-05, "epoch": 16.80293501048218, "percentage": 84.01, "elapsed_time": "1:22:05", "remaining_time": "0:15:37", "throughput": 4251.16, "total_tokens": 20938936} {"current_steps": 32065, "total_steps": 38160, "loss": 0.4837, "lr": 7.574344032760367e-05, "epoch": 16.805555555555557, "percentage": 84.03, "elapsed_time": "1:22:06", "remaining_time": "0:15:36", "throughput": 4251.22, "total_tokens": 20942520} {"current_steps": 32070, "total_steps": 38160, "loss": 0.3562, "lr": 7.562247010209111e-05, "epoch": 16.80817610062893, "percentage": 84.04, "elapsed_time": "1:22:06", "remaining_time": "0:15:35", "throughput": 4251.2, "total_tokens": 20945208} {"current_steps": 32075, "total_steps": 38160, "loss": 0.4229, "lr": 7.550158865151618e-05, "epoch": 16.810796645702307, "percentage": 84.05, "elapsed_time": "1:22:07", "remaining_time": "0:15:34", "throughput": 4251.2, "total_tokens": 20948344} {"current_steps": 32080, "total_steps": 38160, "loss": 0.3563, "lr": 7.538079600116593e-05, "epoch": 16.81341719077568, "percentage": 84.07, "elapsed_time": "1:22:08", "remaining_time": "0:15:34", "throughput": 4251.21, "total_tokens": 20951352} {"current_steps": 32085, "total_steps": 38160, "loss": 0.62, "lr": 7.526009217630886e-05, "epoch": 16.816037735849058, "percentage": 84.08, "elapsed_time": "1:22:08", "remaining_time": "0:15:33", "throughput": 4251.17, "total_tokens": 20953848} {"current_steps": 32090, "total_steps": 38160, "loss": 0.445, "lr": 7.513947720219494e-05, "epoch": 16.81865828092243, "percentage": 84.09, "elapsed_time": "1:22:09", "remaining_time": "0:15:32", "throughput": 4251.2, "total_tokens": 20957080} {"current_steps": 32095, "total_steps": 38160, "loss": 0.4476, "lr": 7.501895110405533e-05, "epoch": 16.821278825995808, "percentage": 84.11, "elapsed_time": "1:22:10", "remaining_time": "0:15:31", "throughput": 4251.32, "total_tokens": 20961336} {"current_steps": 32100, "total_steps": 38160, "loss": 0.4258, "lr": 7.489851390710262e-05, "epoch": 16.82389937106918, "percentage": 84.12, "elapsed_time": "1:22:11", "remaining_time": "0:15:30", "throughput": 4251.28, "total_tokens": 20963864} {"current_steps": 32105, "total_steps": 38160, "loss": 0.3794, "lr": 7.477816563653095e-05, "epoch": 16.82651991614256, "percentage": 84.13, "elapsed_time": "1:22:11", "remaining_time": "0:15:30", "throughput": 4251.28, "total_tokens": 20966872} {"current_steps": 32110, "total_steps": 38160, "loss": 0.425, "lr": 7.465790631751584e-05, "epoch": 16.829140461215932, "percentage": 84.15, "elapsed_time": "1:22:12", "remaining_time": "0:15:29", "throughput": 4251.25, "total_tokens": 20969432} {"current_steps": 32115, "total_steps": 38160, "loss": 0.3885, "lr": 7.453773597521429e-05, "epoch": 16.83176100628931, "percentage": 84.16, "elapsed_time": "1:22:13", "remaining_time": "0:15:28", "throughput": 4251.25, "total_tokens": 20972312} {"current_steps": 32120, "total_steps": 38160, "loss": 0.3594, "lr": 7.44176546347643e-05, "epoch": 16.834381551362682, "percentage": 84.17, "elapsed_time": "1:22:14", "remaining_time": "0:15:27", "throughput": 4251.35, "total_tokens": 20976344} {"current_steps": 32125, "total_steps": 38160, "loss": 0.4198, "lr": 7.429766232128583e-05, "epoch": 16.83700209643606, "percentage": 84.19, "elapsed_time": "1:22:14", "remaining_time": "0:15:27", "throughput": 4251.47, "total_tokens": 20980408} {"current_steps": 32130, "total_steps": 38160, "loss": 0.3435, "lr": 7.417775905987956e-05, "epoch": 16.839622641509433, "percentage": 84.2, "elapsed_time": "1:22:15", "remaining_time": "0:15:26", "throughput": 4251.51, "total_tokens": 20983928} {"current_steps": 32135, "total_steps": 38160, "loss": 0.3455, "lr": 7.405794487562811e-05, "epoch": 16.84224318658281, "percentage": 84.21, "elapsed_time": "1:22:16", "remaining_time": "0:15:25", "throughput": 4251.52, "total_tokens": 20986936} {"current_steps": 32140, "total_steps": 38160, "loss": 0.3627, "lr": 7.393821979359528e-05, "epoch": 16.844863731656183, "percentage": 84.22, "elapsed_time": "1:22:17", "remaining_time": "0:15:24", "throughput": 4251.56, "total_tokens": 20990200} {"current_steps": 32145, "total_steps": 38160, "loss": 0.402, "lr": 7.3818583838826e-05, "epoch": 16.84748427672956, "percentage": 84.24, "elapsed_time": "1:22:17", "remaining_time": "0:15:23", "throughput": 4251.59, "total_tokens": 20993368} {"current_steps": 32150, "total_steps": 38160, "loss": 0.4436, "lr": 7.369903703634684e-05, "epoch": 16.850104821802937, "percentage": 84.25, "elapsed_time": "1:22:18", "remaining_time": "0:15:23", "throughput": 4251.65, "total_tokens": 20996888} {"current_steps": 32155, "total_steps": 38160, "loss": 0.4398, "lr": 7.357957941116572e-05, "epoch": 16.85272536687631, "percentage": 84.26, "elapsed_time": "1:22:19", "remaining_time": "0:15:22", "throughput": 4251.69, "total_tokens": 21000152} {"current_steps": 32160, "total_steps": 38160, "loss": 0.496, "lr": 7.346021098827166e-05, "epoch": 16.855345911949687, "percentage": 84.28, "elapsed_time": "1:22:20", "remaining_time": "0:15:21", "throughput": 4251.79, "total_tokens": 21004056} {"current_steps": 32165, "total_steps": 38160, "loss": 0.359, "lr": 7.334093179263518e-05, "epoch": 16.85796645702306, "percentage": 84.29, "elapsed_time": "1:22:20", "remaining_time": "0:15:20", "throughput": 4251.77, "total_tokens": 21006680} {"current_steps": 32170, "total_steps": 38160, "loss": 0.493, "lr": 7.322174184920837e-05, "epoch": 16.860587002096437, "percentage": 84.3, "elapsed_time": "1:22:21", "remaining_time": "0:15:20", "throughput": 4251.81, "total_tokens": 21010104} {"current_steps": 32175, "total_steps": 38160, "loss": 0.4922, "lr": 7.310264118292404e-05, "epoch": 16.86320754716981, "percentage": 84.32, "elapsed_time": "1:22:22", "remaining_time": "0:15:19", "throughput": 4251.92, "total_tokens": 21014072} {"current_steps": 32180, "total_steps": 38160, "loss": 0.3868, "lr": 7.298362981869705e-05, "epoch": 16.865828092243188, "percentage": 84.33, "elapsed_time": "1:22:23", "remaining_time": "0:15:18", "throughput": 4251.97, "total_tokens": 21017496} {"current_steps": 32185, "total_steps": 38160, "loss": 0.3216, "lr": 7.286470778142284e-05, "epoch": 16.86844863731656, "percentage": 84.34, "elapsed_time": "1:22:23", "remaining_time": "0:15:17", "throughput": 4251.98, "total_tokens": 21020472} {"current_steps": 32190, "total_steps": 38160, "loss": 0.3835, "lr": 7.274587509597886e-05, "epoch": 16.871069182389938, "percentage": 84.36, "elapsed_time": "1:22:24", "remaining_time": "0:15:17", "throughput": 4252.03, "total_tokens": 21023896} {"current_steps": 32195, "total_steps": 38160, "loss": 0.5965, "lr": 7.262713178722346e-05, "epoch": 16.87368972746331, "percentage": 84.37, "elapsed_time": "1:22:25", "remaining_time": "0:15:16", "throughput": 4252.04, "total_tokens": 21026904} {"current_steps": 32200, "total_steps": 38160, "loss": 0.3872, "lr": 7.250847787999625e-05, "epoch": 16.87631027253669, "percentage": 84.38, "elapsed_time": "1:22:25", "remaining_time": "0:15:15", "throughput": 4252.06, "total_tokens": 21029944} {"current_steps": 32205, "total_steps": 38160, "loss": 0.3471, "lr": 7.238991339911844e-05, "epoch": 16.878930817610062, "percentage": 84.39, "elapsed_time": "1:22:26", "remaining_time": "0:15:14", "throughput": 4252.02, "total_tokens": 21032504} {"current_steps": 32210, "total_steps": 38160, "loss": 0.5438, "lr": 7.227143836939237e-05, "epoch": 16.88155136268344, "percentage": 84.41, "elapsed_time": "1:22:27", "remaining_time": "0:15:13", "throughput": 4252.12, "total_tokens": 21036600} {"current_steps": 32215, "total_steps": 38160, "loss": 0.4454, "lr": 7.215305281560153e-05, "epoch": 16.884171907756812, "percentage": 84.42, "elapsed_time": "1:22:28", "remaining_time": "0:15:13", "throughput": 4252.14, "total_tokens": 21039768} {"current_steps": 32220, "total_steps": 38160, "loss": 0.404, "lr": 7.203475676251104e-05, "epoch": 16.88679245283019, "percentage": 84.43, "elapsed_time": "1:22:28", "remaining_time": "0:15:12", "throughput": 4252.19, "total_tokens": 21043256} {"current_steps": 32225, "total_steps": 38160, "loss": 0.4595, "lr": 7.191655023486682e-05, "epoch": 16.889412997903563, "percentage": 84.45, "elapsed_time": "1:22:29", "remaining_time": "0:15:11", "throughput": 4252.18, "total_tokens": 21046072} {"current_steps": 32230, "total_steps": 38160, "loss": 0.3845, "lr": 7.179843325739644e-05, "epoch": 16.89203354297694, "percentage": 84.46, "elapsed_time": "1:22:30", "remaining_time": "0:15:10", "throughput": 4252.32, "total_tokens": 21050424} {"current_steps": 32235, "total_steps": 38160, "loss": 0.4653, "lr": 7.168040585480861e-05, "epoch": 16.894654088050313, "percentage": 84.47, "elapsed_time": "1:22:30", "remaining_time": "0:15:10", "throughput": 4252.3, "total_tokens": 21053144} {"current_steps": 32240, "total_steps": 38160, "loss": 0.4821, "lr": 7.156246805179351e-05, "epoch": 16.89727463312369, "percentage": 84.49, "elapsed_time": "1:22:31", "remaining_time": "0:15:09", "throughput": 4252.38, "total_tokens": 21056856} {"current_steps": 32245, "total_steps": 38160, "loss": 0.4395, "lr": 7.144461987302208e-05, "epoch": 16.899895178197063, "percentage": 84.5, "elapsed_time": "1:22:32", "remaining_time": "0:15:08", "throughput": 4252.47, "total_tokens": 21060792} {"current_steps": 32250, "total_steps": 38160, "loss": 0.5068, "lr": 7.132686134314714e-05, "epoch": 16.90251572327044, "percentage": 84.51, "elapsed_time": "1:22:33", "remaining_time": "0:15:07", "throughput": 4252.47, "total_tokens": 21063768} {"current_steps": 32255, "total_steps": 38160, "loss": 0.3546, "lr": 7.120919248680208e-05, "epoch": 16.905136268343817, "percentage": 84.53, "elapsed_time": "1:22:33", "remaining_time": "0:15:06", "throughput": 4252.46, "total_tokens": 21066680} {"current_steps": 32260, "total_steps": 38160, "loss": 0.4782, "lr": 7.109161332860203e-05, "epoch": 16.90775681341719, "percentage": 84.54, "elapsed_time": "1:22:34", "remaining_time": "0:15:06", "throughput": 4252.58, "total_tokens": 21070968} {"current_steps": 32265, "total_steps": 38160, "loss": 0.4562, "lr": 7.097412389314322e-05, "epoch": 16.910377358490567, "percentage": 84.55, "elapsed_time": "1:22:35", "remaining_time": "0:15:05", "throughput": 4252.7, "total_tokens": 21075032} {"current_steps": 32270, "total_steps": 38160, "loss": 0.3584, "lr": 7.085672420500322e-05, "epoch": 16.91299790356394, "percentage": 84.56, "elapsed_time": "1:22:36", "remaining_time": "0:15:04", "throughput": 4252.77, "total_tokens": 21078712} {"current_steps": 32275, "total_steps": 38160, "loss": 0.4509, "lr": 7.073941428874064e-05, "epoch": 16.915618448637318, "percentage": 84.58, "elapsed_time": "1:22:37", "remaining_time": "0:15:03", "throughput": 4252.82, "total_tokens": 21082168} {"current_steps": 32280, "total_steps": 38160, "loss": 0.2289, "lr": 7.062219416889514e-05, "epoch": 16.91823899371069, "percentage": 84.59, "elapsed_time": "1:22:37", "remaining_time": "0:15:03", "throughput": 4252.84, "total_tokens": 21085304} {"current_steps": 32285, "total_steps": 38160, "loss": 0.4246, "lr": 7.050506386998806e-05, "epoch": 16.920859538784068, "percentage": 84.6, "elapsed_time": "1:22:38", "remaining_time": "0:15:02", "throughput": 4252.93, "total_tokens": 21089144} {"current_steps": 32290, "total_steps": 38160, "loss": 0.3959, "lr": 7.038802341652172e-05, "epoch": 16.92348008385744, "percentage": 84.62, "elapsed_time": "1:22:39", "remaining_time": "0:15:01", "throughput": 4252.97, "total_tokens": 21092504} {"current_steps": 32295, "total_steps": 38160, "loss": 0.4194, "lr": 7.027107283297967e-05, "epoch": 16.92610062893082, "percentage": 84.63, "elapsed_time": "1:22:40", "remaining_time": "0:15:00", "throughput": 4252.97, "total_tokens": 21095352} {"current_steps": 32300, "total_steps": 38160, "loss": 0.4128, "lr": 7.015421214382661e-05, "epoch": 16.928721174004192, "percentage": 84.64, "elapsed_time": "1:22:40", "remaining_time": "0:15:00", "throughput": 4252.95, "total_tokens": 21098104} {"current_steps": 32305, "total_steps": 38160, "loss": 0.2813, "lr": 7.003744137350827e-05, "epoch": 16.93134171907757, "percentage": 84.66, "elapsed_time": "1:22:41", "remaining_time": "0:14:59", "throughput": 4252.92, "total_tokens": 21100696} {"current_steps": 32310, "total_steps": 38160, "loss": 0.4066, "lr": 6.992076054645197e-05, "epoch": 16.933962264150942, "percentage": 84.67, "elapsed_time": "1:22:42", "remaining_time": "0:14:58", "throughput": 4252.93, "total_tokens": 21103736} {"current_steps": 32315, "total_steps": 38160, "loss": 0.3705, "lr": 6.980416968706594e-05, "epoch": 16.93658280922432, "percentage": 84.68, "elapsed_time": "1:22:42", "remaining_time": "0:14:57", "throughput": 4253.01, "total_tokens": 21107384} {"current_steps": 32320, "total_steps": 38160, "loss": 0.5959, "lr": 6.968766881973965e-05, "epoch": 16.939203354297693, "percentage": 84.7, "elapsed_time": "1:22:43", "remaining_time": "0:14:56", "throughput": 4253.08, "total_tokens": 21111096} {"current_steps": 32325, "total_steps": 38160, "loss": 0.4616, "lr": 6.957125796884395e-05, "epoch": 16.94182389937107, "percentage": 84.71, "elapsed_time": "1:22:44", "remaining_time": "0:14:56", "throughput": 4253.15, "total_tokens": 21114808} {"current_steps": 32330, "total_steps": 38160, "loss": 0.3746, "lr": 6.945493715873046e-05, "epoch": 16.944444444444443, "percentage": 84.72, "elapsed_time": "1:22:45", "remaining_time": "0:14:55", "throughput": 4253.13, "total_tokens": 21117560} {"current_steps": 32335, "total_steps": 38160, "loss": 0.2995, "lr": 6.933870641373208e-05, "epoch": 16.94706498951782, "percentage": 84.74, "elapsed_time": "1:22:45", "remaining_time": "0:14:54", "throughput": 4253.12, "total_tokens": 21120472} {"current_steps": 32340, "total_steps": 38160, "loss": 0.3987, "lr": 6.92225657581631e-05, "epoch": 16.949685534591197, "percentage": 84.75, "elapsed_time": "1:22:46", "remaining_time": "0:14:53", "throughput": 4253.07, "total_tokens": 21122840} {"current_steps": 32345, "total_steps": 38160, "loss": 0.5876, "lr": 6.910651521631877e-05, "epoch": 16.95230607966457, "percentage": 84.76, "elapsed_time": "1:22:47", "remaining_time": "0:14:53", "throughput": 4253.13, "total_tokens": 21126392} {"current_steps": 32350, "total_steps": 38160, "loss": 0.3724, "lr": 6.899055481247568e-05, "epoch": 16.954926624737947, "percentage": 84.77, "elapsed_time": "1:22:47", "remaining_time": "0:14:52", "throughput": 4253.14, "total_tokens": 21129336} {"current_steps": 32355, "total_steps": 38160, "loss": 0.3611, "lr": 6.88746845708913e-05, "epoch": 16.95754716981132, "percentage": 84.79, "elapsed_time": "1:22:48", "remaining_time": "0:14:51", "throughput": 4253.24, "total_tokens": 21133560} {"current_steps": 32360, "total_steps": 38160, "loss": 0.4078, "lr": 6.87589045158043e-05, "epoch": 16.960167714884697, "percentage": 84.8, "elapsed_time": "1:22:49", "remaining_time": "0:14:50", "throughput": 4253.24, "total_tokens": 21136408} {"current_steps": 32365, "total_steps": 38160, "loss": 0.4403, "lr": 6.864321467143459e-05, "epoch": 16.96278825995807, "percentage": 84.81, "elapsed_time": "1:22:50", "remaining_time": "0:14:49", "throughput": 4253.23, "total_tokens": 21139224} {"current_steps": 32370, "total_steps": 38160, "loss": 0.3988, "lr": 6.852761506198319e-05, "epoch": 16.965408805031448, "percentage": 84.83, "elapsed_time": "1:22:50", "remaining_time": "0:14:49", "throughput": 4253.2, "total_tokens": 21141848} {"current_steps": 32375, "total_steps": 38160, "loss": 0.3553, "lr": 6.841210571163231e-05, "epoch": 16.96802935010482, "percentage": 84.84, "elapsed_time": "1:22:51", "remaining_time": "0:14:48", "throughput": 4253.32, "total_tokens": 21146104} {"current_steps": 32380, "total_steps": 38160, "loss": 0.4669, "lr": 6.829668664454513e-05, "epoch": 16.970649895178198, "percentage": 84.85, "elapsed_time": "1:22:52", "remaining_time": "0:14:47", "throughput": 4253.4, "total_tokens": 21149816} {"current_steps": 32385, "total_steps": 38160, "loss": 0.3513, "lr": 6.818135788486584e-05, "epoch": 16.97327044025157, "percentage": 84.87, "elapsed_time": "1:22:53", "remaining_time": "0:14:46", "throughput": 4253.4, "total_tokens": 21152824} {"current_steps": 32390, "total_steps": 38160, "loss": 0.4401, "lr": 6.806611945672004e-05, "epoch": 16.97589098532495, "percentage": 84.88, "elapsed_time": "1:22:53", "remaining_time": "0:14:46", "throughput": 4253.47, "total_tokens": 21156472} {"current_steps": 32395, "total_steps": 38160, "loss": 0.4386, "lr": 6.79509713842143e-05, "epoch": 16.978511530398322, "percentage": 84.89, "elapsed_time": "1:22:54", "remaining_time": "0:14:45", "throughput": 4253.52, "total_tokens": 21159864} {"current_steps": 32400, "total_steps": 38160, "loss": 0.3775, "lr": 6.783591369143626e-05, "epoch": 16.9811320754717, "percentage": 84.91, "elapsed_time": "1:22:55", "remaining_time": "0:14:44", "throughput": 4253.47, "total_tokens": 21162264} {"current_steps": 32405, "total_steps": 38160, "loss": 0.4126, "lr": 6.77209464024548e-05, "epoch": 16.983752620545072, "percentage": 84.92, "elapsed_time": "1:22:56", "remaining_time": "0:14:43", "throughput": 4253.52, "total_tokens": 21165816} {"current_steps": 32410, "total_steps": 38160, "loss": 0.4874, "lr": 6.760606954131965e-05, "epoch": 16.98637316561845, "percentage": 84.93, "elapsed_time": "1:22:56", "remaining_time": "0:14:42", "throughput": 4253.51, "total_tokens": 21168536} {"current_steps": 32415, "total_steps": 38160, "loss": 0.4959, "lr": 6.749128313206165e-05, "epoch": 16.988993710691823, "percentage": 84.94, "elapsed_time": "1:22:57", "remaining_time": "0:14:42", "throughput": 4253.51, "total_tokens": 21171448} {"current_steps": 32420, "total_steps": 38160, "loss": 0.4046, "lr": 6.737658719869288e-05, "epoch": 16.9916142557652, "percentage": 84.96, "elapsed_time": "1:22:58", "remaining_time": "0:14:41", "throughput": 4253.53, "total_tokens": 21174552} {"current_steps": 32425, "total_steps": 38160, "loss": 0.3938, "lr": 6.726198176520642e-05, "epoch": 16.994234800838573, "percentage": 84.97, "elapsed_time": "1:22:58", "remaining_time": "0:14:40", "throughput": 4253.55, "total_tokens": 21177688} {"current_steps": 32430, "total_steps": 38160, "loss": 0.6919, "lr": 6.71474668555766e-05, "epoch": 16.99685534591195, "percentage": 84.98, "elapsed_time": "1:22:59", "remaining_time": "0:14:39", "throughput": 4253.59, "total_tokens": 21181112} {"current_steps": 32435, "total_steps": 38160, "loss": 0.3716, "lr": 6.703304249375836e-05, "epoch": 16.999475890985323, "percentage": 85.0, "elapsed_time": "1:23:00", "remaining_time": "0:14:39", "throughput": 4253.67, "total_tokens": 21184856} {"current_steps": 32436, "total_steps": 38160, "eval_loss": 0.4925762712955475, "epoch": 17.0, "percentage": 85.0, "elapsed_time": "1:23:14", "remaining_time": "0:14:41", "throughput": 4241.66, "total_tokens": 21184936} {"current_steps": 32440, "total_steps": 38160, "loss": 0.4272, "lr": 6.691870870368815e-05, "epoch": 17.0020964360587, "percentage": 85.01, "elapsed_time": "1:23:17", "remaining_time": "0:14:41", "throughput": 4239.96, "total_tokens": 21187656} {"current_steps": 32445, "total_steps": 38160, "loss": 0.3194, "lr": 6.680446550928316e-05, "epoch": 17.004716981132077, "percentage": 85.02, "elapsed_time": "1:23:18", "remaining_time": "0:14:40", "throughput": 4240.16, "total_tokens": 21192744} {"current_steps": 32450, "total_steps": 38160, "loss": 0.6774, "lr": 6.669031293444177e-05, "epoch": 17.00733752620545, "percentage": 85.04, "elapsed_time": "1:23:18", "remaining_time": "0:14:39", "throughput": 4240.13, "total_tokens": 21195368} {"current_steps": 32455, "total_steps": 38160, "loss": 0.3562, "lr": 6.65762510030436e-05, "epoch": 17.009958071278827, "percentage": 85.05, "elapsed_time": "1:23:19", "remaining_time": "0:14:38", "throughput": 4240.16, "total_tokens": 21198728} {"current_steps": 32460, "total_steps": 38160, "loss": 0.3275, "lr": 6.646227973894886e-05, "epoch": 17.0125786163522, "percentage": 85.06, "elapsed_time": "1:23:20", "remaining_time": "0:14:38", "throughput": 4240.17, "total_tokens": 21201768} {"current_steps": 32465, "total_steps": 38160, "loss": 0.3926, "lr": 6.634839916599921e-05, "epoch": 17.015199161425578, "percentage": 85.08, "elapsed_time": "1:23:20", "remaining_time": "0:14:37", "throughput": 4240.15, "total_tokens": 21204520} {"current_steps": 32470, "total_steps": 38160, "loss": 0.3435, "lr": 6.623460930801701e-05, "epoch": 17.01781970649895, "percentage": 85.09, "elapsed_time": "1:23:21", "remaining_time": "0:14:36", "throughput": 4240.17, "total_tokens": 21207560} {"current_steps": 32475, "total_steps": 38160, "loss": 0.3564, "lr": 6.61209101888059e-05, "epoch": 17.020440251572328, "percentage": 85.1, "elapsed_time": "1:23:22", "remaining_time": "0:14:35", "throughput": 4240.17, "total_tokens": 21210536} {"current_steps": 32480, "total_steps": 38160, "loss": 0.4546, "lr": 6.600730183215043e-05, "epoch": 17.0230607966457, "percentage": 85.12, "elapsed_time": "1:23:23", "remaining_time": "0:14:34", "throughput": 4240.27, "total_tokens": 21214440} {"current_steps": 32485, "total_steps": 38160, "loss": 0.4125, "lr": 6.589378426181624e-05, "epoch": 17.02568134171908, "percentage": 85.13, "elapsed_time": "1:23:23", "remaining_time": "0:14:34", "throughput": 4240.25, "total_tokens": 21217128} {"current_steps": 32490, "total_steps": 38160, "loss": 0.433, "lr": 6.578035750154976e-05, "epoch": 17.028301886792452, "percentage": 85.14, "elapsed_time": "1:23:24", "remaining_time": "0:14:33", "throughput": 4240.32, "total_tokens": 21220808} {"current_steps": 32495, "total_steps": 38160, "loss": 0.2838, "lr": 6.566702157507875e-05, "epoch": 17.03092243186583, "percentage": 85.15, "elapsed_time": "1:23:25", "remaining_time": "0:14:32", "throughput": 4240.38, "total_tokens": 21224456} {"current_steps": 32500, "total_steps": 38160, "loss": 0.3263, "lr": 6.555377650611155e-05, "epoch": 17.033542976939202, "percentage": 85.17, "elapsed_time": "1:23:25", "remaining_time": "0:14:31", "throughput": 4240.36, "total_tokens": 21227112} {"current_steps": 32505, "total_steps": 38160, "loss": 0.4074, "lr": 6.544062231833792e-05, "epoch": 17.03616352201258, "percentage": 85.18, "elapsed_time": "1:23:26", "remaining_time": "0:14:31", "throughput": 4240.37, "total_tokens": 21230152} {"current_steps": 32510, "total_steps": 38160, "loss": 0.4204, "lr": 6.532755903542847e-05, "epoch": 17.038784067085953, "percentage": 85.19, "elapsed_time": "1:23:27", "remaining_time": "0:14:30", "throughput": 4240.35, "total_tokens": 21232904} {"current_steps": 32515, "total_steps": 38160, "loss": 0.3618, "lr": 6.521458668103458e-05, "epoch": 17.04140461215933, "percentage": 85.21, "elapsed_time": "1:23:28", "remaining_time": "0:14:29", "throughput": 4240.35, "total_tokens": 21235816} {"current_steps": 32520, "total_steps": 38160, "loss": 0.3335, "lr": 6.510170527878889e-05, "epoch": 17.044025157232703, "percentage": 85.22, "elapsed_time": "1:23:28", "remaining_time": "0:14:28", "throughput": 4240.39, "total_tokens": 21239112} {"current_steps": 32525, "total_steps": 38160, "loss": 0.3879, "lr": 6.498891485230491e-05, "epoch": 17.04664570230608, "percentage": 85.23, "elapsed_time": "1:23:29", "remaining_time": "0:14:27", "throughput": 4240.39, "total_tokens": 21241928} {"current_steps": 32530, "total_steps": 38160, "loss": 0.3909, "lr": 6.487621542517703e-05, "epoch": 17.049266247379453, "percentage": 85.25, "elapsed_time": "1:23:30", "remaining_time": "0:14:27", "throughput": 4240.68, "total_tokens": 21248616} {"current_steps": 32535, "total_steps": 38160, "loss": 0.3991, "lr": 6.476360702098078e-05, "epoch": 17.05188679245283, "percentage": 85.26, "elapsed_time": "1:23:31", "remaining_time": "0:14:26", "throughput": 4240.67, "total_tokens": 21251464} {"current_steps": 32540, "total_steps": 38160, "loss": 0.4543, "lr": 6.465108966327243e-05, "epoch": 17.054507337526207, "percentage": 85.27, "elapsed_time": "1:23:32", "remaining_time": "0:14:25", "throughput": 4240.68, "total_tokens": 21254408} {"current_steps": 32545, "total_steps": 38160, "loss": 0.5574, "lr": 6.453866337558939e-05, "epoch": 17.05712788259958, "percentage": 85.29, "elapsed_time": "1:23:32", "remaining_time": "0:14:24", "throughput": 4240.71, "total_tokens": 21257704} {"current_steps": 32550, "total_steps": 38160, "loss": 0.3381, "lr": 6.442632818145011e-05, "epoch": 17.059748427672957, "percentage": 85.3, "elapsed_time": "1:23:33", "remaining_time": "0:14:24", "throughput": 4240.66, "total_tokens": 21260040} {"current_steps": 32555, "total_steps": 38160, "loss": 0.4617, "lr": 6.431408410435352e-05, "epoch": 17.06236897274633, "percentage": 85.31, "elapsed_time": "1:23:34", "remaining_time": "0:14:23", "throughput": 4240.63, "total_tokens": 21262664} {"current_steps": 32560, "total_steps": 38160, "loss": 0.3552, "lr": 6.420193116778e-05, "epoch": 17.064989517819708, "percentage": 85.32, "elapsed_time": "1:23:34", "remaining_time": "0:14:22", "throughput": 4240.73, "total_tokens": 21266728} {"current_steps": 32565, "total_steps": 38160, "loss": 0.3829, "lr": 6.408986939519074e-05, "epoch": 17.06761006289308, "percentage": 85.34, "elapsed_time": "1:23:35", "remaining_time": "0:14:21", "throughput": 4240.71, "total_tokens": 21269416} {"current_steps": 32570, "total_steps": 38160, "loss": 0.3185, "lr": 6.397789881002752e-05, "epoch": 17.070230607966458, "percentage": 85.35, "elapsed_time": "1:23:36", "remaining_time": "0:14:20", "throughput": 4240.68, "total_tokens": 21271944} {"current_steps": 32575, "total_steps": 38160, "loss": 0.4358, "lr": 6.386601943571352e-05, "epoch": 17.07285115303983, "percentage": 85.36, "elapsed_time": "1:23:36", "remaining_time": "0:14:20", "throughput": 4240.66, "total_tokens": 21274728} {"current_steps": 32580, "total_steps": 38160, "loss": 0.369, "lr": 6.375423129565266e-05, "epoch": 17.07547169811321, "percentage": 85.38, "elapsed_time": "1:23:37", "remaining_time": "0:14:19", "throughput": 4240.71, "total_tokens": 21278184} {"current_steps": 32585, "total_steps": 38160, "loss": 0.5166, "lr": 6.36425344132296e-05, "epoch": 17.078092243186582, "percentage": 85.39, "elapsed_time": "1:23:38", "remaining_time": "0:14:18", "throughput": 4240.73, "total_tokens": 21281288} {"current_steps": 32590, "total_steps": 38160, "loss": 0.4224, "lr": 6.353092881181016e-05, "epoch": 17.08071278825996, "percentage": 85.4, "elapsed_time": "1:23:39", "remaining_time": "0:14:17", "throughput": 4240.73, "total_tokens": 21284232} {"current_steps": 32595, "total_steps": 38160, "loss": 0.3881, "lr": 6.341941451474082e-05, "epoch": 17.083333333333332, "percentage": 85.42, "elapsed_time": "1:23:39", "remaining_time": "0:14:17", "throughput": 4240.67, "total_tokens": 21286472} {"current_steps": 32600, "total_steps": 38160, "loss": 0.4929, "lr": 6.330799154534921e-05, "epoch": 17.08595387840671, "percentage": 85.43, "elapsed_time": "1:23:40", "remaining_time": "0:14:16", "throughput": 4240.7, "total_tokens": 21289704} {"current_steps": 32605, "total_steps": 38160, "loss": 0.359, "lr": 6.319665992694368e-05, "epoch": 17.088574423480082, "percentage": 85.44, "elapsed_time": "1:23:40", "remaining_time": "0:14:15", "throughput": 4240.69, "total_tokens": 21292392} {"current_steps": 32610, "total_steps": 38160, "loss": 0.3671, "lr": 6.308541968281373e-05, "epoch": 17.09119496855346, "percentage": 85.46, "elapsed_time": "1:23:41", "remaining_time": "0:14:14", "throughput": 4240.72, "total_tokens": 21295624} {"current_steps": 32615, "total_steps": 38160, "loss": 0.3586, "lr": 6.297427083622936e-05, "epoch": 17.093815513626833, "percentage": 85.47, "elapsed_time": "1:23:42", "remaining_time": "0:14:13", "throughput": 4240.7, "total_tokens": 21298248} {"current_steps": 32620, "total_steps": 38160, "loss": 0.5544, "lr": 6.28632134104416e-05, "epoch": 17.09643605870021, "percentage": 85.48, "elapsed_time": "1:23:43", "remaining_time": "0:14:13", "throughput": 4240.79, "total_tokens": 21302120} {"current_steps": 32625, "total_steps": 38160, "loss": 0.4278, "lr": 6.275224742868247e-05, "epoch": 17.099056603773583, "percentage": 85.5, "elapsed_time": "1:23:43", "remaining_time": "0:14:12", "throughput": 4240.76, "total_tokens": 21304744} {"current_steps": 32630, "total_steps": 38160, "loss": 0.3604, "lr": 6.264137291416477e-05, "epoch": 17.10167714884696, "percentage": 85.51, "elapsed_time": "1:23:44", "remaining_time": "0:14:11", "throughput": 4240.87, "total_tokens": 21309000} {"current_steps": 32635, "total_steps": 38160, "loss": 0.4203, "lr": 6.253058989008226e-05, "epoch": 17.104297693920337, "percentage": 85.52, "elapsed_time": "1:23:45", "remaining_time": "0:14:10", "throughput": 4240.86, "total_tokens": 21311688} {"current_steps": 32640, "total_steps": 38160, "loss": 0.4185, "lr": 6.241989837960949e-05, "epoch": 17.10691823899371, "percentage": 85.53, "elapsed_time": "1:23:46", "remaining_time": "0:14:09", "throughput": 4240.86, "total_tokens": 21314568} {"current_steps": 32645, "total_steps": 38160, "loss": 0.339, "lr": 6.230929840590177e-05, "epoch": 17.109538784067087, "percentage": 85.55, "elapsed_time": "1:23:47", "remaining_time": "0:14:09", "throughput": 4241.2, "total_tokens": 21321512} {"current_steps": 32650, "total_steps": 38160, "loss": 0.4346, "lr": 6.219878999209533e-05, "epoch": 17.11215932914046, "percentage": 85.56, "elapsed_time": "1:23:47", "remaining_time": "0:14:08", "throughput": 4241.19, "total_tokens": 21324264} {"current_steps": 32655, "total_steps": 38160, "loss": 0.3439, "lr": 6.208837316130733e-05, "epoch": 17.114779874213838, "percentage": 85.57, "elapsed_time": "1:23:48", "remaining_time": "0:14:07", "throughput": 4241.25, "total_tokens": 21327944} {"current_steps": 32660, "total_steps": 38160, "loss": 0.4874, "lr": 6.197804793663564e-05, "epoch": 17.11740041928721, "percentage": 85.59, "elapsed_time": "1:23:49", "remaining_time": "0:14:06", "throughput": 4241.23, "total_tokens": 21330632} {"current_steps": 32665, "total_steps": 38160, "loss": 0.3761, "lr": 6.18678143411593e-05, "epoch": 17.120020964360588, "percentage": 85.6, "elapsed_time": "1:23:49", "remaining_time": "0:14:06", "throughput": 4241.15, "total_tokens": 21332712} {"current_steps": 32670, "total_steps": 38160, "loss": 0.4177, "lr": 6.175767239793767e-05, "epoch": 17.12264150943396, "percentage": 85.61, "elapsed_time": "1:23:50", "remaining_time": "0:14:05", "throughput": 4241.24, "total_tokens": 21336616} {"current_steps": 32675, "total_steps": 38160, "loss": 0.4011, "lr": 6.164762213001112e-05, "epoch": 17.12526205450734, "percentage": 85.63, "elapsed_time": "1:23:51", "remaining_time": "0:14:04", "throughput": 4241.27, "total_tokens": 21339848} {"current_steps": 32680, "total_steps": 38160, "loss": 0.4411, "lr": 6.153766356040107e-05, "epoch": 17.127882599580712, "percentage": 85.64, "elapsed_time": "1:23:52", "remaining_time": "0:14:03", "throughput": 4241.28, "total_tokens": 21342888} {"current_steps": 32685, "total_steps": 38160, "loss": 0.34, "lr": 6.142779671210951e-05, "epoch": 17.13050314465409, "percentage": 85.65, "elapsed_time": "1:23:52", "remaining_time": "0:14:03", "throughput": 4241.35, "total_tokens": 21346440} {"current_steps": 32690, "total_steps": 38160, "loss": 0.3653, "lr": 6.131802160811956e-05, "epoch": 17.133123689727462, "percentage": 85.67, "elapsed_time": "1:23:53", "remaining_time": "0:14:02", "throughput": 4241.3, "total_tokens": 21348808} {"current_steps": 32695, "total_steps": 38160, "loss": 0.3794, "lr": 6.120833827139466e-05, "epoch": 17.13574423480084, "percentage": 85.68, "elapsed_time": "1:23:54", "remaining_time": "0:14:01", "throughput": 4241.23, "total_tokens": 21350984} {"current_steps": 32700, "total_steps": 38160, "loss": 0.444, "lr": 6.109874672487936e-05, "epoch": 17.138364779874212, "percentage": 85.69, "elapsed_time": "1:23:54", "remaining_time": "0:14:00", "throughput": 4241.33, "total_tokens": 21354888} {"current_steps": 32705, "total_steps": 38160, "loss": 0.4297, "lr": 6.098924699149894e-05, "epoch": 17.14098532494759, "percentage": 85.7, "elapsed_time": "1:23:55", "remaining_time": "0:13:59", "throughput": 4241.28, "total_tokens": 21357352} {"current_steps": 32710, "total_steps": 38160, "loss": 0.6382, "lr": 6.087983909415962e-05, "epoch": 17.143605870020963, "percentage": 85.72, "elapsed_time": "1:23:56", "remaining_time": "0:13:59", "throughput": 4241.27, "total_tokens": 21360104} {"current_steps": 32715, "total_steps": 38160, "loss": 0.3397, "lr": 6.077052305574815e-05, "epoch": 17.14622641509434, "percentage": 85.73, "elapsed_time": "1:23:56", "remaining_time": "0:13:58", "throughput": 4241.29, "total_tokens": 21363144} {"current_steps": 32720, "total_steps": 38160, "loss": 0.4083, "lr": 6.066129889913241e-05, "epoch": 17.148846960167713, "percentage": 85.74, "elapsed_time": "1:23:57", "remaining_time": "0:13:57", "throughput": 4241.43, "total_tokens": 21367432} {"current_steps": 32725, "total_steps": 38160, "loss": 0.367, "lr": 6.0552166647160676e-05, "epoch": 17.15146750524109, "percentage": 85.76, "elapsed_time": "1:23:58", "remaining_time": "0:13:56", "throughput": 4241.49, "total_tokens": 21370984} {"current_steps": 32730, "total_steps": 38160, "loss": 0.441, "lr": 6.044312632266208e-05, "epoch": 17.154088050314467, "percentage": 85.77, "elapsed_time": "1:23:59", "remaining_time": "0:13:56", "throughput": 4241.5, "total_tokens": 21374024} {"current_steps": 32735, "total_steps": 38160, "loss": 0.4427, "lr": 6.03341779484467e-05, "epoch": 17.15670859538784, "percentage": 85.78, "elapsed_time": "1:23:59", "remaining_time": "0:13:55", "throughput": 4241.53, "total_tokens": 21377160} {"current_steps": 32740, "total_steps": 38160, "loss": 0.4794, "lr": 6.022532154730537e-05, "epoch": 17.159329140461217, "percentage": 85.8, "elapsed_time": "1:24:00", "remaining_time": "0:13:54", "throughput": 4241.6, "total_tokens": 21380904} {"current_steps": 32745, "total_steps": 38160, "loss": 0.4125, "lr": 6.011655714200964e-05, "epoch": 17.16194968553459, "percentage": 85.81, "elapsed_time": "1:24:01", "remaining_time": "0:13:53", "throughput": 4241.61, "total_tokens": 21383880} {"current_steps": 32750, "total_steps": 38160, "loss": 0.4567, "lr": 6.0007884755311715e-05, "epoch": 17.164570230607968, "percentage": 85.82, "elapsed_time": "1:24:02", "remaining_time": "0:13:52", "throughput": 4241.64, "total_tokens": 21387048} {"current_steps": 32755, "total_steps": 38160, "loss": 0.2713, "lr": 5.989930440994451e-05, "epoch": 17.16719077568134, "percentage": 85.84, "elapsed_time": "1:24:02", "remaining_time": "0:13:52", "throughput": 4241.69, "total_tokens": 21390568} {"current_steps": 32760, "total_steps": 38160, "loss": 0.3346, "lr": 5.979081612862186e-05, "epoch": 17.169811320754718, "percentage": 85.85, "elapsed_time": "1:24:03", "remaining_time": "0:13:51", "throughput": 4241.64, "total_tokens": 21392904} {"current_steps": 32765, "total_steps": 38160, "loss": 0.3125, "lr": 5.968241993403834e-05, "epoch": 17.17243186582809, "percentage": 85.86, "elapsed_time": "1:24:04", "remaining_time": "0:13:50", "throughput": 4241.67, "total_tokens": 21396072} {"current_steps": 32770, "total_steps": 38160, "loss": 0.4559, "lr": 5.957411584886924e-05, "epoch": 17.17505241090147, "percentage": 85.88, "elapsed_time": "1:24:04", "remaining_time": "0:13:49", "throughput": 4241.7, "total_tokens": 21399208} {"current_steps": 32775, "total_steps": 38160, "loss": 0.3161, "lr": 5.946590389577033e-05, "epoch": 17.177672955974842, "percentage": 85.89, "elapsed_time": "1:24:05", "remaining_time": "0:13:49", "throughput": 4241.71, "total_tokens": 21402248} {"current_steps": 32780, "total_steps": 38160, "loss": 0.4202, "lr": 5.935778409737857e-05, "epoch": 17.18029350104822, "percentage": 85.9, "elapsed_time": "1:24:06", "remaining_time": "0:13:48", "throughput": 4241.74, "total_tokens": 21405480} {"current_steps": 32785, "total_steps": 38160, "loss": 0.4314, "lr": 5.92497564763112e-05, "epoch": 17.182914046121592, "percentage": 85.91, "elapsed_time": "1:24:07", "remaining_time": "0:13:47", "throughput": 4241.72, "total_tokens": 21408168} {"current_steps": 32790, "total_steps": 38160, "loss": 0.3753, "lr": 5.914182105516641e-05, "epoch": 17.18553459119497, "percentage": 85.93, "elapsed_time": "1:24:07", "remaining_time": "0:13:46", "throughput": 4241.72, "total_tokens": 21411112} {"current_steps": 32795, "total_steps": 38160, "loss": 0.3872, "lr": 5.903397785652304e-05, "epoch": 17.188155136268342, "percentage": 85.94, "elapsed_time": "1:24:08", "remaining_time": "0:13:45", "throughput": 4241.8, "total_tokens": 21414856} {"current_steps": 32800, "total_steps": 38160, "loss": 0.4142, "lr": 5.8926226902940804e-05, "epoch": 17.19077568134172, "percentage": 85.95, "elapsed_time": "1:24:09", "remaining_time": "0:13:45", "throughput": 4241.8, "total_tokens": 21417736} {"current_steps": 32805, "total_steps": 38160, "loss": 0.373, "lr": 5.88185682169598e-05, "epoch": 17.193396226415093, "percentage": 85.97, "elapsed_time": "1:24:09", "remaining_time": "0:13:44", "throughput": 4241.86, "total_tokens": 21421352} {"current_steps": 32810, "total_steps": 38160, "loss": 0.4799, "lr": 5.871100182110117e-05, "epoch": 17.19601677148847, "percentage": 85.98, "elapsed_time": "1:24:10", "remaining_time": "0:13:43", "throughput": 4241.96, "total_tokens": 21425352} {"current_steps": 32815, "total_steps": 38160, "loss": 0.3505, "lr": 5.8603527737866314e-05, "epoch": 17.198637316561843, "percentage": 85.99, "elapsed_time": "1:24:11", "remaining_time": "0:13:42", "throughput": 4241.96, "total_tokens": 21428232} {"current_steps": 32820, "total_steps": 38160, "loss": 0.4042, "lr": 5.849614598973779e-05, "epoch": 17.20125786163522, "percentage": 86.01, "elapsed_time": "1:24:12", "remaining_time": "0:13:42", "throughput": 4241.94, "total_tokens": 21430984} {"current_steps": 32825, "total_steps": 38160, "loss": 0.4644, "lr": 5.8388856599178644e-05, "epoch": 17.203878406708597, "percentage": 86.02, "elapsed_time": "1:24:12", "remaining_time": "0:13:41", "throughput": 4241.97, "total_tokens": 21434152} {"current_steps": 32830, "total_steps": 38160, "loss": 0.4178, "lr": 5.8281659588632464e-05, "epoch": 17.20649895178197, "percentage": 86.03, "elapsed_time": "1:24:13", "remaining_time": "0:13:40", "throughput": 4242.06, "total_tokens": 21438088} {"current_steps": 32835, "total_steps": 38160, "loss": 0.4252, "lr": 5.817455498052382e-05, "epoch": 17.209119496855347, "percentage": 86.05, "elapsed_time": "1:24:14", "remaining_time": "0:13:39", "throughput": 4242.2, "total_tokens": 21442408} {"current_steps": 32840, "total_steps": 38160, "loss": 0.4348, "lr": 5.806754279725751e-05, "epoch": 17.21174004192872, "percentage": 86.06, "elapsed_time": "1:24:15", "remaining_time": "0:13:38", "throughput": 4242.14, "total_tokens": 21444680} {"current_steps": 32845, "total_steps": 38160, "loss": 0.4182, "lr": 5.796062306121947e-05, "epoch": 17.214360587002098, "percentage": 86.07, "elapsed_time": "1:24:15", "remaining_time": "0:13:38", "throughput": 4242.11, "total_tokens": 21447272} {"current_steps": 32850, "total_steps": 38160, "loss": 0.4094, "lr": 5.785379579477607e-05, "epoch": 17.21698113207547, "percentage": 86.08, "elapsed_time": "1:24:16", "remaining_time": "0:13:37", "throughput": 4242.1, "total_tokens": 21450120} {"current_steps": 32855, "total_steps": 38160, "loss": 0.3441, "lr": 5.774706102027427e-05, "epoch": 17.219601677148848, "percentage": 86.1, "elapsed_time": "1:24:17", "remaining_time": "0:13:36", "throughput": 4242.17, "total_tokens": 21453736} {"current_steps": 32860, "total_steps": 38160, "loss": 0.4729, "lr": 5.7640418760041776e-05, "epoch": 17.22222222222222, "percentage": 86.11, "elapsed_time": "1:24:18", "remaining_time": "0:13:35", "throughput": 4242.24, "total_tokens": 21457512} {"current_steps": 32865, "total_steps": 38160, "loss": 0.356, "lr": 5.753386903638713e-05, "epoch": 17.2248427672956, "percentage": 86.12, "elapsed_time": "1:24:18", "remaining_time": "0:13:35", "throughput": 4242.22, "total_tokens": 21460104} {"current_steps": 32870, "total_steps": 38160, "loss": 0.3935, "lr": 5.7427411871599e-05, "epoch": 17.22746331236897, "percentage": 86.14, "elapsed_time": "1:24:19", "remaining_time": "0:13:34", "throughput": 4242.22, "total_tokens": 21463048} {"current_steps": 32875, "total_steps": 38160, "loss": 0.5198, "lr": 5.7321047287947235e-05, "epoch": 17.23008385744235, "percentage": 86.15, "elapsed_time": "1:24:20", "remaining_time": "0:13:33", "throughput": 4242.15, "total_tokens": 21465288} {"current_steps": 32880, "total_steps": 38160, "loss": 0.6149, "lr": 5.72147753076821e-05, "epoch": 17.232704402515722, "percentage": 86.16, "elapsed_time": "1:24:20", "remaining_time": "0:13:32", "throughput": 4242.18, "total_tokens": 21468552} {"current_steps": 32885, "total_steps": 38160, "loss": 0.534, "lr": 5.7108595953034306e-05, "epoch": 17.2353249475891, "percentage": 86.18, "elapsed_time": "1:24:21", "remaining_time": "0:13:31", "throughput": 4242.22, "total_tokens": 21471784} {"current_steps": 32890, "total_steps": 38160, "loss": 0.5058, "lr": 5.7002509246215415e-05, "epoch": 17.237945492662472, "percentage": 86.19, "elapsed_time": "1:24:22", "remaining_time": "0:13:31", "throughput": 4242.18, "total_tokens": 21474312} {"current_steps": 32895, "total_steps": 38160, "loss": 0.3818, "lr": 5.68965152094178e-05, "epoch": 17.24056603773585, "percentage": 86.2, "elapsed_time": "1:24:22", "remaining_time": "0:13:30", "throughput": 4242.23, "total_tokens": 21477640} {"current_steps": 32900, "total_steps": 38160, "loss": 0.4534, "lr": 5.679061386481388e-05, "epoch": 17.243186582809223, "percentage": 86.22, "elapsed_time": "1:24:23", "remaining_time": "0:13:29", "throughput": 4242.25, "total_tokens": 21480744} {"current_steps": 32905, "total_steps": 38160, "loss": 0.4379, "lr": 5.6684805234557216e-05, "epoch": 17.2458071278826, "percentage": 86.23, "elapsed_time": "1:24:24", "remaining_time": "0:13:28", "throughput": 4242.27, "total_tokens": 21483816} {"current_steps": 32910, "total_steps": 38160, "loss": 0.3171, "lr": 5.65790893407816e-05, "epoch": 17.248427672955973, "percentage": 86.24, "elapsed_time": "1:24:24", "remaining_time": "0:13:27", "throughput": 4242.31, "total_tokens": 21487080} {"current_steps": 32915, "total_steps": 38160, "loss": 0.4353, "lr": 5.647346620560168e-05, "epoch": 17.25104821802935, "percentage": 86.26, "elapsed_time": "1:24:25", "remaining_time": "0:13:27", "throughput": 4242.32, "total_tokens": 21490088} {"current_steps": 32920, "total_steps": 38160, "loss": 0.3934, "lr": 5.6367935851112605e-05, "epoch": 17.253668763102727, "percentage": 86.27, "elapsed_time": "1:24:26", "remaining_time": "0:13:26", "throughput": 4242.38, "total_tokens": 21493672} {"current_steps": 32925, "total_steps": 38160, "loss": 0.3883, "lr": 5.626249829939023e-05, "epoch": 17.2562893081761, "percentage": 86.28, "elapsed_time": "1:24:27", "remaining_time": "0:13:25", "throughput": 4242.4, "total_tokens": 21496776} {"current_steps": 32930, "total_steps": 38160, "loss": 0.3174, "lr": 5.6157153572490795e-05, "epoch": 17.258909853249477, "percentage": 86.29, "elapsed_time": "1:24:27", "remaining_time": "0:13:24", "throughput": 4242.36, "total_tokens": 21499208} {"current_steps": 32935, "total_steps": 38160, "loss": 0.3048, "lr": 5.6051901692451115e-05, "epoch": 17.26153039832285, "percentage": 86.31, "elapsed_time": "1:24:28", "remaining_time": "0:13:24", "throughput": 4242.48, "total_tokens": 21503368} {"current_steps": 32940, "total_steps": 38160, "loss": 0.4418, "lr": 5.5946742681288744e-05, "epoch": 17.264150943396228, "percentage": 86.32, "elapsed_time": "1:24:29", "remaining_time": "0:13:23", "throughput": 4242.53, "total_tokens": 21506824} {"current_steps": 32945, "total_steps": 38160, "loss": 0.5296, "lr": 5.5841676561001805e-05, "epoch": 17.2667714884696, "percentage": 86.33, "elapsed_time": "1:24:29", "remaining_time": "0:13:22", "throughput": 4242.51, "total_tokens": 21509384} {"current_steps": 32950, "total_steps": 38160, "loss": 0.4273, "lr": 5.573670335356901e-05, "epoch": 17.269392033542978, "percentage": 86.35, "elapsed_time": "1:24:30", "remaining_time": "0:13:21", "throughput": 4242.57, "total_tokens": 21512872} {"current_steps": 32955, "total_steps": 38160, "loss": 0.51, "lr": 5.563182308094933e-05, "epoch": 17.27201257861635, "percentage": 86.36, "elapsed_time": "1:24:31", "remaining_time": "0:13:21", "throughput": 4242.69, "total_tokens": 21517000} {"current_steps": 32960, "total_steps": 38160, "loss": 0.4424, "lr": 5.552703576508272e-05, "epoch": 17.27463312368973, "percentage": 86.37, "elapsed_time": "1:24:32", "remaining_time": "0:13:20", "throughput": 4242.63, "total_tokens": 21519272} {"current_steps": 32965, "total_steps": 38160, "loss": 0.4671, "lr": 5.5422341427889324e-05, "epoch": 17.2772536687631, "percentage": 86.39, "elapsed_time": "1:24:32", "remaining_time": "0:13:19", "throughput": 4242.67, "total_tokens": 21522536} {"current_steps": 32970, "total_steps": 38160, "loss": 0.5942, "lr": 5.531774009127011e-05, "epoch": 17.27987421383648, "percentage": 86.4, "elapsed_time": "1:24:33", "remaining_time": "0:13:18", "throughput": 4242.84, "total_tokens": 21527240} {"current_steps": 32975, "total_steps": 38160, "loss": 0.4801, "lr": 5.521323177710647e-05, "epoch": 17.282494758909852, "percentage": 86.41, "elapsed_time": "1:24:34", "remaining_time": "0:13:17", "throughput": 4242.92, "total_tokens": 21530984} {"current_steps": 32980, "total_steps": 38160, "loss": 0.3953, "lr": 5.510881650726046e-05, "epoch": 17.28511530398323, "percentage": 86.43, "elapsed_time": "1:24:35", "remaining_time": "0:13:17", "throughput": 4242.97, "total_tokens": 21534344} {"current_steps": 32985, "total_steps": 38160, "loss": 0.4849, "lr": 5.50044943035744e-05, "epoch": 17.287735849056602, "percentage": 86.44, "elapsed_time": "1:24:36", "remaining_time": "0:13:16", "throughput": 4243.01, "total_tokens": 21537576} {"current_steps": 32990, "total_steps": 38160, "loss": 0.391, "lr": 5.490026518787128e-05, "epoch": 17.29035639412998, "percentage": 86.45, "elapsed_time": "1:24:36", "remaining_time": "0:13:15", "throughput": 4243.0, "total_tokens": 21540488} {"current_steps": 32995, "total_steps": 38160, "loss": 0.5393, "lr": 5.47961291819547e-05, "epoch": 17.292976939203353, "percentage": 86.46, "elapsed_time": "1:24:37", "remaining_time": "0:13:14", "throughput": 4243.01, "total_tokens": 21543592} {"current_steps": 33000, "total_steps": 38160, "loss": 0.3816, "lr": 5.46920863076088e-05, "epoch": 17.29559748427673, "percentage": 86.48, "elapsed_time": "1:24:38", "remaining_time": "0:13:14", "throughput": 4243.04, "total_tokens": 21546760} {"current_steps": 33005, "total_steps": 38160, "loss": 0.4333, "lr": 5.4588136586598056e-05, "epoch": 17.298218029350103, "percentage": 86.49, "elapsed_time": "1:24:38", "remaining_time": "0:13:13", "throughput": 4243.02, "total_tokens": 21549608} {"current_steps": 33010, "total_steps": 38160, "loss": 0.3234, "lr": 5.44842800406678e-05, "epoch": 17.30083857442348, "percentage": 86.5, "elapsed_time": "1:24:39", "remaining_time": "0:13:12", "throughput": 4243.14, "total_tokens": 21553736} {"current_steps": 33015, "total_steps": 38160, "loss": 0.3931, "lr": 5.438051669154326e-05, "epoch": 17.303459119496857, "percentage": 86.52, "elapsed_time": "1:24:40", "remaining_time": "0:13:11", "throughput": 4243.14, "total_tokens": 21556648} {"current_steps": 33020, "total_steps": 38160, "loss": 0.3193, "lr": 5.427684656093074e-05, "epoch": 17.30607966457023, "percentage": 86.53, "elapsed_time": "1:24:41", "remaining_time": "0:13:10", "throughput": 4243.17, "total_tokens": 21559912} {"current_steps": 33025, "total_steps": 38160, "loss": 0.3621, "lr": 5.417326967051683e-05, "epoch": 17.308700209643607, "percentage": 86.54, "elapsed_time": "1:24:41", "remaining_time": "0:13:10", "throughput": 4243.13, "total_tokens": 21562344} {"current_steps": 33030, "total_steps": 38160, "loss": 0.4479, "lr": 5.4069786041968663e-05, "epoch": 17.31132075471698, "percentage": 86.56, "elapsed_time": "1:24:42", "remaining_time": "0:13:09", "throughput": 4243.14, "total_tokens": 21565288} {"current_steps": 33035, "total_steps": 38160, "loss": 0.3989, "lr": 5.39663956969339e-05, "epoch": 17.313941299790358, "percentage": 86.57, "elapsed_time": "1:24:43", "remaining_time": "0:13:08", "throughput": 4243.1, "total_tokens": 21567816} {"current_steps": 33040, "total_steps": 38160, "loss": 0.6142, "lr": 5.3863098657040534e-05, "epoch": 17.31656184486373, "percentage": 86.58, "elapsed_time": "1:24:43", "remaining_time": "0:13:07", "throughput": 4243.21, "total_tokens": 21571912} {"current_steps": 33045, "total_steps": 38160, "loss": 0.4324, "lr": 5.375989494389705e-05, "epoch": 17.319182389937108, "percentage": 86.6, "elapsed_time": "1:24:44", "remaining_time": "0:13:07", "throughput": 4243.19, "total_tokens": 21574600} {"current_steps": 33050, "total_steps": 38160, "loss": 0.3541, "lr": 5.365678457909257e-05, "epoch": 17.32180293501048, "percentage": 86.61, "elapsed_time": "1:24:45", "remaining_time": "0:13:06", "throughput": 4243.23, "total_tokens": 21577864} {"current_steps": 33055, "total_steps": 38160, "loss": 0.7593, "lr": 5.3553767584196555e-05, "epoch": 17.32442348008386, "percentage": 86.62, "elapsed_time": "1:24:45", "remaining_time": "0:13:05", "throughput": 4243.21, "total_tokens": 21580552} {"current_steps": 33060, "total_steps": 38160, "loss": 0.451, "lr": 5.3450843980759166e-05, "epoch": 17.32704402515723, "percentage": 86.64, "elapsed_time": "1:24:46", "remaining_time": "0:13:04", "throughput": 4243.25, "total_tokens": 21583880} {"current_steps": 33065, "total_steps": 38160, "loss": 0.4087, "lr": 5.3348013790310736e-05, "epoch": 17.32966457023061, "percentage": 86.65, "elapsed_time": "1:24:47", "remaining_time": "0:13:03", "throughput": 4243.32, "total_tokens": 21587432} {"current_steps": 33070, "total_steps": 38160, "loss": 0.338, "lr": 5.324527703436199e-05, "epoch": 17.332285115303982, "percentage": 86.66, "elapsed_time": "1:24:48", "remaining_time": "0:13:03", "throughput": 4243.33, "total_tokens": 21590376} {"current_steps": 33075, "total_steps": 38160, "loss": 0.4804, "lr": 5.314263373440448e-05, "epoch": 17.33490566037736, "percentage": 86.67, "elapsed_time": "1:24:48", "remaining_time": "0:13:02", "throughput": 4243.31, "total_tokens": 21592936} {"current_steps": 33080, "total_steps": 38160, "loss": 0.6415, "lr": 5.304008391190995e-05, "epoch": 17.337526205450732, "percentage": 86.69, "elapsed_time": "1:24:49", "remaining_time": "0:13:01", "throughput": 4243.33, "total_tokens": 21596040} {"current_steps": 33085, "total_steps": 38160, "loss": 0.382, "lr": 5.293762758833071e-05, "epoch": 17.34014675052411, "percentage": 86.7, "elapsed_time": "1:24:50", "remaining_time": "0:13:00", "throughput": 4243.39, "total_tokens": 21599560} {"current_steps": 33090, "total_steps": 38160, "loss": 0.4042, "lr": 5.283526478509953e-05, "epoch": 17.342767295597483, "percentage": 86.71, "elapsed_time": "1:24:50", "remaining_time": "0:13:00", "throughput": 4243.38, "total_tokens": 21602344} {"current_steps": 33095, "total_steps": 38160, "loss": 0.3327, "lr": 5.273299552362942e-05, "epoch": 17.34538784067086, "percentage": 86.73, "elapsed_time": "1:24:51", "remaining_time": "0:12:59", "throughput": 4243.54, "total_tokens": 21607016} {"current_steps": 33100, "total_steps": 38160, "loss": 0.3649, "lr": 5.263081982531381e-05, "epoch": 17.348008385744233, "percentage": 86.74, "elapsed_time": "1:24:52", "remaining_time": "0:12:58", "throughput": 4243.59, "total_tokens": 21610344} {"current_steps": 33105, "total_steps": 38160, "loss": 0.3924, "lr": 5.2528737711526885e-05, "epoch": 17.35062893081761, "percentage": 86.75, "elapsed_time": "1:24:53", "remaining_time": "0:12:57", "throughput": 4243.58, "total_tokens": 21613288} {"current_steps": 33110, "total_steps": 38160, "loss": 0.4639, "lr": 5.2426749203623005e-05, "epoch": 17.353249475890987, "percentage": 86.77, "elapsed_time": "1:24:53", "remaining_time": "0:12:56", "throughput": 4243.62, "total_tokens": 21616456} {"current_steps": 33115, "total_steps": 38160, "loss": 0.6062, "lr": 5.23248543229371e-05, "epoch": 17.35587002096436, "percentage": 86.78, "elapsed_time": "1:24:54", "remaining_time": "0:12:56", "throughput": 4243.62, "total_tokens": 21619272} {"current_steps": 33120, "total_steps": 38160, "loss": 0.4353, "lr": 5.222305309078429e-05, "epoch": 17.358490566037737, "percentage": 86.79, "elapsed_time": "1:24:55", "remaining_time": "0:12:55", "throughput": 4243.62, "total_tokens": 21622216} {"current_steps": 33125, "total_steps": 38160, "loss": 0.5579, "lr": 5.2121345528460205e-05, "epoch": 17.36111111111111, "percentage": 86.81, "elapsed_time": "1:24:55", "remaining_time": "0:12:54", "throughput": 4243.68, "total_tokens": 21625704} {"current_steps": 33130, "total_steps": 38160, "loss": 0.4256, "lr": 5.201973165724094e-05, "epoch": 17.363731656184488, "percentage": 86.82, "elapsed_time": "1:24:56", "remaining_time": "0:12:53", "throughput": 4243.74, "total_tokens": 21629288} {"current_steps": 33135, "total_steps": 38160, "loss": 0.4079, "lr": 5.1918211498382996e-05, "epoch": 17.36635220125786, "percentage": 86.83, "elapsed_time": "1:24:57", "remaining_time": "0:12:53", "throughput": 4243.75, "total_tokens": 21632264} {"current_steps": 33140, "total_steps": 38160, "loss": 0.4724, "lr": 5.181678507312332e-05, "epoch": 17.368972746331238, "percentage": 86.84, "elapsed_time": "1:24:58", "remaining_time": "0:12:52", "throughput": 4243.87, "total_tokens": 21636584} {"current_steps": 33145, "total_steps": 38160, "loss": 0.513, "lr": 5.171545240267894e-05, "epoch": 17.37159329140461, "percentage": 86.86, "elapsed_time": "1:24:59", "remaining_time": "0:12:51", "throughput": 4243.93, "total_tokens": 21640168} {"current_steps": 33150, "total_steps": 38160, "loss": 0.4957, "lr": 5.161421350824774e-05, "epoch": 17.37421383647799, "percentage": 86.87, "elapsed_time": "1:24:59", "remaining_time": "0:12:50", "throughput": 4243.94, "total_tokens": 21643176} {"current_steps": 33155, "total_steps": 38160, "loss": 0.5282, "lr": 5.151306841100756e-05, "epoch": 17.37683438155136, "percentage": 86.88, "elapsed_time": "1:25:00", "remaining_time": "0:12:49", "throughput": 4244.04, "total_tokens": 21647112} {"current_steps": 33160, "total_steps": 38160, "loss": 0.3469, "lr": 5.141201713211679e-05, "epoch": 17.37945492662474, "percentage": 86.9, "elapsed_time": "1:25:01", "remaining_time": "0:12:49", "throughput": 4244.11, "total_tokens": 21650920} {"current_steps": 33165, "total_steps": 38160, "loss": 0.378, "lr": 5.1311059692714324e-05, "epoch": 17.382075471698112, "percentage": 86.91, "elapsed_time": "1:25:02", "remaining_time": "0:12:48", "throughput": 4244.12, "total_tokens": 21653864} {"current_steps": 33170, "total_steps": 38160, "loss": 0.4785, "lr": 5.1210196113919306e-05, "epoch": 17.38469601677149, "percentage": 86.92, "elapsed_time": "1:25:02", "remaining_time": "0:12:47", "throughput": 4244.08, "total_tokens": 21656296} {"current_steps": 33175, "total_steps": 38160, "loss": 0.3036, "lr": 5.110942641683114e-05, "epoch": 17.387316561844862, "percentage": 86.94, "elapsed_time": "1:25:03", "remaining_time": "0:12:46", "throughput": 4244.08, "total_tokens": 21659240} {"current_steps": 33180, "total_steps": 38160, "loss": 0.4431, "lr": 5.10087506225298e-05, "epoch": 17.38993710691824, "percentage": 86.95, "elapsed_time": "1:25:04", "remaining_time": "0:12:46", "throughput": 4244.05, "total_tokens": 21661768} {"current_steps": 33185, "total_steps": 38160, "loss": 0.3867, "lr": 5.090816875207543e-05, "epoch": 17.392557651991613, "percentage": 86.96, "elapsed_time": "1:25:04", "remaining_time": "0:12:45", "throughput": 4244.05, "total_tokens": 21664712} {"current_steps": 33190, "total_steps": 38160, "loss": 0.4376, "lr": 5.0807680826508604e-05, "epoch": 17.39517819706499, "percentage": 86.98, "elapsed_time": "1:25:05", "remaining_time": "0:12:44", "throughput": 4244.09, "total_tokens": 21668008} {"current_steps": 33195, "total_steps": 38160, "loss": 0.4341, "lr": 5.070728686685039e-05, "epoch": 17.397798742138363, "percentage": 86.99, "elapsed_time": "1:25:06", "remaining_time": "0:12:43", "throughput": 4244.08, "total_tokens": 21670792} {"current_steps": 33200, "total_steps": 38160, "loss": 0.3324, "lr": 5.0606986894101925e-05, "epoch": 17.40041928721174, "percentage": 87.0, "elapsed_time": "1:25:06", "remaining_time": "0:12:42", "throughput": 4244.03, "total_tokens": 21673160} {"current_steps": 33205, "total_steps": 38160, "loss": 0.3761, "lr": 5.0506780929244875e-05, "epoch": 17.403039832285117, "percentage": 87.02, "elapsed_time": "1:25:07", "remaining_time": "0:12:42", "throughput": 4244.13, "total_tokens": 21677000} {"current_steps": 33210, "total_steps": 38160, "loss": 0.4942, "lr": 5.040666899324109e-05, "epoch": 17.40566037735849, "percentage": 87.03, "elapsed_time": "1:25:08", "remaining_time": "0:12:41", "throughput": 4244.17, "total_tokens": 21680424} {"current_steps": 33215, "total_steps": 38160, "loss": 0.5108, "lr": 5.0306651107032916e-05, "epoch": 17.408280922431867, "percentage": 87.04, "elapsed_time": "1:25:09", "remaining_time": "0:12:40", "throughput": 4244.22, "total_tokens": 21683752} {"current_steps": 33220, "total_steps": 38160, "loss": 0.4343, "lr": 5.020672729154308e-05, "epoch": 17.41090146750524, "percentage": 87.05, "elapsed_time": "1:25:09", "remaining_time": "0:12:39", "throughput": 4244.18, "total_tokens": 21686280} {"current_steps": 33225, "total_steps": 38160, "loss": 0.3594, "lr": 5.010689756767428e-05, "epoch": 17.413522012578618, "percentage": 87.07, "elapsed_time": "1:25:10", "remaining_time": "0:12:39", "throughput": 4244.26, "total_tokens": 21689928} {"current_steps": 33230, "total_steps": 38160, "loss": 0.4042, "lr": 5.000716195630983e-05, "epoch": 17.41614255765199, "percentage": 87.08, "elapsed_time": "1:25:11", "remaining_time": "0:12:38", "throughput": 4244.23, "total_tokens": 21692456} {"current_steps": 33235, "total_steps": 38160, "loss": 0.3784, "lr": 4.990752047831343e-05, "epoch": 17.418763102725368, "percentage": 87.09, "elapsed_time": "1:25:11", "remaining_time": "0:12:37", "throughput": 4244.21, "total_tokens": 21695112} {"current_steps": 33240, "total_steps": 38160, "loss": 0.3503, "lr": 4.980797315452873e-05, "epoch": 17.42138364779874, "percentage": 87.11, "elapsed_time": "1:25:12", "remaining_time": "0:12:36", "throughput": 4244.26, "total_tokens": 21698696} {"current_steps": 33245, "total_steps": 38160, "loss": 0.4774, "lr": 4.9708520005779965e-05, "epoch": 17.42400419287212, "percentage": 87.12, "elapsed_time": "1:25:13", "remaining_time": "0:12:35", "throughput": 4244.35, "total_tokens": 21702664} {"current_steps": 33250, "total_steps": 38160, "loss": 0.5229, "lr": 4.960916105287172e-05, "epoch": 17.42662473794549, "percentage": 87.13, "elapsed_time": "1:25:14", "remaining_time": "0:12:35", "throughput": 4244.4, "total_tokens": 21705960} {"current_steps": 33255, "total_steps": 38160, "loss": 0.4973, "lr": 4.950989631658859e-05, "epoch": 17.42924528301887, "percentage": 87.15, "elapsed_time": "1:25:14", "remaining_time": "0:12:34", "throughput": 4244.55, "total_tokens": 21710472} {"current_steps": 33260, "total_steps": 38160, "loss": 0.39, "lr": 4.941072581769562e-05, "epoch": 17.431865828092242, "percentage": 87.16, "elapsed_time": "1:25:15", "remaining_time": "0:12:33", "throughput": 4244.54, "total_tokens": 21713288} {"current_steps": 33265, "total_steps": 38160, "loss": 0.3085, "lr": 4.931164957693834e-05, "epoch": 17.43448637316562, "percentage": 87.17, "elapsed_time": "1:25:16", "remaining_time": "0:12:32", "throughput": 4244.58, "total_tokens": 21716584} {"current_steps": 33270, "total_steps": 38160, "loss": 0.5123, "lr": 4.921266761504217e-05, "epoch": 17.437106918238992, "percentage": 87.19, "elapsed_time": "1:25:17", "remaining_time": "0:12:32", "throughput": 4244.61, "total_tokens": 21719752} {"current_steps": 33275, "total_steps": 38160, "loss": 0.4372, "lr": 4.9113779952713155e-05, "epoch": 17.43972746331237, "percentage": 87.2, "elapsed_time": "1:25:17", "remaining_time": "0:12:31", "throughput": 4244.65, "total_tokens": 21723112} {"current_steps": 33280, "total_steps": 38160, "loss": 0.4187, "lr": 4.90149866106373e-05, "epoch": 17.442348008385743, "percentage": 87.21, "elapsed_time": "1:25:18", "remaining_time": "0:12:30", "throughput": 4244.66, "total_tokens": 21726184} {"current_steps": 33285, "total_steps": 38160, "loss": 0.4788, "lr": 4.8916287609481137e-05, "epoch": 17.44496855345912, "percentage": 87.22, "elapsed_time": "1:25:19", "remaining_time": "0:12:29", "throughput": 4244.7, "total_tokens": 21729416} {"current_steps": 33290, "total_steps": 38160, "loss": 0.3623, "lr": 4.8817682969891366e-05, "epoch": 17.447589098532493, "percentage": 87.24, "elapsed_time": "1:25:19", "remaining_time": "0:12:28", "throughput": 4244.73, "total_tokens": 21732648} {"current_steps": 33295, "total_steps": 38160, "loss": 0.31, "lr": 4.8719172712495095e-05, "epoch": 17.45020964360587, "percentage": 87.25, "elapsed_time": "1:25:20", "remaining_time": "0:12:28", "throughput": 4244.82, "total_tokens": 21736520} {"current_steps": 33300, "total_steps": 38160, "loss": 0.4591, "lr": 4.862075685789935e-05, "epoch": 17.452830188679247, "percentage": 87.26, "elapsed_time": "1:25:21", "remaining_time": "0:12:27", "throughput": 4244.82, "total_tokens": 21739464} {"current_steps": 33305, "total_steps": 38160, "loss": 0.2975, "lr": 4.8522435426691604e-05, "epoch": 17.45545073375262, "percentage": 87.28, "elapsed_time": "1:25:22", "remaining_time": "0:12:26", "throughput": 4244.82, "total_tokens": 21742312} {"current_steps": 33310, "total_steps": 38160, "loss": 0.4681, "lr": 4.842420843943962e-05, "epoch": 17.458071278825997, "percentage": 87.29, "elapsed_time": "1:25:22", "remaining_time": "0:12:25", "throughput": 4244.79, "total_tokens": 21744936} {"current_steps": 33315, "total_steps": 38160, "loss": 0.4356, "lr": 4.8326075916691415e-05, "epoch": 17.46069182389937, "percentage": 87.3, "elapsed_time": "1:25:23", "remaining_time": "0:12:25", "throughput": 4244.89, "total_tokens": 21749032} {"current_steps": 33320, "total_steps": 38160, "loss": 0.4419, "lr": 4.822803787897523e-05, "epoch": 17.463312368972748, "percentage": 87.32, "elapsed_time": "1:25:24", "remaining_time": "0:12:24", "throughput": 4244.95, "total_tokens": 21752744} {"current_steps": 33325, "total_steps": 38160, "loss": 0.4745, "lr": 4.813009434679932e-05, "epoch": 17.46593291404612, "percentage": 87.33, "elapsed_time": "1:25:25", "remaining_time": "0:12:23", "throughput": 4245.03, "total_tokens": 21756552} {"current_steps": 33330, "total_steps": 38160, "loss": 0.332, "lr": 4.803224534065259e-05, "epoch": 17.468553459119498, "percentage": 87.34, "elapsed_time": "1:25:25", "remaining_time": "0:12:22", "throughput": 4244.98, "total_tokens": 21758984} {"current_steps": 33335, "total_steps": 38160, "loss": 0.4463, "lr": 4.793449088100371e-05, "epoch": 17.47117400419287, "percentage": 87.36, "elapsed_time": "1:25:26", "remaining_time": "0:12:22", "throughput": 4244.97, "total_tokens": 21761800} {"current_steps": 33340, "total_steps": 38160, "loss": 0.3706, "lr": 4.783683098830188e-05, "epoch": 17.47379454926625, "percentage": 87.37, "elapsed_time": "1:25:27", "remaining_time": "0:12:21", "throughput": 4245.01, "total_tokens": 21765096} {"current_steps": 33345, "total_steps": 38160, "loss": 0.5747, "lr": 4.7739265682976485e-05, "epoch": 17.47641509433962, "percentage": 87.38, "elapsed_time": "1:25:27", "remaining_time": "0:12:20", "throughput": 4245.06, "total_tokens": 21768552} {"current_steps": 33350, "total_steps": 38160, "loss": 0.4445, "lr": 4.764179498543714e-05, "epoch": 17.479035639413, "percentage": 87.4, "elapsed_time": "1:25:28", "remaining_time": "0:12:19", "throughput": 4245.15, "total_tokens": 21772424} {"current_steps": 33355, "total_steps": 38160, "loss": 0.4441, "lr": 4.754441891607347e-05, "epoch": 17.481656184486372, "percentage": 87.41, "elapsed_time": "1:25:29", "remaining_time": "0:12:18", "throughput": 4245.1, "total_tokens": 21774824} {"current_steps": 33360, "total_steps": 38160, "loss": 0.5559, "lr": 4.7447137495255424e-05, "epoch": 17.48427672955975, "percentage": 87.42, "elapsed_time": "1:25:30", "remaining_time": "0:12:18", "throughput": 4245.19, "total_tokens": 21778728} {"current_steps": 33365, "total_steps": 38160, "loss": 0.4758, "lr": 4.7349950743333206e-05, "epoch": 17.486897274633122, "percentage": 87.43, "elapsed_time": "1:25:30", "remaining_time": "0:12:17", "throughput": 4245.23, "total_tokens": 21782152} {"current_steps": 33370, "total_steps": 38160, "loss": 0.3946, "lr": 4.725285868063722e-05, "epoch": 17.4895178197065, "percentage": 87.45, "elapsed_time": "1:25:31", "remaining_time": "0:12:16", "throughput": 4245.28, "total_tokens": 21785608} {"current_steps": 33375, "total_steps": 38160, "loss": 0.5471, "lr": 4.715586132747801e-05, "epoch": 17.492138364779873, "percentage": 87.46, "elapsed_time": "1:25:32", "remaining_time": "0:12:15", "throughput": 4245.37, "total_tokens": 21789480} {"current_steps": 33380, "total_steps": 38160, "loss": 0.4354, "lr": 4.705895870414634e-05, "epoch": 17.49475890985325, "percentage": 87.47, "elapsed_time": "1:25:33", "remaining_time": "0:12:15", "throughput": 4245.44, "total_tokens": 21793192} {"current_steps": 33385, "total_steps": 38160, "loss": 0.4128, "lr": 4.696215083091299e-05, "epoch": 17.497379454926623, "percentage": 87.49, "elapsed_time": "1:25:33", "remaining_time": "0:12:14", "throughput": 4245.43, "total_tokens": 21795816} {"current_steps": 33390, "total_steps": 38160, "loss": 0.5148, "lr": 4.686543772802915e-05, "epoch": 17.5, "percentage": 87.5, "elapsed_time": "1:25:34", "remaining_time": "0:12:13", "throughput": 4245.48, "total_tokens": 21799240} {"current_steps": 33395, "total_steps": 38160, "loss": 0.3159, "lr": 4.6768819415726085e-05, "epoch": 17.502620545073377, "percentage": 87.51, "elapsed_time": "1:25:35", "remaining_time": "0:12:12", "throughput": 4245.48, "total_tokens": 21802184} {"current_steps": 33400, "total_steps": 38160, "loss": 0.4904, "lr": 4.667229591421529e-05, "epoch": 17.50524109014675, "percentage": 87.53, "elapsed_time": "1:25:36", "remaining_time": "0:12:11", "throughput": 4245.53, "total_tokens": 21805640} {"current_steps": 33405, "total_steps": 38160, "loss": 0.4231, "lr": 4.657586724368845e-05, "epoch": 17.507861635220127, "percentage": 87.54, "elapsed_time": "1:25:36", "remaining_time": "0:12:11", "throughput": 4245.54, "total_tokens": 21808648} {"current_steps": 33410, "total_steps": 38160, "loss": 0.3946, "lr": 4.647953342431726e-05, "epoch": 17.5104821802935, "percentage": 87.55, "elapsed_time": "1:25:37", "remaining_time": "0:12:10", "throughput": 4245.64, "total_tokens": 21812616} {"current_steps": 33415, "total_steps": 38160, "loss": 0.2877, "lr": 4.63832944762535e-05, "epoch": 17.513102725366878, "percentage": 87.57, "elapsed_time": "1:25:38", "remaining_time": "0:12:09", "throughput": 4245.65, "total_tokens": 21815624} {"current_steps": 33420, "total_steps": 38160, "loss": 0.3531, "lr": 4.628715041962944e-05, "epoch": 17.51572327044025, "percentage": 87.58, "elapsed_time": "1:25:39", "remaining_time": "0:12:08", "throughput": 4245.65, "total_tokens": 21818472} {"current_steps": 33425, "total_steps": 38160, "loss": 0.2614, "lr": 4.619110127455728e-05, "epoch": 17.518343815513628, "percentage": 87.59, "elapsed_time": "1:25:39", "remaining_time": "0:12:08", "throughput": 4245.81, "total_tokens": 21823208} {"current_steps": 33430, "total_steps": 38160, "loss": 0.315, "lr": 4.6095147061129494e-05, "epoch": 17.520964360587, "percentage": 87.6, "elapsed_time": "1:25:40", "remaining_time": "0:12:07", "throughput": 4245.81, "total_tokens": 21826120} {"current_steps": 33435, "total_steps": 38160, "loss": 0.4224, "lr": 4.599928779941853e-05, "epoch": 17.52358490566038, "percentage": 87.62, "elapsed_time": "1:25:41", "remaining_time": "0:12:06", "throughput": 4245.9, "total_tokens": 21829992} {"current_steps": 33440, "total_steps": 38160, "loss": 0.4586, "lr": 4.590352350947691e-05, "epoch": 17.52620545073375, "percentage": 87.63, "elapsed_time": "1:25:42", "remaining_time": "0:12:05", "throughput": 4245.91, "total_tokens": 21832968} {"current_steps": 33445, "total_steps": 38160, "loss": 0.3658, "lr": 4.580785421133759e-05, "epoch": 17.52882599580713, "percentage": 87.64, "elapsed_time": "1:25:42", "remaining_time": "0:12:05", "throughput": 4245.96, "total_tokens": 21836328} {"current_steps": 33450, "total_steps": 38160, "loss": 0.4009, "lr": 4.571227992501348e-05, "epoch": 17.531446540880502, "percentage": 87.66, "elapsed_time": "1:25:43", "remaining_time": "0:12:04", "throughput": 4245.93, "total_tokens": 21838856} {"current_steps": 33455, "total_steps": 38160, "loss": 0.4984, "lr": 4.561680067049773e-05, "epoch": 17.53406708595388, "percentage": 87.67, "elapsed_time": "1:25:44", "remaining_time": "0:12:03", "throughput": 4245.99, "total_tokens": 21842440} {"current_steps": 33460, "total_steps": 38160, "loss": 0.5756, "lr": 4.552141646776331e-05, "epoch": 17.536687631027252, "percentage": 87.68, "elapsed_time": "1:25:44", "remaining_time": "0:12:02", "throughput": 4245.98, "total_tokens": 21845128} {"current_steps": 33465, "total_steps": 38160, "loss": 0.4411, "lr": 4.542612733676365e-05, "epoch": 17.53930817610063, "percentage": 87.7, "elapsed_time": "1:25:45", "remaining_time": "0:12:01", "throughput": 4245.93, "total_tokens": 21847528} {"current_steps": 33470, "total_steps": 38160, "loss": 0.5609, "lr": 4.533093329743204e-05, "epoch": 17.541928721174003, "percentage": 87.71, "elapsed_time": "1:25:46", "remaining_time": "0:12:01", "throughput": 4246.0, "total_tokens": 21851240} {"current_steps": 33475, "total_steps": 38160, "loss": 0.4419, "lr": 4.523583436968204e-05, "epoch": 17.54454926624738, "percentage": 87.72, "elapsed_time": "1:25:46", "remaining_time": "0:12:00", "throughput": 4245.96, "total_tokens": 21853672} {"current_steps": 33480, "total_steps": 38160, "loss": 0.6426, "lr": 4.514083057340723e-05, "epoch": 17.547169811320753, "percentage": 87.74, "elapsed_time": "1:25:47", "remaining_time": "0:11:59", "throughput": 4246.07, "total_tokens": 21857736} {"current_steps": 33485, "total_steps": 38160, "loss": 0.3524, "lr": 4.504592192848151e-05, "epoch": 17.54979035639413, "percentage": 87.75, "elapsed_time": "1:25:48", "remaining_time": "0:11:58", "throughput": 4246.12, "total_tokens": 21861192} {"current_steps": 33490, "total_steps": 38160, "loss": 0.3888, "lr": 4.495110845475847e-05, "epoch": 17.552410901467507, "percentage": 87.76, "elapsed_time": "1:25:49", "remaining_time": "0:11:58", "throughput": 4246.17, "total_tokens": 21864584} {"current_steps": 33495, "total_steps": 38160, "loss": 0.5635, "lr": 4.4856390172072045e-05, "epoch": 17.55503144654088, "percentage": 87.78, "elapsed_time": "1:25:49", "remaining_time": "0:11:57", "throughput": 4246.18, "total_tokens": 21867560} {"current_steps": 33500, "total_steps": 38160, "loss": 0.3933, "lr": 4.476176710023622e-05, "epoch": 17.557651991614257, "percentage": 87.79, "elapsed_time": "1:25:50", "remaining_time": "0:11:56", "throughput": 4246.18, "total_tokens": 21870408} {"current_steps": 33505, "total_steps": 38160, "loss": 0.3847, "lr": 4.4667239259045035e-05, "epoch": 17.56027253668763, "percentage": 87.8, "elapsed_time": "1:25:51", "remaining_time": "0:11:55", "throughput": 4246.19, "total_tokens": 21873256} {"current_steps": 33510, "total_steps": 38160, "loss": 0.5071, "lr": 4.457280666827285e-05, "epoch": 17.562893081761008, "percentage": 87.81, "elapsed_time": "1:25:51", "remaining_time": "0:11:54", "throughput": 4246.2, "total_tokens": 21876328} {"current_steps": 33515, "total_steps": 38160, "loss": 0.3993, "lr": 4.447846934767358e-05, "epoch": 17.56551362683438, "percentage": 87.83, "elapsed_time": "1:25:52", "remaining_time": "0:11:54", "throughput": 4246.25, "total_tokens": 21879784} {"current_steps": 33520, "total_steps": 38160, "loss": 0.4661, "lr": 4.4384227316981774e-05, "epoch": 17.568134171907758, "percentage": 87.84, "elapsed_time": "1:25:53", "remaining_time": "0:11:53", "throughput": 4246.26, "total_tokens": 21882792} {"current_steps": 33525, "total_steps": 38160, "loss": 0.4427, "lr": 4.4290080595911555e-05, "epoch": 17.57075471698113, "percentage": 87.85, "elapsed_time": "1:25:54", "remaining_time": "0:11:52", "throughput": 4246.34, "total_tokens": 21886632} {"current_steps": 33530, "total_steps": 38160, "loss": 0.5154, "lr": 4.419602920415749e-05, "epoch": 17.57337526205451, "percentage": 87.87, "elapsed_time": "1:25:54", "remaining_time": "0:11:51", "throughput": 4246.35, "total_tokens": 21889544} {"current_steps": 33535, "total_steps": 38160, "loss": 0.4283, "lr": 4.410207316139408e-05, "epoch": 17.57599580712788, "percentage": 87.88, "elapsed_time": "1:25:55", "remaining_time": "0:11:51", "throughput": 4246.42, "total_tokens": 21893192} {"current_steps": 33540, "total_steps": 38160, "loss": 0.4764, "lr": 4.400821248727577e-05, "epoch": 17.57861635220126, "percentage": 87.89, "elapsed_time": "1:25:56", "remaining_time": "0:11:50", "throughput": 4246.47, "total_tokens": 21896584} {"current_steps": 33545, "total_steps": 38160, "loss": 0.3781, "lr": 4.391444720143717e-05, "epoch": 17.581236897274632, "percentage": 87.91, "elapsed_time": "1:25:57", "remaining_time": "0:11:49", "throughput": 4246.5, "total_tokens": 21899656} {"current_steps": 33550, "total_steps": 38160, "loss": 0.4706, "lr": 4.382077732349299e-05, "epoch": 17.58385744234801, "percentage": 87.92, "elapsed_time": "1:25:57", "remaining_time": "0:11:48", "throughput": 4246.59, "total_tokens": 21903688} {"current_steps": 33555, "total_steps": 38160, "loss": 0.5068, "lr": 4.372720287303772e-05, "epoch": 17.586477987421382, "percentage": 87.93, "elapsed_time": "1:25:58", "remaining_time": "0:11:47", "throughput": 4246.61, "total_tokens": 21906760} {"current_steps": 33560, "total_steps": 38160, "loss": 0.3705, "lr": 4.3633723869646204e-05, "epoch": 17.58909853249476, "percentage": 87.95, "elapsed_time": "1:25:59", "remaining_time": "0:11:47", "throughput": 4246.61, "total_tokens": 21909864} {"current_steps": 33565, "total_steps": 38160, "loss": 0.3519, "lr": 4.3540340332873184e-05, "epoch": 17.591719077568133, "percentage": 87.96, "elapsed_time": "1:26:00", "remaining_time": "0:11:46", "throughput": 4246.62, "total_tokens": 21912808} {"current_steps": 33570, "total_steps": 38160, "loss": 0.3074, "lr": 4.3447052282253375e-05, "epoch": 17.59433962264151, "percentage": 87.97, "elapsed_time": "1:26:00", "remaining_time": "0:11:45", "throughput": 4246.64, "total_tokens": 21916040} {"current_steps": 33575, "total_steps": 38160, "loss": 0.455, "lr": 4.335385973730166e-05, "epoch": 17.596960167714883, "percentage": 87.98, "elapsed_time": "1:26:01", "remaining_time": "0:11:44", "throughput": 4246.84, "total_tokens": 21921064} {"current_steps": 33580, "total_steps": 38160, "loss": 0.4504, "lr": 4.3260762717512726e-05, "epoch": 17.59958071278826, "percentage": 88.0, "elapsed_time": "1:26:02", "remaining_time": "0:11:44", "throughput": 4246.8, "total_tokens": 21923624} {"current_steps": 33585, "total_steps": 38160, "loss": 0.378, "lr": 4.316776124236144e-05, "epoch": 17.602201257861637, "percentage": 88.01, "elapsed_time": "1:26:03", "remaining_time": "0:11:43", "throughput": 4246.9, "total_tokens": 21927688} {"current_steps": 33590, "total_steps": 38160, "loss": 0.5056, "lr": 4.307485533130279e-05, "epoch": 17.60482180293501, "percentage": 88.02, "elapsed_time": "1:26:03", "remaining_time": "0:11:42", "throughput": 4246.86, "total_tokens": 21930248} {"current_steps": 33595, "total_steps": 38160, "loss": 0.3746, "lr": 4.298204500377145e-05, "epoch": 17.607442348008387, "percentage": 88.04, "elapsed_time": "1:26:04", "remaining_time": "0:11:41", "throughput": 4246.92, "total_tokens": 21933736} {"current_steps": 33600, "total_steps": 38160, "loss": 0.3658, "lr": 4.288933027918235e-05, "epoch": 17.61006289308176, "percentage": 88.05, "elapsed_time": "1:26:05", "remaining_time": "0:11:41", "throughput": 4246.98, "total_tokens": 21937256} {"current_steps": 33605, "total_steps": 38160, "loss": 0.3596, "lr": 4.279671117693046e-05, "epoch": 17.612683438155138, "percentage": 88.06, "elapsed_time": "1:26:06", "remaining_time": "0:11:40", "throughput": 4246.98, "total_tokens": 21940136} {"current_steps": 33610, "total_steps": 38160, "loss": 0.4942, "lr": 4.270418771639045e-05, "epoch": 17.61530398322851, "percentage": 88.08, "elapsed_time": "1:26:06", "remaining_time": "0:11:39", "throughput": 4246.97, "total_tokens": 21942888} {"current_steps": 33615, "total_steps": 38160, "loss": 0.38, "lr": 4.2611759916917345e-05, "epoch": 17.617924528301888, "percentage": 88.09, "elapsed_time": "1:26:07", "remaining_time": "0:11:38", "throughput": 4247.13, "total_tokens": 21947752} {"current_steps": 33620, "total_steps": 38160, "loss": 0.52, "lr": 4.251942779784579e-05, "epoch": 17.62054507337526, "percentage": 88.1, "elapsed_time": "1:26:08", "remaining_time": "0:11:37", "throughput": 4247.21, "total_tokens": 21951496} {"current_steps": 33625, "total_steps": 38160, "loss": 0.3588, "lr": 4.242719137849077e-05, "epoch": 17.62316561844864, "percentage": 88.12, "elapsed_time": "1:26:09", "remaining_time": "0:11:37", "throughput": 4247.27, "total_tokens": 21955048} {"current_steps": 33630, "total_steps": 38160, "loss": 0.4233, "lr": 4.233505067814702e-05, "epoch": 17.62578616352201, "percentage": 88.13, "elapsed_time": "1:26:09", "remaining_time": "0:11:36", "throughput": 4247.32, "total_tokens": 21958408} {"current_steps": 33635, "total_steps": 38160, "loss": 0.4471, "lr": 4.224300571608947e-05, "epoch": 17.62840670859539, "percentage": 88.14, "elapsed_time": "1:26:10", "remaining_time": "0:11:35", "throughput": 4247.29, "total_tokens": 21961000} {"current_steps": 33640, "total_steps": 38160, "loss": 0.4536, "lr": 4.215105651157264e-05, "epoch": 17.631027253668762, "percentage": 88.16, "elapsed_time": "1:26:11", "remaining_time": "0:11:34", "throughput": 4247.35, "total_tokens": 21964552} {"current_steps": 33645, "total_steps": 38160, "loss": 0.4291, "lr": 4.2059203083831434e-05, "epoch": 17.63364779874214, "percentage": 88.17, "elapsed_time": "1:26:12", "remaining_time": "0:11:34", "throughput": 4247.34, "total_tokens": 21967272} {"current_steps": 33650, "total_steps": 38160, "loss": 0.4964, "lr": 4.196744545208042e-05, "epoch": 17.636268343815512, "percentage": 88.18, "elapsed_time": "1:26:12", "remaining_time": "0:11:33", "throughput": 4247.4, "total_tokens": 21970824} {"current_steps": 33655, "total_steps": 38160, "loss": 0.4281, "lr": 4.187578363551431e-05, "epoch": 17.63888888888889, "percentage": 88.19, "elapsed_time": "1:26:13", "remaining_time": "0:11:32", "throughput": 4247.4, "total_tokens": 21973768} {"current_steps": 33660, "total_steps": 38160, "loss": 0.4761, "lr": 4.17842176533077e-05, "epoch": 17.641509433962263, "percentage": 88.21, "elapsed_time": "1:26:14", "remaining_time": "0:11:31", "throughput": 4247.41, "total_tokens": 21976712} {"current_steps": 33665, "total_steps": 38160, "loss": 0.3849, "lr": 4.1692747524615274e-05, "epoch": 17.64412997903564, "percentage": 88.22, "elapsed_time": "1:26:14", "remaining_time": "0:11:30", "throughput": 4247.43, "total_tokens": 21979848} {"current_steps": 33670, "total_steps": 38160, "loss": 0.4988, "lr": 4.160137326857138e-05, "epoch": 17.646750524109013, "percentage": 88.23, "elapsed_time": "1:26:15", "remaining_time": "0:11:30", "throughput": 4247.45, "total_tokens": 21983048} {"current_steps": 33675, "total_steps": 38160, "loss": 0.4903, "lr": 4.151009490429042e-05, "epoch": 17.64937106918239, "percentage": 88.25, "elapsed_time": "1:26:16", "remaining_time": "0:11:29", "throughput": 4247.56, "total_tokens": 21987176} {"current_steps": 33680, "total_steps": 38160, "loss": 0.4138, "lr": 4.141891245086687e-05, "epoch": 17.651991614255767, "percentage": 88.26, "elapsed_time": "1:26:17", "remaining_time": "0:11:28", "throughput": 4247.56, "total_tokens": 21990088} {"current_steps": 33685, "total_steps": 38160, "loss": 0.5188, "lr": 4.132782592737511e-05, "epoch": 17.65461215932914, "percentage": 88.27, "elapsed_time": "1:26:17", "remaining_time": "0:11:27", "throughput": 4247.64, "total_tokens": 21993928} {"current_steps": 33690, "total_steps": 38160, "loss": 0.4011, "lr": 4.123683535286943e-05, "epoch": 17.657232704402517, "percentage": 88.29, "elapsed_time": "1:26:18", "remaining_time": "0:11:27", "throughput": 4247.79, "total_tokens": 21998536} {"current_steps": 33695, "total_steps": 38160, "loss": 0.518, "lr": 4.114594074638395e-05, "epoch": 17.65985324947589, "percentage": 88.3, "elapsed_time": "1:26:19", "remaining_time": "0:11:26", "throughput": 4247.86, "total_tokens": 22002184} {"current_steps": 33700, "total_steps": 38160, "loss": 0.4829, "lr": 4.105514212693268e-05, "epoch": 17.662473794549268, "percentage": 88.31, "elapsed_time": "1:26:20", "remaining_time": "0:11:25", "throughput": 4247.97, "total_tokens": 22006504} {"current_steps": 33705, "total_steps": 38160, "loss": 0.3711, "lr": 4.096443951350976e-05, "epoch": 17.66509433962264, "percentage": 88.33, "elapsed_time": "1:26:21", "remaining_time": "0:11:24", "throughput": 4247.93, "total_tokens": 22009000} {"current_steps": 33710, "total_steps": 38160, "loss": 0.4951, "lr": 4.0873832925089116e-05, "epoch": 17.667714884696018, "percentage": 88.34, "elapsed_time": "1:26:21", "remaining_time": "0:11:24", "throughput": 4247.99, "total_tokens": 22012456} {"current_steps": 33715, "total_steps": 38160, "loss": 0.3254, "lr": 4.0783322380624656e-05, "epoch": 17.67033542976939, "percentage": 88.35, "elapsed_time": "1:26:22", "remaining_time": "0:11:23", "throughput": 4247.98, "total_tokens": 22015272} {"current_steps": 33720, "total_steps": 38160, "loss": 0.5068, "lr": 4.069290789905023e-05, "epoch": 17.67295597484277, "percentage": 88.36, "elapsed_time": "1:26:23", "remaining_time": "0:11:22", "throughput": 4247.97, "total_tokens": 22018088} {"current_steps": 33725, "total_steps": 38160, "loss": 0.4833, "lr": 4.060258949927942e-05, "epoch": 17.67557651991614, "percentage": 88.38, "elapsed_time": "1:26:23", "remaining_time": "0:11:21", "throughput": 4248.0, "total_tokens": 22021224} {"current_steps": 33730, "total_steps": 38160, "loss": 0.335, "lr": 4.051236720020568e-05, "epoch": 17.67819706498952, "percentage": 88.39, "elapsed_time": "1:26:24", "remaining_time": "0:11:20", "throughput": 4247.97, "total_tokens": 22023848} {"current_steps": 33735, "total_steps": 38160, "loss": 0.6032, "lr": 4.042224102070263e-05, "epoch": 17.680817610062892, "percentage": 88.4, "elapsed_time": "1:26:25", "remaining_time": "0:11:20", "throughput": 4247.95, "total_tokens": 22026568} {"current_steps": 33740, "total_steps": 38160, "loss": 0.4114, "lr": 4.033221097962364e-05, "epoch": 17.68343815513627, "percentage": 88.42, "elapsed_time": "1:26:25", "remaining_time": "0:11:19", "throughput": 4247.95, "total_tokens": 22029448} {"current_steps": 33745, "total_steps": 38160, "loss": 0.3916, "lr": 4.0242277095802025e-05, "epoch": 17.686058700209642, "percentage": 88.43, "elapsed_time": "1:26:26", "remaining_time": "0:11:18", "throughput": 4247.96, "total_tokens": 22032392} {"current_steps": 33750, "total_steps": 38160, "loss": 0.4406, "lr": 4.015243938805086e-05, "epoch": 17.68867924528302, "percentage": 88.44, "elapsed_time": "1:26:27", "remaining_time": "0:11:17", "throughput": 4247.95, "total_tokens": 22035208} {"current_steps": 33755, "total_steps": 38160, "loss": 0.3546, "lr": 4.006269787516304e-05, "epoch": 17.691299790356393, "percentage": 88.46, "elapsed_time": "1:26:28", "remaining_time": "0:11:17", "throughput": 4248.0, "total_tokens": 22038696} {"current_steps": 33760, "total_steps": 38160, "loss": 0.4178, "lr": 3.9973052575911606e-05, "epoch": 17.69392033542977, "percentage": 88.47, "elapsed_time": "1:26:28", "remaining_time": "0:11:16", "throughput": 4248.05, "total_tokens": 22042088} {"current_steps": 33765, "total_steps": 38160, "loss": 0.3502, "lr": 3.988350350904929e-05, "epoch": 17.696540880503143, "percentage": 88.48, "elapsed_time": "1:26:29", "remaining_time": "0:11:15", "throughput": 4248.05, "total_tokens": 22045064} {"current_steps": 33770, "total_steps": 38160, "loss": 0.3936, "lr": 3.979405069330882e-05, "epoch": 17.69916142557652, "percentage": 88.5, "elapsed_time": "1:26:30", "remaining_time": "0:11:14", "throughput": 4248.16, "total_tokens": 22049128} {"current_steps": 33775, "total_steps": 38160, "loss": 0.3811, "lr": 3.970469414740269e-05, "epoch": 17.701781970649897, "percentage": 88.51, "elapsed_time": "1:26:31", "remaining_time": "0:11:13", "throughput": 4248.26, "total_tokens": 22053128} {"current_steps": 33780, "total_steps": 38160, "loss": 0.4064, "lr": 3.961543389002309e-05, "epoch": 17.70440251572327, "percentage": 88.52, "elapsed_time": "1:26:31", "remaining_time": "0:11:13", "throughput": 4248.31, "total_tokens": 22056616} {"current_steps": 33785, "total_steps": 38160, "loss": 0.5818, "lr": 3.952626993984243e-05, "epoch": 17.707023060796647, "percentage": 88.54, "elapsed_time": "1:26:32", "remaining_time": "0:11:12", "throughput": 4248.33, "total_tokens": 22059816} {"current_steps": 33790, "total_steps": 38160, "loss": 0.5638, "lr": 3.943720231551268e-05, "epoch": 17.70964360587002, "percentage": 88.55, "elapsed_time": "1:26:33", "remaining_time": "0:11:11", "throughput": 4248.32, "total_tokens": 22062504} {"current_steps": 33795, "total_steps": 38160, "loss": 0.3241, "lr": 3.934823103566587e-05, "epoch": 17.712264150943398, "percentage": 88.56, "elapsed_time": "1:26:33", "remaining_time": "0:11:10", "throughput": 4248.33, "total_tokens": 22065448} {"current_steps": 33800, "total_steps": 38160, "loss": 0.5076, "lr": 3.925935611891379e-05, "epoch": 17.71488469601677, "percentage": 88.57, "elapsed_time": "1:26:34", "remaining_time": "0:11:10", "throughput": 4248.37, "total_tokens": 22068840} {"current_steps": 33805, "total_steps": 38160, "loss": 0.4205, "lr": 3.917057758384801e-05, "epoch": 17.717505241090148, "percentage": 88.59, "elapsed_time": "1:26:35", "remaining_time": "0:11:09", "throughput": 4248.36, "total_tokens": 22071688} {"current_steps": 33810, "total_steps": 38160, "loss": 0.3837, "lr": 3.9081895449039896e-05, "epoch": 17.72012578616352, "percentage": 88.6, "elapsed_time": "1:26:36", "remaining_time": "0:11:08", "throughput": 4248.36, "total_tokens": 22074568} {"current_steps": 33815, "total_steps": 38160, "loss": 0.4087, "lr": 3.899330973304083e-05, "epoch": 17.7227463312369, "percentage": 88.61, "elapsed_time": "1:26:36", "remaining_time": "0:11:07", "throughput": 4248.38, "total_tokens": 22077640} {"current_steps": 33820, "total_steps": 38160, "loss": 0.566, "lr": 3.8904820454381875e-05, "epoch": 17.72536687631027, "percentage": 88.63, "elapsed_time": "1:26:37", "remaining_time": "0:11:06", "throughput": 4248.4, "total_tokens": 22080712} {"current_steps": 33825, "total_steps": 38160, "loss": 0.3976, "lr": 3.881642763157417e-05, "epoch": 17.72798742138365, "percentage": 88.64, "elapsed_time": "1:26:38", "remaining_time": "0:11:06", "throughput": 4248.46, "total_tokens": 22084360} {"current_steps": 33830, "total_steps": 38160, "loss": 0.3075, "lr": 3.872813128310826e-05, "epoch": 17.730607966457022, "percentage": 88.65, "elapsed_time": "1:26:38", "remaining_time": "0:11:05", "throughput": 4248.45, "total_tokens": 22087176} {"current_steps": 33835, "total_steps": 38160, "loss": 0.5672, "lr": 3.8639931427454866e-05, "epoch": 17.7332285115304, "percentage": 88.67, "elapsed_time": "1:26:39", "remaining_time": "0:11:04", "throughput": 4248.47, "total_tokens": 22090248} {"current_steps": 33840, "total_steps": 38160, "loss": 0.392, "lr": 3.855182808306429e-05, "epoch": 17.735849056603772, "percentage": 88.68, "elapsed_time": "1:26:40", "remaining_time": "0:11:03", "throughput": 4248.52, "total_tokens": 22093672} {"current_steps": 33845, "total_steps": 38160, "loss": 0.4337, "lr": 3.8463821268366784e-05, "epoch": 17.73846960167715, "percentage": 88.69, "elapsed_time": "1:26:41", "remaining_time": "0:11:03", "throughput": 4248.57, "total_tokens": 22097128} {"current_steps": 33850, "total_steps": 38160, "loss": 0.3945, "lr": 3.837591100177246e-05, "epoch": 17.741090146750523, "percentage": 88.71, "elapsed_time": "1:26:41", "remaining_time": "0:11:02", "throughput": 4248.56, "total_tokens": 22099976} {"current_steps": 33855, "total_steps": 38160, "loss": 0.4159, "lr": 3.828809730167099e-05, "epoch": 17.7437106918239, "percentage": 88.72, "elapsed_time": "1:26:42", "remaining_time": "0:11:01", "throughput": 4248.66, "total_tokens": 22103880} {"current_steps": 33860, "total_steps": 38160, "loss": 0.4508, "lr": 3.820038018643218e-05, "epoch": 17.746331236897273, "percentage": 88.73, "elapsed_time": "1:26:43", "remaining_time": "0:11:00", "throughput": 4248.71, "total_tokens": 22107400} {"current_steps": 33865, "total_steps": 38160, "loss": 0.4176, "lr": 3.8112759674405254e-05, "epoch": 17.74895178197065, "percentage": 88.74, "elapsed_time": "1:26:43", "remaining_time": "0:11:00", "throughput": 4248.7, "total_tokens": 22110184} {"current_steps": 33870, "total_steps": 38160, "loss": 0.3599, "lr": 3.802523578391953e-05, "epoch": 17.751572327044027, "percentage": 88.76, "elapsed_time": "1:26:44", "remaining_time": "0:10:59", "throughput": 4248.66, "total_tokens": 22112520} {"current_steps": 33875, "total_steps": 38160, "loss": 0.4371, "lr": 3.793780853328399e-05, "epoch": 17.7541928721174, "percentage": 88.77, "elapsed_time": "1:26:45", "remaining_time": "0:10:58", "throughput": 4248.68, "total_tokens": 22115752} {"current_steps": 33880, "total_steps": 38160, "loss": 0.3152, "lr": 3.785047794078744e-05, "epoch": 17.756813417190777, "percentage": 88.78, "elapsed_time": "1:26:46", "remaining_time": "0:10:57", "throughput": 4248.8, "total_tokens": 22120072} {"current_steps": 33885, "total_steps": 38160, "loss": 0.4108, "lr": 3.776324402469844e-05, "epoch": 17.75943396226415, "percentage": 88.8, "elapsed_time": "1:26:46", "remaining_time": "0:10:56", "throughput": 4248.84, "total_tokens": 22123400} {"current_steps": 33890, "total_steps": 38160, "loss": 0.5531, "lr": 3.767610680326533e-05, "epoch": 17.762054507337528, "percentage": 88.81, "elapsed_time": "1:26:47", "remaining_time": "0:10:56", "throughput": 4248.92, "total_tokens": 22127144} {"current_steps": 33895, "total_steps": 38160, "loss": 0.3327, "lr": 3.7589066294716145e-05, "epoch": 17.7646750524109, "percentage": 88.82, "elapsed_time": "1:26:48", "remaining_time": "0:10:55", "throughput": 4248.91, "total_tokens": 22129928} {"current_steps": 33900, "total_steps": 38160, "loss": 0.5119, "lr": 3.750212251725882e-05, "epoch": 17.767295597484278, "percentage": 88.84, "elapsed_time": "1:26:49", "remaining_time": "0:10:54", "throughput": 4248.9, "total_tokens": 22132776} {"current_steps": 33905, "total_steps": 38160, "loss": 0.3629, "lr": 3.741527548908113e-05, "epoch": 17.76991614255765, "percentage": 88.85, "elapsed_time": "1:26:49", "remaining_time": "0:10:53", "throughput": 4248.95, "total_tokens": 22136232} {"current_steps": 33910, "total_steps": 38160, "loss": 0.477, "lr": 3.732852522835023e-05, "epoch": 17.77253668763103, "percentage": 88.86, "elapsed_time": "1:26:50", "remaining_time": "0:10:53", "throughput": 4249.05, "total_tokens": 22140168} {"current_steps": 33915, "total_steps": 38160, "loss": 0.5419, "lr": 3.724187175321342e-05, "epoch": 17.7751572327044, "percentage": 88.88, "elapsed_time": "1:26:51", "remaining_time": "0:10:52", "throughput": 4249.07, "total_tokens": 22143368} {"current_steps": 33920, "total_steps": 38160, "loss": 0.3912, "lr": 3.71553150817977e-05, "epoch": 17.77777777777778, "percentage": 88.89, "elapsed_time": "1:26:52", "remaining_time": "0:10:51", "throughput": 4249.12, "total_tokens": 22146824} {"current_steps": 33925, "total_steps": 38160, "loss": 0.3569, "lr": 3.70688552322096e-05, "epoch": 17.780398322851152, "percentage": 88.9, "elapsed_time": "1:26:52", "remaining_time": "0:10:50", "throughput": 4249.13, "total_tokens": 22149928} {"current_steps": 33930, "total_steps": 38160, "loss": 0.4186, "lr": 3.698249222253569e-05, "epoch": 17.78301886792453, "percentage": 88.92, "elapsed_time": "1:26:53", "remaining_time": "0:10:49", "throughput": 4249.21, "total_tokens": 22153768} {"current_steps": 33935, "total_steps": 38160, "loss": 0.4188, "lr": 3.6896226070841863e-05, "epoch": 17.785639412997902, "percentage": 88.93, "elapsed_time": "1:26:54", "remaining_time": "0:10:49", "throughput": 4249.21, "total_tokens": 22156744} {"current_steps": 33940, "total_steps": 38160, "loss": 0.3622, "lr": 3.681005679517424e-05, "epoch": 17.78825995807128, "percentage": 88.94, "elapsed_time": "1:26:54", "remaining_time": "0:10:48", "throughput": 4249.17, "total_tokens": 22159240} {"current_steps": 33945, "total_steps": 38160, "loss": 0.4033, "lr": 3.6723984413558455e-05, "epoch": 17.790880503144653, "percentage": 88.95, "elapsed_time": "1:26:55", "remaining_time": "0:10:47", "throughput": 4249.24, "total_tokens": 22162856} {"current_steps": 33950, "total_steps": 38160, "loss": 0.3508, "lr": 3.663800894399971e-05, "epoch": 17.79350104821803, "percentage": 88.97, "elapsed_time": "1:26:56", "remaining_time": "0:10:46", "throughput": 4249.23, "total_tokens": 22165736} {"current_steps": 33955, "total_steps": 38160, "loss": 0.3195, "lr": 3.655213040448318e-05, "epoch": 17.796121593291403, "percentage": 88.98, "elapsed_time": "1:26:57", "remaining_time": "0:10:46", "throughput": 4249.22, "total_tokens": 22168488} {"current_steps": 33960, "total_steps": 38160, "loss": 0.4099, "lr": 3.6466348812973723e-05, "epoch": 17.79874213836478, "percentage": 88.99, "elapsed_time": "1:26:58", "remaining_time": "0:10:45", "throughput": 4249.39, "total_tokens": 22173448} {"current_steps": 33965, "total_steps": 38160, "loss": 0.429, "lr": 3.6380664187415815e-05, "epoch": 17.801362683438157, "percentage": 89.01, "elapsed_time": "1:26:58", "remaining_time": "0:10:44", "throughput": 4249.46, "total_tokens": 22177096} {"current_steps": 33970, "total_steps": 38160, "loss": 0.4348, "lr": 3.6295076545733663e-05, "epoch": 17.80398322851153, "percentage": 89.02, "elapsed_time": "1:26:59", "remaining_time": "0:10:43", "throughput": 4249.47, "total_tokens": 22180168} {"current_steps": 33975, "total_steps": 38160, "loss": 0.5291, "lr": 3.6209585905831344e-05, "epoch": 17.806603773584907, "percentage": 89.03, "elapsed_time": "1:27:00", "remaining_time": "0:10:43", "throughput": 4249.45, "total_tokens": 22182920} {"current_steps": 33980, "total_steps": 38160, "loss": 0.343, "lr": 3.6124192285592385e-05, "epoch": 17.80922431865828, "percentage": 89.05, "elapsed_time": "1:27:00", "remaining_time": "0:10:42", "throughput": 4249.4, "total_tokens": 22185288} {"current_steps": 33985, "total_steps": 38160, "loss": 0.3763, "lr": 3.6038895702880324e-05, "epoch": 17.811844863731658, "percentage": 89.06, "elapsed_time": "1:27:01", "remaining_time": "0:10:41", "throughput": 4249.59, "total_tokens": 22190472} {"current_steps": 33990, "total_steps": 38160, "loss": 0.5482, "lr": 3.595369617553806e-05, "epoch": 17.81446540880503, "percentage": 89.07, "elapsed_time": "1:27:02", "remaining_time": "0:10:40", "throughput": 4249.64, "total_tokens": 22193960} {"current_steps": 33995, "total_steps": 38160, "loss": 0.3226, "lr": 3.58685937213884e-05, "epoch": 17.817085953878408, "percentage": 89.09, "elapsed_time": "1:27:03", "remaining_time": "0:10:39", "throughput": 4249.6, "total_tokens": 22196392} {"current_steps": 34000, "total_steps": 38160, "loss": 0.3541, "lr": 3.5783588358233863e-05, "epoch": 17.81970649895178, "percentage": 89.1, "elapsed_time": "1:27:03", "remaining_time": "0:10:39", "throughput": 4249.59, "total_tokens": 22199272} {"current_steps": 34005, "total_steps": 38160, "loss": 0.4702, "lr": 3.569868010385663e-05, "epoch": 17.822327044025158, "percentage": 89.11, "elapsed_time": "1:27:04", "remaining_time": "0:10:38", "throughput": 4249.63, "total_tokens": 22202536} {"current_steps": 34010, "total_steps": 38160, "loss": 0.5079, "lr": 3.5613868976018535e-05, "epoch": 17.82494758909853, "percentage": 89.12, "elapsed_time": "1:27:05", "remaining_time": "0:10:37", "throughput": 4249.67, "total_tokens": 22205864} {"current_steps": 34015, "total_steps": 38160, "loss": 0.3926, "lr": 3.5529154992460955e-05, "epoch": 17.82756813417191, "percentage": 89.14, "elapsed_time": "1:27:05", "remaining_time": "0:10:36", "throughput": 4249.65, "total_tokens": 22208520} {"current_steps": 34020, "total_steps": 38160, "loss": 0.3922, "lr": 3.544453817090521e-05, "epoch": 17.830188679245282, "percentage": 89.15, "elapsed_time": "1:27:06", "remaining_time": "0:10:36", "throughput": 4249.64, "total_tokens": 22211336} {"current_steps": 34025, "total_steps": 38160, "loss": 0.5102, "lr": 3.536001852905207e-05, "epoch": 17.83280922431866, "percentage": 89.16, "elapsed_time": "1:27:07", "remaining_time": "0:10:35", "throughput": 4249.69, "total_tokens": 22214888} {"current_steps": 34030, "total_steps": 38160, "loss": 0.4068, "lr": 3.527559608458225e-05, "epoch": 17.835429769392032, "percentage": 89.18, "elapsed_time": "1:27:08", "remaining_time": "0:10:34", "throughput": 4249.73, "total_tokens": 22218216} {"current_steps": 34035, "total_steps": 38160, "loss": 0.4952, "lr": 3.5191270855155886e-05, "epoch": 17.83805031446541, "percentage": 89.19, "elapsed_time": "1:27:08", "remaining_time": "0:10:33", "throughput": 4249.74, "total_tokens": 22221224} {"current_steps": 34040, "total_steps": 38160, "loss": 0.3843, "lr": 3.510704285841293e-05, "epoch": 17.840670859538783, "percentage": 89.2, "elapsed_time": "1:27:09", "remaining_time": "0:10:32", "throughput": 4249.72, "total_tokens": 22223912} {"current_steps": 34045, "total_steps": 38160, "loss": 0.4584, "lr": 3.502291211197267e-05, "epoch": 17.84329140461216, "percentage": 89.22, "elapsed_time": "1:27:10", "remaining_time": "0:10:32", "throughput": 4249.81, "total_tokens": 22227784} {"current_steps": 34050, "total_steps": 38160, "loss": 0.4071, "lr": 3.493887863343448e-05, "epoch": 17.845911949685533, "percentage": 89.23, "elapsed_time": "1:27:10", "remaining_time": "0:10:31", "throughput": 4249.77, "total_tokens": 22230280} {"current_steps": 34055, "total_steps": 38160, "loss": 0.4839, "lr": 3.485494244037718e-05, "epoch": 17.84853249475891, "percentage": 89.24, "elapsed_time": "1:27:11", "remaining_time": "0:10:30", "throughput": 4249.74, "total_tokens": 22232744} {"current_steps": 34060, "total_steps": 38160, "loss": 0.3208, "lr": 3.477110355035934e-05, "epoch": 17.851153039832283, "percentage": 89.26, "elapsed_time": "1:27:12", "remaining_time": "0:10:29", "throughput": 4249.75, "total_tokens": 22235784} {"current_steps": 34065, "total_steps": 38160, "loss": 0.4883, "lr": 3.468736198091904e-05, "epoch": 17.85377358490566, "percentage": 89.27, "elapsed_time": "1:27:13", "remaining_time": "0:10:29", "throughput": 4249.86, "total_tokens": 22239912} {"current_steps": 34070, "total_steps": 38160, "loss": 0.5504, "lr": 3.4603717749573935e-05, "epoch": 17.856394129979037, "percentage": 89.28, "elapsed_time": "1:27:13", "remaining_time": "0:10:28", "throughput": 4249.97, "total_tokens": 22244104} {"current_steps": 34075, "total_steps": 38160, "loss": 0.3797, "lr": 3.452017087382159e-05, "epoch": 17.85901467505241, "percentage": 89.3, "elapsed_time": "1:27:14", "remaining_time": "0:10:27", "throughput": 4250.04, "total_tokens": 22247816} {"current_steps": 34080, "total_steps": 38160, "loss": 0.3848, "lr": 3.443672137113901e-05, "epoch": 17.861635220125788, "percentage": 89.31, "elapsed_time": "1:27:15", "remaining_time": "0:10:26", "throughput": 4250.13, "total_tokens": 22251688} {"current_steps": 34085, "total_steps": 38160, "loss": 0.4418, "lr": 3.4353369258983025e-05, "epoch": 17.86425576519916, "percentage": 89.32, "elapsed_time": "1:27:16", "remaining_time": "0:10:26", "throughput": 4250.18, "total_tokens": 22255144} {"current_steps": 34090, "total_steps": 38160, "loss": 0.705, "lr": 3.4270114554789735e-05, "epoch": 17.866876310272538, "percentage": 89.33, "elapsed_time": "1:27:17", "remaining_time": "0:10:25", "throughput": 4250.23, "total_tokens": 22258536} {"current_steps": 34095, "total_steps": 38160, "loss": 0.3681, "lr": 3.41869572759751e-05, "epoch": 17.86949685534591, "percentage": 89.35, "elapsed_time": "1:27:18", "remaining_time": "0:10:24", "throughput": 4250.45, "total_tokens": 22264104} {"current_steps": 34100, "total_steps": 38160, "loss": 0.3085, "lr": 3.410389743993475e-05, "epoch": 17.872117400419288, "percentage": 89.36, "elapsed_time": "1:27:18", "remaining_time": "0:10:23", "throughput": 4250.45, "total_tokens": 22266952} {"current_steps": 34105, "total_steps": 38160, "loss": 0.397, "lr": 3.40209350640438e-05, "epoch": 17.87473794549266, "percentage": 89.37, "elapsed_time": "1:27:19", "remaining_time": "0:10:22", "throughput": 4250.47, "total_tokens": 22270088} {"current_steps": 34110, "total_steps": 38160, "loss": 0.4399, "lr": 3.3938070165657084e-05, "epoch": 17.87735849056604, "percentage": 89.39, "elapsed_time": "1:27:20", "remaining_time": "0:10:22", "throughput": 4250.45, "total_tokens": 22272680} {"current_steps": 34115, "total_steps": 38160, "loss": 0.3354, "lr": 3.385530276210902e-05, "epoch": 17.879979035639412, "percentage": 89.4, "elapsed_time": "1:27:20", "remaining_time": "0:10:21", "throughput": 4250.52, "total_tokens": 22276456} {"current_steps": 34120, "total_steps": 38160, "loss": 0.3929, "lr": 3.377263287071358e-05, "epoch": 17.88259958071279, "percentage": 89.41, "elapsed_time": "1:27:21", "remaining_time": "0:10:20", "throughput": 4250.56, "total_tokens": 22279784} {"current_steps": 34125, "total_steps": 38160, "loss": 0.5002, "lr": 3.369006050876428e-05, "epoch": 17.885220125786162, "percentage": 89.43, "elapsed_time": "1:27:22", "remaining_time": "0:10:19", "throughput": 4250.57, "total_tokens": 22282760} {"current_steps": 34130, "total_steps": 38160, "loss": 0.4841, "lr": 3.3607585693534394e-05, "epoch": 17.88784067085954, "percentage": 89.44, "elapsed_time": "1:27:23", "remaining_time": "0:10:19", "throughput": 4250.6, "total_tokens": 22286088} {"current_steps": 34135, "total_steps": 38160, "loss": 0.35, "lr": 3.352520844227663e-05, "epoch": 17.890461215932913, "percentage": 89.45, "elapsed_time": "1:27:23", "remaining_time": "0:10:18", "throughput": 4250.75, "total_tokens": 22290632} {"current_steps": 34140, "total_steps": 38160, "loss": 0.344, "lr": 3.344292877222355e-05, "epoch": 17.89308176100629, "percentage": 89.47, "elapsed_time": "1:27:24", "remaining_time": "0:10:17", "throughput": 4250.75, "total_tokens": 22293448} {"current_steps": 34145, "total_steps": 38160, "loss": 0.5803, "lr": 3.336074670058703e-05, "epoch": 17.895702306079663, "percentage": 89.48, "elapsed_time": "1:27:25", "remaining_time": "0:10:16", "throughput": 4250.86, "total_tokens": 22297704} {"current_steps": 34150, "total_steps": 38160, "loss": 0.3612, "lr": 3.327866224455844e-05, "epoch": 17.89832285115304, "percentage": 89.49, "elapsed_time": "1:27:26", "remaining_time": "0:10:16", "throughput": 4250.85, "total_tokens": 22300488} {"current_steps": 34155, "total_steps": 38160, "loss": 0.4938, "lr": 3.3196675421309165e-05, "epoch": 17.900943396226417, "percentage": 89.5, "elapsed_time": "1:27:26", "remaining_time": "0:10:15", "throughput": 4250.87, "total_tokens": 22303656} {"current_steps": 34160, "total_steps": 38160, "loss": 0.3437, "lr": 3.3114786247989744e-05, "epoch": 17.90356394129979, "percentage": 89.52, "elapsed_time": "1:27:27", "remaining_time": "0:10:14", "throughput": 4250.88, "total_tokens": 22306664} {"current_steps": 34165, "total_steps": 38160, "loss": 0.3511, "lr": 3.303299474173066e-05, "epoch": 17.906184486373167, "percentage": 89.53, "elapsed_time": "1:27:28", "remaining_time": "0:10:13", "throughput": 4250.88, "total_tokens": 22309512} {"current_steps": 34170, "total_steps": 38160, "loss": 0.43, "lr": 3.2951300919641544e-05, "epoch": 17.90880503144654, "percentage": 89.54, "elapsed_time": "1:27:28", "remaining_time": "0:10:12", "throughput": 4250.87, "total_tokens": 22312424} {"current_steps": 34175, "total_steps": 38160, "loss": 0.5088, "lr": 3.2869704798811964e-05, "epoch": 17.911425576519918, "percentage": 89.56, "elapsed_time": "1:27:29", "remaining_time": "0:10:12", "throughput": 4250.93, "total_tokens": 22316136} {"current_steps": 34180, "total_steps": 38160, "loss": 0.4723, "lr": 3.2788206396310746e-05, "epoch": 17.91404612159329, "percentage": 89.57, "elapsed_time": "1:27:30", "remaining_time": "0:10:11", "throughput": 4250.93, "total_tokens": 22319112} {"current_steps": 34185, "total_steps": 38160, "loss": 0.447, "lr": 3.270680572918655e-05, "epoch": 17.916666666666668, "percentage": 89.58, "elapsed_time": "1:27:31", "remaining_time": "0:10:10", "throughput": 4250.98, "total_tokens": 22322504} {"current_steps": 34190, "total_steps": 38160, "loss": 0.4467, "lr": 3.262550281446741e-05, "epoch": 17.91928721174004, "percentage": 89.6, "elapsed_time": "1:27:32", "remaining_time": "0:10:09", "throughput": 4251.25, "total_tokens": 22328744} {"current_steps": 34195, "total_steps": 38160, "loss": 0.462, "lr": 3.2544297669161115e-05, "epoch": 17.921907756813418, "percentage": 89.61, "elapsed_time": "1:27:33", "remaining_time": "0:10:09", "throughput": 4251.36, "total_tokens": 22332936} {"current_steps": 34200, "total_steps": 38160, "loss": 0.6511, "lr": 3.2463190310254633e-05, "epoch": 17.92452830188679, "percentage": 89.62, "elapsed_time": "1:27:33", "remaining_time": "0:10:08", "throughput": 4251.42, "total_tokens": 22336552} {"current_steps": 34205, "total_steps": 38160, "loss": 0.4118, "lr": 3.238218075471483e-05, "epoch": 17.92714884696017, "percentage": 89.64, "elapsed_time": "1:27:34", "remaining_time": "0:10:07", "throughput": 4251.42, "total_tokens": 22339496} {"current_steps": 34210, "total_steps": 38160, "loss": 0.4329, "lr": 3.230126901948788e-05, "epoch": 17.929769392033542, "percentage": 89.65, "elapsed_time": "1:27:35", "remaining_time": "0:10:06", "throughput": 4251.44, "total_tokens": 22342696} {"current_steps": 34215, "total_steps": 38160, "loss": 0.4225, "lr": 3.222045512149968e-05, "epoch": 17.93238993710692, "percentage": 89.66, "elapsed_time": "1:27:36", "remaining_time": "0:10:06", "throughput": 4251.48, "total_tokens": 22346024} {"current_steps": 34220, "total_steps": 38160, "loss": 0.3569, "lr": 3.213973907765566e-05, "epoch": 17.935010482180292, "percentage": 89.68, "elapsed_time": "1:27:36", "remaining_time": "0:10:05", "throughput": 4251.46, "total_tokens": 22348808} {"current_steps": 34225, "total_steps": 38160, "loss": 0.4033, "lr": 3.205912090484048e-05, "epoch": 17.93763102725367, "percentage": 89.69, "elapsed_time": "1:27:37", "remaining_time": "0:10:04", "throughput": 4251.54, "total_tokens": 22352584} {"current_steps": 34230, "total_steps": 38160, "loss": 0.7423, "lr": 3.1978600619918754e-05, "epoch": 17.940251572327043, "percentage": 89.7, "elapsed_time": "1:27:38", "remaining_time": "0:10:03", "throughput": 4251.53, "total_tokens": 22355336} {"current_steps": 34235, "total_steps": 38160, "loss": 0.4311, "lr": 3.189817823973423e-05, "epoch": 17.94287211740042, "percentage": 89.71, "elapsed_time": "1:27:39", "remaining_time": "0:10:02", "throughput": 4251.87, "total_tokens": 22362664} {"current_steps": 34240, "total_steps": 38160, "loss": 0.5155, "lr": 3.18178537811104e-05, "epoch": 17.945492662473793, "percentage": 89.73, "elapsed_time": "1:27:40", "remaining_time": "0:10:02", "throughput": 4251.87, "total_tokens": 22365736} {"current_steps": 34245, "total_steps": 38160, "loss": 0.3555, "lr": 3.1737627260850335e-05, "epoch": 17.94811320754717, "percentage": 89.74, "elapsed_time": "1:27:40", "remaining_time": "0:10:01", "throughput": 4251.88, "total_tokens": 22368744} {"current_steps": 34250, "total_steps": 38160, "loss": 0.7972, "lr": 3.1657498695736364e-05, "epoch": 17.950733752620543, "percentage": 89.75, "elapsed_time": "1:27:41", "remaining_time": "0:10:00", "throughput": 4251.84, "total_tokens": 22371176} {"current_steps": 34255, "total_steps": 38160, "loss": 0.4022, "lr": 3.157746810253054e-05, "epoch": 17.95335429769392, "percentage": 89.77, "elapsed_time": "1:27:42", "remaining_time": "0:09:59", "throughput": 4251.98, "total_tokens": 22375592} {"current_steps": 34260, "total_steps": 38160, "loss": 0.4093, "lr": 3.149753549797446e-05, "epoch": 17.955974842767297, "percentage": 89.78, "elapsed_time": "1:27:43", "remaining_time": "0:09:59", "throughput": 4252.04, "total_tokens": 22379112} {"current_steps": 34265, "total_steps": 38160, "loss": 0.3368, "lr": 3.141770089878887e-05, "epoch": 17.95859538784067, "percentage": 89.79, "elapsed_time": "1:27:43", "remaining_time": "0:09:58", "throughput": 4252.12, "total_tokens": 22382824} {"current_steps": 34270, "total_steps": 38160, "loss": 0.5237, "lr": 3.1337964321674354e-05, "epoch": 17.961215932914047, "percentage": 89.81, "elapsed_time": "1:27:44", "remaining_time": "0:09:57", "throughput": 4252.17, "total_tokens": 22386408} {"current_steps": 34275, "total_steps": 38160, "loss": 0.3316, "lr": 3.125832578331106e-05, "epoch": 17.96383647798742, "percentage": 89.82, "elapsed_time": "1:27:45", "remaining_time": "0:09:56", "throughput": 4252.18, "total_tokens": 22389320} {"current_steps": 34280, "total_steps": 38160, "loss": 0.3448, "lr": 3.117878530035823e-05, "epoch": 17.966457023060798, "percentage": 89.83, "elapsed_time": "1:27:46", "remaining_time": "0:09:56", "throughput": 4252.15, "total_tokens": 22391848} {"current_steps": 34285, "total_steps": 38160, "loss": 0.4584, "lr": 3.1099342889454875e-05, "epoch": 17.96907756813417, "percentage": 89.85, "elapsed_time": "1:27:46", "remaining_time": "0:09:55", "throughput": 4252.2, "total_tokens": 22395304} {"current_steps": 34290, "total_steps": 38160, "loss": 0.4161, "lr": 3.1019998567219597e-05, "epoch": 17.971698113207548, "percentage": 89.86, "elapsed_time": "1:27:47", "remaining_time": "0:09:54", "throughput": 4252.19, "total_tokens": 22397960} {"current_steps": 34295, "total_steps": 38160, "loss": 0.3121, "lr": 3.0940752350250125e-05, "epoch": 17.97431865828092, "percentage": 89.87, "elapsed_time": "1:27:48", "remaining_time": "0:09:53", "throughput": 4252.14, "total_tokens": 22400296} {"current_steps": 34300, "total_steps": 38160, "loss": 0.4023, "lr": 3.0861604255124074e-05, "epoch": 17.9769392033543, "percentage": 89.88, "elapsed_time": "1:27:48", "remaining_time": "0:09:52", "throughput": 4252.15, "total_tokens": 22403432} {"current_steps": 34305, "total_steps": 38160, "loss": 0.5485, "lr": 3.0782554298398045e-05, "epoch": 17.979559748427672, "percentage": 89.9, "elapsed_time": "1:27:49", "remaining_time": "0:09:52", "throughput": 4252.2, "total_tokens": 22406952} {"current_steps": 34310, "total_steps": 38160, "loss": 0.3258, "lr": 3.070360249660859e-05, "epoch": 17.98218029350105, "percentage": 89.91, "elapsed_time": "1:27:50", "remaining_time": "0:09:51", "throughput": 4252.28, "total_tokens": 22410568} {"current_steps": 34315, "total_steps": 38160, "loss": 0.4456, "lr": 3.0624748866271535e-05, "epoch": 17.984800838574422, "percentage": 89.92, "elapsed_time": "1:27:50", "remaining_time": "0:09:50", "throughput": 4252.32, "total_tokens": 22413832} {"current_steps": 34320, "total_steps": 38160, "loss": 0.5389, "lr": 3.0545993423882036e-05, "epoch": 17.9874213836478, "percentage": 89.94, "elapsed_time": "1:27:51", "remaining_time": "0:09:49", "throughput": 4252.39, "total_tokens": 22417576} {"current_steps": 34325, "total_steps": 38160, "loss": 0.5246, "lr": 3.046733618591496e-05, "epoch": 17.990041928721173, "percentage": 89.95, "elapsed_time": "1:27:52", "remaining_time": "0:09:49", "throughput": 4252.39, "total_tokens": 22420456} {"current_steps": 34330, "total_steps": 38160, "loss": 0.3725, "lr": 3.0388777168824434e-05, "epoch": 17.99266247379455, "percentage": 89.96, "elapsed_time": "1:27:53", "remaining_time": "0:09:48", "throughput": 4252.35, "total_tokens": 22423016} {"current_steps": 34335, "total_steps": 38160, "loss": 0.393, "lr": 3.0310316389044022e-05, "epoch": 17.995283018867923, "percentage": 89.98, "elapsed_time": "1:27:53", "remaining_time": "0:09:47", "throughput": 4252.32, "total_tokens": 22425544} {"current_steps": 34340, "total_steps": 38160, "loss": 0.3937, "lr": 3.0231953862986995e-05, "epoch": 17.9979035639413, "percentage": 89.99, "elapsed_time": "1:27:54", "remaining_time": "0:09:46", "throughput": 4252.31, "total_tokens": 22428392} {"current_steps": 34344, "total_steps": 38160, "eval_loss": 0.4931029677391052, "epoch": 18.0, "percentage": 90.0, "elapsed_time": "1:28:08", "remaining_time": "0:09:47", "throughput": 4240.97, "total_tokens": 22429992} {"current_steps": 34345, "total_steps": 38160, "loss": 0.4668, "lr": 3.0153689607045842e-05, "epoch": 18.000524109014677, "percentage": 90.0, "elapsed_time": "1:28:11", "remaining_time": "0:09:47", "throughput": 4239.34, "total_tokens": 22430632} {"current_steps": 34350, "total_steps": 38160, "loss": 0.4538, "lr": 3.0075523637592474e-05, "epoch": 18.00314465408805, "percentage": 90.02, "elapsed_time": "1:28:11", "remaining_time": "0:09:46", "throughput": 4239.36, "total_tokens": 22433864} {"current_steps": 34355, "total_steps": 38160, "loss": 0.4578, "lr": 2.999745597097847e-05, "epoch": 18.005765199161427, "percentage": 90.03, "elapsed_time": "1:28:12", "remaining_time": "0:09:46", "throughput": 4239.39, "total_tokens": 22437128} {"current_steps": 34360, "total_steps": 38160, "loss": 0.4516, "lr": 2.9919486623534497e-05, "epoch": 18.0083857442348, "percentage": 90.04, "elapsed_time": "1:28:13", "remaining_time": "0:09:45", "throughput": 4239.38, "total_tokens": 22439912} {"current_steps": 34365, "total_steps": 38160, "loss": 0.567, "lr": 2.9841615611571005e-05, "epoch": 18.011006289308177, "percentage": 90.06, "elapsed_time": "1:28:13", "remaining_time": "0:09:44", "throughput": 4239.36, "total_tokens": 22442760} {"current_steps": 34370, "total_steps": 38160, "loss": 0.3037, "lr": 2.9763842951377628e-05, "epoch": 18.01362683438155, "percentage": 90.07, "elapsed_time": "1:28:14", "remaining_time": "0:09:43", "throughput": 4239.36, "total_tokens": 22445704} {"current_steps": 34375, "total_steps": 38160, "loss": 0.5975, "lr": 2.968616865922369e-05, "epoch": 18.016247379454928, "percentage": 90.08, "elapsed_time": "1:28:15", "remaining_time": "0:09:43", "throughput": 4239.37, "total_tokens": 22448808} {"current_steps": 34380, "total_steps": 38160, "loss": 0.3181, "lr": 2.960859275135758e-05, "epoch": 18.0188679245283, "percentage": 90.09, "elapsed_time": "1:28:15", "remaining_time": "0:09:42", "throughput": 4239.37, "total_tokens": 22451688} {"current_steps": 34385, "total_steps": 38160, "loss": 0.3975, "lr": 2.9531115244007367e-05, "epoch": 18.021488469601678, "percentage": 90.11, "elapsed_time": "1:28:16", "remaining_time": "0:09:41", "throughput": 4239.37, "total_tokens": 22454472} {"current_steps": 34390, "total_steps": 38160, "loss": 0.5466, "lr": 2.945373615338037e-05, "epoch": 18.02410901467505, "percentage": 90.12, "elapsed_time": "1:28:17", "remaining_time": "0:09:40", "throughput": 4239.36, "total_tokens": 22457224} {"current_steps": 34395, "total_steps": 38160, "loss": 0.358, "lr": 2.9376455495663534e-05, "epoch": 18.02672955974843, "percentage": 90.13, "elapsed_time": "1:28:17", "remaining_time": "0:09:39", "throughput": 4239.33, "total_tokens": 22459784} {"current_steps": 34400, "total_steps": 38160, "loss": 0.3704, "lr": 2.9299273287023144e-05, "epoch": 18.029350104821802, "percentage": 90.15, "elapsed_time": "1:28:18", "remaining_time": "0:09:39", "throughput": 4239.31, "total_tokens": 22462408} {"current_steps": 34405, "total_steps": 38160, "loss": 0.4337, "lr": 2.922218954360473e-05, "epoch": 18.03197064989518, "percentage": 90.16, "elapsed_time": "1:28:19", "remaining_time": "0:09:38", "throughput": 4239.37, "total_tokens": 22466152} {"current_steps": 34410, "total_steps": 38160, "loss": 0.4662, "lr": 2.9145204281533278e-05, "epoch": 18.034591194968552, "percentage": 90.17, "elapsed_time": "1:28:20", "remaining_time": "0:09:37", "throughput": 4239.4, "total_tokens": 22469352} {"current_steps": 34415, "total_steps": 38160, "loss": 0.3545, "lr": 2.9068317516913244e-05, "epoch": 18.03721174004193, "percentage": 90.19, "elapsed_time": "1:28:20", "remaining_time": "0:09:36", "throughput": 4239.42, "total_tokens": 22472488} {"current_steps": 34420, "total_steps": 38160, "loss": 0.4371, "lr": 2.8991529265828542e-05, "epoch": 18.039832285115303, "percentage": 90.2, "elapsed_time": "1:28:21", "remaining_time": "0:09:36", "throughput": 4239.41, "total_tokens": 22475272} {"current_steps": 34425, "total_steps": 38160, "loss": 0.2379, "lr": 2.891483954434243e-05, "epoch": 18.04245283018868, "percentage": 90.21, "elapsed_time": "1:28:22", "remaining_time": "0:09:35", "throughput": 4239.43, "total_tokens": 22478312} {"current_steps": 34430, "total_steps": 38160, "loss": 0.3584, "lr": 2.8838248368497465e-05, "epoch": 18.045073375262053, "percentage": 90.23, "elapsed_time": "1:28:22", "remaining_time": "0:09:34", "throughput": 4239.39, "total_tokens": 22480712} {"current_steps": 34435, "total_steps": 38160, "loss": 0.3827, "lr": 2.8761755754315667e-05, "epoch": 18.04769392033543, "percentage": 90.24, "elapsed_time": "1:28:23", "remaining_time": "0:09:33", "throughput": 4239.5, "total_tokens": 22485064} {"current_steps": 34440, "total_steps": 38160, "loss": 0.392, "lr": 2.8685361717798286e-05, "epoch": 18.050314465408807, "percentage": 90.25, "elapsed_time": "1:28:24", "remaining_time": "0:09:32", "throughput": 4239.51, "total_tokens": 22488040} {"current_steps": 34445, "total_steps": 38160, "loss": 0.3815, "lr": 2.8609066274926265e-05, "epoch": 18.05293501048218, "percentage": 90.26, "elapsed_time": "1:28:25", "remaining_time": "0:09:32", "throughput": 4239.56, "total_tokens": 22491560} {"current_steps": 34450, "total_steps": 38160, "loss": 0.4399, "lr": 2.8532869441659615e-05, "epoch": 18.055555555555557, "percentage": 90.28, "elapsed_time": "1:28:25", "remaining_time": "0:09:31", "throughput": 4239.53, "total_tokens": 22494088} {"current_steps": 34455, "total_steps": 38160, "loss": 0.6348, "lr": 2.8456771233937973e-05, "epoch": 18.05817610062893, "percentage": 90.29, "elapsed_time": "1:28:26", "remaining_time": "0:09:30", "throughput": 4239.61, "total_tokens": 22497864} {"current_steps": 34460, "total_steps": 38160, "loss": 0.39, "lr": 2.838077166768016e-05, "epoch": 18.060796645702307, "percentage": 90.3, "elapsed_time": "1:28:27", "remaining_time": "0:09:29", "throughput": 4239.66, "total_tokens": 22501320} {"current_steps": 34465, "total_steps": 38160, "loss": 0.3042, "lr": 2.8304870758784296e-05, "epoch": 18.06341719077568, "percentage": 90.32, "elapsed_time": "1:28:27", "remaining_time": "0:09:29", "throughput": 4239.62, "total_tokens": 22503816} {"current_steps": 34470, "total_steps": 38160, "loss": 0.5057, "lr": 2.822906852312812e-05, "epoch": 18.066037735849058, "percentage": 90.33, "elapsed_time": "1:28:28", "remaining_time": "0:09:28", "throughput": 4239.69, "total_tokens": 22507432} {"current_steps": 34475, "total_steps": 38160, "loss": 0.3934, "lr": 2.8153364976568563e-05, "epoch": 18.06865828092243, "percentage": 90.34, "elapsed_time": "1:28:30", "remaining_time": "0:09:27", "throughput": 4240.0, "total_tokens": 22514472} {"current_steps": 34480, "total_steps": 38160, "loss": 0.414, "lr": 2.8077760134941955e-05, "epoch": 18.071278825995808, "percentage": 90.36, "elapsed_time": "1:28:30", "remaining_time": "0:09:26", "throughput": 4240.04, "total_tokens": 22517864} {"current_steps": 34485, "total_steps": 38160, "loss": 0.3262, "lr": 2.800225401406392e-05, "epoch": 18.07389937106918, "percentage": 90.37, "elapsed_time": "1:28:31", "remaining_time": "0:09:26", "throughput": 4240.07, "total_tokens": 22521256} {"current_steps": 34490, "total_steps": 38160, "loss": 0.4446, "lr": 2.7926846629729607e-05, "epoch": 18.07651991614256, "percentage": 90.38, "elapsed_time": "1:28:32", "remaining_time": "0:09:25", "throughput": 4240.03, "total_tokens": 22523624} {"current_steps": 34495, "total_steps": 38160, "loss": 0.4398, "lr": 2.7851537997713174e-05, "epoch": 18.079140461215932, "percentage": 90.4, "elapsed_time": "1:28:32", "remaining_time": "0:09:24", "throughput": 4240.06, "total_tokens": 22526984} {"current_steps": 34500, "total_steps": 38160, "loss": 0.4029, "lr": 2.7776328133768458e-05, "epoch": 18.08176100628931, "percentage": 90.41, "elapsed_time": "1:28:33", "remaining_time": "0:09:23", "throughput": 4240.06, "total_tokens": 22529960} {"current_steps": 34505, "total_steps": 38160, "loss": 0.4681, "lr": 2.770121705362849e-05, "epoch": 18.084381551362682, "percentage": 90.42, "elapsed_time": "1:28:34", "remaining_time": "0:09:22", "throughput": 4240.02, "total_tokens": 22532456} {"current_steps": 34510, "total_steps": 38160, "loss": 0.4136, "lr": 2.7626204773005704e-05, "epoch": 18.08700209643606, "percentage": 90.44, "elapsed_time": "1:28:35", "remaining_time": "0:09:22", "throughput": 4240.08, "total_tokens": 22536040} {"current_steps": 34515, "total_steps": 38160, "loss": 0.4426, "lr": 2.7551291307591765e-05, "epoch": 18.089622641509433, "percentage": 90.45, "elapsed_time": "1:28:35", "remaining_time": "0:09:21", "throughput": 4240.09, "total_tokens": 22539144} {"current_steps": 34520, "total_steps": 38160, "loss": 0.5041, "lr": 2.7476476673057636e-05, "epoch": 18.09224318658281, "percentage": 90.46, "elapsed_time": "1:28:36", "remaining_time": "0:09:20", "throughput": 4240.09, "total_tokens": 22541960} {"current_steps": 34525, "total_steps": 38160, "loss": 0.5335, "lr": 2.740176088505375e-05, "epoch": 18.094863731656183, "percentage": 90.47, "elapsed_time": "1:28:37", "remaining_time": "0:09:19", "throughput": 4240.09, "total_tokens": 22544968} {"current_steps": 34530, "total_steps": 38160, "loss": 0.3261, "lr": 2.7327143959209765e-05, "epoch": 18.09748427672956, "percentage": 90.49, "elapsed_time": "1:28:37", "remaining_time": "0:09:19", "throughput": 4240.12, "total_tokens": 22548232} {"current_steps": 34535, "total_steps": 38160, "loss": 0.3872, "lr": 2.725262591113481e-05, "epoch": 18.100104821802937, "percentage": 90.5, "elapsed_time": "1:28:38", "remaining_time": "0:09:18", "throughput": 4240.1, "total_tokens": 22550824} {"current_steps": 34540, "total_steps": 38160, "loss": 0.5089, "lr": 2.7178206756417078e-05, "epoch": 18.10272536687631, "percentage": 90.51, "elapsed_time": "1:28:39", "remaining_time": "0:09:17", "throughput": 4240.1, "total_tokens": 22553736} {"current_steps": 34545, "total_steps": 38160, "loss": 0.4184, "lr": 2.7103886510624344e-05, "epoch": 18.105345911949687, "percentage": 90.53, "elapsed_time": "1:28:39", "remaining_time": "0:09:16", "throughput": 4240.11, "total_tokens": 22556936} {"current_steps": 34550, "total_steps": 38160, "loss": 0.5173, "lr": 2.7029665189303387e-05, "epoch": 18.10796645702306, "percentage": 90.54, "elapsed_time": "1:28:40", "remaining_time": "0:09:15", "throughput": 4240.12, "total_tokens": 22560008} {"current_steps": 34555, "total_steps": 38160, "loss": 0.4967, "lr": 2.6955542807980515e-05, "epoch": 18.110587002096437, "percentage": 90.55, "elapsed_time": "1:28:41", "remaining_time": "0:09:15", "throughput": 4240.12, "total_tokens": 22562824} {"current_steps": 34560, "total_steps": 38160, "loss": 0.3872, "lr": 2.688151938216138e-05, "epoch": 18.11320754716981, "percentage": 90.57, "elapsed_time": "1:28:42", "remaining_time": "0:09:14", "throughput": 4240.22, "total_tokens": 22566856} {"current_steps": 34565, "total_steps": 38160, "loss": 0.3757, "lr": 2.6807594927330703e-05, "epoch": 18.115828092243188, "percentage": 90.58, "elapsed_time": "1:28:43", "remaining_time": "0:09:13", "throughput": 4240.37, "total_tokens": 22571528} {"current_steps": 34570, "total_steps": 38160, "loss": 0.4818, "lr": 2.6733769458952727e-05, "epoch": 18.11844863731656, "percentage": 90.59, "elapsed_time": "1:28:43", "remaining_time": "0:09:12", "throughput": 4240.42, "total_tokens": 22575016} {"current_steps": 34575, "total_steps": 38160, "loss": 0.496, "lr": 2.6660042992470934e-05, "epoch": 18.121069182389938, "percentage": 90.61, "elapsed_time": "1:28:44", "remaining_time": "0:09:12", "throughput": 4240.51, "total_tokens": 22578920} {"current_steps": 34580, "total_steps": 38160, "loss": 0.3479, "lr": 2.658641554330793e-05, "epoch": 18.12368972746331, "percentage": 90.62, "elapsed_time": "1:28:45", "remaining_time": "0:09:11", "throughput": 4240.78, "total_tokens": 22585256} {"current_steps": 34585, "total_steps": 38160, "loss": 0.3437, "lr": 2.6512887126865782e-05, "epoch": 18.12631027253669, "percentage": 90.63, "elapsed_time": "1:28:46", "remaining_time": "0:09:10", "throughput": 4240.82, "total_tokens": 22588648} {"current_steps": 34590, "total_steps": 38160, "loss": 0.4297, "lr": 2.6439457758525908e-05, "epoch": 18.128930817610062, "percentage": 90.64, "elapsed_time": "1:28:47", "remaining_time": "0:09:09", "throughput": 4240.79, "total_tokens": 22591176} {"current_steps": 34595, "total_steps": 38160, "loss": 0.4569, "lr": 2.6366127453648748e-05, "epoch": 18.13155136268344, "percentage": 90.66, "elapsed_time": "1:28:47", "remaining_time": "0:09:09", "throughput": 4240.92, "total_tokens": 22595592} {"current_steps": 34600, "total_steps": 38160, "loss": 0.4127, "lr": 2.6292896227574303e-05, "epoch": 18.134171907756812, "percentage": 90.67, "elapsed_time": "1:28:48", "remaining_time": "0:09:08", "throughput": 4240.87, "total_tokens": 22597928} {"current_steps": 34605, "total_steps": 38160, "loss": 0.639, "lr": 2.6219764095621547e-05, "epoch": 18.13679245283019, "percentage": 90.68, "elapsed_time": "1:28:49", "remaining_time": "0:09:07", "throughput": 4240.88, "total_tokens": 22600840} {"current_steps": 34610, "total_steps": 38160, "loss": 0.3415, "lr": 2.6146731073088958e-05, "epoch": 18.139412997903563, "percentage": 90.7, "elapsed_time": "1:28:49", "remaining_time": "0:09:06", "throughput": 4240.87, "total_tokens": 22603624} {"current_steps": 34615, "total_steps": 38160, "loss": 0.5868, "lr": 2.607379717525432e-05, "epoch": 18.14203354297694, "percentage": 90.71, "elapsed_time": "1:28:50", "remaining_time": "0:09:05", "throughput": 4240.81, "total_tokens": 22605928} {"current_steps": 34620, "total_steps": 38160, "loss": 0.3883, "lr": 2.6000962417374373e-05, "epoch": 18.144654088050313, "percentage": 90.72, "elapsed_time": "1:28:51", "remaining_time": "0:09:05", "throughput": 4240.91, "total_tokens": 22609960} {"current_steps": 34625, "total_steps": 38160, "loss": 0.4606, "lr": 2.5928226814685485e-05, "epoch": 18.14727463312369, "percentage": 90.74, "elapsed_time": "1:28:52", "remaining_time": "0:09:04", "throughput": 4240.99, "total_tokens": 22613672} {"current_steps": 34630, "total_steps": 38160, "loss": 0.5347, "lr": 2.585559038240304e-05, "epoch": 18.149895178197063, "percentage": 90.75, "elapsed_time": "1:28:52", "remaining_time": "0:09:03", "throughput": 4240.99, "total_tokens": 22616552} {"current_steps": 34635, "total_steps": 38160, "loss": 0.4598, "lr": 2.5783053135721714e-05, "epoch": 18.15251572327044, "percentage": 90.76, "elapsed_time": "1:28:53", "remaining_time": "0:09:02", "throughput": 4241.07, "total_tokens": 22620392} {"current_steps": 34640, "total_steps": 38160, "loss": 0.4188, "lr": 2.571061508981565e-05, "epoch": 18.155136268343817, "percentage": 90.78, "elapsed_time": "1:28:54", "remaining_time": "0:09:02", "throughput": 4241.06, "total_tokens": 22623208} {"current_steps": 34645, "total_steps": 38160, "loss": 0.537, "lr": 2.5638276259837778e-05, "epoch": 18.15775681341719, "percentage": 90.79, "elapsed_time": "1:28:55", "remaining_time": "0:09:01", "throughput": 4241.08, "total_tokens": 22626248} {"current_steps": 34650, "total_steps": 38160, "loss": 0.4926, "lr": 2.5566036660920778e-05, "epoch": 18.160377358490567, "percentage": 90.8, "elapsed_time": "1:28:55", "remaining_time": "0:09:00", "throughput": 4241.09, "total_tokens": 22629352} {"current_steps": 34655, "total_steps": 38160, "loss": 0.3422, "lr": 2.5493896308176223e-05, "epoch": 18.16299790356394, "percentage": 90.81, "elapsed_time": "1:28:56", "remaining_time": "0:08:59", "throughput": 4241.14, "total_tokens": 22632712} {"current_steps": 34660, "total_steps": 38160, "loss": 0.5038, "lr": 2.542185521669521e-05, "epoch": 18.165618448637318, "percentage": 90.83, "elapsed_time": "1:28:57", "remaining_time": "0:08:58", "throughput": 4241.24, "total_tokens": 22636648} {"current_steps": 34665, "total_steps": 38160, "loss": 0.4071, "lr": 2.534991340154774e-05, "epoch": 18.16823899371069, "percentage": 90.84, "elapsed_time": "1:28:58", "remaining_time": "0:08:58", "throughput": 4241.56, "total_tokens": 22643752} {"current_steps": 34670, "total_steps": 38160, "loss": 0.4675, "lr": 2.5278070877783332e-05, "epoch": 18.170859538784068, "percentage": 90.85, "elapsed_time": "1:28:59", "remaining_time": "0:08:57", "throughput": 4241.62, "total_tokens": 22647336} {"current_steps": 34675, "total_steps": 38160, "loss": 0.352, "lr": 2.520632766043052e-05, "epoch": 18.17348008385744, "percentage": 90.87, "elapsed_time": "1:28:59", "remaining_time": "0:08:56", "throughput": 4241.6, "total_tokens": 22650024} {"current_steps": 34680, "total_steps": 38160, "loss": 0.403, "lr": 2.513468376449729e-05, "epoch": 18.17610062893082, "percentage": 90.88, "elapsed_time": "1:29:00", "remaining_time": "0:08:55", "throughput": 4241.59, "total_tokens": 22652840} {"current_steps": 34685, "total_steps": 38160, "loss": 0.434, "lr": 2.506313920497061e-05, "epoch": 18.178721174004192, "percentage": 90.89, "elapsed_time": "1:29:01", "remaining_time": "0:08:55", "throughput": 4241.58, "total_tokens": 22655560} {"current_steps": 34690, "total_steps": 38160, "loss": 0.3528, "lr": 2.4991693996816888e-05, "epoch": 18.18134171907757, "percentage": 90.91, "elapsed_time": "1:29:02", "remaining_time": "0:08:54", "throughput": 4241.61, "total_tokens": 22658920} {"current_steps": 34695, "total_steps": 38160, "loss": 0.3299, "lr": 2.4920348154981677e-05, "epoch": 18.183962264150942, "percentage": 90.92, "elapsed_time": "1:29:02", "remaining_time": "0:08:53", "throughput": 4241.62, "total_tokens": 22661960} {"current_steps": 34700, "total_steps": 38160, "loss": 0.3435, "lr": 2.4849101694389477e-05, "epoch": 18.18658280922432, "percentage": 90.93, "elapsed_time": "1:29:03", "remaining_time": "0:08:52", "throughput": 4241.62, "total_tokens": 22664840} {"current_steps": 34705, "total_steps": 38160, "loss": 0.4995, "lr": 2.4777954629944478e-05, "epoch": 18.189203354297693, "percentage": 90.95, "elapsed_time": "1:29:04", "remaining_time": "0:08:52", "throughput": 4241.6, "total_tokens": 22667464} {"current_steps": 34710, "total_steps": 38160, "loss": 0.4764, "lr": 2.4706906976529718e-05, "epoch": 18.19182389937107, "percentage": 90.96, "elapsed_time": "1:29:04", "remaining_time": "0:08:51", "throughput": 4241.67, "total_tokens": 22671176} {"current_steps": 34715, "total_steps": 38160, "loss": 0.3581, "lr": 2.4635958749007648e-05, "epoch": 18.194444444444443, "percentage": 90.97, "elapsed_time": "1:29:05", "remaining_time": "0:08:50", "throughput": 4241.75, "total_tokens": 22674888} {"current_steps": 34720, "total_steps": 38160, "loss": 0.4505, "lr": 2.456510996221978e-05, "epoch": 18.19706498951782, "percentage": 90.99, "elapsed_time": "1:29:06", "remaining_time": "0:08:49", "throughput": 4241.8, "total_tokens": 22678408} {"current_steps": 34725, "total_steps": 38160, "loss": 0.6222, "lr": 2.4494360630986756e-05, "epoch": 18.199685534591197, "percentage": 91.0, "elapsed_time": "1:29:07", "remaining_time": "0:08:48", "throughput": 4241.86, "total_tokens": 22682056} {"current_steps": 34730, "total_steps": 38160, "loss": 0.517, "lr": 2.4423710770108687e-05, "epoch": 18.20230607966457, "percentage": 91.01, "elapsed_time": "1:29:07", "remaining_time": "0:08:48", "throughput": 4241.89, "total_tokens": 22685320} {"current_steps": 34735, "total_steps": 38160, "loss": 0.3386, "lr": 2.435316039436464e-05, "epoch": 18.204926624737947, "percentage": 91.02, "elapsed_time": "1:29:08", "remaining_time": "0:08:47", "throughput": 4241.93, "total_tokens": 22688616} {"current_steps": 34740, "total_steps": 38160, "loss": 0.3327, "lr": 2.428270951851297e-05, "epoch": 18.20754716981132, "percentage": 91.04, "elapsed_time": "1:29:09", "remaining_time": "0:08:46", "throughput": 4241.88, "total_tokens": 22690952} {"current_steps": 34745, "total_steps": 38160, "loss": 0.349, "lr": 2.421235815729128e-05, "epoch": 18.210167714884697, "percentage": 91.05, "elapsed_time": "1:29:10", "remaining_time": "0:08:45", "throughput": 4241.93, "total_tokens": 22694472} {"current_steps": 34750, "total_steps": 38160, "loss": 0.4491, "lr": 2.414210632541619e-05, "epoch": 18.21278825995807, "percentage": 91.06, "elapsed_time": "1:29:10", "remaining_time": "0:08:45", "throughput": 4241.97, "total_tokens": 22697832} {"current_steps": 34755, "total_steps": 38160, "loss": 0.4205, "lr": 2.40719540375835e-05, "epoch": 18.215408805031448, "percentage": 91.08, "elapsed_time": "1:29:11", "remaining_time": "0:08:44", "throughput": 4242.07, "total_tokens": 22701992} {"current_steps": 34760, "total_steps": 38160, "loss": 0.4454, "lr": 2.4001901308468353e-05, "epoch": 18.21802935010482, "percentage": 91.09, "elapsed_time": "1:29:12", "remaining_time": "0:08:43", "throughput": 4242.06, "total_tokens": 22704808} {"current_steps": 34765, "total_steps": 38160, "loss": 0.3735, "lr": 2.3931948152724982e-05, "epoch": 18.220649895178198, "percentage": 91.1, "elapsed_time": "1:29:13", "remaining_time": "0:08:42", "throughput": 4242.09, "total_tokens": 22708008} {"current_steps": 34770, "total_steps": 38160, "loss": 0.3788, "lr": 2.386209458498684e-05, "epoch": 18.22327044025157, "percentage": 91.12, "elapsed_time": "1:29:13", "remaining_time": "0:08:41", "throughput": 4242.14, "total_tokens": 22711496} {"current_steps": 34775, "total_steps": 38160, "loss": 0.3022, "lr": 2.3792340619866458e-05, "epoch": 18.22589098532495, "percentage": 91.13, "elapsed_time": "1:29:14", "remaining_time": "0:08:41", "throughput": 4242.22, "total_tokens": 22715400} {"current_steps": 34780, "total_steps": 38160, "loss": 0.5922, "lr": 2.3722686271955507e-05, "epoch": 18.228511530398322, "percentage": 91.14, "elapsed_time": "1:29:15", "remaining_time": "0:08:40", "throughput": 4242.27, "total_tokens": 22718728} {"current_steps": 34785, "total_steps": 38160, "loss": 0.446, "lr": 2.365313155582488e-05, "epoch": 18.2311320754717, "percentage": 91.16, "elapsed_time": "1:29:16", "remaining_time": "0:08:39", "throughput": 4242.29, "total_tokens": 22721928} {"current_steps": 34790, "total_steps": 38160, "loss": 0.4364, "lr": 2.358367648602472e-05, "epoch": 18.233752620545072, "percentage": 91.17, "elapsed_time": "1:29:16", "remaining_time": "0:08:38", "throughput": 4242.33, "total_tokens": 22725128} {"current_steps": 34795, "total_steps": 38160, "loss": 0.2987, "lr": 2.3514321077084234e-05, "epoch": 18.23637316561845, "percentage": 91.18, "elapsed_time": "1:29:17", "remaining_time": "0:08:38", "throughput": 4242.43, "total_tokens": 22729224} {"current_steps": 34800, "total_steps": 38160, "loss": 0.3802, "lr": 2.3445065343511763e-05, "epoch": 18.238993710691823, "percentage": 91.19, "elapsed_time": "1:29:18", "remaining_time": "0:08:37", "throughput": 4242.41, "total_tokens": 22731880} {"current_steps": 34805, "total_steps": 38160, "loss": 0.3214, "lr": 2.3375909299794717e-05, "epoch": 18.2416142557652, "percentage": 91.21, "elapsed_time": "1:29:18", "remaining_time": "0:08:36", "throughput": 4242.45, "total_tokens": 22735272} {"current_steps": 34810, "total_steps": 38160, "loss": 0.4846, "lr": 2.330685296039986e-05, "epoch": 18.244234800838573, "percentage": 91.22, "elapsed_time": "1:29:19", "remaining_time": "0:08:35", "throughput": 4242.51, "total_tokens": 22738824} {"current_steps": 34815, "total_steps": 38160, "loss": 0.3431, "lr": 2.3237896339772914e-05, "epoch": 18.24685534591195, "percentage": 91.23, "elapsed_time": "1:29:20", "remaining_time": "0:08:35", "throughput": 4242.48, "total_tokens": 22741384} {"current_steps": 34820, "total_steps": 38160, "loss": 0.4638, "lr": 2.3169039452338892e-05, "epoch": 18.249475890985323, "percentage": 91.25, "elapsed_time": "1:29:21", "remaining_time": "0:08:34", "throughput": 4242.53, "total_tokens": 22744840} {"current_steps": 34825, "total_steps": 38160, "loss": 0.5875, "lr": 2.3100282312501886e-05, "epoch": 18.2520964360587, "percentage": 91.26, "elapsed_time": "1:29:22", "remaining_time": "0:08:33", "throughput": 4242.71, "total_tokens": 22750024} {"current_steps": 34830, "total_steps": 38160, "loss": 0.5071, "lr": 2.3031624934645113e-05, "epoch": 18.254716981132077, "percentage": 91.27, "elapsed_time": "1:29:22", "remaining_time": "0:08:32", "throughput": 4242.72, "total_tokens": 22752904} {"current_steps": 34835, "total_steps": 38160, "loss": 0.4209, "lr": 2.296306733313075e-05, "epoch": 18.25733752620545, "percentage": 91.29, "elapsed_time": "1:29:23", "remaining_time": "0:08:31", "throughput": 4242.7, "total_tokens": 22755624} {"current_steps": 34840, "total_steps": 38160, "loss": 0.4538, "lr": 2.289460952230038e-05, "epoch": 18.259958071278827, "percentage": 91.3, "elapsed_time": "1:29:24", "remaining_time": "0:08:31", "throughput": 4242.72, "total_tokens": 22758664} {"current_steps": 34845, "total_steps": 38160, "loss": 0.5177, "lr": 2.2826251516474604e-05, "epoch": 18.2625786163522, "percentage": 91.31, "elapsed_time": "1:29:24", "remaining_time": "0:08:30", "throughput": 4242.69, "total_tokens": 22761288} {"current_steps": 34850, "total_steps": 38160, "loss": 0.4266, "lr": 2.2757993329953152e-05, "epoch": 18.265199161425578, "percentage": 91.33, "elapsed_time": "1:29:25", "remaining_time": "0:08:29", "throughput": 4242.65, "total_tokens": 22763688} {"current_steps": 34855, "total_steps": 38160, "loss": 0.4399, "lr": 2.2689834977014822e-05, "epoch": 18.26781970649895, "percentage": 91.34, "elapsed_time": "1:29:26", "remaining_time": "0:08:28", "throughput": 4242.63, "total_tokens": 22766280} {"current_steps": 34860, "total_steps": 38160, "loss": 0.4827, "lr": 2.2621776471917598e-05, "epoch": 18.270440251572328, "percentage": 91.35, "elapsed_time": "1:29:26", "remaining_time": "0:08:28", "throughput": 4242.68, "total_tokens": 22769800} {"current_steps": 34865, "total_steps": 38160, "loss": 0.4067, "lr": 2.255381782889848e-05, "epoch": 18.2730607966457, "percentage": 91.37, "elapsed_time": "1:29:27", "remaining_time": "0:08:27", "throughput": 4242.72, "total_tokens": 22773128} {"current_steps": 34870, "total_steps": 38160, "loss": 0.4955, "lr": 2.2485959062173654e-05, "epoch": 18.27568134171908, "percentage": 91.38, "elapsed_time": "1:29:28", "remaining_time": "0:08:26", "throughput": 4242.72, "total_tokens": 22776072} {"current_steps": 34875, "total_steps": 38160, "loss": 0.4746, "lr": 2.2418200185938485e-05, "epoch": 18.278301886792452, "percentage": 91.39, "elapsed_time": "1:29:29", "remaining_time": "0:08:25", "throughput": 4242.79, "total_tokens": 22779976} {"current_steps": 34880, "total_steps": 38160, "loss": 0.3495, "lr": 2.235054121436725e-05, "epoch": 18.28092243186583, "percentage": 91.4, "elapsed_time": "1:29:29", "remaining_time": "0:08:24", "throughput": 4242.77, "total_tokens": 22782600} {"current_steps": 34885, "total_steps": 38160, "loss": 0.3807, "lr": 2.2282982161613562e-05, "epoch": 18.283542976939202, "percentage": 91.42, "elapsed_time": "1:29:30", "remaining_time": "0:08:24", "throughput": 4242.75, "total_tokens": 22785224} {"current_steps": 34890, "total_steps": 38160, "loss": 0.3952, "lr": 2.221552304180985e-05, "epoch": 18.28616352201258, "percentage": 91.43, "elapsed_time": "1:29:31", "remaining_time": "0:08:23", "throughput": 4242.75, "total_tokens": 22788168} {"current_steps": 34895, "total_steps": 38160, "loss": 0.591, "lr": 2.2148163869067816e-05, "epoch": 18.288784067085953, "percentage": 91.44, "elapsed_time": "1:29:31", "remaining_time": "0:08:22", "throughput": 4242.78, "total_tokens": 22791464} {"current_steps": 34900, "total_steps": 38160, "loss": 0.5386, "lr": 2.2080904657478305e-05, "epoch": 18.29140461215933, "percentage": 91.46, "elapsed_time": "1:29:32", "remaining_time": "0:08:21", "throughput": 4242.83, "total_tokens": 22794952} {"current_steps": 34905, "total_steps": 38160, "loss": 0.4751, "lr": 2.201374542111123e-05, "epoch": 18.294025157232703, "percentage": 91.47, "elapsed_time": "1:29:33", "remaining_time": "0:08:21", "throughput": 4242.83, "total_tokens": 22797896} {"current_steps": 34910, "total_steps": 38160, "loss": 0.3644, "lr": 2.1946686174015407e-05, "epoch": 18.29664570230608, "percentage": 91.48, "elapsed_time": "1:29:33", "remaining_time": "0:08:20", "throughput": 4242.85, "total_tokens": 22801000} {"current_steps": 34915, "total_steps": 38160, "loss": 0.3936, "lr": 2.1879726930218946e-05, "epoch": 18.299266247379457, "percentage": 91.5, "elapsed_time": "1:29:34", "remaining_time": "0:08:19", "throughput": 4242.92, "total_tokens": 22804712} {"current_steps": 34920, "total_steps": 38160, "loss": 0.4102, "lr": 2.1812867703728866e-05, "epoch": 18.30188679245283, "percentage": 91.51, "elapsed_time": "1:29:35", "remaining_time": "0:08:18", "throughput": 4243.01, "total_tokens": 22808936} {"current_steps": 34925, "total_steps": 38160, "loss": 0.4788, "lr": 2.1746108508531426e-05, "epoch": 18.304507337526207, "percentage": 91.52, "elapsed_time": "1:29:36", "remaining_time": "0:08:17", "throughput": 4242.96, "total_tokens": 22811272} {"current_steps": 34930, "total_steps": 38160, "loss": 0.4336, "lr": 2.1679449358591952e-05, "epoch": 18.30712788259958, "percentage": 91.54, "elapsed_time": "1:29:36", "remaining_time": "0:08:17", "throughput": 4242.97, "total_tokens": 22814280} {"current_steps": 34935, "total_steps": 38160, "loss": 0.3861, "lr": 2.1612890267854624e-05, "epoch": 18.309748427672957, "percentage": 91.55, "elapsed_time": "1:29:37", "remaining_time": "0:08:16", "throughput": 4243.12, "total_tokens": 22818888} {"current_steps": 34940, "total_steps": 38160, "loss": 0.4978, "lr": 2.1546431250242914e-05, "epoch": 18.31236897274633, "percentage": 91.56, "elapsed_time": "1:29:38", "remaining_time": "0:08:15", "throughput": 4243.08, "total_tokens": 22821352} {"current_steps": 34945, "total_steps": 38160, "loss": 0.4562, "lr": 2.1480072319659427e-05, "epoch": 18.314989517819708, "percentage": 91.57, "elapsed_time": "1:29:39", "remaining_time": "0:08:14", "throughput": 4243.18, "total_tokens": 22825448} {"current_steps": 34950, "total_steps": 38160, "loss": 0.3248, "lr": 2.1413813489985447e-05, "epoch": 18.31761006289308, "percentage": 91.59, "elapsed_time": "1:29:40", "remaining_time": "0:08:14", "throughput": 4243.23, "total_tokens": 22828936} {"current_steps": 34955, "total_steps": 38160, "loss": 0.2779, "lr": 2.1347654775081716e-05, "epoch": 18.320230607966458, "percentage": 91.6, "elapsed_time": "1:29:40", "remaining_time": "0:08:13", "throughput": 4243.22, "total_tokens": 22831752} {"current_steps": 34960, "total_steps": 38160, "loss": 0.3797, "lr": 2.1281596188787834e-05, "epoch": 18.32285115303983, "percentage": 91.61, "elapsed_time": "1:29:41", "remaining_time": "0:08:12", "throughput": 4243.22, "total_tokens": 22834760} {"current_steps": 34965, "total_steps": 38160, "loss": 0.5098, "lr": 2.121563774492252e-05, "epoch": 18.32547169811321, "percentage": 91.63, "elapsed_time": "1:29:42", "remaining_time": "0:08:11", "throughput": 4243.17, "total_tokens": 22837064} {"current_steps": 34970, "total_steps": 38160, "loss": 0.4986, "lr": 2.114977945728358e-05, "epoch": 18.328092243186582, "percentage": 91.64, "elapsed_time": "1:29:42", "remaining_time": "0:08:11", "throughput": 4243.2, "total_tokens": 22840232} {"current_steps": 34975, "total_steps": 38160, "loss": 0.4722, "lr": 2.1084021339647707e-05, "epoch": 18.33071278825996, "percentage": 91.65, "elapsed_time": "1:29:43", "remaining_time": "0:08:10", "throughput": 4243.25, "total_tokens": 22843752} {"current_steps": 34980, "total_steps": 38160, "loss": 0.4721, "lr": 2.1018363405770792e-05, "epoch": 18.333333333333332, "percentage": 91.67, "elapsed_time": "1:29:44", "remaining_time": "0:08:09", "throughput": 4243.31, "total_tokens": 22847336} {"current_steps": 34985, "total_steps": 38160, "loss": 0.4346, "lr": 2.095280566938784e-05, "epoch": 18.33595387840671, "percentage": 91.68, "elapsed_time": "1:29:45", "remaining_time": "0:08:08", "throughput": 4243.36, "total_tokens": 22850792} {"current_steps": 34990, "total_steps": 38160, "loss": 0.3535, "lr": 2.0887348144212615e-05, "epoch": 18.338574423480082, "percentage": 91.69, "elapsed_time": "1:29:45", "remaining_time": "0:08:07", "throughput": 4243.36, "total_tokens": 22853768} {"current_steps": 34995, "total_steps": 38160, "loss": 0.5255, "lr": 2.08219908439381e-05, "epoch": 18.34119496855346, "percentage": 91.71, "elapsed_time": "1:29:46", "remaining_time": "0:08:07", "throughput": 4243.48, "total_tokens": 22858024} {"current_steps": 35000, "total_steps": 38160, "loss": 0.5257, "lr": 2.075673378223647e-05, "epoch": 18.343815513626833, "percentage": 91.72, "elapsed_time": "1:29:47", "remaining_time": "0:08:06", "throughput": 4243.53, "total_tokens": 22861416} {"current_steps": 35005, "total_steps": 38160, "loss": 0.45, "lr": 2.069157697275853e-05, "epoch": 18.34643605870021, "percentage": 91.73, "elapsed_time": "1:29:48", "remaining_time": "0:08:05", "throughput": 4243.57, "total_tokens": 22864712} {"current_steps": 35010, "total_steps": 38160, "loss": 0.536, "lr": 2.0626520429134543e-05, "epoch": 18.349056603773583, "percentage": 91.75, "elapsed_time": "1:29:48", "remaining_time": "0:08:04", "throughput": 4243.54, "total_tokens": 22867272} {"current_steps": 35015, "total_steps": 38160, "loss": 0.3924, "lr": 2.0561564164973458e-05, "epoch": 18.35167714884696, "percentage": 91.76, "elapsed_time": "1:29:49", "remaining_time": "0:08:04", "throughput": 4243.49, "total_tokens": 22869640} {"current_steps": 35020, "total_steps": 38160, "loss": 0.3797, "lr": 2.04967081938634e-05, "epoch": 18.354297693920337, "percentage": 91.77, "elapsed_time": "1:29:50", "remaining_time": "0:08:03", "throughput": 4243.63, "total_tokens": 22874152} {"current_steps": 35025, "total_steps": 38160, "loss": 0.3661, "lr": 2.043195252937152e-05, "epoch": 18.35691823899371, "percentage": 91.78, "elapsed_time": "1:29:51", "remaining_time": "0:08:02", "throughput": 4243.68, "total_tokens": 22877736} {"current_steps": 35030, "total_steps": 38160, "loss": 0.5159, "lr": 2.0367297185044043e-05, "epoch": 18.359538784067087, "percentage": 91.8, "elapsed_time": "1:29:51", "remaining_time": "0:08:01", "throughput": 4243.65, "total_tokens": 22880264} {"current_steps": 35035, "total_steps": 38160, "loss": 0.414, "lr": 2.030274217440603e-05, "epoch": 18.36215932914046, "percentage": 91.81, "elapsed_time": "1:29:52", "remaining_time": "0:08:00", "throughput": 4243.76, "total_tokens": 22884520} {"current_steps": 35040, "total_steps": 38160, "loss": 0.4476, "lr": 2.0238287510961628e-05, "epoch": 18.364779874213838, "percentage": 91.82, "elapsed_time": "1:29:53", "remaining_time": "0:08:00", "throughput": 4243.78, "total_tokens": 22887624} {"current_steps": 35045, "total_steps": 38160, "loss": 0.3581, "lr": 2.017393320819405e-05, "epoch": 18.36740041928721, "percentage": 91.84, "elapsed_time": "1:29:54", "remaining_time": "0:07:59", "throughput": 4243.88, "total_tokens": 22891752} {"current_steps": 35050, "total_steps": 38160, "loss": 0.3966, "lr": 2.010967927956553e-05, "epoch": 18.370020964360588, "percentage": 91.85, "elapsed_time": "1:29:54", "remaining_time": "0:07:58", "throughput": 4243.84, "total_tokens": 22894184} {"current_steps": 35055, "total_steps": 38160, "loss": 0.5207, "lr": 2.00455257385172e-05, "epoch": 18.37264150943396, "percentage": 91.86, "elapsed_time": "1:29:55", "remaining_time": "0:07:57", "throughput": 4243.84, "total_tokens": 22896968} {"current_steps": 35060, "total_steps": 38160, "loss": 0.3566, "lr": 1.9981472598469386e-05, "epoch": 18.37526205450734, "percentage": 91.88, "elapsed_time": "1:29:56", "remaining_time": "0:07:57", "throughput": 4243.84, "total_tokens": 22899848} {"current_steps": 35065, "total_steps": 38160, "loss": 0.3934, "lr": 1.9917519872821142e-05, "epoch": 18.377882599580712, "percentage": 91.89, "elapsed_time": "1:29:56", "remaining_time": "0:07:56", "throughput": 4243.79, "total_tokens": 22902312} {"current_steps": 35070, "total_steps": 38160, "loss": 0.4631, "lr": 1.9853667574950605e-05, "epoch": 18.38050314465409, "percentage": 91.9, "elapsed_time": "1:29:57", "remaining_time": "0:07:55", "throughput": 4243.79, "total_tokens": 22905128} {"current_steps": 35075, "total_steps": 38160, "loss": 0.3504, "lr": 1.978991571821498e-05, "epoch": 18.383123689727462, "percentage": 91.92, "elapsed_time": "1:29:58", "remaining_time": "0:07:54", "throughput": 4243.82, "total_tokens": 22908488} {"current_steps": 35080, "total_steps": 38160, "loss": 0.4363, "lr": 1.972626431595048e-05, "epoch": 18.38574423480084, "percentage": 91.93, "elapsed_time": "1:29:58", "remaining_time": "0:07:54", "throughput": 4243.85, "total_tokens": 22911592} {"current_steps": 35085, "total_steps": 38160, "loss": 0.4554, "lr": 1.9662713381472295e-05, "epoch": 18.388364779874212, "percentage": 91.94, "elapsed_time": "1:29:59", "remaining_time": "0:07:53", "throughput": 4243.83, "total_tokens": 22914376} {"current_steps": 35090, "total_steps": 38160, "loss": 0.5246, "lr": 1.959926292807451e-05, "epoch": 18.39098532494759, "percentage": 91.95, "elapsed_time": "1:30:00", "remaining_time": "0:07:52", "throughput": 4243.89, "total_tokens": 22918056} {"current_steps": 35095, "total_steps": 38160, "loss": 0.4918, "lr": 1.9535912969030178e-05, "epoch": 18.393605870020963, "percentage": 91.97, "elapsed_time": "1:30:01", "remaining_time": "0:07:51", "throughput": 4243.98, "total_tokens": 22921992} {"current_steps": 35100, "total_steps": 38160, "loss": 0.3444, "lr": 1.947266351759136e-05, "epoch": 18.39622641509434, "percentage": 91.98, "elapsed_time": "1:30:01", "remaining_time": "0:07:50", "throughput": 4244.08, "total_tokens": 22926024} {"current_steps": 35105, "total_steps": 38160, "loss": 0.334, "lr": 1.940951458698925e-05, "epoch": 18.398846960167713, "percentage": 91.99, "elapsed_time": "1:30:02", "remaining_time": "0:07:50", "throughput": 4244.08, "total_tokens": 22928936} {"current_steps": 35110, "total_steps": 38160, "loss": 0.3597, "lr": 1.9346466190433842e-05, "epoch": 18.40146750524109, "percentage": 92.01, "elapsed_time": "1:30:03", "remaining_time": "0:07:49", "throughput": 4244.1, "total_tokens": 22932168} {"current_steps": 35115, "total_steps": 38160, "loss": 0.4468, "lr": 1.9283518341114136e-05, "epoch": 18.404088050314467, "percentage": 92.02, "elapsed_time": "1:30:03", "remaining_time": "0:07:48", "throughput": 4244.08, "total_tokens": 22934728} {"current_steps": 35120, "total_steps": 38160, "loss": 0.4823, "lr": 1.9220671052198047e-05, "epoch": 18.40670859538784, "percentage": 92.03, "elapsed_time": "1:30:04", "remaining_time": "0:07:47", "throughput": 4244.08, "total_tokens": 22937736} {"current_steps": 35125, "total_steps": 38160, "loss": 0.4711, "lr": 1.9157924336832556e-05, "epoch": 18.409329140461217, "percentage": 92.05, "elapsed_time": "1:30:05", "remaining_time": "0:07:47", "throughput": 4244.13, "total_tokens": 22941256} {"current_steps": 35130, "total_steps": 38160, "loss": 0.3922, "lr": 1.909527820814355e-05, "epoch": 18.41194968553459, "percentage": 92.06, "elapsed_time": "1:30:06", "remaining_time": "0:07:46", "throughput": 4244.1, "total_tokens": 22943784} {"current_steps": 35135, "total_steps": 38160, "loss": 0.4194, "lr": 1.9032732679235886e-05, "epoch": 18.414570230607968, "percentage": 92.07, "elapsed_time": "1:30:06", "remaining_time": "0:07:45", "throughput": 4244.07, "total_tokens": 22946312} {"current_steps": 35140, "total_steps": 38160, "loss": 0.3723, "lr": 1.8970287763193428e-05, "epoch": 18.41719077568134, "percentage": 92.09, "elapsed_time": "1:30:07", "remaining_time": "0:07:44", "throughput": 4244.1, "total_tokens": 22949576} {"current_steps": 35145, "total_steps": 38160, "loss": 0.3545, "lr": 1.8907943473078892e-05, "epoch": 18.419811320754718, "percentage": 92.1, "elapsed_time": "1:30:08", "remaining_time": "0:07:43", "throughput": 4244.12, "total_tokens": 22952712} {"current_steps": 35150, "total_steps": 38160, "loss": 0.4938, "lr": 1.884569982193396e-05, "epoch": 18.42243186582809, "percentage": 92.11, "elapsed_time": "1:30:08", "remaining_time": "0:07:43", "throughput": 4244.1, "total_tokens": 22955400} {"current_steps": 35155, "total_steps": 38160, "loss": 0.5579, "lr": 1.8783556822779267e-05, "epoch": 18.42505241090147, "percentage": 92.13, "elapsed_time": "1:30:09", "remaining_time": "0:07:42", "throughput": 4244.09, "total_tokens": 22958312} {"current_steps": 35160, "total_steps": 38160, "loss": 0.4006, "lr": 1.8721514488614532e-05, "epoch": 18.427672955974842, "percentage": 92.14, "elapsed_time": "1:30:10", "remaining_time": "0:07:41", "throughput": 4244.09, "total_tokens": 22961192} {"current_steps": 35165, "total_steps": 38160, "loss": 0.4003, "lr": 1.8659572832418315e-05, "epoch": 18.43029350104822, "percentage": 92.15, "elapsed_time": "1:30:10", "remaining_time": "0:07:40", "throughput": 4244.09, "total_tokens": 22964040} {"current_steps": 35170, "total_steps": 38160, "loss": 0.4448, "lr": 1.8597731867148026e-05, "epoch": 18.432914046121592, "percentage": 92.16, "elapsed_time": "1:30:11", "remaining_time": "0:07:40", "throughput": 4244.05, "total_tokens": 22966440} {"current_steps": 35175, "total_steps": 38160, "loss": 0.5075, "lr": 1.8535991605740043e-05, "epoch": 18.43553459119497, "percentage": 92.18, "elapsed_time": "1:30:12", "remaining_time": "0:07:39", "throughput": 4244.13, "total_tokens": 22970344} {"current_steps": 35180, "total_steps": 38160, "loss": 0.3346, "lr": 1.8474352061109757e-05, "epoch": 18.438155136268342, "percentage": 92.19, "elapsed_time": "1:30:13", "remaining_time": "0:07:38", "throughput": 4244.18, "total_tokens": 22973896} {"current_steps": 35185, "total_steps": 38160, "loss": 0.3076, "lr": 1.8412813246151515e-05, "epoch": 18.44077568134172, "percentage": 92.2, "elapsed_time": "1:30:13", "remaining_time": "0:07:37", "throughput": 4244.24, "total_tokens": 22977352} {"current_steps": 35190, "total_steps": 38160, "loss": 0.4564, "lr": 1.8351375173738584e-05, "epoch": 18.443396226415093, "percentage": 92.22, "elapsed_time": "1:30:14", "remaining_time": "0:07:36", "throughput": 4244.3, "total_tokens": 22981064} {"current_steps": 35195, "total_steps": 38160, "loss": 0.3342, "lr": 1.829003785672295e-05, "epoch": 18.44601677148847, "percentage": 92.23, "elapsed_time": "1:30:15", "remaining_time": "0:07:36", "throughput": 4244.3, "total_tokens": 22984040} {"current_steps": 35200, "total_steps": 38160, "loss": 0.3396, "lr": 1.8228801307935806e-05, "epoch": 18.448637316561843, "percentage": 92.24, "elapsed_time": "1:30:15", "remaining_time": "0:07:35", "throughput": 4244.31, "total_tokens": 22987080} {"current_steps": 35205, "total_steps": 38160, "loss": 0.4481, "lr": 1.8167665540187063e-05, "epoch": 18.45125786163522, "percentage": 92.26, "elapsed_time": "1:30:16", "remaining_time": "0:07:34", "throughput": 4244.31, "total_tokens": 22989992} {"current_steps": 35210, "total_steps": 38160, "loss": 0.304, "lr": 1.8106630566265604e-05, "epoch": 18.453878406708597, "percentage": 92.27, "elapsed_time": "1:30:17", "remaining_time": "0:07:33", "throughput": 4244.37, "total_tokens": 22993512} {"current_steps": 35215, "total_steps": 38160, "loss": 0.5464, "lr": 1.8045696398939326e-05, "epoch": 18.45649895178197, "percentage": 92.28, "elapsed_time": "1:30:18", "remaining_time": "0:07:33", "throughput": 4244.34, "total_tokens": 22996232} {"current_steps": 35220, "total_steps": 38160, "loss": 0.5528, "lr": 1.7984863050955036e-05, "epoch": 18.459119496855347, "percentage": 92.3, "elapsed_time": "1:30:18", "remaining_time": "0:07:32", "throughput": 4244.32, "total_tokens": 22998856} {"current_steps": 35225, "total_steps": 38160, "loss": 0.5102, "lr": 1.7924130535038162e-05, "epoch": 18.46174004192872, "percentage": 92.31, "elapsed_time": "1:30:19", "remaining_time": "0:07:31", "throughput": 4244.38, "total_tokens": 23002312} {"current_steps": 35230, "total_steps": 38160, "loss": 0.3674, "lr": 1.7863498863893433e-05, "epoch": 18.464360587002098, "percentage": 92.32, "elapsed_time": "1:30:20", "remaining_time": "0:07:30", "throughput": 4244.34, "total_tokens": 23004808} {"current_steps": 35235, "total_steps": 38160, "loss": 0.4322, "lr": 1.7802968050204203e-05, "epoch": 18.46698113207547, "percentage": 92.33, "elapsed_time": "1:30:20", "remaining_time": "0:07:30", "throughput": 4244.39, "total_tokens": 23008328} {"current_steps": 35240, "total_steps": 38160, "loss": 0.5788, "lr": 1.7742538106632844e-05, "epoch": 18.469601677148848, "percentage": 92.35, "elapsed_time": "1:30:21", "remaining_time": "0:07:29", "throughput": 4244.39, "total_tokens": 23011176} {"current_steps": 35245, "total_steps": 38160, "loss": 0.459, "lr": 1.7682209045820684e-05, "epoch": 18.47222222222222, "percentage": 92.36, "elapsed_time": "1:30:22", "remaining_time": "0:07:28", "throughput": 4244.45, "total_tokens": 23014792} {"current_steps": 35250, "total_steps": 38160, "loss": 0.299, "lr": 1.76219808803878e-05, "epoch": 18.4748427672956, "percentage": 92.37, "elapsed_time": "1:30:23", "remaining_time": "0:07:27", "throughput": 4244.44, "total_tokens": 23017640} {"current_steps": 35255, "total_steps": 38160, "loss": 0.3247, "lr": 1.7561853622933278e-05, "epoch": 18.47746331236897, "percentage": 92.39, "elapsed_time": "1:30:23", "remaining_time": "0:07:26", "throughput": 4244.48, "total_tokens": 23021128} {"current_steps": 35260, "total_steps": 38160, "loss": 0.4082, "lr": 1.7501827286035e-05, "epoch": 18.48008385744235, "percentage": 92.4, "elapsed_time": "1:30:24", "remaining_time": "0:07:26", "throughput": 4244.66, "total_tokens": 23026184} {"current_steps": 35265, "total_steps": 38160, "loss": 0.4513, "lr": 1.7441901882249754e-05, "epoch": 18.482704402515722, "percentage": 92.41, "elapsed_time": "1:30:25", "remaining_time": "0:07:25", "throughput": 4244.71, "total_tokens": 23029768} {"current_steps": 35270, "total_steps": 38160, "loss": 0.3845, "lr": 1.7382077424113464e-05, "epoch": 18.4853249475891, "percentage": 92.43, "elapsed_time": "1:30:26", "remaining_time": "0:07:24", "throughput": 4244.76, "total_tokens": 23033096} {"current_steps": 35275, "total_steps": 38160, "loss": 0.2512, "lr": 1.7322353924140498e-05, "epoch": 18.487945492662472, "percentage": 92.44, "elapsed_time": "1:30:26", "remaining_time": "0:07:23", "throughput": 4244.72, "total_tokens": 23035528} {"current_steps": 35280, "total_steps": 38160, "loss": 0.4216, "lr": 1.7262731394824372e-05, "epoch": 18.49056603773585, "percentage": 92.45, "elapsed_time": "1:30:27", "remaining_time": "0:07:23", "throughput": 4244.72, "total_tokens": 23038536} {"current_steps": 35285, "total_steps": 38160, "loss": 0.3562, "lr": 1.7203209848637603e-05, "epoch": 18.493186582809223, "percentage": 92.47, "elapsed_time": "1:30:28", "remaining_time": "0:07:22", "throughput": 4244.74, "total_tokens": 23041672} {"current_steps": 35290, "total_steps": 38160, "loss": 0.41, "lr": 1.7143789298031175e-05, "epoch": 18.4958071278826, "percentage": 92.48, "elapsed_time": "1:30:29", "remaining_time": "0:07:21", "throughput": 4244.86, "total_tokens": 23045928} {"current_steps": 35295, "total_steps": 38160, "loss": 0.4492, "lr": 1.708446975543537e-05, "epoch": 18.498427672955973, "percentage": 92.49, "elapsed_time": "1:30:29", "remaining_time": "0:07:20", "throughput": 4244.91, "total_tokens": 23049448} {"current_steps": 35300, "total_steps": 38160, "loss": 0.4189, "lr": 1.7025251233259098e-05, "epoch": 18.50104821802935, "percentage": 92.51, "elapsed_time": "1:30:30", "remaining_time": "0:07:19", "throughput": 4244.9, "total_tokens": 23052200} {"current_steps": 35305, "total_steps": 38160, "loss": 0.4741, "lr": 1.6966133743890166e-05, "epoch": 18.503668763102727, "percentage": 92.52, "elapsed_time": "1:30:31", "remaining_time": "0:07:19", "throughput": 4244.98, "total_tokens": 23056072} {"current_steps": 35310, "total_steps": 38160, "loss": 0.6121, "lr": 1.690711729969535e-05, "epoch": 18.5062893081761, "percentage": 92.53, "elapsed_time": "1:30:32", "remaining_time": "0:07:18", "throughput": 4245.0, "total_tokens": 23059208} {"current_steps": 35315, "total_steps": 38160, "loss": 0.4435, "lr": 1.684820191302022e-05, "epoch": 18.508909853249477, "percentage": 92.54, "elapsed_time": "1:30:32", "remaining_time": "0:07:17", "throughput": 4244.98, "total_tokens": 23061928} {"current_steps": 35320, "total_steps": 38160, "loss": 0.5125, "lr": 1.6789387596189087e-05, "epoch": 18.51153039832285, "percentage": 92.56, "elapsed_time": "1:30:33", "remaining_time": "0:07:16", "throughput": 4244.99, "total_tokens": 23064904} {"current_steps": 35325, "total_steps": 38160, "loss": 0.3247, "lr": 1.6730674361505382e-05, "epoch": 18.514150943396228, "percentage": 92.57, "elapsed_time": "1:30:34", "remaining_time": "0:07:16", "throughput": 4245.05, "total_tokens": 23068552} {"current_steps": 35330, "total_steps": 38160, "loss": 0.4098, "lr": 1.6672062221251117e-05, "epoch": 18.5167714884696, "percentage": 92.58, "elapsed_time": "1:30:34", "remaining_time": "0:07:15", "throughput": 4245.03, "total_tokens": 23071240} {"current_steps": 35335, "total_steps": 38160, "loss": 0.4825, "lr": 1.6613551187687314e-05, "epoch": 18.519392033542978, "percentage": 92.6, "elapsed_time": "1:30:35", "remaining_time": "0:07:14", "throughput": 4245.11, "total_tokens": 23075016} {"current_steps": 35340, "total_steps": 38160, "loss": 0.3201, "lr": 1.6555141273053907e-05, "epoch": 18.52201257861635, "percentage": 92.61, "elapsed_time": "1:30:36", "remaining_time": "0:07:13", "throughput": 4245.13, "total_tokens": 23078152} {"current_steps": 35345, "total_steps": 38160, "loss": 0.432, "lr": 1.6496832489569457e-05, "epoch": 18.52463312368973, "percentage": 92.62, "elapsed_time": "1:30:37", "remaining_time": "0:07:13", "throughput": 4245.14, "total_tokens": 23081128} {"current_steps": 35350, "total_steps": 38160, "loss": 0.3665, "lr": 1.643862484943165e-05, "epoch": 18.5272536687631, "percentage": 92.64, "elapsed_time": "1:30:37", "remaining_time": "0:07:12", "throughput": 4245.18, "total_tokens": 23084488} {"current_steps": 35355, "total_steps": 38160, "loss": 0.4169, "lr": 1.6380518364816687e-05, "epoch": 18.52987421383648, "percentage": 92.65, "elapsed_time": "1:30:38", "remaining_time": "0:07:11", "throughput": 4245.15, "total_tokens": 23087144} {"current_steps": 35360, "total_steps": 38160, "loss": 0.3585, "lr": 1.632251304787985e-05, "epoch": 18.532494758909852, "percentage": 92.66, "elapsed_time": "1:30:39", "remaining_time": "0:07:10", "throughput": 4245.16, "total_tokens": 23090152} {"current_steps": 35365, "total_steps": 38160, "loss": 0.4719, "lr": 1.6264608910755153e-05, "epoch": 18.53511530398323, "percentage": 92.68, "elapsed_time": "1:30:39", "remaining_time": "0:07:09", "throughput": 4245.23, "total_tokens": 23093992} {"current_steps": 35370, "total_steps": 38160, "loss": 0.3441, "lr": 1.6206805965555627e-05, "epoch": 18.537735849056602, "percentage": 92.69, "elapsed_time": "1:30:40", "remaining_time": "0:07:09", "throughput": 4245.22, "total_tokens": 23096808} {"current_steps": 35375, "total_steps": 38160, "loss": 0.3792, "lr": 1.614910422437288e-05, "epoch": 18.54035639412998, "percentage": 92.7, "elapsed_time": "1:30:41", "remaining_time": "0:07:08", "throughput": 4245.17, "total_tokens": 23099144} {"current_steps": 35380, "total_steps": 38160, "loss": 0.2904, "lr": 1.6091503699277477e-05, "epoch": 18.542976939203353, "percentage": 92.71, "elapsed_time": "1:30:42", "remaining_time": "0:07:07", "throughput": 4245.21, "total_tokens": 23102440} {"current_steps": 35385, "total_steps": 38160, "loss": 0.429, "lr": 1.6034004402318726e-05, "epoch": 18.54559748427673, "percentage": 92.73, "elapsed_time": "1:30:42", "remaining_time": "0:07:06", "throughput": 4245.3, "total_tokens": 23106376} {"current_steps": 35390, "total_steps": 38160, "loss": 0.4631, "lr": 1.5976606345524836e-05, "epoch": 18.548218029350103, "percentage": 92.74, "elapsed_time": "1:30:43", "remaining_time": "0:07:06", "throughput": 4245.31, "total_tokens": 23109448} {"current_steps": 35395, "total_steps": 38160, "loss": 0.4018, "lr": 1.5919309540902927e-05, "epoch": 18.55083857442348, "percentage": 92.75, "elapsed_time": "1:30:44", "remaining_time": "0:07:05", "throughput": 4245.37, "total_tokens": 23113160} {"current_steps": 35400, "total_steps": 38160, "loss": 0.4059, "lr": 1.5862114000438797e-05, "epoch": 18.553459119496857, "percentage": 92.77, "elapsed_time": "1:30:45", "remaining_time": "0:07:04", "throughput": 4245.38, "total_tokens": 23116136} {"current_steps": 35405, "total_steps": 38160, "loss": 0.4015, "lr": 1.5805019736097104e-05, "epoch": 18.55607966457023, "percentage": 92.78, "elapsed_time": "1:30:45", "remaining_time": "0:07:03", "throughput": 4245.4, "total_tokens": 23119112} {"current_steps": 35410, "total_steps": 38160, "loss": 0.3732, "lr": 1.5748026759821232e-05, "epoch": 18.558700209643607, "percentage": 92.79, "elapsed_time": "1:30:46", "remaining_time": "0:07:02", "throughput": 4245.38, "total_tokens": 23121704} {"current_steps": 35415, "total_steps": 38160, "loss": 0.3488, "lr": 1.5691135083533537e-05, "epoch": 18.56132075471698, "percentage": 92.81, "elapsed_time": "1:30:47", "remaining_time": "0:07:02", "throughput": 4245.43, "total_tokens": 23125256} {"current_steps": 35420, "total_steps": 38160, "loss": 0.4962, "lr": 1.5634344719135052e-05, "epoch": 18.563941299790358, "percentage": 92.82, "elapsed_time": "1:30:47", "remaining_time": "0:07:01", "throughput": 4245.46, "total_tokens": 23128360} {"current_steps": 35425, "total_steps": 38160, "loss": 0.3522, "lr": 1.5577655678505776e-05, "epoch": 18.56656184486373, "percentage": 92.83, "elapsed_time": "1:30:48", "remaining_time": "0:07:00", "throughput": 4245.57, "total_tokens": 23132648} {"current_steps": 35430, "total_steps": 38160, "loss": 0.3089, "lr": 1.5521067973504442e-05, "epoch": 18.569182389937108, "percentage": 92.85, "elapsed_time": "1:30:49", "remaining_time": "0:06:59", "throughput": 4245.53, "total_tokens": 23135112} {"current_steps": 35435, "total_steps": 38160, "loss": 0.3726, "lr": 1.546458161596831e-05, "epoch": 18.57180293501048, "percentage": 92.86, "elapsed_time": "1:30:49", "remaining_time": "0:06:59", "throughput": 4245.53, "total_tokens": 23138088} {"current_steps": 35440, "total_steps": 38160, "loss": 0.592, "lr": 1.5408196617713866e-05, "epoch": 18.57442348008386, "percentage": 92.87, "elapsed_time": "1:30:50", "remaining_time": "0:06:58", "throughput": 4245.5, "total_tokens": 23140616} {"current_steps": 35445, "total_steps": 38160, "loss": 0.4618, "lr": 1.5351912990536175e-05, "epoch": 18.57704402515723, "percentage": 92.89, "elapsed_time": "1:30:51", "remaining_time": "0:06:57", "throughput": 4245.5, "total_tokens": 23143624} {"current_steps": 35450, "total_steps": 38160, "loss": 0.5514, "lr": 1.5295730746209103e-05, "epoch": 18.57966457023061, "percentage": 92.9, "elapsed_time": "1:30:52", "remaining_time": "0:06:56", "throughput": 4245.51, "total_tokens": 23146568} {"current_steps": 35455, "total_steps": 38160, "loss": 0.4835, "lr": 1.5239649896485463e-05, "epoch": 18.582285115303982, "percentage": 92.91, "elapsed_time": "1:30:52", "remaining_time": "0:06:56", "throughput": 4245.5, "total_tokens": 23149352} {"current_steps": 35460, "total_steps": 38160, "loss": 0.4817, "lr": 1.5183670453096598e-05, "epoch": 18.58490566037736, "percentage": 92.92, "elapsed_time": "1:30:53", "remaining_time": "0:06:55", "throughput": 4245.46, "total_tokens": 23151944} {"current_steps": 35465, "total_steps": 38160, "loss": 0.4136, "lr": 1.5127792427752696e-05, "epoch": 18.587526205450732, "percentage": 92.94, "elapsed_time": "1:30:54", "remaining_time": "0:06:54", "throughput": 4245.53, "total_tokens": 23155496} {"current_steps": 35470, "total_steps": 38160, "loss": 0.4193, "lr": 1.507201583214296e-05, "epoch": 18.59014675052411, "percentage": 92.95, "elapsed_time": "1:30:54", "remaining_time": "0:06:53", "throughput": 4245.53, "total_tokens": 23158440} {"current_steps": 35475, "total_steps": 38160, "loss": 0.3198, "lr": 1.5016340677935169e-05, "epoch": 18.592767295597483, "percentage": 92.96, "elapsed_time": "1:30:55", "remaining_time": "0:06:52", "throughput": 4245.6, "total_tokens": 23162120} {"current_steps": 35480, "total_steps": 38160, "loss": 0.5483, "lr": 1.4960766976775953e-05, "epoch": 18.59538784067086, "percentage": 92.98, "elapsed_time": "1:30:56", "remaining_time": "0:06:52", "throughput": 4245.6, "total_tokens": 23165128} {"current_steps": 35485, "total_steps": 38160, "loss": 0.4179, "lr": 1.4905294740290677e-05, "epoch": 18.598008385744233, "percentage": 92.99, "elapsed_time": "1:30:57", "remaining_time": "0:06:51", "throughput": 4245.64, "total_tokens": 23168456} {"current_steps": 35490, "total_steps": 38160, "loss": 0.3768, "lr": 1.4849923980083391e-05, "epoch": 18.60062893081761, "percentage": 93.0, "elapsed_time": "1:30:57", "remaining_time": "0:06:50", "throughput": 4245.74, "total_tokens": 23172520} {"current_steps": 35495, "total_steps": 38160, "loss": 0.4581, "lr": 1.4794654707737164e-05, "epoch": 18.603249475890987, "percentage": 93.02, "elapsed_time": "1:30:58", "remaining_time": "0:06:49", "throughput": 4245.78, "total_tokens": 23175816} {"current_steps": 35500, "total_steps": 38160, "loss": 0.4163, "lr": 1.4739486934813696e-05, "epoch": 18.60587002096436, "percentage": 93.03, "elapsed_time": "1:30:59", "remaining_time": "0:06:49", "throughput": 4245.81, "total_tokens": 23179048} {"current_steps": 35505, "total_steps": 38160, "loss": 0.3457, "lr": 1.468442067285336e-05, "epoch": 18.608490566037737, "percentage": 93.04, "elapsed_time": "1:30:59", "remaining_time": "0:06:48", "throughput": 4245.83, "total_tokens": 23182248} {"current_steps": 35510, "total_steps": 38160, "loss": 0.3437, "lr": 1.4629455933375501e-05, "epoch": 18.61111111111111, "percentage": 93.06, "elapsed_time": "1:31:00", "remaining_time": "0:06:47", "throughput": 4245.84, "total_tokens": 23185224} {"current_steps": 35515, "total_steps": 38160, "loss": 0.5319, "lr": 1.4574592727878089e-05, "epoch": 18.613731656184488, "percentage": 93.07, "elapsed_time": "1:31:01", "remaining_time": "0:06:46", "throughput": 4245.88, "total_tokens": 23188552} {"current_steps": 35520, "total_steps": 38160, "loss": 0.4253, "lr": 1.4519831067837774e-05, "epoch": 18.61635220125786, "percentage": 93.08, "elapsed_time": "1:31:02", "remaining_time": "0:06:45", "throughput": 4245.96, "total_tokens": 23192392} {"current_steps": 35525, "total_steps": 38160, "loss": 0.4223, "lr": 1.4465170964710172e-05, "epoch": 18.618972746331238, "percentage": 93.09, "elapsed_time": "1:31:02", "remaining_time": "0:06:45", "throughput": 4245.99, "total_tokens": 23195656} {"current_steps": 35530, "total_steps": 38160, "loss": 0.3607, "lr": 1.441061242992947e-05, "epoch": 18.62159329140461, "percentage": 93.11, "elapsed_time": "1:31:03", "remaining_time": "0:06:44", "throughput": 4245.99, "total_tokens": 23198568} {"current_steps": 35535, "total_steps": 38160, "loss": 0.4092, "lr": 1.4356155474908871e-05, "epoch": 18.62421383647799, "percentage": 93.12, "elapsed_time": "1:31:04", "remaining_time": "0:06:43", "throughput": 4246.01, "total_tokens": 23201768} {"current_steps": 35540, "total_steps": 38160, "loss": 0.3823, "lr": 1.4301800111039986e-05, "epoch": 18.62683438155136, "percentage": 93.13, "elapsed_time": "1:31:05", "remaining_time": "0:06:42", "throughput": 4246.05, "total_tokens": 23205064} {"current_steps": 35545, "total_steps": 38160, "loss": 0.4904, "lr": 1.4247546349693386e-05, "epoch": 18.62945492662474, "percentage": 93.15, "elapsed_time": "1:31:05", "remaining_time": "0:06:42", "throughput": 4246.18, "total_tokens": 23209512} {"current_steps": 35550, "total_steps": 38160, "loss": 0.4002, "lr": 1.4193394202218268e-05, "epoch": 18.632075471698112, "percentage": 93.16, "elapsed_time": "1:31:06", "remaining_time": "0:06:41", "throughput": 4246.27, "total_tokens": 23213544} {"current_steps": 35555, "total_steps": 38160, "loss": 0.3434, "lr": 1.413934367994274e-05, "epoch": 18.63469601677149, "percentage": 93.17, "elapsed_time": "1:31:07", "remaining_time": "0:06:40", "throughput": 4246.31, "total_tokens": 23216904} {"current_steps": 35560, "total_steps": 38160, "loss": 0.4534, "lr": 1.408539479417359e-05, "epoch": 18.637316561844862, "percentage": 93.19, "elapsed_time": "1:31:08", "remaining_time": "0:06:39", "throughput": 4246.3, "total_tokens": 23219624} {"current_steps": 35565, "total_steps": 38160, "loss": 0.4274, "lr": 1.4031547556196178e-05, "epoch": 18.63993710691824, "percentage": 93.2, "elapsed_time": "1:31:08", "remaining_time": "0:06:39", "throughput": 4246.31, "total_tokens": 23222568} {"current_steps": 35570, "total_steps": 38160, "loss": 0.3822, "lr": 1.3977801977274828e-05, "epoch": 18.642557651991613, "percentage": 93.21, "elapsed_time": "1:31:09", "remaining_time": "0:06:38", "throughput": 4246.41, "total_tokens": 23226600} {"current_steps": 35575, "total_steps": 38160, "loss": 0.5309, "lr": 1.3924158068652437e-05, "epoch": 18.64517819706499, "percentage": 93.23, "elapsed_time": "1:31:10", "remaining_time": "0:06:37", "throughput": 4246.47, "total_tokens": 23230216} {"current_steps": 35580, "total_steps": 38160, "loss": 0.4685, "lr": 1.3870615841550693e-05, "epoch": 18.647798742138363, "percentage": 93.24, "elapsed_time": "1:31:11", "remaining_time": "0:06:36", "throughput": 4246.46, "total_tokens": 23232968} {"current_steps": 35585, "total_steps": 38160, "loss": 0.4021, "lr": 1.3817175307170138e-05, "epoch": 18.65041928721174, "percentage": 93.25, "elapsed_time": "1:31:11", "remaining_time": "0:06:35", "throughput": 4246.5, "total_tokens": 23236264} {"current_steps": 35590, "total_steps": 38160, "loss": 0.3239, "lr": 1.3763836476689828e-05, "epoch": 18.653039832285117, "percentage": 93.27, "elapsed_time": "1:31:12", "remaining_time": "0:06:35", "throughput": 4246.69, "total_tokens": 23241896} {"current_steps": 35595, "total_steps": 38160, "loss": 0.3905, "lr": 1.3710599361267617e-05, "epoch": 18.65566037735849, "percentage": 93.28, "elapsed_time": "1:31:13", "remaining_time": "0:06:34", "throughput": 4246.68, "total_tokens": 23244616} {"current_steps": 35600, "total_steps": 38160, "loss": 0.4046, "lr": 1.3657463972040207e-05, "epoch": 18.658280922431867, "percentage": 93.29, "elapsed_time": "1:31:14", "remaining_time": "0:06:33", "throughput": 4246.76, "total_tokens": 23248520} {"current_steps": 35605, "total_steps": 38160, "loss": 0.4484, "lr": 1.3604430320122762e-05, "epoch": 18.66090146750524, "percentage": 93.3, "elapsed_time": "1:31:15", "remaining_time": "0:06:32", "throughput": 4246.78, "total_tokens": 23251720} {"current_steps": 35610, "total_steps": 38160, "loss": 0.3427, "lr": 1.355149841660941e-05, "epoch": 18.663522012578618, "percentage": 93.32, "elapsed_time": "1:31:15", "remaining_time": "0:06:32", "throughput": 4246.8, "total_tokens": 23254760} {"current_steps": 35615, "total_steps": 38160, "loss": 0.4308, "lr": 1.3498668272572955e-05, "epoch": 18.66614255765199, "percentage": 93.33, "elapsed_time": "1:31:16", "remaining_time": "0:06:31", "throughput": 4246.83, "total_tokens": 23258056} {"current_steps": 35620, "total_steps": 38160, "loss": 0.3914, "lr": 1.3445939899064729e-05, "epoch": 18.668763102725368, "percentage": 93.34, "elapsed_time": "1:31:17", "remaining_time": "0:06:30", "throughput": 4246.81, "total_tokens": 23260776} {"current_steps": 35625, "total_steps": 38160, "loss": 0.4443, "lr": 1.3393313307115019e-05, "epoch": 18.67138364779874, "percentage": 93.36, "elapsed_time": "1:31:17", "remaining_time": "0:06:29", "throughput": 4246.85, "total_tokens": 23263976} {"current_steps": 35630, "total_steps": 38160, "loss": 0.4227, "lr": 1.3340788507732626e-05, "epoch": 18.67400419287212, "percentage": 93.37, "elapsed_time": "1:31:18", "remaining_time": "0:06:29", "throughput": 4246.89, "total_tokens": 23267400} {"current_steps": 35635, "total_steps": 38160, "loss": 0.3783, "lr": 1.328836551190521e-05, "epoch": 18.67662473794549, "percentage": 93.38, "elapsed_time": "1:31:19", "remaining_time": "0:06:28", "throughput": 4246.97, "total_tokens": 23271240} {"current_steps": 35640, "total_steps": 38160, "loss": 0.3679, "lr": 1.323604433059905e-05, "epoch": 18.67924528301887, "percentage": 93.4, "elapsed_time": "1:31:20", "remaining_time": "0:06:27", "throughput": 4246.98, "total_tokens": 23274248} {"current_steps": 35645, "total_steps": 38160, "loss": 0.5202, "lr": 1.3183824974759063e-05, "epoch": 18.681865828092242, "percentage": 93.41, "elapsed_time": "1:31:20", "remaining_time": "0:06:26", "throughput": 4247.07, "total_tokens": 23278152} {"current_steps": 35650, "total_steps": 38160, "loss": 0.5904, "lr": 1.3131707455309006e-05, "epoch": 18.68448637316562, "percentage": 93.42, "elapsed_time": "1:31:21", "remaining_time": "0:06:25", "throughput": 4247.12, "total_tokens": 23281640} {"current_steps": 35655, "total_steps": 38160, "loss": 0.492, "lr": 1.307969178315127e-05, "epoch": 18.687106918238992, "percentage": 93.44, "elapsed_time": "1:31:22", "remaining_time": "0:06:25", "throughput": 4247.14, "total_tokens": 23284680} {"current_steps": 35660, "total_steps": 38160, "loss": 0.4403, "lr": 1.3027777969166932e-05, "epoch": 18.68972746331237, "percentage": 93.45, "elapsed_time": "1:31:23", "remaining_time": "0:06:24", "throughput": 4247.14, "total_tokens": 23287496} {"current_steps": 35665, "total_steps": 38160, "loss": 0.3745, "lr": 1.2975966024215746e-05, "epoch": 18.692348008385743, "percentage": 93.46, "elapsed_time": "1:31:23", "remaining_time": "0:06:23", "throughput": 4247.12, "total_tokens": 23290248} {"current_steps": 35670, "total_steps": 38160, "loss": 0.5048, "lr": 1.2924255959136267e-05, "epoch": 18.69496855345912, "percentage": 93.47, "elapsed_time": "1:31:24", "remaining_time": "0:06:22", "throughput": 4247.23, "total_tokens": 23294440} {"current_steps": 35675, "total_steps": 38160, "loss": 0.4634, "lr": 1.2872647784745561e-05, "epoch": 18.697589098532493, "percentage": 93.49, "elapsed_time": "1:31:25", "remaining_time": "0:06:22", "throughput": 4247.34, "total_tokens": 23298536} {"current_steps": 35680, "total_steps": 38160, "loss": 0.5258, "lr": 1.282114151183944e-05, "epoch": 18.70020964360587, "percentage": 93.5, "elapsed_time": "1:31:26", "remaining_time": "0:06:21", "throughput": 4247.32, "total_tokens": 23301224} {"current_steps": 35685, "total_steps": 38160, "loss": 0.5909, "lr": 1.2769737151192562e-05, "epoch": 18.702830188679247, "percentage": 93.51, "elapsed_time": "1:31:26", "remaining_time": "0:06:20", "throughput": 4247.42, "total_tokens": 23305384} {"current_steps": 35690, "total_steps": 38160, "loss": 0.423, "lr": 1.2718434713558047e-05, "epoch": 18.70545073375262, "percentage": 93.53, "elapsed_time": "1:31:27", "remaining_time": "0:06:19", "throughput": 4247.43, "total_tokens": 23308488} {"current_steps": 35695, "total_steps": 38160, "loss": 0.6777, "lr": 1.2667234209667755e-05, "epoch": 18.708071278825997, "percentage": 93.54, "elapsed_time": "1:31:28", "remaining_time": "0:06:19", "throughput": 4247.45, "total_tokens": 23311528} {"current_steps": 35700, "total_steps": 38160, "loss": 0.399, "lr": 1.2616135650232286e-05, "epoch": 18.71069182389937, "percentage": 93.55, "elapsed_time": "1:31:29", "remaining_time": "0:06:18", "throughput": 4247.47, "total_tokens": 23314568} {"current_steps": 35705, "total_steps": 38160, "loss": 0.4205, "lr": 1.2565139045940866e-05, "epoch": 18.713312368972748, "percentage": 93.57, "elapsed_time": "1:31:29", "remaining_time": "0:06:17", "throughput": 4247.45, "total_tokens": 23317288} {"current_steps": 35710, "total_steps": 38160, "loss": 0.2819, "lr": 1.2514244407461462e-05, "epoch": 18.71593291404612, "percentage": 93.58, "elapsed_time": "1:31:30", "remaining_time": "0:06:16", "throughput": 4247.46, "total_tokens": 23320200} {"current_steps": 35715, "total_steps": 38160, "loss": 0.4534, "lr": 1.2463451745440501e-05, "epoch": 18.718553459119498, "percentage": 93.59, "elapsed_time": "1:31:31", "remaining_time": "0:06:15", "throughput": 4247.51, "total_tokens": 23323816} {"current_steps": 35720, "total_steps": 38160, "loss": 0.4856, "lr": 1.241276107050343e-05, "epoch": 18.72117400419287, "percentage": 93.61, "elapsed_time": "1:31:31", "remaining_time": "0:06:15", "throughput": 4247.56, "total_tokens": 23327432} {"current_steps": 35725, "total_steps": 38160, "loss": 0.397, "lr": 1.236217239325399e-05, "epoch": 18.72379454926625, "percentage": 93.62, "elapsed_time": "1:31:32", "remaining_time": "0:06:14", "throughput": 4247.56, "total_tokens": 23330408} {"current_steps": 35730, "total_steps": 38160, "loss": 0.3104, "lr": 1.2311685724274768e-05, "epoch": 18.72641509433962, "percentage": 93.63, "elapsed_time": "1:31:33", "remaining_time": "0:06:13", "throughput": 4247.55, "total_tokens": 23333224} {"current_steps": 35735, "total_steps": 38160, "loss": 0.4232, "lr": 1.2261301074127096e-05, "epoch": 18.729035639413, "percentage": 93.65, "elapsed_time": "1:31:34", "remaining_time": "0:06:12", "throughput": 4247.72, "total_tokens": 23338248} {"current_steps": 35740, "total_steps": 38160, "loss": 0.4247, "lr": 1.2211018453350874e-05, "epoch": 18.731656184486372, "percentage": 93.66, "elapsed_time": "1:31:34", "remaining_time": "0:06:12", "throughput": 4247.68, "total_tokens": 23340648} {"current_steps": 35745, "total_steps": 38160, "loss": 0.406, "lr": 1.2160837872464581e-05, "epoch": 18.73427672955975, "percentage": 93.67, "elapsed_time": "1:31:35", "remaining_time": "0:06:11", "throughput": 4247.72, "total_tokens": 23344072} {"current_steps": 35750, "total_steps": 38160, "loss": 0.3814, "lr": 1.2110759341965428e-05, "epoch": 18.736897274633122, "percentage": 93.68, "elapsed_time": "1:31:36", "remaining_time": "0:06:10", "throughput": 4247.7, "total_tokens": 23346760} {"current_steps": 35755, "total_steps": 38160, "loss": 0.4434, "lr": 1.2060782872329256e-05, "epoch": 18.7395178197065, "percentage": 93.7, "elapsed_time": "1:31:37", "remaining_time": "0:06:09", "throughput": 4247.71, "total_tokens": 23349768} {"current_steps": 35760, "total_steps": 38160, "loss": 0.4331, "lr": 1.2010908474010595e-05, "epoch": 18.742138364779873, "percentage": 93.71, "elapsed_time": "1:31:37", "remaining_time": "0:06:08", "throughput": 4247.8, "total_tokens": 23353608} {"current_steps": 35765, "total_steps": 38160, "loss": 0.3847, "lr": 1.1961136157442654e-05, "epoch": 18.74475890985325, "percentage": 93.72, "elapsed_time": "1:31:38", "remaining_time": "0:06:08", "throughput": 4247.82, "total_tokens": 23356776} {"current_steps": 35770, "total_steps": 38160, "loss": 0.3723, "lr": 1.1911465933037214e-05, "epoch": 18.747379454926623, "percentage": 93.74, "elapsed_time": "1:31:39", "remaining_time": "0:06:07", "throughput": 4247.9, "total_tokens": 23360552} {"current_steps": 35775, "total_steps": 38160, "loss": 0.4912, "lr": 1.1861897811184686e-05, "epoch": 18.75, "percentage": 93.75, "elapsed_time": "1:31:40", "remaining_time": "0:06:06", "throughput": 4247.97, "total_tokens": 23364264} {"current_steps": 35780, "total_steps": 38160, "loss": 0.4425, "lr": 1.1812431802254109e-05, "epoch": 18.752620545073377, "percentage": 93.76, "elapsed_time": "1:31:40", "remaining_time": "0:06:05", "throughput": 4247.98, "total_tokens": 23367176} {"current_steps": 35785, "total_steps": 38160, "loss": 0.362, "lr": 1.1763067916593262e-05, "epoch": 18.75524109014675, "percentage": 93.78, "elapsed_time": "1:31:41", "remaining_time": "0:06:05", "throughput": 4248.09, "total_tokens": 23371464} {"current_steps": 35790, "total_steps": 38160, "loss": 0.404, "lr": 1.1713806164528496e-05, "epoch": 18.757861635220127, "percentage": 93.79, "elapsed_time": "1:31:42", "remaining_time": "0:06:04", "throughput": 4248.1, "total_tokens": 23374504} {"current_steps": 35795, "total_steps": 38160, "loss": 0.4072, "lr": 1.1664646556364844e-05, "epoch": 18.7604821802935, "percentage": 93.8, "elapsed_time": "1:31:43", "remaining_time": "0:06:03", "throughput": 4248.09, "total_tokens": 23377352} {"current_steps": 35800, "total_steps": 38160, "loss": 0.4208, "lr": 1.161558910238597e-05, "epoch": 18.763102725366878, "percentage": 93.82, "elapsed_time": "1:31:43", "remaining_time": "0:06:02", "throughput": 4248.18, "total_tokens": 23381288} {"current_steps": 35805, "total_steps": 38160, "loss": 0.453, "lr": 1.1566633812854e-05, "epoch": 18.76572327044025, "percentage": 93.83, "elapsed_time": "1:31:44", "remaining_time": "0:06:02", "throughput": 4248.21, "total_tokens": 23384456} {"current_steps": 35810, "total_steps": 38160, "loss": 0.4775, "lr": 1.151778069800985e-05, "epoch": 18.768343815513628, "percentage": 93.84, "elapsed_time": "1:31:45", "remaining_time": "0:06:01", "throughput": 4248.29, "total_tokens": 23388232} {"current_steps": 35815, "total_steps": 38160, "loss": 0.4228, "lr": 1.1469029768073125e-05, "epoch": 18.770964360587, "percentage": 93.85, "elapsed_time": "1:31:46", "remaining_time": "0:06:00", "throughput": 4248.29, "total_tokens": 23391240} {"current_steps": 35820, "total_steps": 38160, "loss": 0.3704, "lr": 1.1420381033241889e-05, "epoch": 18.77358490566038, "percentage": 93.87, "elapsed_time": "1:31:46", "remaining_time": "0:05:59", "throughput": 4248.36, "total_tokens": 23394856} {"current_steps": 35825, "total_steps": 38160, "loss": 0.3837, "lr": 1.1371834503693002e-05, "epoch": 18.77620545073375, "percentage": 93.88, "elapsed_time": "1:31:47", "remaining_time": "0:05:58", "throughput": 4248.42, "total_tokens": 23398472} {"current_steps": 35830, "total_steps": 38160, "loss": 0.3616, "lr": 1.1323390189581784e-05, "epoch": 18.77882599580713, "percentage": 93.89, "elapsed_time": "1:31:48", "remaining_time": "0:05:58", "throughput": 4248.45, "total_tokens": 23401640} {"current_steps": 35835, "total_steps": 38160, "loss": 0.3258, "lr": 1.127504810104213e-05, "epoch": 18.781446540880502, "percentage": 93.91, "elapsed_time": "1:31:48", "remaining_time": "0:05:57", "throughput": 4248.47, "total_tokens": 23404776} {"current_steps": 35840, "total_steps": 38160, "loss": 0.4185, "lr": 1.1226808248186782e-05, "epoch": 18.78406708595388, "percentage": 93.92, "elapsed_time": "1:31:49", "remaining_time": "0:05:56", "throughput": 4248.48, "total_tokens": 23407944} {"current_steps": 35845, "total_steps": 38160, "loss": 0.4702, "lr": 1.1178670641106891e-05, "epoch": 18.786687631027252, "percentage": 93.93, "elapsed_time": "1:31:50", "remaining_time": "0:05:55", "throughput": 4248.53, "total_tokens": 23411496} {"current_steps": 35850, "total_steps": 38160, "loss": 0.4299, "lr": 1.1130635289872403e-05, "epoch": 18.78930817610063, "percentage": 93.95, "elapsed_time": "1:31:51", "remaining_time": "0:05:55", "throughput": 4248.54, "total_tokens": 23414440} {"current_steps": 35855, "total_steps": 38160, "loss": 0.3915, "lr": 1.1082702204531725e-05, "epoch": 18.791928721174003, "percentage": 93.96, "elapsed_time": "1:31:51", "remaining_time": "0:05:54", "throughput": 4248.61, "total_tokens": 23418152} {"current_steps": 35860, "total_steps": 38160, "loss": 0.379, "lr": 1.1034871395111778e-05, "epoch": 18.79454926624738, "percentage": 93.97, "elapsed_time": "1:31:52", "remaining_time": "0:05:53", "throughput": 4248.63, "total_tokens": 23421320} {"current_steps": 35865, "total_steps": 38160, "loss": 0.4942, "lr": 1.0987142871618394e-05, "epoch": 18.797169811320753, "percentage": 93.99, "elapsed_time": "1:31:53", "remaining_time": "0:05:52", "throughput": 4248.69, "total_tokens": 23424968} {"current_steps": 35870, "total_steps": 38160, "loss": 0.4305, "lr": 1.0939516644035696e-05, "epoch": 18.79979035639413, "percentage": 94.0, "elapsed_time": "1:31:54", "remaining_time": "0:05:52", "throughput": 4248.67, "total_tokens": 23427592} {"current_steps": 35875, "total_steps": 38160, "loss": 0.5272, "lr": 1.0891992722326716e-05, "epoch": 18.802410901467507, "percentage": 94.01, "elapsed_time": "1:31:54", "remaining_time": "0:05:51", "throughput": 4248.72, "total_tokens": 23431080} {"current_steps": 35880, "total_steps": 38160, "loss": 0.403, "lr": 1.0844571116432778e-05, "epoch": 18.80503144654088, "percentage": 94.03, "elapsed_time": "1:31:55", "remaining_time": "0:05:50", "throughput": 4248.79, "total_tokens": 23434728} {"current_steps": 35885, "total_steps": 38160, "loss": 0.5253, "lr": 1.0797251836274003e-05, "epoch": 18.807651991614257, "percentage": 94.04, "elapsed_time": "1:31:56", "remaining_time": "0:05:49", "throughput": 4248.91, "total_tokens": 23439112} {"current_steps": 35890, "total_steps": 38160, "loss": 0.3594, "lr": 1.0750034891748972e-05, "epoch": 18.81027253668763, "percentage": 94.05, "elapsed_time": "1:31:57", "remaining_time": "0:05:48", "throughput": 4248.93, "total_tokens": 23442344} {"current_steps": 35895, "total_steps": 38160, "loss": 0.4431, "lr": 1.0702920292735009e-05, "epoch": 18.812893081761008, "percentage": 94.06, "elapsed_time": "1:31:57", "remaining_time": "0:05:48", "throughput": 4248.97, "total_tokens": 23445640} {"current_steps": 35900, "total_steps": 38160, "loss": 0.3342, "lr": 1.0655908049087893e-05, "epoch": 18.81551362683438, "percentage": 94.08, "elapsed_time": "1:31:58", "remaining_time": "0:05:47", "throughput": 4248.95, "total_tokens": 23448264} {"current_steps": 35905, "total_steps": 38160, "loss": 0.429, "lr": 1.0608998170642149e-05, "epoch": 18.818134171907758, "percentage": 94.09, "elapsed_time": "1:31:59", "remaining_time": "0:05:46", "throughput": 4248.95, "total_tokens": 23451272} {"current_steps": 35910, "total_steps": 38160, "loss": 0.3879, "lr": 1.0562190667210703e-05, "epoch": 18.82075471698113, "percentage": 94.1, "elapsed_time": "1:31:59", "remaining_time": "0:05:45", "throughput": 4248.93, "total_tokens": 23453832} {"current_steps": 35915, "total_steps": 38160, "loss": 0.432, "lr": 1.0515485548585113e-05, "epoch": 18.82337526205451, "percentage": 94.12, "elapsed_time": "1:32:00", "remaining_time": "0:05:45", "throughput": 4248.91, "total_tokens": 23456520} {"current_steps": 35920, "total_steps": 38160, "loss": 0.3608, "lr": 1.0468882824535676e-05, "epoch": 18.82599580712788, "percentage": 94.13, "elapsed_time": "1:32:01", "remaining_time": "0:05:44", "throughput": 4248.93, "total_tokens": 23459624} {"current_steps": 35925, "total_steps": 38160, "loss": 0.3168, "lr": 1.0422382504811034e-05, "epoch": 18.82861635220126, "percentage": 94.14, "elapsed_time": "1:32:02", "remaining_time": "0:05:43", "throughput": 4249.02, "total_tokens": 23463720} {"current_steps": 35930, "total_steps": 38160, "loss": 0.456, "lr": 1.0375984599138633e-05, "epoch": 18.831236897274632, "percentage": 94.16, "elapsed_time": "1:32:02", "remaining_time": "0:05:42", "throughput": 4249.1, "total_tokens": 23467592} {"current_steps": 35935, "total_steps": 38160, "loss": 0.4399, "lr": 1.0329689117224261e-05, "epoch": 18.83385744234801, "percentage": 94.17, "elapsed_time": "1:32:03", "remaining_time": "0:05:42", "throughput": 4249.06, "total_tokens": 23470024} {"current_steps": 35940, "total_steps": 38160, "loss": 0.5086, "lr": 1.0283496068752507e-05, "epoch": 18.836477987421382, "percentage": 94.18, "elapsed_time": "1:32:04", "remaining_time": "0:05:41", "throughput": 4249.01, "total_tokens": 23472264} {"current_steps": 35945, "total_steps": 38160, "loss": 0.4993, "lr": 1.0237405463386418e-05, "epoch": 18.83909853249476, "percentage": 94.2, "elapsed_time": "1:32:04", "remaining_time": "0:05:40", "throughput": 4249.02, "total_tokens": 23475208} {"current_steps": 35950, "total_steps": 38160, "loss": 0.4042, "lr": 1.0191417310767503e-05, "epoch": 18.841719077568133, "percentage": 94.21, "elapsed_time": "1:32:05", "remaining_time": "0:05:39", "throughput": 4249.05, "total_tokens": 23478472} {"current_steps": 35955, "total_steps": 38160, "loss": 0.2936, "lr": 1.0145531620516179e-05, "epoch": 18.84433962264151, "percentage": 94.22, "elapsed_time": "1:32:06", "remaining_time": "0:05:38", "throughput": 4249.1, "total_tokens": 23482056} {"current_steps": 35960, "total_steps": 38160, "loss": 0.3089, "lr": 1.009974840223099e-05, "epoch": 18.846960167714883, "percentage": 94.23, "elapsed_time": "1:32:06", "remaining_time": "0:05:38", "throughput": 4249.03, "total_tokens": 23484200} {"current_steps": 35965, "total_steps": 38160, "loss": 0.4413, "lr": 1.0054067665489386e-05, "epoch": 18.84958071278826, "percentage": 94.25, "elapsed_time": "1:32:07", "remaining_time": "0:05:37", "throughput": 4249.17, "total_tokens": 23488616} {"current_steps": 35970, "total_steps": 38160, "loss": 0.4013, "lr": 1.0008489419847278e-05, "epoch": 18.852201257861637, "percentage": 94.26, "elapsed_time": "1:32:08", "remaining_time": "0:05:36", "throughput": 4249.21, "total_tokens": 23491944} {"current_steps": 35975, "total_steps": 38160, "loss": 0.3365, "lr": 9.963013674839038e-06, "epoch": 18.85482180293501, "percentage": 94.27, "elapsed_time": "1:32:09", "remaining_time": "0:05:35", "throughput": 4249.3, "total_tokens": 23496008} {"current_steps": 35980, "total_steps": 38160, "loss": 0.4354, "lr": 9.91764043997767e-06, "epoch": 18.857442348008387, "percentage": 94.29, "elapsed_time": "1:32:10", "remaining_time": "0:05:35", "throughput": 4249.3, "total_tokens": 23498888} {"current_steps": 35985, "total_steps": 38160, "loss": 0.3288, "lr": 9.872369724754804e-06, "epoch": 18.86006289308176, "percentage": 94.3, "elapsed_time": "1:32:10", "remaining_time": "0:05:34", "throughput": 4249.31, "total_tokens": 23501896} {"current_steps": 35990, "total_steps": 38160, "loss": 0.4085, "lr": 9.827201538640473e-06, "epoch": 18.862683438155138, "percentage": 94.31, "elapsed_time": "1:32:11", "remaining_time": "0:05:33", "throughput": 4249.31, "total_tokens": 23504840} {"current_steps": 35995, "total_steps": 38160, "loss": 0.3839, "lr": 9.782135891083455e-06, "epoch": 18.86530398322851, "percentage": 94.33, "elapsed_time": "1:32:12", "remaining_time": "0:05:32", "throughput": 4249.28, "total_tokens": 23507336} {"current_steps": 36000, "total_steps": 38160, "loss": 0.4209, "lr": 9.737172791510873e-06, "epoch": 18.867924528301888, "percentage": 94.34, "elapsed_time": "1:32:12", "remaining_time": "0:05:31", "throughput": 4249.3, "total_tokens": 23510536} {"current_steps": 36005, "total_steps": 38160, "loss": 0.4583, "lr": 9.692312249328483e-06, "epoch": 18.87054507337526, "percentage": 94.35, "elapsed_time": "1:32:13", "remaining_time": "0:05:31", "throughput": 4249.31, "total_tokens": 23513576} {"current_steps": 36010, "total_steps": 38160, "loss": 0.6944, "lr": 9.647554273920722e-06, "epoch": 18.87316561844864, "percentage": 94.37, "elapsed_time": "1:32:14", "remaining_time": "0:05:30", "throughput": 4249.33, "total_tokens": 23516744} {"current_steps": 36015, "total_steps": 38160, "loss": 0.4171, "lr": 9.602898874650323e-06, "epoch": 18.87578616352201, "percentage": 94.38, "elapsed_time": "1:32:14", "remaining_time": "0:05:29", "throughput": 4249.33, "total_tokens": 23519720} {"current_steps": 36020, "total_steps": 38160, "loss": 0.6306, "lr": 9.558346060858759e-06, "epoch": 18.87840670859539, "percentage": 94.39, "elapsed_time": "1:32:15", "remaining_time": "0:05:28", "throughput": 4249.35, "total_tokens": 23522696} {"current_steps": 36025, "total_steps": 38160, "loss": 0.3042, "lr": 9.51389584186596e-06, "epoch": 18.881027253668762, "percentage": 94.41, "elapsed_time": "1:32:16", "remaining_time": "0:05:28", "throughput": 4249.31, "total_tokens": 23525160} {"current_steps": 36030, "total_steps": 38160, "loss": 0.3373, "lr": 9.469548226970326e-06, "epoch": 18.88364779874214, "percentage": 94.42, "elapsed_time": "1:32:16", "remaining_time": "0:05:27", "throughput": 4249.29, "total_tokens": 23527848} {"current_steps": 36035, "total_steps": 38160, "loss": 0.4171, "lr": 9.425303225448989e-06, "epoch": 18.886268343815512, "percentage": 94.43, "elapsed_time": "1:32:17", "remaining_time": "0:05:26", "throughput": 4249.29, "total_tokens": 23530824} {"current_steps": 36040, "total_steps": 38160, "loss": 0.4235, "lr": 9.381160846557435e-06, "epoch": 18.88888888888889, "percentage": 94.44, "elapsed_time": "1:32:18", "remaining_time": "0:05:25", "throughput": 4249.27, "total_tokens": 23533480} {"current_steps": 36045, "total_steps": 38160, "loss": 0.4301, "lr": 9.337121099529722e-06, "epoch": 18.891509433962263, "percentage": 94.46, "elapsed_time": "1:32:18", "remaining_time": "0:05:25", "throughput": 4249.21, "total_tokens": 23535688} {"current_steps": 36050, "total_steps": 38160, "loss": 0.3491, "lr": 9.293183993578535e-06, "epoch": 18.89412997903564, "percentage": 94.47, "elapsed_time": "1:32:19", "remaining_time": "0:05:24", "throughput": 4249.24, "total_tokens": 23539016} {"current_steps": 36055, "total_steps": 38160, "loss": 0.3561, "lr": 9.249349537894968e-06, "epoch": 18.896750524109013, "percentage": 94.48, "elapsed_time": "1:32:20", "remaining_time": "0:05:23", "throughput": 4249.26, "total_tokens": 23542152} {"current_steps": 36060, "total_steps": 38160, "loss": 0.3724, "lr": 9.205617741648686e-06, "epoch": 18.89937106918239, "percentage": 94.5, "elapsed_time": "1:32:20", "remaining_time": "0:05:22", "throughput": 4249.26, "total_tokens": 23545096} {"current_steps": 36065, "total_steps": 38160, "loss": 0.259, "lr": 9.161988613987982e-06, "epoch": 18.901991614255767, "percentage": 94.51, "elapsed_time": "1:32:21", "remaining_time": "0:05:21", "throughput": 4249.3, "total_tokens": 23548392} {"current_steps": 36070, "total_steps": 38160, "loss": 0.421, "lr": 9.118462164039387e-06, "epoch": 18.90461215932914, "percentage": 94.52, "elapsed_time": "1:32:22", "remaining_time": "0:05:21", "throughput": 4249.27, "total_tokens": 23550984} {"current_steps": 36075, "total_steps": 38160, "loss": 0.4814, "lr": 9.07503840090823e-06, "epoch": 18.907232704402517, "percentage": 94.54, "elapsed_time": "1:32:23", "remaining_time": "0:05:20", "throughput": 4249.25, "total_tokens": 23553608} {"current_steps": 36080, "total_steps": 38160, "loss": 0.4779, "lr": 9.031717333678303e-06, "epoch": 18.90985324947589, "percentage": 94.55, "elapsed_time": "1:32:23", "remaining_time": "0:05:19", "throughput": 4249.24, "total_tokens": 23556360} {"current_steps": 36085, "total_steps": 38160, "loss": 0.4063, "lr": 8.988498971411851e-06, "epoch": 18.912473794549268, "percentage": 94.56, "elapsed_time": "1:32:24", "remaining_time": "0:05:18", "throughput": 4249.27, "total_tokens": 23559656} {"current_steps": 36090, "total_steps": 38160, "loss": 0.4668, "lr": 8.945383323149647e-06, "epoch": 18.91509433962264, "percentage": 94.58, "elapsed_time": "1:32:25", "remaining_time": "0:05:18", "throughput": 4249.31, "total_tokens": 23563080} {"current_steps": 36095, "total_steps": 38160, "loss": 0.557, "lr": 8.902370397911031e-06, "epoch": 18.917714884696018, "percentage": 94.59, "elapsed_time": "1:32:25", "remaining_time": "0:05:17", "throughput": 4249.32, "total_tokens": 23566056} {"current_steps": 36100, "total_steps": 38160, "loss": 0.3365, "lr": 8.859460204693748e-06, "epoch": 18.92033542976939, "percentage": 94.6, "elapsed_time": "1:32:26", "remaining_time": "0:05:16", "throughput": 4249.37, "total_tokens": 23569480} {"current_steps": 36105, "total_steps": 38160, "loss": 0.4278, "lr": 8.816652752474175e-06, "epoch": 18.92295597484277, "percentage": 94.61, "elapsed_time": "1:32:27", "remaining_time": "0:05:15", "throughput": 4249.48, "total_tokens": 23573704} {"current_steps": 36110, "total_steps": 38160, "loss": 0.4292, "lr": 8.773948050207148e-06, "epoch": 18.92557651991614, "percentage": 94.63, "elapsed_time": "1:32:28", "remaining_time": "0:05:14", "throughput": 4249.51, "total_tokens": 23577032} {"current_steps": 36115, "total_steps": 38160, "loss": 0.4622, "lr": 8.731346106826021e-06, "epoch": 18.92819706498952, "percentage": 94.64, "elapsed_time": "1:32:28", "remaining_time": "0:05:14", "throughput": 4249.54, "total_tokens": 23580232} {"current_steps": 36120, "total_steps": 38160, "loss": 0.3879, "lr": 8.6888469312425e-06, "epoch": 18.930817610062892, "percentage": 94.65, "elapsed_time": "1:32:29", "remaining_time": "0:05:13", "throughput": 4249.59, "total_tokens": 23583816} {"current_steps": 36125, "total_steps": 38160, "loss": 0.4356, "lr": 8.646450532347083e-06, "epoch": 18.93343815513627, "percentage": 94.67, "elapsed_time": "1:32:30", "remaining_time": "0:05:12", "throughput": 4249.63, "total_tokens": 23587208} {"current_steps": 36130, "total_steps": 38160, "loss": 0.5228, "lr": 8.604156919008565e-06, "epoch": 18.936058700209642, "percentage": 94.68, "elapsed_time": "1:32:31", "remaining_time": "0:05:11", "throughput": 4249.69, "total_tokens": 23590920} {"current_steps": 36135, "total_steps": 38160, "loss": 0.6584, "lr": 8.561966100074258e-06, "epoch": 18.93867924528302, "percentage": 94.69, "elapsed_time": "1:32:31", "remaining_time": "0:05:11", "throughput": 4249.71, "total_tokens": 23593992} {"current_steps": 36140, "total_steps": 38160, "loss": 0.441, "lr": 8.519878084370048e-06, "epoch": 18.941299790356393, "percentage": 94.71, "elapsed_time": "1:32:32", "remaining_time": "0:05:10", "throughput": 4249.75, "total_tokens": 23597512} {"current_steps": 36145, "total_steps": 38160, "loss": 0.4015, "lr": 8.477892880700222e-06, "epoch": 18.94392033542977, "percentage": 94.72, "elapsed_time": "1:32:33", "remaining_time": "0:05:09", "throughput": 4249.74, "total_tokens": 23600232} {"current_steps": 36150, "total_steps": 38160, "loss": 0.3695, "lr": 8.436010497847646e-06, "epoch": 18.946540880503143, "percentage": 94.73, "elapsed_time": "1:32:33", "remaining_time": "0:05:08", "throughput": 4249.72, "total_tokens": 23602920} {"current_steps": 36155, "total_steps": 38160, "loss": 0.458, "lr": 8.39423094457359e-06, "epoch": 18.94916142557652, "percentage": 94.75, "elapsed_time": "1:32:34", "remaining_time": "0:05:08", "throughput": 4249.73, "total_tokens": 23605960} {"current_steps": 36160, "total_steps": 38160, "loss": 0.3562, "lr": 8.352554229617892e-06, "epoch": 18.951781970649897, "percentage": 94.76, "elapsed_time": "1:32:35", "remaining_time": "0:05:07", "throughput": 4249.78, "total_tokens": 23609384} {"current_steps": 36165, "total_steps": 38160, "loss": 0.4169, "lr": 8.310980361698861e-06, "epoch": 18.95440251572327, "percentage": 94.77, "elapsed_time": "1:32:36", "remaining_time": "0:05:06", "throughput": 4249.79, "total_tokens": 23612520} {"current_steps": 36170, "total_steps": 38160, "loss": 0.4879, "lr": 8.26950934951326e-06, "epoch": 18.957023060796647, "percentage": 94.79, "elapsed_time": "1:32:36", "remaining_time": "0:05:05", "throughput": 4249.82, "total_tokens": 23615784} {"current_steps": 36175, "total_steps": 38160, "loss": 0.4344, "lr": 8.22814120173626e-06, "epoch": 18.95964360587002, "percentage": 94.8, "elapsed_time": "1:32:37", "remaining_time": "0:05:04", "throughput": 4249.85, "total_tokens": 23619144} {"current_steps": 36180, "total_steps": 38160, "loss": 0.4591, "lr": 8.186875927021775e-06, "epoch": 18.962264150943398, "percentage": 94.81, "elapsed_time": "1:32:38", "remaining_time": "0:05:04", "throughput": 4249.84, "total_tokens": 23621992} {"current_steps": 36185, "total_steps": 38160, "loss": 0.5596, "lr": 8.145713534001897e-06, "epoch": 18.96488469601677, "percentage": 94.82, "elapsed_time": "1:32:39", "remaining_time": "0:05:03", "throughput": 4249.88, "total_tokens": 23625416} {"current_steps": 36190, "total_steps": 38160, "loss": 0.3983, "lr": 8.104654031287406e-06, "epoch": 18.967505241090148, "percentage": 94.84, "elapsed_time": "1:32:39", "remaining_time": "0:05:02", "throughput": 4249.98, "total_tokens": 23629448} {"current_steps": 36195, "total_steps": 38160, "loss": 0.3531, "lr": 8.063697427467486e-06, "epoch": 18.97012578616352, "percentage": 94.85, "elapsed_time": "1:32:40", "remaining_time": "0:05:01", "throughput": 4249.97, "total_tokens": 23632232} {"current_steps": 36200, "total_steps": 38160, "loss": 0.36, "lr": 8.022843731109675e-06, "epoch": 18.9727463312369, "percentage": 94.86, "elapsed_time": "1:32:41", "remaining_time": "0:05:01", "throughput": 4250.03, "total_tokens": 23635880} {"current_steps": 36205, "total_steps": 38160, "loss": 0.3629, "lr": 7.982092950760245e-06, "epoch": 18.97536687631027, "percentage": 94.88, "elapsed_time": "1:32:42", "remaining_time": "0:05:00", "throughput": 4250.05, "total_tokens": 23639016} {"current_steps": 36210, "total_steps": 38160, "loss": 0.3947, "lr": 7.941445094943711e-06, "epoch": 18.97798742138365, "percentage": 94.89, "elapsed_time": "1:32:42", "remaining_time": "0:04:59", "throughput": 4250.08, "total_tokens": 23642376} {"current_steps": 36215, "total_steps": 38160, "loss": 0.3904, "lr": 7.900900172163107e-06, "epoch": 18.980607966457022, "percentage": 94.9, "elapsed_time": "1:32:43", "remaining_time": "0:04:58", "throughput": 4250.13, "total_tokens": 23645896} {"current_steps": 36220, "total_steps": 38160, "loss": 0.505, "lr": 7.860458190900144e-06, "epoch": 18.9832285115304, "percentage": 94.92, "elapsed_time": "1:32:44", "remaining_time": "0:04:58", "throughput": 4250.19, "total_tokens": 23649608} {"current_steps": 36225, "total_steps": 38160, "loss": 0.4933, "lr": 7.820119159614669e-06, "epoch": 18.985849056603772, "percentage": 94.93, "elapsed_time": "1:32:45", "remaining_time": "0:04:57", "throughput": 4250.23, "total_tokens": 23652808} {"current_steps": 36230, "total_steps": 38160, "loss": 0.3067, "lr": 7.779883086745098e-06, "epoch": 18.98846960167715, "percentage": 94.94, "elapsed_time": "1:32:45", "remaining_time": "0:04:56", "throughput": 4250.32, "total_tokens": 23656776} {"current_steps": 36235, "total_steps": 38160, "loss": 0.4872, "lr": 7.739749980708533e-06, "epoch": 18.991090146750523, "percentage": 94.96, "elapsed_time": "1:32:46", "remaining_time": "0:04:55", "throughput": 4250.39, "total_tokens": 23660584} {"current_steps": 36240, "total_steps": 38160, "loss": 0.4612, "lr": 7.6997198499002e-06, "epoch": 18.9937106918239, "percentage": 94.97, "elapsed_time": "1:32:47", "remaining_time": "0:04:54", "throughput": 4250.46, "total_tokens": 23664296} {"current_steps": 36245, "total_steps": 38160, "loss": 0.429, "lr": 7.659792702694068e-06, "epoch": 18.996331236897273, "percentage": 94.98, "elapsed_time": "1:32:48", "remaining_time": "0:04:54", "throughput": 4250.44, "total_tokens": 23667048} {"current_steps": 36250, "total_steps": 38160, "loss": 0.3256, "lr": 7.619968547442346e-06, "epoch": 18.99895178197065, "percentage": 94.99, "elapsed_time": "1:32:48", "remaining_time": "0:04:53", "throughput": 4250.49, "total_tokens": 23670536} {"current_steps": 36252, "total_steps": 38160, "eval_loss": 0.49396204948425293, "epoch": 19.0, "percentage": 95.0, "elapsed_time": "1:33:02", "remaining_time": "0:04:53", "throughput": 4239.89, "total_tokens": 23671264} {"current_steps": 36255, "total_steps": 38160, "loss": 0.4478, "lr": 7.580247392475926e-06, "epoch": 19.001572327044027, "percentage": 95.01, "elapsed_time": "1:33:05", "remaining_time": "0:04:53", "throughput": 4238.63, "total_tokens": 23673120} {"current_steps": 36260, "total_steps": 38160, "loss": 0.3871, "lr": 7.540629246103825e-06, "epoch": 19.0041928721174, "percentage": 95.02, "elapsed_time": "1:33:05", "remaining_time": "0:04:52", "throughput": 4238.62, "total_tokens": 23675872} {"current_steps": 36265, "total_steps": 38160, "loss": 0.3479, "lr": 7.501114116613861e-06, "epoch": 19.006813417190777, "percentage": 95.03, "elapsed_time": "1:33:06", "remaining_time": "0:04:51", "throughput": 4238.61, "total_tokens": 23678560} {"current_steps": 36270, "total_steps": 38160, "loss": 0.3988, "lr": 7.461702012272087e-06, "epoch": 19.00943396226415, "percentage": 95.05, "elapsed_time": "1:33:07", "remaining_time": "0:04:51", "throughput": 4238.67, "total_tokens": 23682208} {"current_steps": 36275, "total_steps": 38160, "loss": 0.5508, "lr": 7.422392941323075e-06, "epoch": 19.012054507337528, "percentage": 95.06, "elapsed_time": "1:33:07", "remaining_time": "0:04:50", "throughput": 4238.69, "total_tokens": 23685472} {"current_steps": 36280, "total_steps": 38160, "loss": 0.3214, "lr": 7.383186911989858e-06, "epoch": 19.0146750524109, "percentage": 95.07, "elapsed_time": "1:33:08", "remaining_time": "0:04:49", "throughput": 4238.67, "total_tokens": 23688064} {"current_steps": 36285, "total_steps": 38160, "loss": 0.3515, "lr": 7.344083932473822e-06, "epoch": 19.017295597484278, "percentage": 95.09, "elapsed_time": "1:33:09", "remaining_time": "0:04:48", "throughput": 4238.66, "total_tokens": 23690848} {"current_steps": 36290, "total_steps": 38160, "loss": 0.4146, "lr": 7.305084010954976e-06, "epoch": 19.01991614255765, "percentage": 95.1, "elapsed_time": "1:33:09", "remaining_time": "0:04:48", "throughput": 4238.67, "total_tokens": 23693952} {"current_steps": 36295, "total_steps": 38160, "loss": 0.3597, "lr": 7.26618715559152e-06, "epoch": 19.02253668763103, "percentage": 95.11, "elapsed_time": "1:33:10", "remaining_time": "0:04:47", "throughput": 4238.77, "total_tokens": 23698016} {"current_steps": 36300, "total_steps": 38160, "loss": 0.3754, "lr": 7.227393374520386e-06, "epoch": 19.0251572327044, "percentage": 95.13, "elapsed_time": "1:33:11", "remaining_time": "0:04:46", "throughput": 4238.93, "total_tokens": 23702976} {"current_steps": 36305, "total_steps": 38160, "loss": 0.3987, "lr": 7.18870267585664e-06, "epoch": 19.02777777777778, "percentage": 95.14, "elapsed_time": "1:33:12", "remaining_time": "0:04:45", "throughput": 4238.99, "total_tokens": 23706464} {"current_steps": 36310, "total_steps": 38160, "loss": 0.4307, "lr": 7.150115067694085e-06, "epoch": 19.030398322851152, "percentage": 95.15, "elapsed_time": "1:33:13", "remaining_time": "0:04:44", "throughput": 4239.07, "total_tokens": 23710464} {"current_steps": 36315, "total_steps": 38160, "loss": 0.5145, "lr": 7.111630558104653e-06, "epoch": 19.03301886792453, "percentage": 95.17, "elapsed_time": "1:33:14", "remaining_time": "0:04:44", "throughput": 4239.09, "total_tokens": 23713632} {"current_steps": 36320, "total_steps": 38160, "loss": 0.6009, "lr": 7.073249155138961e-06, "epoch": 19.035639412997902, "percentage": 95.18, "elapsed_time": "1:33:14", "remaining_time": "0:04:43", "throughput": 4239.06, "total_tokens": 23716192} {"current_steps": 36325, "total_steps": 38160, "loss": 0.4203, "lr": 7.0349708668259736e-06, "epoch": 19.03825995807128, "percentage": 95.19, "elapsed_time": "1:33:15", "remaining_time": "0:04:42", "throughput": 4239.08, "total_tokens": 23719424} {"current_steps": 36330, "total_steps": 38160, "loss": 0.4108, "lr": 6.996795701173009e-06, "epoch": 19.040880503144653, "percentage": 95.2, "elapsed_time": "1:33:16", "remaining_time": "0:04:41", "throughput": 4239.09, "total_tokens": 23722400} {"current_steps": 36335, "total_steps": 38160, "loss": 0.5132, "lr": 6.958723666165901e-06, "epoch": 19.04350104821803, "percentage": 95.22, "elapsed_time": "1:33:16", "remaining_time": "0:04:41", "throughput": 4239.13, "total_tokens": 23725792} {"current_steps": 36340, "total_steps": 38160, "loss": 0.4346, "lr": 6.9207547697689446e-06, "epoch": 19.046121593291403, "percentage": 95.23, "elapsed_time": "1:33:17", "remaining_time": "0:04:40", "throughput": 4239.14, "total_tokens": 23728800} {"current_steps": 36345, "total_steps": 38160, "loss": 0.4009, "lr": 6.882889019924676e-06, "epoch": 19.04874213836478, "percentage": 95.24, "elapsed_time": "1:33:18", "remaining_time": "0:04:39", "throughput": 4239.17, "total_tokens": 23732192} {"current_steps": 36350, "total_steps": 38160, "loss": 0.2999, "lr": 6.84512642455426e-06, "epoch": 19.051362683438157, "percentage": 95.26, "elapsed_time": "1:33:19", "remaining_time": "0:04:38", "throughput": 4239.15, "total_tokens": 23735072} {"current_steps": 36355, "total_steps": 38160, "loss": 0.4537, "lr": 6.8074669915572095e-06, "epoch": 19.05398322851153, "percentage": 95.27, "elapsed_time": "1:33:19", "remaining_time": "0:04:38", "throughput": 4239.16, "total_tokens": 23738144} {"current_steps": 36360, "total_steps": 38160, "loss": 0.4329, "lr": 6.769910728811391e-06, "epoch": 19.056603773584907, "percentage": 95.28, "elapsed_time": "1:33:20", "remaining_time": "0:04:37", "throughput": 4239.14, "total_tokens": 23740768} {"current_steps": 36365, "total_steps": 38160, "loss": 0.4834, "lr": 6.73245764417324e-06, "epoch": 19.05922431865828, "percentage": 95.3, "elapsed_time": "1:33:21", "remaining_time": "0:04:36", "throughput": 4239.11, "total_tokens": 23743456} {"current_steps": 36370, "total_steps": 38160, "loss": 0.3959, "lr": 6.695107745477435e-06, "epoch": 19.061844863731658, "percentage": 95.31, "elapsed_time": "1:33:21", "remaining_time": "0:04:35", "throughput": 4239.12, "total_tokens": 23746528} {"current_steps": 36375, "total_steps": 38160, "loss": 0.5694, "lr": 6.657861040537117e-06, "epoch": 19.06446540880503, "percentage": 95.32, "elapsed_time": "1:33:22", "remaining_time": "0:04:34", "throughput": 4239.09, "total_tokens": 23749024} {"current_steps": 36380, "total_steps": 38160, "loss": 0.3962, "lr": 6.620717537143994e-06, "epoch": 19.067085953878408, "percentage": 95.34, "elapsed_time": "1:33:23", "remaining_time": "0:04:34", "throughput": 4239.06, "total_tokens": 23751552} {"current_steps": 36385, "total_steps": 38160, "loss": 0.4066, "lr": 6.583677243067965e-06, "epoch": 19.06970649895178, "percentage": 95.35, "elapsed_time": "1:33:23", "remaining_time": "0:04:33", "throughput": 4239.08, "total_tokens": 23754784} {"current_steps": 36390, "total_steps": 38160, "loss": 0.3393, "lr": 6.546740166057441e-06, "epoch": 19.072327044025158, "percentage": 95.36, "elapsed_time": "1:33:25", "remaining_time": "0:04:32", "throughput": 4239.4, "total_tokens": 23761888} {"current_steps": 36395, "total_steps": 38160, "loss": 0.5157, "lr": 6.5099063138392975e-06, "epoch": 19.07494758909853, "percentage": 95.37, "elapsed_time": "1:33:25", "remaining_time": "0:04:31", "throughput": 4239.48, "total_tokens": 23765728} {"current_steps": 36400, "total_steps": 38160, "loss": 0.3735, "lr": 6.473175694118705e-06, "epoch": 19.07756813417191, "percentage": 95.39, "elapsed_time": "1:33:26", "remaining_time": "0:04:31", "throughput": 4239.56, "total_tokens": 23769536} {"current_steps": 36405, "total_steps": 38160, "loss": 0.453, "lr": 6.436548314579349e-06, "epoch": 19.080188679245282, "percentage": 95.4, "elapsed_time": "1:33:27", "remaining_time": "0:04:30", "throughput": 4239.56, "total_tokens": 23772512} {"current_steps": 36410, "total_steps": 38160, "loss": 0.3682, "lr": 6.400024182883158e-06, "epoch": 19.08280922431866, "percentage": 95.41, "elapsed_time": "1:33:28", "remaining_time": "0:04:29", "throughput": 4239.62, "total_tokens": 23776128} {"current_steps": 36415, "total_steps": 38160, "loss": 0.4551, "lr": 6.363603306670629e-06, "epoch": 19.085429769392032, "percentage": 95.43, "elapsed_time": "1:33:28", "remaining_time": "0:04:28", "throughput": 4239.69, "total_tokens": 23779936} {"current_steps": 36420, "total_steps": 38160, "loss": 0.3535, "lr": 6.327285693560614e-06, "epoch": 19.08805031446541, "percentage": 95.44, "elapsed_time": "1:33:29", "remaining_time": "0:04:28", "throughput": 4239.77, "total_tokens": 23783808} {"current_steps": 36425, "total_steps": 38160, "loss": 0.3823, "lr": 6.2910713511503125e-06, "epoch": 19.090670859538783, "percentage": 95.45, "elapsed_time": "1:33:30", "remaining_time": "0:04:27", "throughput": 4239.86, "total_tokens": 23787872} {"current_steps": 36430, "total_steps": 38160, "loss": 0.337, "lr": 6.254960287015332e-06, "epoch": 19.09329140461216, "percentage": 95.47, "elapsed_time": "1:33:31", "remaining_time": "0:04:26", "throughput": 4239.9, "total_tokens": 23791296} {"current_steps": 36435, "total_steps": 38160, "loss": 0.5059, "lr": 6.218952508709741e-06, "epoch": 19.095911949685533, "percentage": 95.48, "elapsed_time": "1:33:32", "remaining_time": "0:04:25", "throughput": 4240.0, "total_tokens": 23795456} {"current_steps": 36440, "total_steps": 38160, "loss": 0.9545, "lr": 6.183048023765903e-06, "epoch": 19.09853249475891, "percentage": 95.49, "elapsed_time": "1:33:32", "remaining_time": "0:04:24", "throughput": 4239.98, "total_tokens": 23798080} {"current_steps": 36445, "total_steps": 38160, "loss": 0.4968, "lr": 6.147246839694698e-06, "epoch": 19.101153039832287, "percentage": 95.51, "elapsed_time": "1:33:33", "remaining_time": "0:04:24", "throughput": 4239.99, "total_tokens": 23801216} {"current_steps": 36450, "total_steps": 38160, "loss": 0.4717, "lr": 6.111548963985247e-06, "epoch": 19.10377358490566, "percentage": 95.52, "elapsed_time": "1:33:34", "remaining_time": "0:04:23", "throughput": 4240.02, "total_tokens": 23804320} {"current_steps": 36455, "total_steps": 38160, "loss": 0.4067, "lr": 6.075954404105188e-06, "epoch": 19.106394129979037, "percentage": 95.53, "elapsed_time": "1:33:34", "remaining_time": "0:04:22", "throughput": 4240.04, "total_tokens": 23807584} {"current_steps": 36460, "total_steps": 38160, "loss": 0.5556, "lr": 6.040463167500509e-06, "epoch": 19.10901467505241, "percentage": 95.55, "elapsed_time": "1:33:35", "remaining_time": "0:04:21", "throughput": 4240.19, "total_tokens": 23812320} {"current_steps": 36465, "total_steps": 38160, "loss": 0.4501, "lr": 6.005075261595494e-06, "epoch": 19.111635220125788, "percentage": 95.56, "elapsed_time": "1:33:36", "remaining_time": "0:04:21", "throughput": 4240.2, "total_tokens": 23815296} {"current_steps": 36470, "total_steps": 38160, "loss": 0.4178, "lr": 5.969790693792998e-06, "epoch": 19.11425576519916, "percentage": 95.57, "elapsed_time": "1:33:37", "remaining_time": "0:04:20", "throughput": 4240.26, "total_tokens": 23818880} {"current_steps": 36475, "total_steps": 38160, "loss": 0.3856, "lr": 5.9346094714740615e-06, "epoch": 19.116876310272538, "percentage": 95.58, "elapsed_time": "1:33:38", "remaining_time": "0:04:19", "throughput": 4240.28, "total_tokens": 23822112} {"current_steps": 36480, "total_steps": 38160, "loss": 0.3513, "lr": 5.8995316019982425e-06, "epoch": 19.11949685534591, "percentage": 95.6, "elapsed_time": "1:33:38", "remaining_time": "0:04:18", "throughput": 4240.27, "total_tokens": 23824928} {"current_steps": 36485, "total_steps": 38160, "loss": 0.395, "lr": 5.8645570927034485e-06, "epoch": 19.122117400419288, "percentage": 95.61, "elapsed_time": "1:33:39", "remaining_time": "0:04:17", "throughput": 4240.33, "total_tokens": 23828512} {"current_steps": 36490, "total_steps": 38160, "loss": 0.4061, "lr": 5.8296859509058275e-06, "epoch": 19.12473794549266, "percentage": 95.62, "elapsed_time": "1:33:40", "remaining_time": "0:04:17", "throughput": 4240.35, "total_tokens": 23831616} {"current_steps": 36495, "total_steps": 38160, "loss": 0.4517, "lr": 5.794918183900155e-06, "epoch": 19.12735849056604, "percentage": 95.64, "elapsed_time": "1:33:41", "remaining_time": "0:04:16", "throughput": 4240.44, "total_tokens": 23835648} {"current_steps": 36500, "total_steps": 38160, "loss": 0.3552, "lr": 5.760253798959447e-06, "epoch": 19.129979035639412, "percentage": 95.65, "elapsed_time": "1:33:41", "remaining_time": "0:04:15", "throughput": 4240.52, "total_tokens": 23839424} {"current_steps": 36505, "total_steps": 38160, "loss": 0.5238, "lr": 5.725692803335015e-06, "epoch": 19.13259958071279, "percentage": 95.66, "elapsed_time": "1:33:42", "remaining_time": "0:04:14", "throughput": 4240.52, "total_tokens": 23842432} {"current_steps": 36510, "total_steps": 38160, "loss": 0.403, "lr": 5.691235204256739e-06, "epoch": 19.135220125786162, "percentage": 95.68, "elapsed_time": "1:33:43", "remaining_time": "0:04:14", "throughput": 4240.59, "total_tokens": 23846016} {"current_steps": 36515, "total_steps": 38160, "loss": 0.448, "lr": 5.65688100893258e-06, "epoch": 19.13784067085954, "percentage": 95.69, "elapsed_time": "1:33:44", "remaining_time": "0:04:13", "throughput": 4240.69, "total_tokens": 23850144} {"current_steps": 36520, "total_steps": 38160, "loss": 0.4274, "lr": 5.622630224549174e-06, "epoch": 19.140461215932913, "percentage": 95.7, "elapsed_time": "1:33:44", "remaining_time": "0:04:12", "throughput": 4240.7, "total_tokens": 23853216} {"current_steps": 36525, "total_steps": 38160, "loss": 0.3836, "lr": 5.588482858271404e-06, "epoch": 19.14308176100629, "percentage": 95.72, "elapsed_time": "1:33:45", "remaining_time": "0:04:11", "throughput": 4240.76, "total_tokens": 23856864} {"current_steps": 36530, "total_steps": 38160, "loss": 0.3228, "lr": 5.554438917242444e-06, "epoch": 19.145702306079663, "percentage": 95.73, "elapsed_time": "1:33:46", "remaining_time": "0:04:11", "throughput": 4240.8, "total_tokens": 23860192} {"current_steps": 36535, "total_steps": 38160, "loss": 0.4384, "lr": 5.520498408583985e-06, "epoch": 19.14832285115304, "percentage": 95.74, "elapsed_time": "1:33:47", "remaining_time": "0:04:10", "throughput": 4240.83, "total_tokens": 23863456} {"current_steps": 36540, "total_steps": 38160, "loss": 0.3376, "lr": 5.486661339395904e-06, "epoch": 19.150943396226417, "percentage": 95.75, "elapsed_time": "1:33:47", "remaining_time": "0:04:09", "throughput": 4240.84, "total_tokens": 23866432} {"current_steps": 36545, "total_steps": 38160, "loss": 0.4694, "lr": 5.452927716756595e-06, "epoch": 19.15356394129979, "percentage": 95.77, "elapsed_time": "1:33:48", "remaining_time": "0:04:08", "throughput": 4240.86, "total_tokens": 23869632} {"current_steps": 36550, "total_steps": 38160, "loss": 0.4495, "lr": 5.419297547722635e-06, "epoch": 19.156184486373167, "percentage": 95.78, "elapsed_time": "1:33:49", "remaining_time": "0:04:07", "throughput": 4240.87, "total_tokens": 23872864} {"current_steps": 36555, "total_steps": 38160, "loss": 0.4027, "lr": 5.385770839329229e-06, "epoch": 19.15880503144654, "percentage": 95.79, "elapsed_time": "1:33:49", "remaining_time": "0:04:07", "throughput": 4240.9, "total_tokens": 23876000} {"current_steps": 36560, "total_steps": 38160, "loss": 0.4504, "lr": 5.352347598589713e-06, "epoch": 19.161425576519918, "percentage": 95.81, "elapsed_time": "1:33:50", "remaining_time": "0:04:06", "throughput": 4240.96, "total_tokens": 23879616} {"current_steps": 36565, "total_steps": 38160, "loss": 0.4456, "lr": 5.319027832495826e-06, "epoch": 19.16404612159329, "percentage": 95.82, "elapsed_time": "1:33:51", "remaining_time": "0:04:05", "throughput": 4240.97, "total_tokens": 23882624} {"current_steps": 36570, "total_steps": 38160, "loss": 0.4198, "lr": 5.285811548017661e-06, "epoch": 19.166666666666668, "percentage": 95.83, "elapsed_time": "1:33:52", "remaining_time": "0:04:04", "throughput": 4241.04, "total_tokens": 23886304} {"current_steps": 36575, "total_steps": 38160, "loss": 0.397, "lr": 5.252698752103713e-06, "epoch": 19.16928721174004, "percentage": 95.85, "elapsed_time": "1:33:53", "remaining_time": "0:04:04", "throughput": 4241.15, "total_tokens": 23890624} {"current_steps": 36580, "total_steps": 38160, "loss": 0.4618, "lr": 5.219689451680832e-06, "epoch": 19.171907756813418, "percentage": 95.86, "elapsed_time": "1:33:53", "remaining_time": "0:04:03", "throughput": 4241.14, "total_tokens": 23893376} {"current_steps": 36585, "total_steps": 38160, "loss": 0.4258, "lr": 5.186783653654214e-06, "epoch": 19.17452830188679, "percentage": 95.87, "elapsed_time": "1:33:54", "remaining_time": "0:04:02", "throughput": 4241.17, "total_tokens": 23896608} {"current_steps": 36590, "total_steps": 38160, "loss": 0.3835, "lr": 5.153981364907245e-06, "epoch": 19.17714884696017, "percentage": 95.89, "elapsed_time": "1:33:55", "remaining_time": "0:04:01", "throughput": 4241.47, "total_tokens": 23903872} {"current_steps": 36595, "total_steps": 38160, "loss": 0.3508, "lr": 5.121282592301935e-06, "epoch": 19.179769392033542, "percentage": 95.9, "elapsed_time": "1:33:56", "remaining_time": "0:04:01", "throughput": 4241.49, "total_tokens": 23906912} {"current_steps": 36600, "total_steps": 38160, "loss": 0.4343, "lr": 5.088687342678422e-06, "epoch": 19.18238993710692, "percentage": 95.91, "elapsed_time": "1:33:57", "remaining_time": "0:04:00", "throughput": 4241.49, "total_tokens": 23909888} {"current_steps": 36605, "total_steps": 38160, "loss": 0.3698, "lr": 5.056195622855253e-06, "epoch": 19.185010482180292, "percentage": 95.93, "elapsed_time": "1:33:57", "remaining_time": "0:03:59", "throughput": 4241.56, "total_tokens": 23913568} {"current_steps": 36610, "total_steps": 38160, "loss": 0.4421, "lr": 5.023807439629324e-06, "epoch": 19.18763102725367, "percentage": 95.94, "elapsed_time": "1:33:58", "remaining_time": "0:03:58", "throughput": 4241.59, "total_tokens": 23916928} {"current_steps": 36615, "total_steps": 38160, "loss": 0.3717, "lr": 4.991522799775938e-06, "epoch": 19.190251572327043, "percentage": 95.95, "elapsed_time": "1:33:59", "remaining_time": "0:03:57", "throughput": 4241.59, "total_tokens": 23919840} {"current_steps": 36620, "total_steps": 38160, "loss": 0.4377, "lr": 4.9593417100485816e-06, "epoch": 19.19287211740042, "percentage": 95.96, "elapsed_time": "1:34:00", "remaining_time": "0:03:57", "throughput": 4241.6, "total_tokens": 23922944} {"current_steps": 36625, "total_steps": 38160, "loss": 0.4592, "lr": 4.927264177179258e-06, "epoch": 19.195492662473793, "percentage": 95.98, "elapsed_time": "1:34:00", "remaining_time": "0:03:56", "throughput": 4241.66, "total_tokens": 23926592} {"current_steps": 36630, "total_steps": 38160, "loss": 0.3532, "lr": 4.895290207878156e-06, "epoch": 19.19811320754717, "percentage": 95.99, "elapsed_time": "1:34:01", "remaining_time": "0:03:55", "throughput": 4241.67, "total_tokens": 23929632} {"current_steps": 36635, "total_steps": 38160, "loss": 0.496, "lr": 4.863419808833924e-06, "epoch": 19.200733752620547, "percentage": 96.0, "elapsed_time": "1:34:02", "remaining_time": "0:03:54", "throughput": 4241.73, "total_tokens": 23933216} {"current_steps": 36640, "total_steps": 38160, "loss": 0.3379, "lr": 4.831652986713453e-06, "epoch": 19.20335429769392, "percentage": 96.02, "elapsed_time": "1:34:03", "remaining_time": "0:03:54", "throughput": 4241.76, "total_tokens": 23936416} {"current_steps": 36645, "total_steps": 38160, "loss": 0.4801, "lr": 4.799989748161926e-06, "epoch": 19.205974842767297, "percentage": 96.03, "elapsed_time": "1:34:03", "remaining_time": "0:03:53", "throughput": 4241.75, "total_tokens": 23939264} {"current_steps": 36650, "total_steps": 38160, "loss": 0.3326, "lr": 4.768430099803101e-06, "epoch": 19.20859538784067, "percentage": 96.04, "elapsed_time": "1:34:04", "remaining_time": "0:03:52", "throughput": 4241.92, "total_tokens": 23944192} {"current_steps": 36655, "total_steps": 38160, "loss": 0.4397, "lr": 4.736974048238696e-06, "epoch": 19.211215932914047, "percentage": 96.06, "elapsed_time": "1:34:05", "remaining_time": "0:03:51", "throughput": 4241.9, "total_tokens": 23946880} {"current_steps": 36660, "total_steps": 38160, "loss": 0.5137, "lr": 4.705621600049115e-06, "epoch": 19.21383647798742, "percentage": 96.07, "elapsed_time": "1:34:05", "remaining_time": "0:03:51", "throughput": 4241.85, "total_tokens": 23949184} {"current_steps": 36665, "total_steps": 38160, "loss": 0.3407, "lr": 4.674372761792889e-06, "epoch": 19.216457023060798, "percentage": 96.08, "elapsed_time": "1:34:06", "remaining_time": "0:03:50", "throughput": 4241.86, "total_tokens": 23952256} {"current_steps": 36670, "total_steps": 38160, "loss": 0.3997, "lr": 4.6432275400069e-06, "epoch": 19.21907756813417, "percentage": 96.1, "elapsed_time": "1:34:07", "remaining_time": "0:03:49", "throughput": 4241.84, "total_tokens": 23954912} {"current_steps": 36675, "total_steps": 38160, "loss": 0.4271, "lr": 4.6121859412063264e-06, "epoch": 19.221698113207548, "percentage": 96.11, "elapsed_time": "1:34:08", "remaining_time": "0:03:48", "throughput": 4241.9, "total_tokens": 23958496} {"current_steps": 36680, "total_steps": 38160, "loss": 0.4178, "lr": 4.581247971884861e-06, "epoch": 19.22431865828092, "percentage": 96.12, "elapsed_time": "1:34:08", "remaining_time": "0:03:47", "throughput": 4241.89, "total_tokens": 23961408} {"current_steps": 36685, "total_steps": 38160, "loss": 0.3836, "lr": 4.550413638514217e-06, "epoch": 19.2269392033543, "percentage": 96.13, "elapsed_time": "1:34:09", "remaining_time": "0:03:47", "throughput": 4241.88, "total_tokens": 23964160} {"current_steps": 36690, "total_steps": 38160, "loss": 0.5501, "lr": 4.519682947544679e-06, "epoch": 19.229559748427672, "percentage": 96.15, "elapsed_time": "1:34:10", "remaining_time": "0:03:46", "throughput": 4241.87, "total_tokens": 23966784} {"current_steps": 36695, "total_steps": 38160, "loss": 0.5166, "lr": 4.489055905404715e-06, "epoch": 19.23218029350105, "percentage": 96.16, "elapsed_time": "1:34:10", "remaining_time": "0:03:45", "throughput": 4241.86, "total_tokens": 23969664} {"current_steps": 36700, "total_steps": 38160, "loss": 0.3685, "lr": 4.4585325185012014e-06, "epoch": 19.234800838574422, "percentage": 96.17, "elapsed_time": "1:34:11", "remaining_time": "0:03:44", "throughput": 4241.88, "total_tokens": 23972736} {"current_steps": 36705, "total_steps": 38160, "loss": 0.3192, "lr": 4.428112793219197e-06, "epoch": 19.2374213836478, "percentage": 96.19, "elapsed_time": "1:34:12", "remaining_time": "0:03:44", "throughput": 4241.91, "total_tokens": 23976064} {"current_steps": 36710, "total_steps": 38160, "loss": 0.5054, "lr": 4.397796735922277e-06, "epoch": 19.240041928721173, "percentage": 96.2, "elapsed_time": "1:34:12", "remaining_time": "0:03:43", "throughput": 4241.92, "total_tokens": 23978976} {"current_steps": 36715, "total_steps": 38160, "loss": 0.4896, "lr": 4.367584352952092e-06, "epoch": 19.24266247379455, "percentage": 96.21, "elapsed_time": "1:34:13", "remaining_time": "0:03:42", "throughput": 4241.93, "total_tokens": 23981984} {"current_steps": 36720, "total_steps": 38160, "loss": 0.4702, "lr": 4.337475650628808e-06, "epoch": 19.245283018867923, "percentage": 96.23, "elapsed_time": "1:34:14", "remaining_time": "0:03:41", "throughput": 4241.92, "total_tokens": 23984864} {"current_steps": 36725, "total_steps": 38160, "loss": 0.5824, "lr": 4.307470635250832e-06, "epoch": 19.2479035639413, "percentage": 96.24, "elapsed_time": "1:34:14", "remaining_time": "0:03:40", "throughput": 4241.97, "total_tokens": 23988288} {"current_steps": 36730, "total_steps": 38160, "loss": 0.3417, "lr": 4.277569313094809e-06, "epoch": 19.250524109014677, "percentage": 96.25, "elapsed_time": "1:34:15", "remaining_time": "0:03:40", "throughput": 4242.03, "total_tokens": 23991808} {"current_steps": 36735, "total_steps": 38160, "loss": 0.4659, "lr": 4.247771690415791e-06, "epoch": 19.25314465408805, "percentage": 96.27, "elapsed_time": "1:34:16", "remaining_time": "0:03:39", "throughput": 4242.13, "total_tokens": 23995840} {"current_steps": 36740, "total_steps": 38160, "loss": 0.4566, "lr": 4.218077773447071e-06, "epoch": 19.255765199161427, "percentage": 96.28, "elapsed_time": "1:34:17", "remaining_time": "0:03:38", "throughput": 4242.09, "total_tokens": 23998304} {"current_steps": 36745, "total_steps": 38160, "loss": 0.4139, "lr": 4.1884875684003455e-06, "epoch": 19.2583857442348, "percentage": 96.29, "elapsed_time": "1:34:17", "remaining_time": "0:03:37", "throughput": 4242.05, "total_tokens": 24000608} {"current_steps": 36750, "total_steps": 38160, "loss": 0.4733, "lr": 4.159001081465497e-06, "epoch": 19.261006289308177, "percentage": 96.31, "elapsed_time": "1:34:18", "remaining_time": "0:03:37", "throughput": 4242.08, "total_tokens": 24003808} {"current_steps": 36755, "total_steps": 38160, "loss": 0.3815, "lr": 4.129618318810702e-06, "epoch": 19.26362683438155, "percentage": 96.32, "elapsed_time": "1:34:19", "remaining_time": "0:03:36", "throughput": 4242.09, "total_tokens": 24006784} {"current_steps": 36760, "total_steps": 38160, "loss": 0.4085, "lr": 4.100339286582655e-06, "epoch": 19.266247379454928, "percentage": 96.33, "elapsed_time": "1:34:19", "remaining_time": "0:03:35", "throughput": 4242.07, "total_tokens": 24009376} {"current_steps": 36765, "total_steps": 38160, "loss": 0.3946, "lr": 4.071163990906068e-06, "epoch": 19.2688679245283, "percentage": 96.34, "elapsed_time": "1:34:20", "remaining_time": "0:03:34", "throughput": 4242.14, "total_tokens": 24013120} {"current_steps": 36770, "total_steps": 38160, "loss": 0.4732, "lr": 4.042092437884115e-06, "epoch": 19.271488469601678, "percentage": 96.36, "elapsed_time": "1:34:21", "remaining_time": "0:03:34", "throughput": 4242.17, "total_tokens": 24016384} {"current_steps": 36775, "total_steps": 38160, "loss": 0.383, "lr": 4.013124633598264e-06, "epoch": 19.27410901467505, "percentage": 96.37, "elapsed_time": "1:34:22", "remaining_time": "0:03:33", "throughput": 4242.27, "total_tokens": 24020416} {"current_steps": 36780, "total_steps": 38160, "loss": 0.3604, "lr": 3.984260584108168e-06, "epoch": 19.27672955974843, "percentage": 96.38, "elapsed_time": "1:34:22", "remaining_time": "0:03:32", "throughput": 4242.33, "total_tokens": 24024096} {"current_steps": 36785, "total_steps": 38160, "loss": 0.3077, "lr": 3.955500295451942e-06, "epoch": 19.279350104821802, "percentage": 96.4, "elapsed_time": "1:34:23", "remaining_time": "0:03:31", "throughput": 4242.27, "total_tokens": 24026336} {"current_steps": 36790, "total_steps": 38160, "loss": 0.2307, "lr": 3.926843773645883e-06, "epoch": 19.28197064989518, "percentage": 96.41, "elapsed_time": "1:34:24", "remaining_time": "0:03:30", "throughput": 4242.23, "total_tokens": 24028736} {"current_steps": 36795, "total_steps": 38160, "loss": 0.4735, "lr": 3.8982910246846415e-06, "epoch": 19.284591194968552, "percentage": 96.42, "elapsed_time": "1:34:24", "remaining_time": "0:03:30", "throughput": 4242.25, "total_tokens": 24031936} {"current_steps": 36800, "total_steps": 38160, "loss": 0.3575, "lr": 3.869842054541051e-06, "epoch": 19.28721174004193, "percentage": 96.44, "elapsed_time": "1:34:25", "remaining_time": "0:03:29", "throughput": 4242.25, "total_tokens": 24034752} {"current_steps": 36805, "total_steps": 38160, "loss": 0.4016, "lr": 3.84149686916635e-06, "epoch": 19.289832285115303, "percentage": 96.45, "elapsed_time": "1:34:26", "remaining_time": "0:03:28", "throughput": 4242.3, "total_tokens": 24038208} {"current_steps": 36810, "total_steps": 38160, "loss": 0.4909, "lr": 3.8132554744900183e-06, "epoch": 19.29245283018868, "percentage": 96.46, "elapsed_time": "1:34:27", "remaining_time": "0:03:27", "throughput": 4242.31, "total_tokens": 24041312} {"current_steps": 36815, "total_steps": 38160, "loss": 0.3829, "lr": 3.7851178764198302e-06, "epoch": 19.295073375262053, "percentage": 96.48, "elapsed_time": "1:34:27", "remaining_time": "0:03:27", "throughput": 4242.32, "total_tokens": 24044160} {"current_steps": 36820, "total_steps": 38160, "loss": 0.3412, "lr": 3.7570840808419104e-06, "epoch": 19.29769392033543, "percentage": 96.49, "elapsed_time": "1:34:28", "remaining_time": "0:03:26", "throughput": 4242.32, "total_tokens": 24047040} {"current_steps": 36825, "total_steps": 38160, "loss": 0.4637, "lr": 3.729154093620568e-06, "epoch": 19.300314465408803, "percentage": 96.5, "elapsed_time": "1:34:29", "remaining_time": "0:03:25", "throughput": 4242.38, "total_tokens": 24050720} {"current_steps": 36830, "total_steps": 38160, "loss": 0.3157, "lr": 3.7013279205984073e-06, "epoch": 19.30293501048218, "percentage": 96.51, "elapsed_time": "1:34:29", "remaining_time": "0:03:24", "throughput": 4242.42, "total_tokens": 24054048} {"current_steps": 36835, "total_steps": 38160, "loss": 0.4594, "lr": 3.6736055675963275e-06, "epoch": 19.305555555555557, "percentage": 96.53, "elapsed_time": "1:34:30", "remaining_time": "0:03:23", "throughput": 4242.44, "total_tokens": 24057152} {"current_steps": 36840, "total_steps": 38160, "loss": 0.3191, "lr": 3.645987040413634e-06, "epoch": 19.30817610062893, "percentage": 96.54, "elapsed_time": "1:34:31", "remaining_time": "0:03:23", "throughput": 4242.5, "total_tokens": 24060800} {"current_steps": 36845, "total_steps": 38160, "loss": 0.3416, "lr": 3.6184723448277056e-06, "epoch": 19.310796645702307, "percentage": 96.55, "elapsed_time": "1:34:32", "remaining_time": "0:03:22", "throughput": 4242.53, "total_tokens": 24064032} {"current_steps": 36850, "total_steps": 38160, "loss": 0.3831, "lr": 3.5910614865943826e-06, "epoch": 19.31341719077568, "percentage": 96.57, "elapsed_time": "1:34:32", "remaining_time": "0:03:21", "throughput": 4242.61, "total_tokens": 24067808} {"current_steps": 36855, "total_steps": 38160, "loss": 0.4656, "lr": 3.563754471447689e-06, "epoch": 19.316037735849058, "percentage": 96.58, "elapsed_time": "1:34:33", "remaining_time": "0:03:20", "throughput": 4242.69, "total_tokens": 24071680} {"current_steps": 36860, "total_steps": 38160, "loss": 0.4139, "lr": 3.5365513050998334e-06, "epoch": 19.31865828092243, "percentage": 96.59, "elapsed_time": "1:34:34", "remaining_time": "0:03:20", "throughput": 4242.67, "total_tokens": 24074336} {"current_steps": 36865, "total_steps": 38160, "loss": 0.6446, "lr": 3.5094519932415414e-06, "epoch": 19.321278825995808, "percentage": 96.61, "elapsed_time": "1:34:34", "remaining_time": "0:03:19", "throughput": 4242.67, "total_tokens": 24077152} {"current_steps": 36870, "total_steps": 38160, "loss": 0.3744, "lr": 3.4824565415416123e-06, "epoch": 19.32389937106918, "percentage": 96.62, "elapsed_time": "1:34:35", "remaining_time": "0:03:18", "throughput": 4242.64, "total_tokens": 24079744} {"current_steps": 36875, "total_steps": 38160, "loss": 0.5341, "lr": 3.4555649556471946e-06, "epoch": 19.32651991614256, "percentage": 96.63, "elapsed_time": "1:34:36", "remaining_time": "0:03:17", "throughput": 4242.67, "total_tokens": 24083008} {"current_steps": 36880, "total_steps": 38160, "loss": 0.3709, "lr": 3.4287772411837338e-06, "epoch": 19.329140461215932, "percentage": 96.65, "elapsed_time": "1:34:37", "remaining_time": "0:03:17", "throughput": 4242.67, "total_tokens": 24085984} {"current_steps": 36885, "total_steps": 38160, "loss": 0.4106, "lr": 3.402093403754858e-06, "epoch": 19.33176100628931, "percentage": 96.66, "elapsed_time": "1:34:37", "remaining_time": "0:03:16", "throughput": 4242.69, "total_tokens": 24089024} {"current_steps": 36890, "total_steps": 38160, "loss": 0.3902, "lr": 3.375513448942602e-06, "epoch": 19.334381551362682, "percentage": 96.67, "elapsed_time": "1:34:38", "remaining_time": "0:03:15", "throughput": 4242.78, "total_tokens": 24093056} {"current_steps": 36895, "total_steps": 38160, "loss": 0.4232, "lr": 3.349037382307074e-06, "epoch": 19.33700209643606, "percentage": 96.69, "elapsed_time": "1:34:39", "remaining_time": "0:03:14", "throughput": 4242.82, "total_tokens": 24096448} {"current_steps": 36900, "total_steps": 38160, "loss": 0.4204, "lr": 3.322665209386899e-06, "epoch": 19.339622641509433, "percentage": 96.7, "elapsed_time": "1:34:39", "remaining_time": "0:03:13", "throughput": 4242.76, "total_tokens": 24098592} {"current_steps": 36905, "total_steps": 38160, "loss": 0.4133, "lr": 3.29639693569872e-06, "epoch": 19.34224318658281, "percentage": 96.71, "elapsed_time": "1:34:40", "remaining_time": "0:03:13", "throughput": 4242.71, "total_tokens": 24100864} {"current_steps": 36910, "total_steps": 38160, "loss": 0.428, "lr": 3.270232566737641e-06, "epoch": 19.344863731656183, "percentage": 96.72, "elapsed_time": "1:34:41", "remaining_time": "0:03:12", "throughput": 4242.71, "total_tokens": 24103680} {"current_steps": 36915, "total_steps": 38160, "loss": 0.4766, "lr": 3.244172107976895e-06, "epoch": 19.34748427672956, "percentage": 96.74, "elapsed_time": "1:34:41", "remaining_time": "0:03:11", "throughput": 4242.73, "total_tokens": 24106784} {"current_steps": 36920, "total_steps": 38160, "loss": 0.3937, "lr": 3.2182155648680657e-06, "epoch": 19.350104821802937, "percentage": 96.75, "elapsed_time": "1:34:42", "remaining_time": "0:03:10", "throughput": 4242.78, "total_tokens": 24110208} {"current_steps": 36925, "total_steps": 38160, "loss": 0.4333, "lr": 3.1923629428409205e-06, "epoch": 19.35272536687631, "percentage": 96.76, "elapsed_time": "1:34:43", "remaining_time": "0:03:10", "throughput": 4242.78, "total_tokens": 24113216} {"current_steps": 36930, "total_steps": 38160, "loss": 0.4586, "lr": 3.166614247303634e-06, "epoch": 19.355345911949687, "percentage": 96.78, "elapsed_time": "1:34:44", "remaining_time": "0:03:09", "throughput": 4242.79, "total_tokens": 24116192} {"current_steps": 36935, "total_steps": 38160, "loss": 0.3862, "lr": 3.140969483642453e-06, "epoch": 19.35796645702306, "percentage": 96.79, "elapsed_time": "1:34:44", "remaining_time": "0:03:08", "throughput": 4242.8, "total_tokens": 24119200} {"current_steps": 36940, "total_steps": 38160, "loss": 0.5045, "lr": 3.1154286572219747e-06, "epoch": 19.360587002096437, "percentage": 96.8, "elapsed_time": "1:34:45", "remaining_time": "0:03:07", "throughput": 4242.87, "total_tokens": 24122912} {"current_steps": 36945, "total_steps": 38160, "loss": 0.5067, "lr": 3.089991773385037e-06, "epoch": 19.36320754716981, "percentage": 96.82, "elapsed_time": "1:34:46", "remaining_time": "0:03:07", "throughput": 4242.87, "total_tokens": 24125760} {"current_steps": 36950, "total_steps": 38160, "loss": 0.3394, "lr": 3.064658837452772e-06, "epoch": 19.365828092243188, "percentage": 96.83, "elapsed_time": "1:34:46", "remaining_time": "0:03:06", "throughput": 4242.92, "total_tokens": 24129280} {"current_steps": 36955, "total_steps": 38160, "loss": 0.331, "lr": 3.0394298547246068e-06, "epoch": 19.36844863731656, "percentage": 96.84, "elapsed_time": "1:34:47", "remaining_time": "0:03:05", "throughput": 4242.91, "total_tokens": 24132000} {"current_steps": 36960, "total_steps": 38160, "loss": 0.3204, "lr": 3.0143048304779875e-06, "epoch": 19.371069182389938, "percentage": 96.86, "elapsed_time": "1:34:48", "remaining_time": "0:03:04", "throughput": 4242.97, "total_tokens": 24135808} {"current_steps": 36965, "total_steps": 38160, "loss": 0.5266, "lr": 2.989283769968987e-06, "epoch": 19.37368972746331, "percentage": 96.87, "elapsed_time": "1:34:49", "remaining_time": "0:03:03", "throughput": 4243.01, "total_tokens": 24139040} {"current_steps": 36970, "total_steps": 38160, "loss": 0.4234, "lr": 2.964366678431585e-06, "epoch": 19.37631027253669, "percentage": 96.88, "elapsed_time": "1:34:49", "remaining_time": "0:03:03", "throughput": 4242.99, "total_tokens": 24141760} {"current_steps": 36975, "total_steps": 38160, "loss": 0.4753, "lr": 2.9395535610781678e-06, "epoch": 19.378930817610062, "percentage": 96.89, "elapsed_time": "1:34:50", "remaining_time": "0:03:02", "throughput": 4243.05, "total_tokens": 24145216} {"current_steps": 36980, "total_steps": 38160, "loss": 0.4416, "lr": 2.9148444230994166e-06, "epoch": 19.38155136268344, "percentage": 96.91, "elapsed_time": "1:34:51", "remaining_time": "0:03:01", "throughput": 4243.07, "total_tokens": 24148320} {"current_steps": 36985, "total_steps": 38160, "loss": 0.3754, "lr": 2.890239269664141e-06, "epoch": 19.384171907756812, "percentage": 96.92, "elapsed_time": "1:34:51", "remaining_time": "0:03:00", "throughput": 4243.04, "total_tokens": 24150816} {"current_steps": 36990, "total_steps": 38160, "loss": 0.4326, "lr": 2.8657381059194466e-06, "epoch": 19.38679245283019, "percentage": 96.93, "elapsed_time": "1:34:52", "remaining_time": "0:03:00", "throughput": 4243.05, "total_tokens": 24153760} {"current_steps": 36995, "total_steps": 38160, "loss": 0.5218, "lr": 2.8413409369907885e-06, "epoch": 19.389412997903563, "percentage": 96.95, "elapsed_time": "1:34:53", "remaining_time": "0:02:59", "throughput": 4243.05, "total_tokens": 24156800} {"current_steps": 37000, "total_steps": 38160, "loss": 0.464, "lr": 2.817047767981695e-06, "epoch": 19.39203354297694, "percentage": 96.96, "elapsed_time": "1:34:54", "remaining_time": "0:02:58", "throughput": 4243.13, "total_tokens": 24160736} {"current_steps": 37005, "total_steps": 38160, "loss": 0.3649, "lr": 2.7928586039740466e-06, "epoch": 19.394654088050313, "percentage": 96.97, "elapsed_time": "1:34:54", "remaining_time": "0:02:57", "throughput": 4243.11, "total_tokens": 24163424} {"current_steps": 37010, "total_steps": 38160, "loss": 0.3874, "lr": 2.7687734500279615e-06, "epoch": 19.39727463312369, "percentage": 96.99, "elapsed_time": "1:34:55", "remaining_time": "0:02:56", "throughput": 4243.16, "total_tokens": 24166880} {"current_steps": 37015, "total_steps": 38160, "loss": 0.4761, "lr": 2.744792311181743e-06, "epoch": 19.399895178197063, "percentage": 97.0, "elapsed_time": "1:34:56", "remaining_time": "0:02:56", "throughput": 4243.18, "total_tokens": 24169984} {"current_steps": 37020, "total_steps": 38160, "loss": 0.5184, "lr": 2.720915192451989e-06, "epoch": 19.40251572327044, "percentage": 97.01, "elapsed_time": "1:34:56", "remaining_time": "0:02:55", "throughput": 4243.21, "total_tokens": 24173248} {"current_steps": 37025, "total_steps": 38160, "loss": 0.3636, "lr": 2.697142098833538e-06, "epoch": 19.405136268343817, "percentage": 97.03, "elapsed_time": "1:34:57", "remaining_time": "0:02:54", "throughput": 4243.24, "total_tokens": 24176512} {"current_steps": 37030, "total_steps": 38160, "loss": 0.4628, "lr": 2.6734730352993563e-06, "epoch": 19.40775681341719, "percentage": 97.04, "elapsed_time": "1:34:58", "remaining_time": "0:02:53", "throughput": 4243.23, "total_tokens": 24179296} {"current_steps": 37035, "total_steps": 38160, "loss": 0.4756, "lr": 2.649908006800872e-06, "epoch": 19.410377358490567, "percentage": 97.05, "elapsed_time": "1:34:59", "remaining_time": "0:02:53", "throughput": 4243.31, "total_tokens": 24183008} {"current_steps": 37040, "total_steps": 38160, "loss": 0.4671, "lr": 2.626447018267586e-06, "epoch": 19.41299790356394, "percentage": 97.06, "elapsed_time": "1:34:59", "remaining_time": "0:02:52", "throughput": 4243.32, "total_tokens": 24186048} {"current_steps": 37045, "total_steps": 38160, "loss": 0.3539, "lr": 2.603090074607184e-06, "epoch": 19.415618448637318, "percentage": 97.08, "elapsed_time": "1:35:00", "remaining_time": "0:02:51", "throughput": 4243.29, "total_tokens": 24188640} {"current_steps": 37050, "total_steps": 38160, "loss": 0.3424, "lr": 2.579837180705813e-06, "epoch": 19.41823899371069, "percentage": 97.09, "elapsed_time": "1:35:01", "remaining_time": "0:02:50", "throughput": 4243.25, "total_tokens": 24191040} {"current_steps": 37055, "total_steps": 38160, "loss": 0.4477, "lr": 2.556688341427582e-06, "epoch": 19.420859538784068, "percentage": 97.1, "elapsed_time": "1:35:01", "remaining_time": "0:02:50", "throughput": 4243.26, "total_tokens": 24194016} {"current_steps": 37060, "total_steps": 38160, "loss": 0.3842, "lr": 2.5336435616150066e-06, "epoch": 19.42348008385744, "percentage": 97.12, "elapsed_time": "1:35:02", "remaining_time": "0:02:49", "throughput": 4243.21, "total_tokens": 24196320} {"current_steps": 37065, "total_steps": 38160, "loss": 0.478, "lr": 2.510702846088786e-06, "epoch": 19.42610062893082, "percentage": 97.13, "elapsed_time": "1:35:03", "remaining_time": "0:02:48", "throughput": 4243.23, "total_tokens": 24199456} {"current_steps": 37070, "total_steps": 38160, "loss": 0.4243, "lr": 2.487866199647915e-06, "epoch": 19.428721174004192, "percentage": 97.14, "elapsed_time": "1:35:03", "remaining_time": "0:02:47", "throughput": 4243.27, "total_tokens": 24202848} {"current_steps": 37075, "total_steps": 38160, "loss": 0.4631, "lr": 2.4651336270695156e-06, "epoch": 19.43134171907757, "percentage": 97.16, "elapsed_time": "1:35:04", "remaining_time": "0:02:46", "throughput": 4243.3, "total_tokens": 24206016} {"current_steps": 37080, "total_steps": 38160, "loss": 0.5147, "lr": 2.442505133108952e-06, "epoch": 19.433962264150942, "percentage": 97.17, "elapsed_time": "1:35:05", "remaining_time": "0:02:46", "throughput": 4243.28, "total_tokens": 24208768} {"current_steps": 37085, "total_steps": 38160, "loss": 0.4506, "lr": 2.419980722499937e-06, "epoch": 19.43658280922432, "percentage": 97.18, "elapsed_time": "1:35:05", "remaining_time": "0:02:45", "throughput": 4243.33, "total_tokens": 24212320} {"current_steps": 37090, "total_steps": 38160, "loss": 0.3342, "lr": 2.397560399954202e-06, "epoch": 19.439203354297693, "percentage": 97.2, "elapsed_time": "1:35:06", "remaining_time": "0:02:44", "throughput": 4243.33, "total_tokens": 24215232} {"current_steps": 37095, "total_steps": 38160, "loss": 0.4464, "lr": 2.3752441701618833e-06, "epoch": 19.44182389937107, "percentage": 97.21, "elapsed_time": "1:35:07", "remaining_time": "0:02:43", "throughput": 4243.36, "total_tokens": 24218336} {"current_steps": 37100, "total_steps": 38160, "loss": 0.3813, "lr": 2.3530320377913027e-06, "epoch": 19.444444444444443, "percentage": 97.22, "elapsed_time": "1:35:08", "remaining_time": "0:02:43", "throughput": 4243.43, "total_tokens": 24222176} {"current_steps": 37105, "total_steps": 38160, "loss": 0.5679, "lr": 2.3309240074890213e-06, "epoch": 19.44706498951782, "percentage": 97.24, "elapsed_time": "1:35:08", "remaining_time": "0:02:42", "throughput": 4243.47, "total_tokens": 24225536} {"current_steps": 37110, "total_steps": 38160, "loss": 0.5769, "lr": 2.3089200838796176e-06, "epoch": 19.449685534591197, "percentage": 97.25, "elapsed_time": "1:35:09", "remaining_time": "0:02:41", "throughput": 4243.46, "total_tokens": 24228352} {"current_steps": 37115, "total_steps": 38160, "loss": 0.5192, "lr": 2.2870202715662426e-06, "epoch": 19.45230607966457, "percentage": 97.26, "elapsed_time": "1:35:10", "remaining_time": "0:02:40", "throughput": 4243.45, "total_tokens": 24231168} {"current_steps": 37120, "total_steps": 38160, "loss": 0.3147, "lr": 2.265224575130009e-06, "epoch": 19.454926624737947, "percentage": 97.27, "elapsed_time": "1:35:11", "remaining_time": "0:02:40", "throughput": 4243.69, "total_tokens": 24237184} {"current_steps": 37125, "total_steps": 38160, "loss": 0.4688, "lr": 2.2435329991303268e-06, "epoch": 19.45754716981132, "percentage": 97.29, "elapsed_time": "1:35:12", "remaining_time": "0:02:39", "throughput": 4243.74, "total_tokens": 24240672} {"current_steps": 37130, "total_steps": 38160, "loss": 0.4493, "lr": 2.2219455481047868e-06, "epoch": 19.460167714884697, "percentage": 97.3, "elapsed_time": "1:35:12", "remaining_time": "0:02:38", "throughput": 4243.77, "total_tokens": 24244032} {"current_steps": 37135, "total_steps": 38160, "loss": 0.3415, "lr": 2.2004622265693886e-06, "epoch": 19.46278825995807, "percentage": 97.31, "elapsed_time": "1:35:13", "remaining_time": "0:02:37", "throughput": 4243.73, "total_tokens": 24246496} {"current_steps": 37140, "total_steps": 38160, "loss": 0.3599, "lr": 2.179083039018037e-06, "epoch": 19.465408805031448, "percentage": 97.33, "elapsed_time": "1:35:14", "remaining_time": "0:02:36", "throughput": 4243.73, "total_tokens": 24249376} {"current_steps": 37145, "total_steps": 38160, "loss": 0.3681, "lr": 2.157807989923044e-06, "epoch": 19.46802935010482, "percentage": 97.34, "elapsed_time": "1:35:14", "remaining_time": "0:02:36", "throughput": 4243.73, "total_tokens": 24252288} {"current_steps": 37150, "total_steps": 38160, "loss": 0.3715, "lr": 2.1366370837349603e-06, "epoch": 19.470649895178198, "percentage": 97.35, "elapsed_time": "1:35:15", "remaining_time": "0:02:35", "throughput": 4243.66, "total_tokens": 24254432} {"current_steps": 37155, "total_steps": 38160, "loss": 0.5126, "lr": 2.1155703248825207e-06, "epoch": 19.47327044025157, "percentage": 97.37, "elapsed_time": "1:35:16", "remaining_time": "0:02:34", "throughput": 4243.66, "total_tokens": 24257408} {"current_steps": 37160, "total_steps": 38160, "loss": 0.4013, "lr": 2.094607717772534e-06, "epoch": 19.47589098532495, "percentage": 97.38, "elapsed_time": "1:35:16", "remaining_time": "0:02:33", "throughput": 4243.66, "total_tokens": 24260224} {"current_steps": 37165, "total_steps": 38160, "loss": 0.4835, "lr": 2.0737492667902702e-06, "epoch": 19.478511530398322, "percentage": 97.39, "elapsed_time": "1:35:17", "remaining_time": "0:02:33", "throughput": 4243.67, "total_tokens": 24263200} {"current_steps": 37170, "total_steps": 38160, "loss": 0.4686, "lr": 2.0529949762989608e-06, "epoch": 19.4811320754717, "percentage": 97.41, "elapsed_time": "1:35:18", "remaining_time": "0:02:32", "throughput": 4243.68, "total_tokens": 24266240} {"current_steps": 37175, "total_steps": 38160, "loss": 0.3473, "lr": 2.032344850640244e-06, "epoch": 19.483752620545072, "percentage": 97.42, "elapsed_time": "1:35:19", "remaining_time": "0:02:31", "throughput": 4243.81, "total_tokens": 24270656} {"current_steps": 37180, "total_steps": 38160, "loss": 0.4146, "lr": 2.011798894133887e-06, "epoch": 19.48637316561845, "percentage": 97.43, "elapsed_time": "1:35:19", "remaining_time": "0:02:30", "throughput": 4243.85, "total_tokens": 24274016} {"current_steps": 37185, "total_steps": 38160, "loss": 0.4573, "lr": 1.9913571110777852e-06, "epoch": 19.488993710691823, "percentage": 97.44, "elapsed_time": "1:35:20", "remaining_time": "0:02:29", "throughput": 4243.89, "total_tokens": 24277536} {"current_steps": 37190, "total_steps": 38160, "loss": 0.4199, "lr": 1.971019505748295e-06, "epoch": 19.4916142557652, "percentage": 97.46, "elapsed_time": "1:35:21", "remaining_time": "0:02:29", "throughput": 4243.87, "total_tokens": 24280192} {"current_steps": 37195, "total_steps": 38160, "loss": 0.4423, "lr": 1.9507860823996803e-06, "epoch": 19.494234800838573, "percentage": 97.47, "elapsed_time": "1:35:21", "remaining_time": "0:02:28", "throughput": 4243.88, "total_tokens": 24283232} {"current_steps": 37200, "total_steps": 38160, "loss": 0.4548, "lr": 1.9306568452645e-06, "epoch": 19.49685534591195, "percentage": 97.48, "elapsed_time": "1:35:22", "remaining_time": "0:02:27", "throughput": 4243.9, "total_tokens": 24286368} {"current_steps": 37205, "total_steps": 38160, "loss": 0.404, "lr": 1.910631798553664e-06, "epoch": 19.499475890985323, "percentage": 97.5, "elapsed_time": "1:35:23", "remaining_time": "0:02:26", "throughput": 4243.97, "total_tokens": 24289952} {"current_steps": 37210, "total_steps": 38160, "loss": 0.362, "lr": 1.8907109464562088e-06, "epoch": 19.5020964360587, "percentage": 97.51, "elapsed_time": "1:35:24", "remaining_time": "0:02:26", "throughput": 4244.05, "total_tokens": 24293952} {"current_steps": 37215, "total_steps": 38160, "loss": 0.397, "lr": 1.870894293139247e-06, "epoch": 19.504716981132077, "percentage": 97.52, "elapsed_time": "1:35:24", "remaining_time": "0:02:25", "throughput": 4244.09, "total_tokens": 24297216} {"current_steps": 37220, "total_steps": 38160, "loss": 0.3342, "lr": 1.8511818427482396e-06, "epoch": 19.50733752620545, "percentage": 97.54, "elapsed_time": "1:35:25", "remaining_time": "0:02:24", "throughput": 4244.1, "total_tokens": 24300288} {"current_steps": 37225, "total_steps": 38160, "loss": 0.4321, "lr": 1.8315735994068327e-06, "epoch": 19.509958071278827, "percentage": 97.55, "elapsed_time": "1:35:26", "remaining_time": "0:02:23", "throughput": 4244.12, "total_tokens": 24303328} {"current_steps": 37230, "total_steps": 38160, "loss": 0.6623, "lr": 1.8120695672168009e-06, "epoch": 19.5125786163522, "percentage": 97.56, "elapsed_time": "1:35:27", "remaining_time": "0:02:23", "throughput": 4244.15, "total_tokens": 24306560} {"current_steps": 37235, "total_steps": 38160, "loss": 0.4198, "lr": 1.792669750258158e-06, "epoch": 19.515199161425578, "percentage": 97.58, "elapsed_time": "1:35:27", "remaining_time": "0:02:22", "throughput": 4244.18, "total_tokens": 24309760} {"current_steps": 37240, "total_steps": 38160, "loss": 0.5406, "lr": 1.7733741525892134e-06, "epoch": 19.51781970649895, "percentage": 97.59, "elapsed_time": "1:35:28", "remaining_time": "0:02:21", "throughput": 4244.25, "total_tokens": 24313504} {"current_steps": 37245, "total_steps": 38160, "loss": 0.4763, "lr": 1.7541827782462937e-06, "epoch": 19.520440251572328, "percentage": 97.6, "elapsed_time": "1:35:29", "remaining_time": "0:02:20", "throughput": 4244.27, "total_tokens": 24316800} {"current_steps": 37250, "total_steps": 38160, "loss": 0.412, "lr": 1.7350956312440768e-06, "epoch": 19.5230607966457, "percentage": 97.62, "elapsed_time": "1:35:29", "remaining_time": "0:02:19", "throughput": 4244.27, "total_tokens": 24319616} {"current_steps": 37255, "total_steps": 38160, "loss": 0.4011, "lr": 1.716112715575313e-06, "epoch": 19.52568134171908, "percentage": 97.63, "elapsed_time": "1:35:30", "remaining_time": "0:02:19", "throughput": 4244.37, "total_tokens": 24323744} {"current_steps": 37260, "total_steps": 38160, "loss": 0.375, "lr": 1.6972340352110481e-06, "epoch": 19.528301886792452, "percentage": 97.64, "elapsed_time": "1:35:31", "remaining_time": "0:02:18", "throughput": 4244.44, "total_tokens": 24327456} {"current_steps": 37265, "total_steps": 38160, "loss": 0.4771, "lr": 1.6784595941004565e-06, "epoch": 19.53092243186583, "percentage": 97.65, "elapsed_time": "1:35:32", "remaining_time": "0:02:17", "throughput": 4244.44, "total_tokens": 24330400} {"current_steps": 37270, "total_steps": 38160, "loss": 0.4735, "lr": 1.659789396171063e-06, "epoch": 19.533542976939202, "percentage": 97.67, "elapsed_time": "1:35:33", "remaining_time": "0:02:16", "throughput": 4244.48, "total_tokens": 24333696} {"current_steps": 37275, "total_steps": 38160, "loss": 0.587, "lr": 1.6412234453282993e-06, "epoch": 19.53616352201258, "percentage": 97.68, "elapsed_time": "1:35:33", "remaining_time": "0:02:16", "throughput": 4244.53, "total_tokens": 24337216} {"current_steps": 37280, "total_steps": 38160, "loss": 0.3825, "lr": 1.622761745456003e-06, "epoch": 19.538784067085953, "percentage": 97.69, "elapsed_time": "1:35:34", "remaining_time": "0:02:15", "throughput": 4244.56, "total_tokens": 24340384} {"current_steps": 37285, "total_steps": 38160, "loss": 0.3711, "lr": 1.6044043004161958e-06, "epoch": 19.54140461215933, "percentage": 97.71, "elapsed_time": "1:35:35", "remaining_time": "0:02:14", "throughput": 4244.53, "total_tokens": 24343008} {"current_steps": 37290, "total_steps": 38160, "loss": 0.2716, "lr": 1.5861511140489725e-06, "epoch": 19.544025157232703, "percentage": 97.72, "elapsed_time": "1:35:35", "remaining_time": "0:02:13", "throughput": 4244.46, "total_tokens": 24345088} {"current_steps": 37295, "total_steps": 38160, "loss": 0.6099, "lr": 1.5680021901727237e-06, "epoch": 19.54664570230608, "percentage": 97.73, "elapsed_time": "1:35:36", "remaining_time": "0:02:13", "throughput": 4244.5, "total_tokens": 24348384} {"current_steps": 37300, "total_steps": 38160, "loss": 0.4093, "lr": 1.5499575325840232e-06, "epoch": 19.549266247379457, "percentage": 97.75, "elapsed_time": "1:35:37", "remaining_time": "0:02:12", "throughput": 4244.55, "total_tokens": 24351840} {"current_steps": 37305, "total_steps": 38160, "loss": 0.4665, "lr": 1.5320171450576293e-06, "epoch": 19.55188679245283, "percentage": 97.76, "elapsed_time": "1:35:37", "remaining_time": "0:02:11", "throughput": 4244.59, "total_tokens": 24355232} {"current_steps": 37310, "total_steps": 38160, "loss": 0.4018, "lr": 1.5141810313463733e-06, "epoch": 19.554507337526207, "percentage": 97.77, "elapsed_time": "1:35:38", "remaining_time": "0:02:10", "throughput": 4244.67, "total_tokens": 24359200} {"current_steps": 37315, "total_steps": 38160, "loss": 0.5261, "lr": 1.4964491951814374e-06, "epoch": 19.55712788259958, "percentage": 97.79, "elapsed_time": "1:35:39", "remaining_time": "0:02:09", "throughput": 4244.69, "total_tokens": 24362272} {"current_steps": 37320, "total_steps": 38160, "loss": 0.5016, "lr": 1.4788216402720766e-06, "epoch": 19.559748427672957, "percentage": 97.8, "elapsed_time": "1:35:40", "remaining_time": "0:02:09", "throughput": 4244.73, "total_tokens": 24365632} {"current_steps": 37325, "total_steps": 38160, "loss": 0.4437, "lr": 1.4612983703058413e-06, "epoch": 19.56236897274633, "percentage": 97.81, "elapsed_time": "1:35:40", "remaining_time": "0:02:08", "throughput": 4244.71, "total_tokens": 24368256} {"current_steps": 37330, "total_steps": 38160, "loss": 0.3994, "lr": 1.4438793889483549e-06, "epoch": 19.564989517819708, "percentage": 97.82, "elapsed_time": "1:35:41", "remaining_time": "0:02:07", "throughput": 4244.76, "total_tokens": 24371904} {"current_steps": 37335, "total_steps": 38160, "loss": 0.3898, "lr": 1.4265646998434246e-06, "epoch": 19.56761006289308, "percentage": 97.84, "elapsed_time": "1:35:42", "remaining_time": "0:02:06", "throughput": 4244.89, "total_tokens": 24376640} {"current_steps": 37340, "total_steps": 38160, "loss": 0.3659, "lr": 1.409354306613153e-06, "epoch": 19.570230607966458, "percentage": 97.85, "elapsed_time": "1:35:43", "remaining_time": "0:02:06", "throughput": 4244.95, "total_tokens": 24380288} {"current_steps": 37345, "total_steps": 38160, "loss": 0.4975, "lr": 1.3922482128577718e-06, "epoch": 19.57285115303983, "percentage": 97.86, "elapsed_time": "1:35:44", "remaining_time": "0:02:05", "throughput": 4244.97, "total_tokens": 24383328} {"current_steps": 37350, "total_steps": 38160, "loss": 0.4636, "lr": 1.3752464221556404e-06, "epoch": 19.57547169811321, "percentage": 97.88, "elapsed_time": "1:35:44", "remaining_time": "0:02:04", "throughput": 4244.99, "total_tokens": 24386464} {"current_steps": 37355, "total_steps": 38160, "loss": 0.3508, "lr": 1.358348938063303e-06, "epoch": 19.578092243186582, "percentage": 97.89, "elapsed_time": "1:35:45", "remaining_time": "0:02:03", "throughput": 4245.0, "total_tokens": 24389440} {"current_steps": 37360, "total_steps": 38160, "loss": 0.369, "lr": 1.341555764115543e-06, "epoch": 19.58071278825996, "percentage": 97.9, "elapsed_time": "1:35:46", "remaining_time": "0:02:03", "throughput": 4245.06, "total_tokens": 24393088} {"current_steps": 37365, "total_steps": 38160, "loss": 0.4432, "lr": 1.3248669038253835e-06, "epoch": 19.583333333333332, "percentage": 97.92, "elapsed_time": "1:35:46", "remaining_time": "0:02:02", "throughput": 4245.09, "total_tokens": 24396224} {"current_steps": 37370, "total_steps": 38160, "loss": 0.3967, "lr": 1.3082823606838656e-06, "epoch": 19.58595387840671, "percentage": 97.93, "elapsed_time": "1:35:47", "remaining_time": "0:02:01", "throughput": 4245.05, "total_tokens": 24398592} {"current_steps": 37375, "total_steps": 38160, "loss": 0.5375, "lr": 1.2918021381603251e-06, "epoch": 19.588574423480082, "percentage": 97.94, "elapsed_time": "1:35:48", "remaining_time": "0:02:00", "throughput": 4245.17, "total_tokens": 24403136} {"current_steps": 37380, "total_steps": 38160, "loss": 0.3107, "lr": 1.275426239702171e-06, "epoch": 19.59119496855346, "percentage": 97.96, "elapsed_time": "1:35:49", "remaining_time": "0:01:59", "throughput": 4245.17, "total_tokens": 24406048} {"current_steps": 37385, "total_steps": 38160, "loss": 0.303, "lr": 1.2591546687351073e-06, "epoch": 19.593815513626833, "percentage": 97.97, "elapsed_time": "1:35:49", "remaining_time": "0:01:59", "throughput": 4245.16, "total_tokens": 24408864} {"current_steps": 37390, "total_steps": 38160, "loss": 0.4596, "lr": 1.2429874286629673e-06, "epoch": 19.59643605870021, "percentage": 97.98, "elapsed_time": "1:35:50", "remaining_time": "0:01:58", "throughput": 4245.19, "total_tokens": 24412128} {"current_steps": 37395, "total_steps": 38160, "loss": 0.3363, "lr": 1.2269245228677116e-06, "epoch": 19.599056603773583, "percentage": 98.0, "elapsed_time": "1:35:51", "remaining_time": "0:01:57", "throughput": 4245.22, "total_tokens": 24415488} {"current_steps": 37400, "total_steps": 38160, "loss": 0.4132, "lr": 1.210965954709542e-06, "epoch": 19.60167714884696, "percentage": 98.01, "elapsed_time": "1:35:51", "remaining_time": "0:01:56", "throughput": 4245.2, "total_tokens": 24418080} {"current_steps": 37405, "total_steps": 38160, "loss": 0.5161, "lr": 1.1951117275268431e-06, "epoch": 19.604297693920337, "percentage": 98.02, "elapsed_time": "1:35:52", "remaining_time": "0:01:56", "throughput": 4245.23, "total_tokens": 24421280} {"current_steps": 37410, "total_steps": 38160, "loss": 0.3868, "lr": 1.1793618446360732e-06, "epoch": 19.60691823899371, "percentage": 98.03, "elapsed_time": "1:35:53", "remaining_time": "0:01:55", "throughput": 4245.21, "total_tokens": 24424032} {"current_steps": 37415, "total_steps": 38160, "loss": 0.3507, "lr": 1.1637163093319303e-06, "epoch": 19.609538784067087, "percentage": 98.05, "elapsed_time": "1:35:53", "remaining_time": "0:01:54", "throughput": 4245.18, "total_tokens": 24426528} {"current_steps": 37420, "total_steps": 38160, "loss": 0.234, "lr": 1.1481751248874072e-06, "epoch": 19.61215932914046, "percentage": 98.06, "elapsed_time": "1:35:54", "remaining_time": "0:01:53", "throughput": 4245.2, "total_tokens": 24429632} {"current_steps": 37425, "total_steps": 38160, "loss": 0.4158, "lr": 1.1327382945533482e-06, "epoch": 19.614779874213838, "percentage": 98.07, "elapsed_time": "1:35:55", "remaining_time": "0:01:53", "throughput": 4245.21, "total_tokens": 24432832} {"current_steps": 37430, "total_steps": 38160, "loss": 0.5055, "lr": 1.1174058215591143e-06, "epoch": 19.61740041928721, "percentage": 98.09, "elapsed_time": "1:35:56", "remaining_time": "0:01:52", "throughput": 4245.21, "total_tokens": 24435712} {"current_steps": 37435, "total_steps": 38160, "loss": 0.652, "lr": 1.1021777091119732e-06, "epoch": 19.620020964360588, "percentage": 98.1, "elapsed_time": "1:35:56", "remaining_time": "0:01:51", "throughput": 4245.2, "total_tokens": 24438496} {"current_steps": 37440, "total_steps": 38160, "loss": 0.5132, "lr": 1.0870539603975994e-06, "epoch": 19.62264150943396, "percentage": 98.11, "elapsed_time": "1:35:57", "remaining_time": "0:01:50", "throughput": 4245.19, "total_tokens": 24441312} {"current_steps": 37445, "total_steps": 38160, "loss": 0.4341, "lr": 1.0720345785795727e-06, "epoch": 19.62526205450734, "percentage": 98.13, "elapsed_time": "1:35:58", "remaining_time": "0:01:49", "throughput": 4245.16, "total_tokens": 24443840} {"current_steps": 37450, "total_steps": 38160, "loss": 0.3171, "lr": 1.0571195667998802e-06, "epoch": 19.627882599580712, "percentage": 98.14, "elapsed_time": "1:35:58", "remaining_time": "0:01:49", "throughput": 4245.23, "total_tokens": 24447520} {"current_steps": 37455, "total_steps": 38160, "loss": 0.4295, "lr": 1.042308928178526e-06, "epoch": 19.63050314465409, "percentage": 98.15, "elapsed_time": "1:35:59", "remaining_time": "0:01:48", "throughput": 4245.25, "total_tokens": 24450720} {"current_steps": 37460, "total_steps": 38160, "loss": 0.3405, "lr": 1.0276026658137538e-06, "epoch": 19.633123689727462, "percentage": 98.17, "elapsed_time": "1:36:00", "remaining_time": "0:01:47", "throughput": 4245.38, "total_tokens": 24455328} {"current_steps": 37465, "total_steps": 38160, "loss": 0.5044, "lr": 1.013000782781881e-06, "epoch": 19.63574423480084, "percentage": 98.18, "elapsed_time": "1:36:01", "remaining_time": "0:01:46", "throughput": 4245.41, "total_tokens": 24458496} {"current_steps": 37470, "total_steps": 38160, "loss": 0.5322, "lr": 9.985032821375195e-07, "epoch": 19.638364779874212, "percentage": 98.19, "elapsed_time": "1:36:01", "remaining_time": "0:01:46", "throughput": 4245.48, "total_tokens": 24462432} {"current_steps": 37475, "total_steps": 38160, "loss": 0.4428, "lr": 9.841101669134101e-07, "epoch": 19.64098532494759, "percentage": 98.2, "elapsed_time": "1:36:02", "remaining_time": "0:01:45", "throughput": 4245.55, "total_tokens": 24466240} {"current_steps": 37480, "total_steps": 38160, "loss": 0.2781, "lr": 9.69821440120311e-07, "epoch": 19.643605870020963, "percentage": 98.22, "elapsed_time": "1:36:03", "remaining_time": "0:01:44", "throughput": 4245.75, "total_tokens": 24472064} {"current_steps": 37485, "total_steps": 38160, "loss": 0.3946, "lr": 9.556371047473866e-07, "epoch": 19.64622641509434, "percentage": 98.23, "elapsed_time": "1:36:04", "remaining_time": "0:01:43", "throughput": 4245.72, "total_tokens": 24474496} {"current_steps": 37490, "total_steps": 38160, "loss": 0.4054, "lr": 9.415571637617082e-07, "epoch": 19.648846960167717, "percentage": 98.24, "elapsed_time": "1:36:05", "remaining_time": "0:01:43", "throughput": 4245.77, "total_tokens": 24478016} {"current_steps": 37495, "total_steps": 38160, "loss": 0.442, "lr": 9.275816201087528e-07, "epoch": 19.65146750524109, "percentage": 98.26, "elapsed_time": "1:36:05", "remaining_time": "0:01:42", "throughput": 4245.77, "total_tokens": 24481024} {"current_steps": 37500, "total_steps": 38160, "loss": 0.407, "lr": 9.137104767120153e-07, "epoch": 19.654088050314467, "percentage": 98.27, "elapsed_time": "1:36:06", "remaining_time": "0:01:41", "throughput": 4245.85, "total_tokens": 24484864} {"current_steps": 37505, "total_steps": 38160, "loss": 0.4181, "lr": 8.999437364731189e-07, "epoch": 19.65670859538784, "percentage": 98.28, "elapsed_time": "1:36:07", "remaining_time": "0:01:40", "throughput": 4245.91, "total_tokens": 24488480} {"current_steps": 37510, "total_steps": 38160, "loss": 0.5786, "lr": 8.862814022720378e-07, "epoch": 19.659329140461217, "percentage": 98.3, "elapsed_time": "1:36:08", "remaining_time": "0:01:39", "throughput": 4245.9, "total_tokens": 24491136} {"current_steps": 37515, "total_steps": 38160, "loss": 0.4672, "lr": 8.727234769666526e-07, "epoch": 19.66194968553459, "percentage": 98.31, "elapsed_time": "1:36:08", "remaining_time": "0:01:39", "throughput": 4245.97, "total_tokens": 24494944} {"current_steps": 37520, "total_steps": 38160, "loss": 0.3444, "lr": 8.592699633931389e-07, "epoch": 19.664570230607968, "percentage": 98.32, "elapsed_time": "1:36:09", "remaining_time": "0:01:38", "throughput": 4245.98, "total_tokens": 24497920} {"current_steps": 37525, "total_steps": 38160, "loss": 0.4458, "lr": 8.459208643659122e-07, "epoch": 19.66719077568134, "percentage": 98.34, "elapsed_time": "1:36:10", "remaining_time": "0:01:37", "throughput": 4245.98, "total_tokens": 24500800} {"current_steps": 37530, "total_steps": 38160, "loss": 0.5145, "lr": 8.326761826773499e-07, "epoch": 19.669811320754718, "percentage": 98.35, "elapsed_time": "1:36:11", "remaining_time": "0:01:36", "throughput": 4246.04, "total_tokens": 24504416} {"current_steps": 37535, "total_steps": 38160, "loss": 0.4289, "lr": 8.195359210981246e-07, "epoch": 19.67243186582809, "percentage": 98.36, "elapsed_time": "1:36:11", "remaining_time": "0:01:36", "throughput": 4246.1, "total_tokens": 24508000} {"current_steps": 37540, "total_steps": 38160, "loss": 0.4948, "lr": 8.065000823770929e-07, "epoch": 19.67505241090147, "percentage": 98.38, "elapsed_time": "1:36:12", "remaining_time": "0:01:35", "throughput": 4246.29, "total_tokens": 24513280} {"current_steps": 37545, "total_steps": 38160, "loss": 0.4286, "lr": 7.935686692410737e-07, "epoch": 19.677672955974842, "percentage": 98.39, "elapsed_time": "1:36:13", "remaining_time": "0:01:34", "throughput": 4246.28, "total_tokens": 24516000} {"current_steps": 37550, "total_steps": 38160, "loss": 0.3642, "lr": 7.807416843952364e-07, "epoch": 19.68029350104822, "percentage": 98.4, "elapsed_time": "1:36:14", "remaining_time": "0:01:33", "throughput": 4246.26, "total_tokens": 24518624} {"current_steps": 37555, "total_steps": 38160, "loss": 0.4408, "lr": 7.68019130522879e-07, "epoch": 19.682914046121592, "percentage": 98.41, "elapsed_time": "1:36:14", "remaining_time": "0:01:33", "throughput": 4246.31, "total_tokens": 24522144} {"current_steps": 37560, "total_steps": 38160, "loss": 0.3726, "lr": 7.554010102853726e-07, "epoch": 19.68553459119497, "percentage": 98.43, "elapsed_time": "1:36:15", "remaining_time": "0:01:32", "throughput": 4246.34, "total_tokens": 24525312} {"current_steps": 37565, "total_steps": 38160, "loss": 0.5036, "lr": 7.428873263223279e-07, "epoch": 19.688155136268342, "percentage": 98.44, "elapsed_time": "1:36:16", "remaining_time": "0:01:31", "throughput": 4246.35, "total_tokens": 24528288} {"current_steps": 37570, "total_steps": 38160, "loss": 0.4381, "lr": 7.304780812513734e-07, "epoch": 19.69077568134172, "percentage": 98.45, "elapsed_time": "1:36:16", "remaining_time": "0:01:30", "throughput": 4246.33, "total_tokens": 24531040} {"current_steps": 37575, "total_steps": 38160, "loss": 0.4578, "lr": 7.181732776684325e-07, "epoch": 19.693396226415093, "percentage": 98.47, "elapsed_time": "1:36:17", "remaining_time": "0:01:29", "throughput": 4246.35, "total_tokens": 24534240} {"current_steps": 37580, "total_steps": 38160, "loss": 0.4476, "lr": 7.059729181475572e-07, "epoch": 19.69601677148847, "percentage": 98.48, "elapsed_time": "1:36:18", "remaining_time": "0:01:29", "throughput": 4246.33, "total_tokens": 24536864} {"current_steps": 37585, "total_steps": 38160, "loss": 0.4015, "lr": 6.938770052409282e-07, "epoch": 19.698637316561843, "percentage": 98.49, "elapsed_time": "1:36:19", "remaining_time": "0:01:28", "throughput": 4246.37, "total_tokens": 24540160} {"current_steps": 37590, "total_steps": 38160, "loss": 0.4856, "lr": 6.81885541478855e-07, "epoch": 19.70125786163522, "percentage": 98.51, "elapsed_time": "1:36:19", "remaining_time": "0:01:27", "throughput": 4246.37, "total_tokens": 24543040} {"current_steps": 37595, "total_steps": 38160, "loss": 0.379, "lr": 6.699985293697197e-07, "epoch": 19.703878406708597, "percentage": 98.52, "elapsed_time": "1:36:20", "remaining_time": "0:01:26", "throughput": 4246.35, "total_tokens": 24545792} {"current_steps": 37600, "total_steps": 38160, "loss": 0.4576, "lr": 6.582159714003111e-07, "epoch": 19.70649895178197, "percentage": 98.53, "elapsed_time": "1:36:21", "remaining_time": "0:01:26", "throughput": 4246.34, "total_tokens": 24548512} {"current_steps": 37605, "total_steps": 38160, "loss": 0.3742, "lr": 6.465378700352687e-07, "epoch": 19.709119496855347, "percentage": 98.55, "elapsed_time": "1:36:21", "remaining_time": "0:01:25", "throughput": 4246.32, "total_tokens": 24551200} {"current_steps": 37610, "total_steps": 38160, "loss": 0.4091, "lr": 6.349642277176382e-07, "epoch": 19.71174004192872, "percentage": 98.56, "elapsed_time": "1:36:22", "remaining_time": "0:01:24", "throughput": 4246.32, "total_tokens": 24554016} {"current_steps": 37615, "total_steps": 38160, "loss": 0.4998, "lr": 6.23495046868372e-07, "epoch": 19.714360587002098, "percentage": 98.57, "elapsed_time": "1:36:23", "remaining_time": "0:01:23", "throughput": 4246.41, "total_tokens": 24557952} {"current_steps": 37620, "total_steps": 38160, "loss": 0.44, "lr": 6.121303298868286e-07, "epoch": 19.71698113207547, "percentage": 98.58, "elapsed_time": "1:36:23", "remaining_time": "0:01:23", "throughput": 4246.45, "total_tokens": 24561408} {"current_steps": 37625, "total_steps": 38160, "loss": 0.4321, "lr": 6.008700791502175e-07, "epoch": 19.719601677148848, "percentage": 98.6, "elapsed_time": "1:36:24", "remaining_time": "0:01:22", "throughput": 4246.46, "total_tokens": 24564352} {"current_steps": 37630, "total_steps": 38160, "loss": 0.4027, "lr": 5.8971429701421e-07, "epoch": 19.72222222222222, "percentage": 98.61, "elapsed_time": "1:36:25", "remaining_time": "0:01:21", "throughput": 4246.44, "total_tokens": 24567008} {"current_steps": 37635, "total_steps": 38160, "loss": 0.3835, "lr": 5.786629858123283e-07, "epoch": 19.7248427672956, "percentage": 98.62, "elapsed_time": "1:36:25", "remaining_time": "0:01:20", "throughput": 4246.43, "total_tokens": 24569824} {"current_steps": 37640, "total_steps": 38160, "loss": 0.4211, "lr": 5.677161478565008e-07, "epoch": 19.72746331236897, "percentage": 98.64, "elapsed_time": "1:36:26", "remaining_time": "0:01:19", "throughput": 4246.45, "total_tokens": 24572960} {"current_steps": 37645, "total_steps": 38160, "loss": 0.473, "lr": 5.56873785436618e-07, "epoch": 19.73008385744235, "percentage": 98.65, "elapsed_time": "1:36:27", "remaining_time": "0:01:19", "throughput": 4246.53, "total_tokens": 24576864} {"current_steps": 37650, "total_steps": 38160, "loss": 0.4471, "lr": 5.4613590082081e-07, "epoch": 19.732704402515722, "percentage": 98.66, "elapsed_time": "1:36:28", "remaining_time": "0:01:18", "throughput": 4246.51, "total_tokens": 24579520} {"current_steps": 37655, "total_steps": 38160, "loss": 0.3851, "lr": 5.355024962552801e-07, "epoch": 19.7353249475891, "percentage": 98.68, "elapsed_time": "1:36:28", "remaining_time": "0:01:17", "throughput": 4246.56, "total_tokens": 24583136} {"current_steps": 37660, "total_steps": 38160, "loss": 0.2345, "lr": 5.249735739644157e-07, "epoch": 19.737945492662472, "percentage": 98.69, "elapsed_time": "1:36:29", "remaining_time": "0:01:16", "throughput": 4246.6, "total_tokens": 24586528} {"current_steps": 37665, "total_steps": 38160, "loss": 0.4754, "lr": 5.145491361508436e-07, "epoch": 19.74056603773585, "percentage": 98.7, "elapsed_time": "1:36:30", "remaining_time": "0:01:16", "throughput": 4246.62, "total_tokens": 24589696} {"current_steps": 37670, "total_steps": 38160, "loss": 0.5156, "lr": 5.042291849950975e-07, "epoch": 19.743186582809223, "percentage": 98.72, "elapsed_time": "1:36:31", "remaining_time": "0:01:15", "throughput": 4246.74, "total_tokens": 24594208} {"current_steps": 37675, "total_steps": 38160, "loss": 0.4156, "lr": 4.940137226560615e-07, "epoch": 19.7458071278826, "percentage": 98.73, "elapsed_time": "1:36:32", "remaining_time": "0:01:14", "throughput": 4246.76, "total_tokens": 24597312} {"current_steps": 37680, "total_steps": 38160, "loss": 0.3407, "lr": 4.839027512706928e-07, "epoch": 19.748427672955973, "percentage": 98.74, "elapsed_time": "1:36:32", "remaining_time": "0:01:13", "throughput": 4246.74, "total_tokens": 24600096} {"current_steps": 37685, "total_steps": 38160, "loss": 0.5401, "lr": 4.7389627295407743e-07, "epoch": 19.75104821802935, "percentage": 98.76, "elapsed_time": "1:36:33", "remaining_time": "0:01:13", "throughput": 4246.77, "total_tokens": 24603328} {"current_steps": 37690, "total_steps": 38160, "loss": 0.3149, "lr": 4.6399428979948534e-07, "epoch": 19.753668763102727, "percentage": 98.77, "elapsed_time": "1:36:34", "remaining_time": "0:01:12", "throughput": 4246.83, "total_tokens": 24606944} {"current_steps": 37695, "total_steps": 38160, "loss": 0.4805, "lr": 4.541968038782596e-07, "epoch": 19.7562893081761, "percentage": 98.78, "elapsed_time": "1:36:34", "remaining_time": "0:01:11", "throughput": 4246.87, "total_tokens": 24610304} {"current_steps": 37700, "total_steps": 38160, "loss": 0.3042, "lr": 4.445038172399829e-07, "epoch": 19.758909853249477, "percentage": 98.79, "elapsed_time": "1:36:35", "remaining_time": "0:01:10", "throughput": 4246.85, "total_tokens": 24612992} {"current_steps": 37705, "total_steps": 38160, "loss": 0.543, "lr": 4.3491533191225563e-07, "epoch": 19.76153039832285, "percentage": 98.81, "elapsed_time": "1:36:36", "remaining_time": "0:01:09", "throughput": 4246.9, "total_tokens": 24616448} {"current_steps": 37710, "total_steps": 38160, "loss": 0.4542, "lr": 4.254313499009177e-07, "epoch": 19.764150943396228, "percentage": 98.82, "elapsed_time": "1:36:36", "remaining_time": "0:01:09", "throughput": 4246.85, "total_tokens": 24618816} {"current_steps": 37715, "total_steps": 38160, "loss": 0.4084, "lr": 4.1605187318982664e-07, "epoch": 19.7667714884696, "percentage": 98.83, "elapsed_time": "1:36:37", "remaining_time": "0:01:08", "throughput": 4246.85, "total_tokens": 24621632} {"current_steps": 37720, "total_steps": 38160, "loss": 0.4402, "lr": 4.067769037411906e-07, "epoch": 19.769392033542978, "percentage": 98.85, "elapsed_time": "1:36:38", "remaining_time": "0:01:07", "throughput": 4246.9, "total_tokens": 24625280} {"current_steps": 37725, "total_steps": 38160, "loss": 0.3894, "lr": 3.9760644349517984e-07, "epoch": 19.77201257861635, "percentage": 98.86, "elapsed_time": "1:36:39", "remaining_time": "0:01:06", "throughput": 4246.89, "total_tokens": 24627936} {"current_steps": 37730, "total_steps": 38160, "loss": 0.4336, "lr": 3.885404943700932e-07, "epoch": 19.77463312368973, "percentage": 98.87, "elapsed_time": "1:36:39", "remaining_time": "0:01:06", "throughput": 4246.96, "total_tokens": 24631776} {"current_steps": 37735, "total_steps": 38160, "loss": 0.4126, "lr": 3.795790582624692e-07, "epoch": 19.7772536687631, "percentage": 98.89, "elapsed_time": "1:36:40", "remaining_time": "0:01:05", "throughput": 4246.93, "total_tokens": 24634272} {"current_steps": 37740, "total_steps": 38160, "loss": 0.4443, "lr": 3.707221370469749e-07, "epoch": 19.77987421383648, "percentage": 98.9, "elapsed_time": "1:36:41", "remaining_time": "0:01:04", "throughput": 4246.92, "total_tokens": 24637056} {"current_steps": 37745, "total_steps": 38160, "loss": 0.371, "lr": 3.6196973257629494e-07, "epoch": 19.782494758909852, "percentage": 98.91, "elapsed_time": "1:36:41", "remaining_time": "0:01:03", "throughput": 4246.95, "total_tokens": 24640320} {"current_steps": 37750, "total_steps": 38160, "loss": 0.3698, "lr": 3.533218466813537e-07, "epoch": 19.78511530398323, "percentage": 98.93, "elapsed_time": "1:36:42", "remaining_time": "0:01:03", "throughput": 4246.97, "total_tokens": 24643456} {"current_steps": 37755, "total_steps": 38160, "loss": 0.5827, "lr": 3.447784811712595e-07, "epoch": 19.787735849056602, "percentage": 98.94, "elapsed_time": "1:36:43", "remaining_time": "0:01:02", "throughput": 4246.96, "total_tokens": 24646144} {"current_steps": 37760, "total_steps": 38160, "loss": 0.4773, "lr": 3.363396378331385e-07, "epoch": 19.79035639412998, "percentage": 98.95, "elapsed_time": "1:36:43", "remaining_time": "0:01:01", "throughput": 4246.93, "total_tokens": 24648736} {"current_steps": 37765, "total_steps": 38160, "loss": 0.3514, "lr": 3.280053184323006e-07, "epoch": 19.792976939203353, "percentage": 98.96, "elapsed_time": "1:36:44", "remaining_time": "0:01:00", "throughput": 4246.92, "total_tokens": 24651456} {"current_steps": 37770, "total_steps": 38160, "loss": 0.4711, "lr": 3.1977552471218476e-07, "epoch": 19.79559748427673, "percentage": 98.98, "elapsed_time": "1:36:45", "remaining_time": "0:00:59", "throughput": 4246.93, "total_tokens": 24654560} {"current_steps": 37775, "total_steps": 38160, "loss": 0.4066, "lr": 3.116502583943581e-07, "epoch": 19.798218029350103, "percentage": 98.99, "elapsed_time": "1:36:46", "remaining_time": "0:00:59", "throughput": 4246.99, "total_tokens": 24658144} {"current_steps": 37780, "total_steps": 38160, "loss": 0.4813, "lr": 3.036295211785722e-07, "epoch": 19.80083857442348, "percentage": 99.0, "elapsed_time": "1:36:47", "remaining_time": "0:00:58", "throughput": 4247.23, "total_tokens": 24664576} {"current_steps": 37785, "total_steps": 38160, "loss": 0.4699, "lr": 2.957133147425961e-07, "epoch": 19.803459119496857, "percentage": 99.02, "elapsed_time": "1:36:47", "remaining_time": "0:00:57", "throughput": 4247.28, "total_tokens": 24668096} {"current_steps": 37790, "total_steps": 38160, "loss": 0.2858, "lr": 2.879016407425494e-07, "epoch": 19.80607966457023, "percentage": 99.03, "elapsed_time": "1:36:48", "remaining_time": "0:00:56", "throughput": 4247.25, "total_tokens": 24670592} {"current_steps": 37795, "total_steps": 38160, "loss": 0.501, "lr": 2.8019450081240295e-07, "epoch": 19.808700209643607, "percentage": 99.04, "elapsed_time": "1:36:49", "remaining_time": "0:00:56", "throughput": 4247.31, "total_tokens": 24674208} {"current_steps": 37800, "total_steps": 38160, "loss": 0.389, "lr": 2.7259189656447803e-07, "epoch": 19.81132075471698, "percentage": 99.06, "elapsed_time": "1:36:50", "remaining_time": "0:00:55", "throughput": 4247.27, "total_tokens": 24676672} {"current_steps": 37805, "total_steps": 38160, "loss": 0.4555, "lr": 2.650938295891692e-07, "epoch": 19.813941299790358, "percentage": 99.07, "elapsed_time": "1:36:50", "remaining_time": "0:00:54", "throughput": 4247.24, "total_tokens": 24679264} {"current_steps": 37810, "total_steps": 38160, "loss": 0.3648, "lr": 2.5770030145494395e-07, "epoch": 19.81656184486373, "percentage": 99.08, "elapsed_time": "1:36:51", "remaining_time": "0:00:53", "throughput": 4247.24, "total_tokens": 24682080} {"current_steps": 37815, "total_steps": 38160, "loss": 0.4169, "lr": 2.504113137083985e-07, "epoch": 19.819182389937108, "percentage": 99.1, "elapsed_time": "1:36:52", "remaining_time": "0:00:53", "throughput": 4247.3, "total_tokens": 24685888} {"current_steps": 37820, "total_steps": 38160, "loss": 0.3683, "lr": 2.4322686787442425e-07, "epoch": 19.82180293501048, "percentage": 99.11, "elapsed_time": "1:36:52", "remaining_time": "0:00:52", "throughput": 4247.3, "total_tokens": 24688800} {"current_steps": 37825, "total_steps": 38160, "loss": 0.4222, "lr": 2.3614696545581904e-07, "epoch": 19.82442348008386, "percentage": 99.12, "elapsed_time": "1:36:53", "remaining_time": "0:00:51", "throughput": 4247.36, "total_tokens": 24692416} {"current_steps": 37830, "total_steps": 38160, "loss": 0.4183, "lr": 2.2917160793367585e-07, "epoch": 19.82704402515723, "percentage": 99.14, "elapsed_time": "1:36:54", "remaining_time": "0:00:50", "throughput": 4247.35, "total_tokens": 24695296} {"current_steps": 37835, "total_steps": 38160, "loss": 0.3854, "lr": 2.2230079676716086e-07, "epoch": 19.82966457023061, "percentage": 99.15, "elapsed_time": "1:36:54", "remaining_time": "0:00:49", "throughput": 4247.34, "total_tokens": 24698016} {"current_steps": 37840, "total_steps": 38160, "loss": 0.4183, "lr": 2.1553453339356875e-07, "epoch": 19.832285115303982, "percentage": 99.16, "elapsed_time": "1:36:55", "remaining_time": "0:00:49", "throughput": 4247.4, "total_tokens": 24701696} {"current_steps": 37845, "total_steps": 38160, "loss": 0.425, "lr": 2.0887281922826738e-07, "epoch": 19.83490566037736, "percentage": 99.17, "elapsed_time": "1:36:56", "remaining_time": "0:00:48", "throughput": 4247.49, "total_tokens": 24705760} {"current_steps": 37850, "total_steps": 38160, "loss": 0.4983, "lr": 2.023156556648642e-07, "epoch": 19.837526205450732, "percentage": 99.19, "elapsed_time": "1:36:57", "remaining_time": "0:00:47", "throughput": 4247.56, "total_tokens": 24709504} {"current_steps": 37855, "total_steps": 38160, "loss": 0.5899, "lr": 1.9586304407503975e-07, "epoch": 19.84014675052411, "percentage": 99.2, "elapsed_time": "1:36:58", "remaining_time": "0:00:46", "throughput": 4247.58, "total_tokens": 24712640} {"current_steps": 37860, "total_steps": 38160, "loss": 0.6207, "lr": 1.8951498580860315e-07, "epoch": 19.842767295597483, "percentage": 99.21, "elapsed_time": "1:36:58", "remaining_time": "0:00:46", "throughput": 4247.61, "total_tokens": 24715808} {"current_steps": 37865, "total_steps": 38160, "loss": 0.3819, "lr": 1.832714821934922e-07, "epoch": 19.84538784067086, "percentage": 99.23, "elapsed_time": "1:36:59", "remaining_time": "0:00:45", "throughput": 4247.62, "total_tokens": 24718848} {"current_steps": 37870, "total_steps": 38160, "loss": 0.3563, "lr": 1.7713253453577328e-07, "epoch": 19.848008385744233, "percentage": 99.24, "elapsed_time": "1:37:00", "remaining_time": "0:00:44", "throughput": 4247.65, "total_tokens": 24722016} {"current_steps": 37875, "total_steps": 38160, "loss": 0.4327, "lr": 1.7109814411964132e-07, "epoch": 19.85062893081761, "percentage": 99.25, "elapsed_time": "1:37:00", "remaining_time": "0:00:43", "throughput": 4247.74, "total_tokens": 24725920} {"current_steps": 37880, "total_steps": 38160, "loss": 0.4288, "lr": 1.651683122074754e-07, "epoch": 19.853249475890987, "percentage": 99.27, "elapsed_time": "1:37:01", "remaining_time": "0:00:43", "throughput": 4247.84, "total_tokens": 24730112} {"current_steps": 37885, "total_steps": 38160, "loss": 0.4968, "lr": 1.5934304003961675e-07, "epoch": 19.85587002096436, "percentage": 99.28, "elapsed_time": "1:37:02", "remaining_time": "0:00:42", "throughput": 4247.86, "total_tokens": 24733248} {"current_steps": 37890, "total_steps": 38160, "loss": 0.4249, "lr": 1.5362232883475713e-07, "epoch": 19.858490566037737, "percentage": 99.29, "elapsed_time": "1:37:03", "remaining_time": "0:00:41", "throughput": 4247.89, "total_tokens": 24736576} {"current_steps": 37895, "total_steps": 38160, "loss": 0.404, "lr": 1.4800617978949492e-07, "epoch": 19.86111111111111, "percentage": 99.31, "elapsed_time": "1:37:04", "remaining_time": "0:00:40", "throughput": 4247.97, "total_tokens": 24740544} {"current_steps": 37900, "total_steps": 38160, "loss": 0.382, "lr": 1.424945940787792e-07, "epoch": 19.863731656184488, "percentage": 99.32, "elapsed_time": "1:37:04", "remaining_time": "0:00:39", "throughput": 4248.03, "total_tokens": 24744128} {"current_steps": 37905, "total_steps": 38160, "loss": 0.4799, "lr": 1.3708757285552098e-07, "epoch": 19.86635220125786, "percentage": 99.33, "elapsed_time": "1:37:05", "remaining_time": "0:00:39", "throughput": 4248.03, "total_tokens": 24747104} {"current_steps": 37910, "total_steps": 38160, "loss": 0.4759, "lr": 1.3178511725076004e-07, "epoch": 19.868972746331238, "percentage": 99.34, "elapsed_time": "1:37:06", "remaining_time": "0:00:38", "throughput": 4248.06, "total_tokens": 24750432} {"current_steps": 37915, "total_steps": 38160, "loss": 0.309, "lr": 1.265872283738312e-07, "epoch": 19.87159329140461, "percentage": 99.36, "elapsed_time": "1:37:06", "remaining_time": "0:00:37", "throughput": 4248.02, "total_tokens": 24752896} {"current_steps": 37920, "total_steps": 38160, "loss": 0.5311, "lr": 1.2149390731192033e-07, "epoch": 19.87421383647799, "percentage": 99.37, "elapsed_time": "1:37:07", "remaining_time": "0:00:36", "throughput": 4248.04, "total_tokens": 24756096} {"current_steps": 37925, "total_steps": 38160, "loss": 0.4147, "lr": 1.1650515513061955e-07, "epoch": 19.87683438155136, "percentage": 99.38, "elapsed_time": "1:37:08", "remaining_time": "0:00:36", "throughput": 4248.11, "total_tokens": 24759776} {"current_steps": 37930, "total_steps": 38160, "loss": 0.379, "lr": 1.1162097287342743e-07, "epoch": 19.87945492662474, "percentage": 99.4, "elapsed_time": "1:37:09", "remaining_time": "0:00:35", "throughput": 4248.11, "total_tokens": 24762720} {"current_steps": 37935, "total_steps": 38160, "loss": 0.3369, "lr": 1.0684136156213775e-07, "epoch": 19.882075471698112, "percentage": 99.41, "elapsed_time": "1:37:09", "remaining_time": "0:00:34", "throughput": 4248.18, "total_tokens": 24766528} {"current_steps": 37940, "total_steps": 38160, "loss": 0.4381, "lr": 1.0216632219650634e-07, "epoch": 19.88469601677149, "percentage": 99.42, "elapsed_time": "1:37:10", "remaining_time": "0:00:33", "throughput": 4248.27, "total_tokens": 24770496} {"current_steps": 37945, "total_steps": 38160, "loss": 0.5184, "lr": 9.759585575458418e-08, "epoch": 19.887316561844862, "percentage": 99.44, "elapsed_time": "1:37:11", "remaining_time": "0:00:33", "throughput": 4248.24, "total_tokens": 24773024} {"current_steps": 37950, "total_steps": 38160, "loss": 0.3776, "lr": 9.312996319238432e-08, "epoch": 19.88993710691824, "percentage": 99.45, "elapsed_time": "1:37:12", "remaining_time": "0:00:32", "throughput": 4248.25, "total_tokens": 24776064} {"current_steps": 37955, "total_steps": 38160, "loss": 0.4356, "lr": 8.876864544421493e-08, "epoch": 19.892557651991613, "percentage": 99.46, "elapsed_time": "1:37:12", "remaining_time": "0:00:31", "throughput": 4248.26, "total_tokens": 24779072} {"current_steps": 37960, "total_steps": 38160, "loss": 0.4974, "lr": 8.451190342229077e-08, "epoch": 19.89517819706499, "percentage": 99.48, "elapsed_time": "1:37:13", "remaining_time": "0:00:30", "throughput": 4248.31, "total_tokens": 24782560} {"current_steps": 37965, "total_steps": 38160, "loss": 0.4209, "lr": 8.035973801717722e-08, "epoch": 19.897798742138363, "percentage": 99.49, "elapsed_time": "1:37:14", "remaining_time": "0:00:29", "throughput": 4248.29, "total_tokens": 24785312} {"current_steps": 37970, "total_steps": 38160, "loss": 0.4835, "lr": 7.631215009740178e-08, "epoch": 19.90041928721174, "percentage": 99.5, "elapsed_time": "1:37:14", "remaining_time": "0:00:29", "throughput": 4248.29, "total_tokens": 24788128} {"current_steps": 37975, "total_steps": 38160, "loss": 0.5781, "lr": 7.236914050973153e-08, "epoch": 19.903039832285117, "percentage": 99.52, "elapsed_time": "1:37:15", "remaining_time": "0:00:28", "throughput": 4248.25, "total_tokens": 24790496} {"current_steps": 37980, "total_steps": 38160, "loss": 0.3987, "lr": 6.853071007895117e-08, "epoch": 19.90566037735849, "percentage": 99.53, "elapsed_time": "1:37:16", "remaining_time": "0:00:27", "throughput": 4248.28, "total_tokens": 24793792} {"current_steps": 37985, "total_steps": 38160, "loss": 0.3117, "lr": 6.479685960797399e-08, "epoch": 19.908280922431867, "percentage": 99.54, "elapsed_time": "1:37:16", "remaining_time": "0:00:26", "throughput": 4248.31, "total_tokens": 24796992} {"current_steps": 37990, "total_steps": 38160, "loss": 0.4335, "lr": 6.116758987800841e-08, "epoch": 19.91090146750524, "percentage": 99.55, "elapsed_time": "1:37:17", "remaining_time": "0:00:26", "throughput": 4248.39, "total_tokens": 24800864} {"current_steps": 37995, "total_steps": 38160, "loss": 0.3512, "lr": 5.7642901648113924e-08, "epoch": 19.913522012578618, "percentage": 99.57, "elapsed_time": "1:37:18", "remaining_time": "0:00:25", "throughput": 4248.42, "total_tokens": 24804160} {"current_steps": 38000, "total_steps": 38160, "loss": 0.4339, "lr": 5.422279565570065e-08, "epoch": 19.91614255765199, "percentage": 99.58, "elapsed_time": "1:37:19", "remaining_time": "0:00:24", "throughput": 4248.42, "total_tokens": 24807072} {"current_steps": 38005, "total_steps": 38160, "loss": 0.3335, "lr": 5.090727261619632e-08, "epoch": 19.918763102725368, "percentage": 99.59, "elapsed_time": "1:37:20", "remaining_time": "0:00:23", "throughput": 4248.54, "total_tokens": 24811584} {"current_steps": 38010, "total_steps": 38160, "loss": 0.2925, "lr": 4.7696333223212765e-08, "epoch": 19.92138364779874, "percentage": 99.61, "elapsed_time": "1:37:20", "remaining_time": "0:00:23", "throughput": 4248.54, "total_tokens": 24814464} {"current_steps": 38015, "total_steps": 38160, "loss": 0.3734, "lr": 4.4589978148323884e-08, "epoch": 19.92400419287212, "percentage": 99.62, "elapsed_time": "1:37:21", "remaining_time": "0:00:22", "throughput": 4248.58, "total_tokens": 24817920} {"current_steps": 38020, "total_steps": 38160, "loss": 0.3705, "lr": 4.1588208041454244e-08, "epoch": 19.92662473794549, "percentage": 99.63, "elapsed_time": "1:37:22", "remaining_time": "0:00:21", "throughput": 4248.61, "total_tokens": 24821312} {"current_steps": 38025, "total_steps": 38160, "loss": 0.4274, "lr": 3.8691023530545985e-08, "epoch": 19.92924528301887, "percentage": 99.65, "elapsed_time": "1:37:22", "remaining_time": "0:00:20", "throughput": 4248.65, "total_tokens": 24824672} {"current_steps": 38030, "total_steps": 38160, "loss": 0.478, "lr": 3.589842522155884e-08, "epoch": 19.931865828092242, "percentage": 99.66, "elapsed_time": "1:37:23", "remaining_time": "0:00:19", "throughput": 4248.65, "total_tokens": 24827584} {"current_steps": 38035, "total_steps": 38160, "loss": 0.5188, "lr": 3.321041369874767e-08, "epoch": 19.93448637316562, "percentage": 99.67, "elapsed_time": "1:37:24", "remaining_time": "0:00:19", "throughput": 4248.74, "total_tokens": 24831680} {"current_steps": 38040, "total_steps": 38160, "loss": 0.3802, "lr": 3.0626989524384916e-08, "epoch": 19.937106918238992, "percentage": 99.69, "elapsed_time": "1:37:25", "remaining_time": "0:00:18", "throughput": 4248.79, "total_tokens": 24835168} {"current_steps": 38045, "total_steps": 38160, "loss": 0.4624, "lr": 2.8148153238927167e-08, "epoch": 19.93972746331237, "percentage": 99.7, "elapsed_time": "1:37:25", "remaining_time": "0:00:17", "throughput": 4248.82, "total_tokens": 24838432} {"current_steps": 38050, "total_steps": 38160, "loss": 0.3854, "lr": 2.5773905360904072e-08, "epoch": 19.942348008385743, "percentage": 99.71, "elapsed_time": "1:37:27", "remaining_time": "0:00:16", "throughput": 4249.03, "total_tokens": 24844096} {"current_steps": 38055, "total_steps": 38160, "loss": 0.4422, "lr": 2.3504246386918392e-08, "epoch": 19.94496855345912, "percentage": 99.72, "elapsed_time": "1:37:27", "remaining_time": "0:00:16", "throughput": 4249.1, "total_tokens": 24847872} {"current_steps": 38060, "total_steps": 38160, "loss": 0.423, "lr": 2.133917679186803e-08, "epoch": 19.947589098532493, "percentage": 99.74, "elapsed_time": "1:37:28", "remaining_time": "0:00:15", "throughput": 4249.16, "total_tokens": 24851520} {"current_steps": 38065, "total_steps": 38160, "loss": 0.4226, "lr": 1.9278697028557447e-08, "epoch": 19.95020964360587, "percentage": 99.75, "elapsed_time": "1:37:29", "remaining_time": "0:00:14", "throughput": 4249.16, "total_tokens": 24854656} {"current_steps": 38070, "total_steps": 38160, "loss": 0.4599, "lr": 1.7322807528086238e-08, "epoch": 19.952830188679247, "percentage": 99.76, "elapsed_time": "1:37:30", "remaining_time": "0:00:13", "throughput": 4249.2, "total_tokens": 24857952} {"current_steps": 38075, "total_steps": 38160, "loss": 0.5442, "lr": 1.547150869957159e-08, "epoch": 19.95545073375262, "percentage": 99.78, "elapsed_time": "1:37:30", "remaining_time": "0:00:13", "throughput": 4249.19, "total_tokens": 24860704} {"current_steps": 38080, "total_steps": 38160, "loss": 0.4286, "lr": 1.3724800930314806e-08, "epoch": 19.958071278825997, "percentage": 99.79, "elapsed_time": "1:37:31", "remaining_time": "0:00:12", "throughput": 4249.2, "total_tokens": 24863712} {"current_steps": 38085, "total_steps": 38160, "loss": 0.3009, "lr": 1.2082684585634773e-08, "epoch": 19.96069182389937, "percentage": 99.8, "elapsed_time": "1:37:32", "remaining_time": "0:00:11", "throughput": 4249.21, "total_tokens": 24866752} {"current_steps": 38090, "total_steps": 38160, "loss": 0.3789, "lr": 1.0545160009145516e-08, "epoch": 19.963312368972748, "percentage": 99.82, "elapsed_time": "1:37:32", "remaining_time": "0:00:10", "throughput": 4249.35, "total_tokens": 24871360} {"current_steps": 38095, "total_steps": 38160, "loss": 0.5999, "lr": 9.112227522423133e-09, "epoch": 19.96593291404612, "percentage": 99.83, "elapsed_time": "1:37:33", "remaining_time": "0:00:09", "throughput": 4249.44, "total_tokens": 24875488} {"current_steps": 38100, "total_steps": 38160, "loss": 0.4515, "lr": 7.783887425172331e-09, "epoch": 19.968553459119498, "percentage": 99.84, "elapsed_time": "1:37:34", "remaining_time": "0:00:09", "throughput": 4249.45, "total_tokens": 24878528} {"current_steps": 38105, "total_steps": 38160, "loss": 0.365, "lr": 6.560139995392955e-09, "epoch": 19.97117400419287, "percentage": 99.86, "elapsed_time": "1:37:35", "remaining_time": "0:00:08", "throughput": 4249.48, "total_tokens": 24881792} {"current_steps": 38110, "total_steps": 38160, "loss": 0.3327, "lr": 5.440985488935901e-09, "epoch": 19.97379454926625, "percentage": 99.87, "elapsed_time": "1:37:35", "remaining_time": "0:00:07", "throughput": 4249.5, "total_tokens": 24884928} {"current_steps": 38115, "total_steps": 38160, "loss": 0.33, "lr": 4.426424140058227e-09, "epoch": 19.97641509433962, "percentage": 99.88, "elapsed_time": "1:37:36", "remaining_time": "0:00:06", "throughput": 4249.47, "total_tokens": 24887488} {"current_steps": 38120, "total_steps": 38160, "loss": 0.4976, "lr": 3.5164561608680424e-09, "epoch": 19.979035639413, "percentage": 99.9, "elapsed_time": "1:37:37", "remaining_time": "0:00:06", "throughput": 4249.47, "total_tokens": 24890368} {"current_steps": 38125, "total_steps": 38160, "loss": 0.4701, "lr": 2.7110817417685953e-09, "epoch": 19.981656184486372, "percentage": 99.91, "elapsed_time": "1:37:37", "remaining_time": "0:00:05", "throughput": 4249.4, "total_tokens": 24892416} {"current_steps": 38130, "total_steps": 38160, "loss": 0.3155, "lr": 2.010301051291741e-09, "epoch": 19.98427672955975, "percentage": 99.92, "elapsed_time": "1:37:38", "remaining_time": "0:00:04", "throughput": 4249.42, "total_tokens": 24895552} {"current_steps": 38135, "total_steps": 38160, "loss": 0.4155, "lr": 1.4141142359314074e-09, "epoch": 19.986897274633122, "percentage": 99.93, "elapsed_time": "1:37:39", "remaining_time": "0:00:03", "throughput": 4249.48, "total_tokens": 24899296} {"current_steps": 38140, "total_steps": 38160, "loss": 0.386, "lr": 9.22521420476663e-10, "epoch": 19.9895178197065, "percentage": 99.95, "elapsed_time": "1:37:40", "remaining_time": "0:00:03", "throughput": 4249.5, "total_tokens": 24902432} {"current_steps": 38145, "total_steps": 38160, "loss": 0.4007, "lr": 5.355227077341596e-10, "epoch": 19.992138364779873, "percentage": 99.96, "elapsed_time": "1:37:40", "remaining_time": "0:00:02", "throughput": 4249.53, "total_tokens": 24905696} {"current_steps": 38150, "total_steps": 38160, "loss": 0.3734, "lr": 2.5311817863915566e-10, "epoch": 19.99475890985325, "percentage": 99.97, "elapsed_time": "1:37:41", "remaining_time": "0:00:01", "throughput": 4249.54, "total_tokens": 24908672} {"current_steps": 38155, "total_steps": 38160, "loss": 0.496, "lr": 7.53078923110273e-11, "epoch": 19.997379454926623, "percentage": 99.99, "elapsed_time": "1:37:42", "remaining_time": "0:00:00", "throughput": 4249.54, "total_tokens": 24911552} {"current_steps": 38160, "total_steps": 38160, "loss": 0.3567, "lr": 2.0918859422458526e-12, "epoch": 20.0, "percentage": 100.0, "elapsed_time": "1:37:42", "remaining_time": "0:00:00", "throughput": 4249.37, "total_tokens": 24913312} {"current_steps": 38160, "total_steps": 38160, "eval_loss": 0.49418532848358154, "epoch": 20.0, "percentage": 100.0, "elapsed_time": "1:37:56", "remaining_time": "0:00:00", "throughput": 4239.43, "total_tokens": 24913312} {"current_steps": 38160, "total_steps": 38160, "epoch": 20.0, "percentage": 100.0, "elapsed_time": "1:37:58", "remaining_time": "0:00:00", "throughput": 4238.31, "total_tokens": 24913312}