{"current_steps": 5, "total_steps": 38160, "loss": 4.3366, "lr": 1.0482180293501048e-06, "epoch": 0.002620545073375262, "percentage": 0.01, "elapsed_time": "0:00:01", "remaining_time": "3:07:18", "throughput": 2216.28, "total_tokens": 3264} {"current_steps": 10, "total_steps": 38160, "loss": 4.3961, "lr": 2.358490566037736e-06, "epoch": 0.005241090146750524, "percentage": 0.03, "elapsed_time": "0:00:02", "remaining_time": "2:14:55", "throughput": 2774.8, "total_tokens": 5888} {"current_steps": 15, "total_steps": 38160, "loss": 4.3377, "lr": 3.668763102725367e-06, "epoch": 0.007861635220125786, "percentage": 0.04, "elapsed_time": "0:00:02", "remaining_time": "1:57:10", "throughput": 3067.47, "total_tokens": 8480} {"current_steps": 20, "total_steps": 38160, "loss": 3.2407, "lr": 4.979035639412998e-06, "epoch": 0.010482180293501049, "percentage": 0.05, "elapsed_time": "0:00:03", "remaining_time": "1:49:54", "throughput": 3322.21, "total_tokens": 11488} {"current_steps": 25, "total_steps": 38160, "loss": 2.08, "lr": 6.289308176100629e-06, "epoch": 0.01310272536687631, "percentage": 0.07, "elapsed_time": "0:00:04", "remaining_time": "1:46:51", "throughput": 3540.33, "total_tokens": 14880} {"current_steps": 30, "total_steps": 38160, "loss": 1.0257, "lr": 7.59958071278826e-06, "epoch": 0.015723270440251572, "percentage": 0.08, "elapsed_time": "0:00:04", "remaining_time": "1:45:36", "throughput": 3728.97, "total_tokens": 18592} {"current_steps": 35, "total_steps": 38160, "loss": 0.8789, "lr": 8.90985324947589e-06, "epoch": 0.018343815513626835, "percentage": 0.09, "elapsed_time": "0:00:05", "remaining_time": "1:42:52", "throughput": 3806.28, "total_tokens": 21568} {"current_steps": 40, "total_steps": 38160, "loss": 0.7281, "lr": 1.0220125786163522e-05, "epoch": 0.020964360587002098, "percentage": 0.1, "elapsed_time": "0:00:06", "remaining_time": "1:40:17", "throughput": 3826.35, "total_tokens": 24160} {"current_steps": 45, "total_steps": 38160, "loss": 0.7915, "lr": 1.1530398322851153e-05, "epoch": 0.02358490566037736, "percentage": 0.12, "elapsed_time": "0:00:07", "remaining_time": "1:38:53", "throughput": 3878.35, "total_tokens": 27168} {"current_steps": 50, "total_steps": 38160, "loss": 0.6498, "lr": 1.2840670859538784e-05, "epoch": 0.02620545073375262, "percentage": 0.13, "elapsed_time": "0:00:07", "remaining_time": "1:37:41", "throughput": 3911.3, "total_tokens": 30080} {"current_steps": 55, "total_steps": 38160, "loss": 0.7485, "lr": 1.4150943396226415e-05, "epoch": 0.028825995807127882, "percentage": 0.14, "elapsed_time": "0:00:08", "remaining_time": "1:36:10", "throughput": 3915.27, "total_tokens": 32608} {"current_steps": 60, "total_steps": 38160, "loss": 0.7152, "lr": 1.5461215932914046e-05, "epoch": 0.031446540880503145, "percentage": 0.16, "elapsed_time": "0:00:09", "remaining_time": "1:36:42", "throughput": 3988.73, "total_tokens": 36448} {"current_steps": 65, "total_steps": 38160, "loss": 0.4345, "lr": 1.6771488469601677e-05, "epoch": 0.034067085953878404, "percentage": 0.17, "elapsed_time": "0:00:09", "remaining_time": "1:35:21", "throughput": 3989.06, "total_tokens": 38944} {"current_steps": 70, "total_steps": 38160, "loss": 0.5775, "lr": 1.8081761006289308e-05, "epoch": 0.03668763102725367, "percentage": 0.18, "elapsed_time": "0:00:10", "remaining_time": "1:34:54", "throughput": 3996.32, "total_tokens": 41824} {"current_steps": 75, "total_steps": 38160, "loss": 0.5619, "lr": 1.9392033542976942e-05, "epoch": 0.03930817610062893, "percentage": 0.2, "elapsed_time": "0:00:11", "remaining_time": "1:34:30", "throughput": 4020.44, "total_tokens": 44896} {"current_steps": 80, "total_steps": 38160, "loss": 0.5432, "lr": 2.070230607966457e-05, "epoch": 0.041928721174004195, "percentage": 0.21, "elapsed_time": "0:00:11", "remaining_time": "1:33:44", "throughput": 4030.0, "total_tokens": 47616} {"current_steps": 85, "total_steps": 38160, "loss": 0.6556, "lr": 2.20125786163522e-05, "epoch": 0.044549266247379454, "percentage": 0.22, "elapsed_time": "0:00:12", "remaining_time": "1:33:08", "throughput": 4037.26, "total_tokens": 50368} {"current_steps": 90, "total_steps": 38160, "loss": 0.6779, "lr": 2.3322851153039832e-05, "epoch": 0.04716981132075472, "percentage": 0.24, "elapsed_time": "0:00:13", "remaining_time": "1:33:28", "throughput": 4073.76, "total_tokens": 54016} {"current_steps": 95, "total_steps": 38160, "loss": 0.4229, "lr": 2.4633123689727463e-05, "epoch": 0.04979035639412998, "percentage": 0.25, "elapsed_time": "0:00:14", "remaining_time": "1:33:52", "throughput": 4118.36, "total_tokens": 57888} {"current_steps": 100, "total_steps": 38160, "loss": 0.5745, "lr": 2.5943396226415097e-05, "epoch": 0.05241090146750524, "percentage": 0.26, "elapsed_time": "0:00:14", "remaining_time": "1:33:34", "throughput": 4136.39, "total_tokens": 61024} {"current_steps": 105, "total_steps": 38160, "loss": 0.5809, "lr": 2.7253668763102725e-05, "epoch": 0.055031446540880505, "percentage": 0.28, "elapsed_time": "0:00:15", "remaining_time": "1:33:42", "throughput": 4168.55, "total_tokens": 64672} {"current_steps": 110, "total_steps": 38160, "loss": 0.5085, "lr": 2.8563941299790356e-05, "epoch": 0.057651991614255764, "percentage": 0.29, "elapsed_time": "0:00:16", "remaining_time": "1:33:22", "throughput": 4174.8, "total_tokens": 67616} {"current_steps": 115, "total_steps": 38160, "loss": 0.521, "lr": 2.987421383647799e-05, "epoch": 0.06027253668763103, "percentage": 0.3, "elapsed_time": "0:00:16", "remaining_time": "1:33:30", "throughput": 4200.05, "total_tokens": 71232} {"current_steps": 120, "total_steps": 38160, "loss": 0.4112, "lr": 3.118448637316562e-05, "epoch": 0.06289308176100629, "percentage": 0.31, "elapsed_time": "0:00:17", "remaining_time": "1:33:41", "throughput": 4222.73, "total_tokens": 74880} {"current_steps": 125, "total_steps": 38160, "loss": 0.5647, "lr": 3.2494758909853245e-05, "epoch": 0.06551362683438156, "percentage": 0.33, "elapsed_time": "0:00:18", "remaining_time": "1:33:46", "throughput": 4241.63, "total_tokens": 78432} {"current_steps": 130, "total_steps": 38160, "loss": 0.4921, "lr": 3.380503144654088e-05, "epoch": 0.06813417190775681, "percentage": 0.34, "elapsed_time": "0:00:19", "remaining_time": "1:33:17", "throughput": 4237.51, "total_tokens": 81088} {"current_steps": 135, "total_steps": 38160, "loss": 0.5339, "lr": 3.5115303983228514e-05, "epoch": 0.07075471698113207, "percentage": 0.35, "elapsed_time": "0:00:19", "remaining_time": "1:33:29", "throughput": 4262.7, "total_tokens": 84896} {"current_steps": 140, "total_steps": 38160, "loss": 0.5942, "lr": 3.642557651991614e-05, "epoch": 0.07337526205450734, "percentage": 0.37, "elapsed_time": "0:00:20", "remaining_time": "1:33:50", "throughput": 4279.87, "total_tokens": 88736} {"current_steps": 145, "total_steps": 38160, "loss": 0.8808, "lr": 3.7735849056603776e-05, "epoch": 0.0759958071278826, "percentage": 0.38, "elapsed_time": "0:00:21", "remaining_time": "1:33:52", "throughput": 4292.92, "total_tokens": 92224} {"current_steps": 150, "total_steps": 38160, "loss": 0.5362, "lr": 3.90461215932914e-05, "epoch": 0.07861635220125786, "percentage": 0.39, "elapsed_time": "0:00:22", "remaining_time": "1:33:37", "throughput": 4293.23, "total_tokens": 95168} {"current_steps": 155, "total_steps": 38160, "loss": 0.5562, "lr": 4.035639412997904e-05, "epoch": 0.08123689727463312, "percentage": 0.41, "elapsed_time": "0:00:22", "remaining_time": "1:33:50", "throughput": 4310.07, "total_tokens": 98976} {"current_steps": 160, "total_steps": 38160, "loss": 0.469, "lr": 4.1666666666666665e-05, "epoch": 0.08385744234800839, "percentage": 0.42, "elapsed_time": "0:00:23", "remaining_time": "1:33:44", "throughput": 4314.39, "total_tokens": 102176} {"current_steps": 165, "total_steps": 38160, "loss": 0.464, "lr": 4.29769392033543e-05, "epoch": 0.08647798742138364, "percentage": 0.43, "elapsed_time": "0:00:24", "remaining_time": "1:33:52", "throughput": 4326.48, "total_tokens": 105824} {"current_steps": 170, "total_steps": 38160, "loss": 0.5105, "lr": 4.4287211740041934e-05, "epoch": 0.08909853249475891, "percentage": 0.45, "elapsed_time": "0:00:25", "remaining_time": "1:33:31", "throughput": 4321.19, "total_tokens": 108512} {"current_steps": 175, "total_steps": 38160, "loss": 0.523, "lr": 4.5597484276729555e-05, "epoch": 0.09171907756813417, "percentage": 0.46, "elapsed_time": "0:00:25", "remaining_time": "1:33:31", "throughput": 4327.47, "total_tokens": 111872} {"current_steps": 180, "total_steps": 38160, "loss": 0.4721, "lr": 4.690775681341719e-05, "epoch": 0.09433962264150944, "percentage": 0.47, "elapsed_time": "0:00:26", "remaining_time": "1:33:35", "throughput": 4341.91, "total_tokens": 115552} {"current_steps": 185, "total_steps": 38160, "loss": 0.6313, "lr": 4.8218029350104823e-05, "epoch": 0.09696016771488469, "percentage": 0.48, "elapsed_time": "0:00:27", "remaining_time": "1:33:31", "throughput": 4345.34, "total_tokens": 118784} {"current_steps": 190, "total_steps": 38160, "loss": 0.4303, "lr": 4.952830188679246e-05, "epoch": 0.09958071278825996, "percentage": 0.5, "elapsed_time": "0:00:28", "remaining_time": "1:33:39", "throughput": 4357.49, "total_tokens": 122528} {"current_steps": 195, "total_steps": 38160, "loss": 0.5259, "lr": 5.0838574423480085e-05, "epoch": 0.10220125786163523, "percentage": 0.51, "elapsed_time": "0:00:28", "remaining_time": "1:33:16", "throughput": 4349.25, "total_tokens": 125024} {"current_steps": 200, "total_steps": 38160, "loss": 0.5996, "lr": 5.214884696016771e-05, "epoch": 0.10482180293501048, "percentage": 0.52, "elapsed_time": "0:00:29", "remaining_time": "1:33:09", "throughput": 4349.31, "total_tokens": 128096} {"current_steps": 205, "total_steps": 38160, "loss": 0.6745, "lr": 5.345911949685535e-05, "epoch": 0.10744234800838574, "percentage": 0.54, "elapsed_time": "0:00:30", "remaining_time": "1:32:46", "throughput": 4340.7, "total_tokens": 130496} {"current_steps": 210, "total_steps": 38160, "loss": 0.5892, "lr": 5.4769392033542975e-05, "epoch": 0.11006289308176101, "percentage": 0.55, "elapsed_time": "0:00:30", "remaining_time": "1:32:29", "throughput": 4335.98, "total_tokens": 133152} {"current_steps": 215, "total_steps": 38160, "loss": 0.6939, "lr": 5.607966457023061e-05, "epoch": 0.11268343815513626, "percentage": 0.56, "elapsed_time": "0:00:31", "remaining_time": "1:32:26", "throughput": 4339.45, "total_tokens": 136384} {"current_steps": 220, "total_steps": 38160, "loss": 0.6202, "lr": 5.7389937106918244e-05, "epoch": 0.11530398322851153, "percentage": 0.58, "elapsed_time": "0:00:32", "remaining_time": "1:32:19", "throughput": 4341.18, "total_tokens": 139456} {"current_steps": 225, "total_steps": 38160, "loss": 0.626, "lr": 5.870020964360587e-05, "epoch": 0.1179245283018868, "percentage": 0.59, "elapsed_time": "0:00:32", "remaining_time": "1:32:19", "throughput": 4346.4, "total_tokens": 142816} {"current_steps": 230, "total_steps": 38160, "loss": 0.5322, "lr": 6.00104821802935e-05, "epoch": 0.12054507337526206, "percentage": 0.6, "elapsed_time": "0:00:33", "remaining_time": "1:32:09", "throughput": 4345.53, "total_tokens": 145696} {"current_steps": 235, "total_steps": 38160, "loss": 0.6419, "lr": 6.132075471698113e-05, "epoch": 0.12316561844863731, "percentage": 0.62, "elapsed_time": "0:00:34", "remaining_time": "1:32:08", "throughput": 4350.41, "total_tokens": 149024} {"current_steps": 240, "total_steps": 38160, "loss": 0.5641, "lr": 6.263102725366875e-05, "epoch": 0.12578616352201258, "percentage": 0.63, "elapsed_time": "0:00:34", "remaining_time": "1:31:58", "throughput": 4347.37, "total_tokens": 151840} {"current_steps": 245, "total_steps": 38160, "loss": 0.6886, "lr": 6.39412997903564e-05, "epoch": 0.12840670859538783, "percentage": 0.64, "elapsed_time": "0:00:35", "remaining_time": "1:32:04", "throughput": 4354.86, "total_tokens": 155456} {"current_steps": 250, "total_steps": 38160, "loss": 0.5696, "lr": 6.525157232704402e-05, "epoch": 0.1310272536687631, "percentage": 0.66, "elapsed_time": "0:00:36", "remaining_time": "1:31:59", "throughput": 4355.42, "total_tokens": 158528} {"current_steps": 255, "total_steps": 38160, "loss": 0.5468, "lr": 6.656184486373166e-05, "epoch": 0.13364779874213836, "percentage": 0.67, "elapsed_time": "0:00:37", "remaining_time": "1:33:36", "throughput": 4406.81, "total_tokens": 166496} {"current_steps": 260, "total_steps": 38160, "loss": 0.5205, "lr": 6.787211740041929e-05, "epoch": 0.13626834381551362, "percentage": 0.68, "elapsed_time": "0:00:38", "remaining_time": "1:33:29", "throughput": 4406.65, "total_tokens": 169568} {"current_steps": 265, "total_steps": 38160, "loss": 0.6078, "lr": 6.918238993710691e-05, "epoch": 0.1388888888888889, "percentage": 0.69, "elapsed_time": "0:00:39", "remaining_time": "1:33:24", "throughput": 4406.91, "total_tokens": 172704} {"current_steps": 270, "total_steps": 38160, "loss": 0.7384, "lr": 7.049266247379455e-05, "epoch": 0.14150943396226415, "percentage": 0.71, "elapsed_time": "0:00:39", "remaining_time": "1:33:30", "throughput": 4414.05, "total_tokens": 176480} {"current_steps": 275, "total_steps": 38160, "loss": 0.5469, "lr": 7.180293501048218e-05, "epoch": 0.1441299790356394, "percentage": 0.72, "elapsed_time": "0:00:40", "remaining_time": "1:33:57", "throughput": 4433.35, "total_tokens": 181408} {"current_steps": 280, "total_steps": 38160, "loss": 0.5923, "lr": 7.311320754716982e-05, "epoch": 0.14675052410901468, "percentage": 0.73, "elapsed_time": "0:00:41", "remaining_time": "1:33:54", "throughput": 4435.18, "total_tokens": 184736} {"current_steps": 285, "total_steps": 38160, "loss": 0.5122, "lr": 7.442348008385745e-05, "epoch": 0.14937106918238993, "percentage": 0.75, "elapsed_time": "0:00:42", "remaining_time": "1:33:56", "throughput": 4440.69, "total_tokens": 188352} {"current_steps": 290, "total_steps": 38160, "loss": 0.4922, "lr": 7.573375262054507e-05, "epoch": 0.1519916142557652, "percentage": 0.76, "elapsed_time": "0:00:43", "remaining_time": "1:34:26", "throughput": 4457.2, "total_tokens": 193408} {"current_steps": 295, "total_steps": 38160, "loss": 0.4207, "lr": 7.70440251572327e-05, "epoch": 0.15461215932914046, "percentage": 0.77, "elapsed_time": "0:00:44", "remaining_time": "1:34:17", "throughput": 4455.63, "total_tokens": 196384} {"current_steps": 300, "total_steps": 38160, "loss": 0.6115, "lr": 7.835429769392034e-05, "epoch": 0.15723270440251572, "percentage": 0.79, "elapsed_time": "0:00:44", "remaining_time": "1:34:09", "throughput": 4453.36, "total_tokens": 199360} {"current_steps": 305, "total_steps": 38160, "loss": 0.5228, "lr": 7.966457023060797e-05, "epoch": 0.159853249475891, "percentage": 0.8, "elapsed_time": "0:00:45", "remaining_time": "1:34:10", "throughput": 4455.43, "total_tokens": 202848} {"current_steps": 310, "total_steps": 38160, "loss": 0.4791, "lr": 8.09748427672956e-05, "epoch": 0.16247379454926625, "percentage": 0.81, "elapsed_time": "0:00:46", "remaining_time": "1:34:25", "throughput": 4463.62, "total_tokens": 207104} {"current_steps": 315, "total_steps": 38160, "loss": 0.637, "lr": 8.228511530398323e-05, "epoch": 0.1650943396226415, "percentage": 0.83, "elapsed_time": "0:00:47", "remaining_time": "1:34:09", "throughput": 4457.23, "total_tokens": 209600} {"current_steps": 320, "total_steps": 38160, "loss": 0.611, "lr": 8.359538784067086e-05, "epoch": 0.16771488469601678, "percentage": 0.84, "elapsed_time": "0:00:47", "remaining_time": "1:34:11", "throughput": 4459.71, "total_tokens": 213152} {"current_steps": 325, "total_steps": 38160, "loss": 0.7027, "lr": 8.490566037735848e-05, "epoch": 0.17033542976939203, "percentage": 0.85, "elapsed_time": "0:00:48", "remaining_time": "1:33:56", "throughput": 4453.48, "total_tokens": 215616} {"current_steps": 330, "total_steps": 38160, "loss": 0.6089, "lr": 8.621593291404613e-05, "epoch": 0.17295597484276728, "percentage": 0.86, "elapsed_time": "0:00:49", "remaining_time": "1:33:48", "throughput": 4451.0, "total_tokens": 218528} {"current_steps": 335, "total_steps": 38160, "loss": 0.4405, "lr": 8.752620545073375e-05, "epoch": 0.17557651991614256, "percentage": 0.88, "elapsed_time": "0:00:49", "remaining_time": "1:33:46", "throughput": 4451.53, "total_tokens": 221824} {"current_steps": 340, "total_steps": 38160, "loss": 0.5055, "lr": 8.883647798742137e-05, "epoch": 0.17819706498951782, "percentage": 0.89, "elapsed_time": "0:00:50", "remaining_time": "1:33:46", "throughput": 4453.62, "total_tokens": 225280} {"current_steps": 345, "total_steps": 38160, "loss": 0.4572, "lr": 9.014675052410902e-05, "epoch": 0.18081761006289307, "percentage": 0.9, "elapsed_time": "0:00:51", "remaining_time": "1:34:20", "throughput": 4471.0, "total_tokens": 230912} {"current_steps": 350, "total_steps": 38160, "loss": 0.5646, "lr": 9.145702306079664e-05, "epoch": 0.18343815513626835, "percentage": 0.92, "elapsed_time": "0:00:52", "remaining_time": "1:34:22", "throughput": 4475.13, "total_tokens": 234592} {"current_steps": 355, "total_steps": 38160, "loss": 0.493, "lr": 9.276729559748428e-05, "epoch": 0.1860587002096436, "percentage": 0.93, "elapsed_time": "0:00:53", "remaining_time": "1:34:16", "throughput": 4473.31, "total_tokens": 237600} {"current_steps": 360, "total_steps": 38160, "loss": 0.6188, "lr": 9.407756813417191e-05, "epoch": 0.18867924528301888, "percentage": 0.94, "elapsed_time": "0:00:53", "remaining_time": "1:34:16", "throughput": 4475.5, "total_tokens": 241088} {"current_steps": 365, "total_steps": 38160, "loss": 0.5569, "lr": 9.538784067085953e-05, "epoch": 0.19129979035639413, "percentage": 0.96, "elapsed_time": "0:00:54", "remaining_time": "1:34:01", "throughput": 4469.52, "total_tokens": 243520} {"current_steps": 370, "total_steps": 38160, "loss": 0.742, "lr": 9.669811320754718e-05, "epoch": 0.19392033542976939, "percentage": 0.97, "elapsed_time": "0:00:55", "remaining_time": "1:34:07", "throughput": 4474.94, "total_tokens": 247456} {"current_steps": 375, "total_steps": 38160, "loss": 0.4974, "lr": 9.80083857442348e-05, "epoch": 0.19654088050314467, "percentage": 0.98, "elapsed_time": "0:00:56", "remaining_time": "1:34:05", "throughput": 4476.09, "total_tokens": 250784} {"current_steps": 380, "total_steps": 38160, "loss": 0.542, "lr": 9.931865828092243e-05, "epoch": 0.19916142557651992, "percentage": 1.0, "elapsed_time": "0:00:56", "remaining_time": "1:34:15", "throughput": 4483.88, "total_tokens": 255040} {"current_steps": 385, "total_steps": 38160, "loss": 0.6188, "lr": 0.00010062893081761007, "epoch": 0.20178197064989517, "percentage": 1.01, "elapsed_time": "0:00:57", "remaining_time": "1:34:11", "throughput": 4483.57, "total_tokens": 258240} {"current_steps": 390, "total_steps": 38160, "loss": 0.4524, "lr": 0.0001019392033542977, "epoch": 0.20440251572327045, "percentage": 1.02, "elapsed_time": "0:00:58", "remaining_time": "1:34:04", "throughput": 4480.67, "total_tokens": 261152} {"current_steps": 395, "total_steps": 38160, "loss": 0.5425, "lr": 0.00010324947589098532, "epoch": 0.2070230607966457, "percentage": 1.04, "elapsed_time": "0:00:59", "remaining_time": "1:34:02", "throughput": 4482.12, "total_tokens": 264544} {"current_steps": 400, "total_steps": 38160, "loss": 0.6098, "lr": 0.00010455974842767296, "epoch": 0.20964360587002095, "percentage": 1.05, "elapsed_time": "0:00:59", "remaining_time": "1:33:52", "throughput": 4477.24, "total_tokens": 267136} {"current_steps": 405, "total_steps": 38160, "loss": 0.4776, "lr": 0.00010587002096436059, "epoch": 0.21226415094339623, "percentage": 1.06, "elapsed_time": "0:01:00", "remaining_time": "1:33:50", "throughput": 4477.83, "total_tokens": 270464} {"current_steps": 410, "total_steps": 38160, "loss": 0.5049, "lr": 0.00010718029350104821, "epoch": 0.2148846960167715, "percentage": 1.07, "elapsed_time": "0:01:01", "remaining_time": "1:33:57", "throughput": 4483.44, "total_tokens": 274528} {"current_steps": 415, "total_steps": 38160, "loss": 0.4909, "lr": 0.00010849056603773586, "epoch": 0.21750524109014674, "percentage": 1.09, "elapsed_time": "0:01:01", "remaining_time": "1:33:51", "throughput": 4479.8, "total_tokens": 277376} {"current_steps": 420, "total_steps": 38160, "loss": 0.395, "lr": 0.00010980083857442348, "epoch": 0.22012578616352202, "percentage": 1.1, "elapsed_time": "0:01:02", "remaining_time": "1:33:38", "throughput": 4472.27, "total_tokens": 279616} {"current_steps": 425, "total_steps": 38160, "loss": 0.4555, "lr": 0.0001111111111111111, "epoch": 0.22274633123689727, "percentage": 1.11, "elapsed_time": "0:01:03", "remaining_time": "1:33:33", "throughput": 4470.51, "total_tokens": 282656} {"current_steps": 430, "total_steps": 38160, "loss": 0.5687, "lr": 0.00011242138364779875, "epoch": 0.22536687631027252, "percentage": 1.13, "elapsed_time": "0:01:03", "remaining_time": "1:33:27", "throughput": 4469.01, "total_tokens": 285600} {"current_steps": 435, "total_steps": 38160, "loss": 0.395, "lr": 0.00011373165618448637, "epoch": 0.2279874213836478, "percentage": 1.14, "elapsed_time": "0:01:04", "remaining_time": "1:33:32", "throughput": 4474.17, "total_tokens": 289568} {"current_steps": 440, "total_steps": 38160, "loss": 0.592, "lr": 0.00011504192872117402, "epoch": 0.23060796645702306, "percentage": 1.15, "elapsed_time": "0:01:05", "remaining_time": "1:33:30", "throughput": 4473.79, "total_tokens": 292768} {"current_steps": 445, "total_steps": 38160, "loss": 0.6336, "lr": 0.00011635220125786164, "epoch": 0.23322851153039834, "percentage": 1.17, "elapsed_time": "0:01:06", "remaining_time": "1:33:21", "throughput": 4470.61, "total_tokens": 295456} {"current_steps": 450, "total_steps": 38160, "loss": 0.5672, "lr": 0.00011766247379454926, "epoch": 0.2358490566037736, "percentage": 1.18, "elapsed_time": "0:01:06", "remaining_time": "1:33:27", "throughput": 4475.96, "total_tokens": 299488} {"current_steps": 455, "total_steps": 38160, "loss": 0.4676, "lr": 0.00011897274633123691, "epoch": 0.23846960167714884, "percentage": 1.19, "elapsed_time": "0:01:07", "remaining_time": "1:33:28", "throughput": 4476.61, "total_tokens": 302976} {"current_steps": 460, "total_steps": 38160, "loss": 0.5342, "lr": 0.00012028301886792453, "epoch": 0.24109014675052412, "percentage": 1.21, "elapsed_time": "0:01:08", "remaining_time": "1:33:28", "throughput": 4479.35, "total_tokens": 306560} {"current_steps": 465, "total_steps": 38160, "loss": 0.4462, "lr": 0.00012159329140461216, "epoch": 0.24371069182389937, "percentage": 1.22, "elapsed_time": "0:01:09", "remaining_time": "1:33:23", "throughput": 4477.61, "total_tokens": 309536} {"current_steps": 470, "total_steps": 38160, "loss": 0.5008, "lr": 0.0001229035639412998, "epoch": 0.24633123689727462, "percentage": 1.23, "elapsed_time": "0:01:09", "remaining_time": "1:33:18", "throughput": 4477.11, "total_tokens": 312576} {"current_steps": 475, "total_steps": 38160, "loss": 0.4987, "lr": 0.00012421383647798743, "epoch": 0.2489517819706499, "percentage": 1.24, "elapsed_time": "0:01:10", "remaining_time": "1:33:13", "throughput": 4476.34, "total_tokens": 315616} {"current_steps": 480, "total_steps": 38160, "loss": 0.5167, "lr": 0.00012552410901467507, "epoch": 0.25157232704402516, "percentage": 1.26, "elapsed_time": "0:01:11", "remaining_time": "1:33:13", "throughput": 4478.42, "total_tokens": 319136} {"current_steps": 485, "total_steps": 38160, "loss": 0.6978, "lr": 0.00012683438155136267, "epoch": 0.25419287211740044, "percentage": 1.27, "elapsed_time": "0:01:11", "remaining_time": "1:33:02", "throughput": 4471.92, "total_tokens": 321376} {"current_steps": 490, "total_steps": 38160, "loss": 0.5501, "lr": 0.0001281446540880503, "epoch": 0.25681341719077566, "percentage": 1.28, "elapsed_time": "0:01:12", "remaining_time": "1:33:02", "throughput": 4474.76, "total_tokens": 324928} {"current_steps": 495, "total_steps": 38160, "loss": 0.6535, "lr": 0.00012945492662473794, "epoch": 0.25943396226415094, "percentage": 1.3, "elapsed_time": "0:01:13", "remaining_time": "1:33:11", "throughput": 4480.87, "total_tokens": 329248} {"current_steps": 500, "total_steps": 38160, "loss": 0.6412, "lr": 0.00013076519916142558, "epoch": 0.2620545073375262, "percentage": 1.31, "elapsed_time": "0:01:14", "remaining_time": "1:33:06", "throughput": 4480.1, "total_tokens": 332288} {"current_steps": 505, "total_steps": 38160, "loss": 0.5217, "lr": 0.0001320754716981132, "epoch": 0.26467505241090145, "percentage": 1.32, "elapsed_time": "0:01:14", "remaining_time": "1:32:56", "throughput": 4476.05, "total_tokens": 334752} {"current_steps": 510, "total_steps": 38160, "loss": 0.5572, "lr": 0.00013338574423480085, "epoch": 0.2672955974842767, "percentage": 1.34, "elapsed_time": "0:01:15", "remaining_time": "1:32:53", "throughput": 4475.13, "total_tokens": 337856} {"current_steps": 515, "total_steps": 38160, "loss": 0.6406, "lr": 0.00013469601677148845, "epoch": 0.269916142557652, "percentage": 1.35, "elapsed_time": "0:01:16", "remaining_time": "1:32:57", "throughput": 4479.04, "total_tokens": 341792} {"current_steps": 520, "total_steps": 38160, "loss": 0.6394, "lr": 0.0001360062893081761, "epoch": 0.27253668763102723, "percentage": 1.36, "elapsed_time": "0:01:16", "remaining_time": "1:32:53", "throughput": 4477.69, "total_tokens": 344768} {"current_steps": 525, "total_steps": 38160, "loss": 0.4626, "lr": 0.00013731656184486375, "epoch": 0.2751572327044025, "percentage": 1.38, "elapsed_time": "0:01:17", "remaining_time": "1:32:45", "throughput": 4474.22, "total_tokens": 347360} {"current_steps": 530, "total_steps": 38160, "loss": 0.4874, "lr": 0.00013862683438155136, "epoch": 0.2777777777777778, "percentage": 1.39, "elapsed_time": "0:01:18", "remaining_time": "1:32:43", "throughput": 4474.55, "total_tokens": 350592} {"current_steps": 535, "total_steps": 38160, "loss": 0.491, "lr": 0.000139937106918239, "epoch": 0.280398322851153, "percentage": 1.4, "elapsed_time": "0:01:19", "remaining_time": "1:32:39", "throughput": 4472.75, "total_tokens": 353568} {"current_steps": 540, "total_steps": 38160, "loss": 0.6103, "lr": 0.00014124737945492663, "epoch": 0.2830188679245283, "percentage": 1.42, "elapsed_time": "0:01:19", "remaining_time": "1:32:32", "throughput": 4470.57, "total_tokens": 356320} {"current_steps": 545, "total_steps": 38160, "loss": 0.5264, "lr": 0.00014255765199161423, "epoch": 0.2856394129979036, "percentage": 1.43, "elapsed_time": "0:01:20", "remaining_time": "1:32:33", "throughput": 4473.59, "total_tokens": 359968} {"current_steps": 550, "total_steps": 38160, "loss": 0.4495, "lr": 0.0001438679245283019, "epoch": 0.2882599580712788, "percentage": 1.44, "elapsed_time": "0:01:21", "remaining_time": "1:32:27", "throughput": 4471.39, "total_tokens": 362752} {"current_steps": 555, "total_steps": 38160, "loss": 0.5891, "lr": 0.00014517819706498953, "epoch": 0.2908805031446541, "percentage": 1.45, "elapsed_time": "0:01:21", "remaining_time": "1:32:19", "throughput": 4468.24, "total_tokens": 365312} {"current_steps": 560, "total_steps": 38160, "loss": 0.4835, "lr": 0.00014648846960167716, "epoch": 0.29350104821802936, "percentage": 1.47, "elapsed_time": "0:01:22", "remaining_time": "1:32:20", "throughput": 4470.41, "total_tokens": 368896} {"current_steps": 565, "total_steps": 38160, "loss": 0.5361, "lr": 0.00014779874213836477, "epoch": 0.29612159329140464, "percentage": 1.48, "elapsed_time": "0:01:23", "remaining_time": "1:32:14", "throughput": 4468.48, "total_tokens": 371648} {"current_steps": 570, "total_steps": 38160, "loss": 0.5799, "lr": 0.00014910901467505243, "epoch": 0.29874213836477986, "percentage": 1.49, "elapsed_time": "0:01:23", "remaining_time": "1:32:12", "throughput": 4468.2, "total_tokens": 374848} {"current_steps": 575, "total_steps": 38160, "loss": 0.5398, "lr": 0.00015041928721174007, "epoch": 0.30136268343815514, "percentage": 1.51, "elapsed_time": "0:01:24", "remaining_time": "1:32:03", "throughput": 4463.68, "total_tokens": 377184} {"current_steps": 580, "total_steps": 38160, "loss": 0.6253, "lr": 0.00015172955974842767, "epoch": 0.3039832285115304, "percentage": 1.52, "elapsed_time": "0:01:25", "remaining_time": "1:32:10", "throughput": 4469.9, "total_tokens": 381504} {"current_steps": 585, "total_steps": 38160, "loss": 0.5353, "lr": 0.0001530398322851153, "epoch": 0.30660377358490565, "percentage": 1.53, "elapsed_time": "0:01:26", "remaining_time": "1:32:07", "throughput": 4469.61, "total_tokens": 384672} {"current_steps": 590, "total_steps": 38160, "loss": 0.5229, "lr": 0.00015435010482180294, "epoch": 0.30922431865828093, "percentage": 1.55, "elapsed_time": "0:01:26", "remaining_time": "1:32:19", "throughput": 4476.18, "total_tokens": 389376} {"current_steps": 595, "total_steps": 38160, "loss": 0.589, "lr": 0.00015566037735849058, "epoch": 0.3118448637316562, "percentage": 1.56, "elapsed_time": "0:01:27", "remaining_time": "1:32:17", "throughput": 4475.4, "total_tokens": 392512} {"current_steps": 600, "total_steps": 38160, "loss": 0.5162, "lr": 0.0001569706498951782, "epoch": 0.31446540880503143, "percentage": 1.57, "elapsed_time": "0:01:28", "remaining_time": "1:32:23", "throughput": 4481.71, "total_tokens": 396864} {"current_steps": 605, "total_steps": 38160, "loss": 0.4766, "lr": 0.00015828092243186584, "epoch": 0.3170859538784067, "percentage": 1.59, "elapsed_time": "0:01:29", "remaining_time": "1:32:16", "throughput": 4479.38, "total_tokens": 399520} {"current_steps": 610, "total_steps": 38160, "loss": 0.4859, "lr": 0.00015959119496855345, "epoch": 0.319706498951782, "percentage": 1.6, "elapsed_time": "0:01:29", "remaining_time": "1:32:12", "throughput": 4478.77, "total_tokens": 402560} {"current_steps": 615, "total_steps": 38160, "loss": 0.6413, "lr": 0.00016090146750524109, "epoch": 0.3223270440251572, "percentage": 1.61, "elapsed_time": "0:01:30", "remaining_time": "1:32:14", "throughput": 4480.71, "total_tokens": 406240} {"current_steps": 620, "total_steps": 38160, "loss": 0.5483, "lr": 0.00016221174004192875, "epoch": 0.3249475890985325, "percentage": 1.62, "elapsed_time": "0:01:31", "remaining_time": "1:32:08", "throughput": 4478.58, "total_tokens": 408960} {"current_steps": 625, "total_steps": 38160, "loss": 0.6812, "lr": 0.00016352201257861635, "epoch": 0.3275681341719078, "percentage": 1.64, "elapsed_time": "0:01:32", "remaining_time": "1:32:07", "throughput": 4479.0, "total_tokens": 412224} {"current_steps": 630, "total_steps": 38160, "loss": 0.4919, "lr": 0.000164832285115304, "epoch": 0.330188679245283, "percentage": 1.65, "elapsed_time": "0:01:32", "remaining_time": "1:32:04", "throughput": 4478.0, "total_tokens": 415296} {"current_steps": 635, "total_steps": 38160, "loss": 0.4547, "lr": 0.00016614255765199162, "epoch": 0.3328092243186583, "percentage": 1.66, "elapsed_time": "0:01:33", "remaining_time": "1:31:55", "throughput": 4473.36, "total_tokens": 417504} {"current_steps": 640, "total_steps": 38160, "loss": 0.5495, "lr": 0.00016745283018867923, "epoch": 0.33542976939203356, "percentage": 1.68, "elapsed_time": "0:01:33", "remaining_time": "1:31:50", "throughput": 4471.4, "total_tokens": 420288} {"current_steps": 645, "total_steps": 38160, "loss": 0.6852, "lr": 0.0001687631027253669, "epoch": 0.3380503144654088, "percentage": 1.69, "elapsed_time": "0:01:34", "remaining_time": "1:31:41", "throughput": 4466.98, "total_tokens": 422560} {"current_steps": 650, "total_steps": 38160, "loss": 0.6101, "lr": 0.00017007337526205453, "epoch": 0.34067085953878407, "percentage": 1.7, "elapsed_time": "0:01:35", "remaining_time": "1:31:38", "throughput": 4465.8, "total_tokens": 425472} {"current_steps": 655, "total_steps": 38160, "loss": 0.5264, "lr": 0.00017138364779874213, "epoch": 0.34329140461215935, "percentage": 1.72, "elapsed_time": "0:01:36", "remaining_time": "1:31:38", "throughput": 4467.79, "total_tokens": 429056} {"current_steps": 660, "total_steps": 38160, "loss": 0.492, "lr": 0.00017269392033542977, "epoch": 0.34591194968553457, "percentage": 1.73, "elapsed_time": "0:01:36", "remaining_time": "1:31:42", "throughput": 4471.28, "total_tokens": 433024} {"current_steps": 665, "total_steps": 38160, "loss": 0.5435, "lr": 0.0001740041928721174, "epoch": 0.34853249475890985, "percentage": 1.74, "elapsed_time": "0:01:37", "remaining_time": "1:31:37", "throughput": 4469.45, "total_tokens": 435776} {"current_steps": 670, "total_steps": 38160, "loss": 0.5188, "lr": 0.00017531446540880504, "epoch": 0.35115303983228513, "percentage": 1.76, "elapsed_time": "0:01:38", "remaining_time": "1:31:31", "throughput": 4467.1, "total_tokens": 438432} {"current_steps": 675, "total_steps": 38160, "loss": 0.5188, "lr": 0.00017662473794549267, "epoch": 0.35377358490566035, "percentage": 1.77, "elapsed_time": "0:01:38", "remaining_time": "1:31:35", "throughput": 4470.71, "total_tokens": 442400} {"current_steps": 680, "total_steps": 38160, "loss": 0.6068, "lr": 0.0001779350104821803, "epoch": 0.35639412997903563, "percentage": 1.78, "elapsed_time": "0:01:39", "remaining_time": "1:31:35", "throughput": 4472.14, "total_tokens": 445888} {"current_steps": 685, "total_steps": 38160, "loss": 0.4774, "lr": 0.0001792452830188679, "epoch": 0.3590146750524109, "percentage": 1.8, "elapsed_time": "0:01:40", "remaining_time": "1:31:31", "throughput": 4471.35, "total_tokens": 448864} {"current_steps": 690, "total_steps": 38160, "loss": 0.6968, "lr": 0.00018055555555555555, "epoch": 0.36163522012578614, "percentage": 1.81, "elapsed_time": "0:01:41", "remaining_time": "1:31:34", "throughput": 4473.86, "total_tokens": 452640} {"current_steps": 695, "total_steps": 38160, "loss": 0.6116, "lr": 0.0001818658280922432, "epoch": 0.3642557651991614, "percentage": 1.82, "elapsed_time": "0:01:41", "remaining_time": "1:31:28", "throughput": 4471.43, "total_tokens": 455296} {"current_steps": 700, "total_steps": 38160, "loss": 0.5421, "lr": 0.00018317610062893082, "epoch": 0.3668763102725367, "percentage": 1.83, "elapsed_time": "0:01:42", "remaining_time": "1:31:23", "throughput": 4468.57, "total_tokens": 457888} {"current_steps": 705, "total_steps": 38160, "loss": 0.6139, "lr": 0.00018448637316561845, "epoch": 0.3694968553459119, "percentage": 1.85, "elapsed_time": "0:01:43", "remaining_time": "1:31:25", "throughput": 4470.91, "total_tokens": 461664} {"current_steps": 710, "total_steps": 38160, "loss": 0.6136, "lr": 0.00018579664570230608, "epoch": 0.3721174004192872, "percentage": 1.86, "elapsed_time": "0:01:43", "remaining_time": "1:31:20", "throughput": 4468.87, "total_tokens": 464352} {"current_steps": 715, "total_steps": 38160, "loss": 0.6077, "lr": 0.0001871069182389937, "epoch": 0.3747379454926625, "percentage": 1.87, "elapsed_time": "0:01:44", "remaining_time": "1:31:24", "throughput": 4471.21, "total_tokens": 468256} {"current_steps": 720, "total_steps": 38160, "loss": 0.5133, "lr": 0.00018841719077568135, "epoch": 0.37735849056603776, "percentage": 1.89, "elapsed_time": "0:01:45", "remaining_time": "1:31:20", "throughput": 4469.71, "total_tokens": 471104} {"current_steps": 725, "total_steps": 38160, "loss": 0.6115, "lr": 0.000189727463312369, "epoch": 0.379979035639413, "percentage": 1.9, "elapsed_time": "0:01:46", "remaining_time": "1:31:15", "throughput": 4466.88, "total_tokens": 473696} {"current_steps": 730, "total_steps": 38160, "loss": 0.5122, "lr": 0.00019103773584905662, "epoch": 0.38259958071278827, "percentage": 1.91, "elapsed_time": "0:01:46", "remaining_time": "1:31:11", "throughput": 4465.2, "total_tokens": 476512} {"current_steps": 735, "total_steps": 38160, "loss": 0.5904, "lr": 0.00019234800838574423, "epoch": 0.38522012578616355, "percentage": 1.93, "elapsed_time": "0:01:47", "remaining_time": "1:31:12", "throughput": 4466.92, "total_tokens": 480128} {"current_steps": 740, "total_steps": 38160, "loss": 0.6301, "lr": 0.00019365828092243186, "epoch": 0.38784067085953877, "percentage": 1.94, "elapsed_time": "0:01:48", "remaining_time": "1:31:14", "throughput": 4468.92, "total_tokens": 483808} {"current_steps": 745, "total_steps": 38160, "loss": 0.5939, "lr": 0.00019496855345911953, "epoch": 0.39046121593291405, "percentage": 1.95, "elapsed_time": "0:01:48", "remaining_time": "1:31:08", "throughput": 4465.7, "total_tokens": 486240} {"current_steps": 750, "total_steps": 38160, "loss": 0.4792, "lr": 0.00019627882599580713, "epoch": 0.39308176100628933, "percentage": 1.97, "elapsed_time": "0:01:49", "remaining_time": "1:31:00", "throughput": 4461.74, "total_tokens": 488448} {"current_steps": 755, "total_steps": 38160, "loss": 0.5778, "lr": 0.00019758909853249477, "epoch": 0.39570230607966456, "percentage": 1.98, "elapsed_time": "0:01:50", "remaining_time": "1:30:57", "throughput": 4460.65, "total_tokens": 491392} {"current_steps": 760, "total_steps": 38160, "loss": 0.5299, "lr": 0.0001988993710691824, "epoch": 0.39832285115303984, "percentage": 1.99, "elapsed_time": "0:01:50", "remaining_time": "1:31:00", "throughput": 4463.19, "total_tokens": 495232} {"current_steps": 765, "total_steps": 38160, "loss": 0.4787, "lr": 0.00020020964360587, "epoch": 0.4009433962264151, "percentage": 2.0, "elapsed_time": "0:01:51", "remaining_time": "1:30:56", "throughput": 4461.82, "total_tokens": 498016} {"current_steps": 770, "total_steps": 38160, "loss": 0.5109, "lr": 0.00020151991614255767, "epoch": 0.40356394129979034, "percentage": 2.02, "elapsed_time": "0:01:52", "remaining_time": "1:30:54", "throughput": 4461.63, "total_tokens": 501152} {"current_steps": 775, "total_steps": 38160, "loss": 0.496, "lr": 0.0002028301886792453, "epoch": 0.4061844863731656, "percentage": 2.03, "elapsed_time": "0:01:52", "remaining_time": "1:30:50", "throughput": 4459.66, "total_tokens": 503872} {"current_steps": 780, "total_steps": 38160, "loss": 0.5207, "lr": 0.0002041404612159329, "epoch": 0.4088050314465409, "percentage": 2.04, "elapsed_time": "0:01:53", "remaining_time": "1:30:50", "throughput": 4460.84, "total_tokens": 507328} {"current_steps": 785, "total_steps": 38160, "loss": 0.4149, "lr": 0.00020545073375262055, "epoch": 0.4114255765199161, "percentage": 2.06, "elapsed_time": "0:01:54", "remaining_time": "1:30:51", "throughput": 4462.02, "total_tokens": 510912} {"current_steps": 790, "total_steps": 38160, "loss": 0.5954, "lr": 0.00020676100628930818, "epoch": 0.4140461215932914, "percentage": 2.07, "elapsed_time": "0:01:55", "remaining_time": "1:30:51", "throughput": 4462.65, "total_tokens": 514304} {"current_steps": 795, "total_steps": 38160, "loss": 0.4442, "lr": 0.00020807127882599581, "epoch": 0.4166666666666667, "percentage": 2.08, "elapsed_time": "0:01:55", "remaining_time": "1:30:49", "throughput": 4462.44, "total_tokens": 517440} {"current_steps": 800, "total_steps": 38160, "loss": 0.6763, "lr": 0.00020938155136268345, "epoch": 0.4192872117400419, "percentage": 2.1, "elapsed_time": "0:01:56", "remaining_time": "1:30:47", "throughput": 4461.66, "total_tokens": 520416} {"current_steps": 805, "total_steps": 38160, "loss": 0.6537, "lr": 0.00021069182389937108, "epoch": 0.4219077568134172, "percentage": 2.11, "elapsed_time": "0:01:57", "remaining_time": "1:30:44", "throughput": 4461.23, "total_tokens": 523456} {"current_steps": 810, "total_steps": 38160, "loss": 0.5032, "lr": 0.0002120020964360587, "epoch": 0.42452830188679247, "percentage": 2.12, "elapsed_time": "0:01:58", "remaining_time": "1:30:43", "throughput": 4461.74, "total_tokens": 526720} {"current_steps": 815, "total_steps": 38160, "loss": 0.4356, "lr": 0.00021331236897274632, "epoch": 0.4271488469601677, "percentage": 2.14, "elapsed_time": "0:01:58", "remaining_time": "1:30:44", "throughput": 4463.29, "total_tokens": 530272} {"current_steps": 820, "total_steps": 38160, "loss": 0.6282, "lr": 0.00021462264150943399, "epoch": 0.429769392033543, "percentage": 2.15, "elapsed_time": "0:01:59", "remaining_time": "1:30:42", "throughput": 4463.14, "total_tokens": 533408} {"current_steps": 825, "total_steps": 38160, "loss": 0.6366, "lr": 0.0002159329140461216, "epoch": 0.43238993710691825, "percentage": 2.16, "elapsed_time": "0:02:00", "remaining_time": "1:30:42", "throughput": 4463.43, "total_tokens": 536768} {"current_steps": 830, "total_steps": 38160, "loss": 0.6108, "lr": 0.00021724318658280923, "epoch": 0.4350104821802935, "percentage": 2.18, "elapsed_time": "0:02:01", "remaining_time": "1:30:47", "throughput": 4467.78, "total_tokens": 541184} {"current_steps": 835, "total_steps": 38160, "loss": 0.4637, "lr": 0.00021855345911949686, "epoch": 0.43763102725366876, "percentage": 2.19, "elapsed_time": "0:02:01", "remaining_time": "1:30:48", "throughput": 4468.06, "total_tokens": 544576} {"current_steps": 840, "total_steps": 38160, "loss": 0.5865, "lr": 0.00021986373165618447, "epoch": 0.44025157232704404, "percentage": 2.2, "elapsed_time": "0:02:02", "remaining_time": "1:30:56", "throughput": 4473.09, "total_tokens": 549408} {"current_steps": 845, "total_steps": 38160, "loss": 0.468, "lr": 0.00022117400419287213, "epoch": 0.44287211740041926, "percentage": 2.21, "elapsed_time": "0:02:03", "remaining_time": "1:30:51", "throughput": 4471.4, "total_tokens": 552032} {"current_steps": 850, "total_steps": 38160, "loss": 0.5104, "lr": 0.00022248427672955977, "epoch": 0.44549266247379454, "percentage": 2.23, "elapsed_time": "0:02:04", "remaining_time": "1:30:53", "throughput": 4473.88, "total_tokens": 555872} {"current_steps": 855, "total_steps": 38160, "loss": 0.6376, "lr": 0.00022379454926624737, "epoch": 0.4481132075471698, "percentage": 2.24, "elapsed_time": "0:02:04", "remaining_time": "1:30:52", "throughput": 4474.18, "total_tokens": 559136} {"current_steps": 860, "total_steps": 38160, "loss": 0.5296, "lr": 0.000225104821802935, "epoch": 0.45073375262054505, "percentage": 2.25, "elapsed_time": "0:02:05", "remaining_time": "1:30:49", "throughput": 4472.88, "total_tokens": 561984} {"current_steps": 865, "total_steps": 38160, "loss": 0.4832, "lr": 0.00022641509433962264, "epoch": 0.4533542976939203, "percentage": 2.27, "elapsed_time": "0:02:06", "remaining_time": "1:30:44", "throughput": 4470.03, "total_tokens": 564448} {"current_steps": 870, "total_steps": 38160, "loss": 0.5687, "lr": 0.00022772536687631028, "epoch": 0.4559748427672956, "percentage": 2.28, "elapsed_time": "0:02:06", "remaining_time": "1:30:38", "throughput": 4466.79, "total_tokens": 566752} {"current_steps": 875, "total_steps": 38160, "loss": 0.5288, "lr": 0.0002290356394129979, "epoch": 0.4585953878406709, "percentage": 2.29, "elapsed_time": "0:02:07", "remaining_time": "1:30:36", "throughput": 4466.63, "total_tokens": 569856} {"current_steps": 880, "total_steps": 38160, "loss": 0.5104, "lr": 0.00023034591194968554, "epoch": 0.4612159329140461, "percentage": 2.31, "elapsed_time": "0:02:08", "remaining_time": "1:30:35", "throughput": 4466.67, "total_tokens": 573056} {"current_steps": 885, "total_steps": 38160, "loss": 0.5814, "lr": 0.00023165618448637318, "epoch": 0.4638364779874214, "percentage": 2.32, "elapsed_time": "0:02:08", "remaining_time": "1:30:30", "throughput": 4465.02, "total_tokens": 575712} {"current_steps": 890, "total_steps": 38160, "loss": 0.4417, "lr": 0.00023296645702306079, "epoch": 0.46645702306079667, "percentage": 2.33, "elapsed_time": "0:02:09", "remaining_time": "1:30:29", "throughput": 4465.16, "total_tokens": 578880} {"current_steps": 895, "total_steps": 38160, "loss": 0.4844, "lr": 0.00023427672955974845, "epoch": 0.4690775681341719, "percentage": 2.35, "elapsed_time": "0:02:10", "remaining_time": "1:30:27", "throughput": 4464.31, "total_tokens": 581920} {"current_steps": 900, "total_steps": 38160, "loss": 0.5446, "lr": 0.00023558700209643608, "epoch": 0.4716981132075472, "percentage": 2.36, "elapsed_time": "0:02:11", "remaining_time": "1:30:23", "throughput": 4462.95, "total_tokens": 584672} {"current_steps": 905, "total_steps": 38160, "loss": 0.4763, "lr": 0.0002368972746331237, "epoch": 0.47431865828092246, "percentage": 2.37, "elapsed_time": "0:02:11", "remaining_time": "1:30:26", "throughput": 4465.65, "total_tokens": 588704} {"current_steps": 910, "total_steps": 38160, "loss": 0.5383, "lr": 0.00023820754716981132, "epoch": 0.4769392033542977, "percentage": 2.38, "elapsed_time": "0:02:12", "remaining_time": "1:30:24", "throughput": 4465.08, "total_tokens": 591712} {"current_steps": 915, "total_steps": 38160, "loss": 0.5598, "lr": 0.00023951781970649896, "epoch": 0.47955974842767296, "percentage": 2.4, "elapsed_time": "0:02:13", "remaining_time": "1:30:23", "throughput": 4466.19, "total_tokens": 595104} {"current_steps": 920, "total_steps": 38160, "loss": 0.494, "lr": 0.0002408280922431866, "epoch": 0.48218029350104824, "percentage": 2.41, "elapsed_time": "0:02:14", "remaining_time": "1:30:30", "throughput": 4470.86, "total_tokens": 599808} {"current_steps": 925, "total_steps": 38160, "loss": 0.4524, "lr": 0.00024213836477987423, "epoch": 0.48480083857442346, "percentage": 2.42, "elapsed_time": "0:02:14", "remaining_time": "1:30:27", "throughput": 4470.1, "total_tokens": 602720} {"current_steps": 930, "total_steps": 38160, "loss": 0.4922, "lr": 0.00024344863731656186, "epoch": 0.48742138364779874, "percentage": 2.44, "elapsed_time": "0:02:15", "remaining_time": "1:30:27", "throughput": 4470.91, "total_tokens": 606176} {"current_steps": 935, "total_steps": 38160, "loss": 0.4674, "lr": 0.00024475890985324947, "epoch": 0.490041928721174, "percentage": 2.45, "elapsed_time": "0:02:16", "remaining_time": "1:30:23", "throughput": 4469.18, "total_tokens": 608864} {"current_steps": 940, "total_steps": 38160, "loss": 0.5117, "lr": 0.0002460691823899371, "epoch": 0.49266247379454925, "percentage": 2.46, "elapsed_time": "0:02:16", "remaining_time": "1:30:22", "throughput": 4468.79, "total_tokens": 611968} {"current_steps": 945, "total_steps": 38160, "loss": 0.6172, "lr": 0.00024737945492662474, "epoch": 0.49528301886792453, "percentage": 2.48, "elapsed_time": "0:02:17", "remaining_time": "1:30:19", "throughput": 4468.12, "total_tokens": 614848} {"current_steps": 950, "total_steps": 38160, "loss": 0.665, "lr": 0.00024868972746331237, "epoch": 0.4979035639412998, "percentage": 2.49, "elapsed_time": "0:02:18", "remaining_time": "1:30:18", "throughput": 4468.02, "total_tokens": 618080} {"current_steps": 955, "total_steps": 38160, "loss": 0.3781, "lr": 0.00025, "epoch": 0.500524109014675, "percentage": 2.5, "elapsed_time": "0:02:18", "remaining_time": "1:30:14", "throughput": 4465.99, "total_tokens": 620736} {"current_steps": 960, "total_steps": 38160, "loss": 0.4699, "lr": 0.00025131027253668764, "epoch": 0.5031446540880503, "percentage": 2.52, "elapsed_time": "0:02:19", "remaining_time": "1:30:16", "throughput": 4467.9, "total_tokens": 624480} {"current_steps": 965, "total_steps": 38160, "loss": 0.4593, "lr": 0.0002526205450733753, "epoch": 0.5057651991614256, "percentage": 2.53, "elapsed_time": "0:02:20", "remaining_time": "1:30:18", "throughput": 4470.45, "total_tokens": 628448} {"current_steps": 970, "total_steps": 38160, "loss": 0.6066, "lr": 0.0002539308176100629, "epoch": 0.5083857442348009, "percentage": 2.54, "elapsed_time": "0:02:21", "remaining_time": "1:30:18", "throughput": 4471.55, "total_tokens": 632000} {"current_steps": 975, "total_steps": 38160, "loss": 0.6094, "lr": 0.0002552410901467505, "epoch": 0.5110062893081762, "percentage": 2.56, "elapsed_time": "0:02:22", "remaining_time": "1:30:20", "throughput": 4472.73, "total_tokens": 635680} {"current_steps": 980, "total_steps": 38160, "loss": 0.7542, "lr": 0.0002565513626834381, "epoch": 0.5136268343815513, "percentage": 2.57, "elapsed_time": "0:02:22", "remaining_time": "1:30:16", "throughput": 4471.82, "total_tokens": 638496} {"current_steps": 985, "total_steps": 38160, "loss": 0.4697, "lr": 0.0002578616352201258, "epoch": 0.5162473794549266, "percentage": 2.58, "elapsed_time": "0:02:23", "remaining_time": "1:30:18", "throughput": 4473.41, "total_tokens": 642272} {"current_steps": 990, "total_steps": 38160, "loss": 0.5283, "lr": 0.00025917190775681345, "epoch": 0.5188679245283019, "percentage": 2.59, "elapsed_time": "0:02:24", "remaining_time": "1:30:19", "throughput": 4474.5, "total_tokens": 645888} {"current_steps": 995, "total_steps": 38160, "loss": 0.3726, "lr": 0.0002604821802935011, "epoch": 0.5214884696016772, "percentage": 2.61, "elapsed_time": "0:02:25", "remaining_time": "1:30:33", "throughput": 4481.07, "total_tokens": 651808} {"current_steps": 1000, "total_steps": 38160, "loss": 0.5356, "lr": 0.0002617924528301887, "epoch": 0.5241090146750524, "percentage": 2.62, "elapsed_time": "0:02:26", "remaining_time": "1:30:34", "throughput": 4482.18, "total_tokens": 655488} {"current_steps": 1005, "total_steps": 38160, "loss": 0.4621, "lr": 0.0002631027253668763, "epoch": 0.5267295597484277, "percentage": 2.63, "elapsed_time": "0:02:26", "remaining_time": "1:30:34", "throughput": 4482.92, "total_tokens": 658976} {"current_steps": 1010, "total_steps": 38160, "loss": 0.4489, "lr": 0.00026441299790356393, "epoch": 0.5293501048218029, "percentage": 2.65, "elapsed_time": "0:02:27", "remaining_time": "1:30:32", "throughput": 4482.63, "total_tokens": 662048} {"current_steps": 1015, "total_steps": 38160, "loss": 0.5845, "lr": 0.00026572327044025156, "epoch": 0.5319706498951782, "percentage": 2.66, "elapsed_time": "0:02:28", "remaining_time": "1:30:28", "throughput": 4480.97, "total_tokens": 664640} {"current_steps": 1020, "total_steps": 38160, "loss": 0.489, "lr": 0.0002670335429769392, "epoch": 0.5345911949685535, "percentage": 2.67, "elapsed_time": "0:02:29", "remaining_time": "1:30:32", "throughput": 4484.34, "total_tokens": 669056} {"current_steps": 1025, "total_steps": 38160, "loss": 0.5195, "lr": 0.00026834381551362683, "epoch": 0.5372117400419287, "percentage": 2.69, "elapsed_time": "0:02:29", "remaining_time": "1:30:30", "throughput": 4483.78, "total_tokens": 672128} {"current_steps": 1030, "total_steps": 38160, "loss": 0.4863, "lr": 0.0002696540880503145, "epoch": 0.539832285115304, "percentage": 2.7, "elapsed_time": "0:02:30", "remaining_time": "1:30:28", "throughput": 4483.18, "total_tokens": 675136} {"current_steps": 1035, "total_steps": 38160, "loss": 0.6039, "lr": 0.0002709643605870021, "epoch": 0.5424528301886793, "percentage": 2.71, "elapsed_time": "0:02:31", "remaining_time": "1:30:30", "throughput": 4485.1, "total_tokens": 678976} {"current_steps": 1040, "total_steps": 38160, "loss": 0.6647, "lr": 0.00027227463312368973, "epoch": 0.5450733752620545, "percentage": 2.73, "elapsed_time": "0:02:32", "remaining_time": "1:30:28", "throughput": 4485.1, "total_tokens": 682176} {"current_steps": 1045, "total_steps": 38160, "loss": 0.5717, "lr": 0.00027358490566037737, "epoch": 0.5476939203354297, "percentage": 2.74, "elapsed_time": "0:02:32", "remaining_time": "1:30:24", "throughput": 4483.44, "total_tokens": 684768} {"current_steps": 1050, "total_steps": 38160, "loss": 0.5619, "lr": 0.000274895178197065, "epoch": 0.550314465408805, "percentage": 2.75, "elapsed_time": "0:02:33", "remaining_time": "1:30:21", "throughput": 4481.49, "total_tokens": 687392} {"current_steps": 1055, "total_steps": 38160, "loss": 0.4905, "lr": 0.00027620545073375264, "epoch": 0.5529350104821803, "percentage": 2.76, "elapsed_time": "0:02:34", "remaining_time": "1:30:19", "throughput": 4481.31, "total_tokens": 690496} {"current_steps": 1060, "total_steps": 38160, "loss": 0.6701, "lr": 0.00027751572327044027, "epoch": 0.5555555555555556, "percentage": 2.78, "elapsed_time": "0:02:34", "remaining_time": "1:30:16", "throughput": 4480.38, "total_tokens": 693376} {"current_steps": 1065, "total_steps": 38160, "loss": 0.4841, "lr": 0.00027882599580712785, "epoch": 0.5581761006289309, "percentage": 2.79, "elapsed_time": "0:02:35", "remaining_time": "1:30:12", "throughput": 4478.11, "total_tokens": 695808} {"current_steps": 1070, "total_steps": 38160, "loss": 0.491, "lr": 0.0002801362683438155, "epoch": 0.560796645702306, "percentage": 2.8, "elapsed_time": "0:02:36", "remaining_time": "1:30:12", "throughput": 4479.54, "total_tokens": 699424} {"current_steps": 1075, "total_steps": 38160, "loss": 0.5349, "lr": 0.0002814465408805031, "epoch": 0.5634171907756813, "percentage": 2.82, "elapsed_time": "0:02:36", "remaining_time": "1:30:14", "throughput": 4482.58, "total_tokens": 703584} {"current_steps": 1080, "total_steps": 38160, "loss": 0.5218, "lr": 0.0002827568134171908, "epoch": 0.5660377358490566, "percentage": 2.83, "elapsed_time": "0:02:37", "remaining_time": "1:30:10", "throughput": 4480.87, "total_tokens": 706144} {"current_steps": 1085, "total_steps": 38160, "loss": 0.5281, "lr": 0.00028406708595387844, "epoch": 0.5686582809224319, "percentage": 2.84, "elapsed_time": "0:02:38", "remaining_time": "1:30:07", "throughput": 4479.65, "total_tokens": 708864} {"current_steps": 1090, "total_steps": 38160, "loss": 0.5503, "lr": 0.0002853773584905661, "epoch": 0.5712788259958071, "percentage": 2.86, "elapsed_time": "0:02:38", "remaining_time": "1:30:07", "throughput": 4480.43, "total_tokens": 712352} {"current_steps": 1095, "total_steps": 38160, "loss": 0.7352, "lr": 0.00028668763102725366, "epoch": 0.5738993710691824, "percentage": 2.87, "elapsed_time": "0:02:39", "remaining_time": "1:30:04", "throughput": 4479.64, "total_tokens": 715296} {"current_steps": 1100, "total_steps": 38160, "loss": 0.4537, "lr": 0.0002879979035639413, "epoch": 0.5765199161425576, "percentage": 2.88, "elapsed_time": "0:02:40", "remaining_time": "1:30:03", "throughput": 4479.9, "total_tokens": 718528} {"current_steps": 1105, "total_steps": 38160, "loss": 0.4627, "lr": 0.00028930817610062893, "epoch": 0.5791404612159329, "percentage": 2.9, "elapsed_time": "0:02:42", "remaining_time": "1:30:43", "throughput": 4452.51, "total_tokens": 722752} {"current_steps": 1110, "total_steps": 38160, "loss": 0.4673, "lr": 0.00029061844863731656, "epoch": 0.5817610062893082, "percentage": 2.91, "elapsed_time": "0:02:43", "remaining_time": "1:30:42", "throughput": 4451.78, "total_tokens": 725824} {"current_steps": 1115, "total_steps": 38160, "loss": 0.5829, "lr": 0.0002919287211740042, "epoch": 0.5843815513626834, "percentage": 2.92, "elapsed_time": "0:02:43", "remaining_time": "1:30:44", "throughput": 4454.85, "total_tokens": 730080} {"current_steps": 1120, "total_steps": 38160, "loss": 0.5032, "lr": 0.00029323899371069183, "epoch": 0.5870020964360587, "percentage": 2.94, "elapsed_time": "0:02:44", "remaining_time": "1:30:43", "throughput": 4454.7, "total_tokens": 733216} {"current_steps": 1125, "total_steps": 38160, "loss": 0.6646, "lr": 0.00029454926624737946, "epoch": 0.589622641509434, "percentage": 2.95, "elapsed_time": "0:02:45", "remaining_time": "1:30:41", "throughput": 4454.78, "total_tokens": 736416} {"current_steps": 1130, "total_steps": 38160, "loss": 0.4559, "lr": 0.0002958595387840671, "epoch": 0.5922431865828093, "percentage": 2.96, "elapsed_time": "0:02:46", "remaining_time": "1:30:41", "throughput": 4455.13, "total_tokens": 739808} {"current_steps": 1135, "total_steps": 38160, "loss": 0.5518, "lr": 0.00029716981132075473, "epoch": 0.5948637316561844, "percentage": 2.97, "elapsed_time": "0:02:46", "remaining_time": "1:30:37", "throughput": 4453.64, "total_tokens": 742400} {"current_steps": 1140, "total_steps": 38160, "loss": 0.4005, "lr": 0.00029848008385744237, "epoch": 0.5974842767295597, "percentage": 2.99, "elapsed_time": "0:02:47", "remaining_time": "1:30:37", "throughput": 4454.14, "total_tokens": 745760} {"current_steps": 1145, "total_steps": 38160, "loss": 0.5925, "lr": 0.00029979035639413, "epoch": 0.600104821802935, "percentage": 3.0, "elapsed_time": "0:02:48", "remaining_time": "1:30:34", "throughput": 4453.74, "total_tokens": 748736} {"current_steps": 1150, "total_steps": 38160, "loss": 0.5357, "lr": 0.00030110062893081764, "epoch": 0.6027253668763103, "percentage": 3.01, "elapsed_time": "0:02:48", "remaining_time": "1:30:33", "throughput": 4454.07, "total_tokens": 752032} {"current_steps": 1155, "total_steps": 38160, "loss": 0.491, "lr": 0.00030241090146750527, "epoch": 0.6053459119496856, "percentage": 3.03, "elapsed_time": "0:02:49", "remaining_time": "1:30:38", "throughput": 4457.88, "total_tokens": 756736} {"current_steps": 1160, "total_steps": 38160, "loss": 0.4877, "lr": 0.00030372117400419285, "epoch": 0.6079664570230608, "percentage": 3.04, "elapsed_time": "0:02:50", "remaining_time": "1:30:36", "throughput": 4457.18, "total_tokens": 759680} {"current_steps": 1165, "total_steps": 38160, "loss": 0.5316, "lr": 0.0003050314465408805, "epoch": 0.610587002096436, "percentage": 3.05, "elapsed_time": "0:02:51", "remaining_time": "1:30:33", "throughput": 4456.38, "total_tokens": 762560} {"current_steps": 1170, "total_steps": 38160, "loss": 0.4494, "lr": 0.0003063417190775681, "epoch": 0.6132075471698113, "percentage": 3.07, "elapsed_time": "0:02:51", "remaining_time": "1:30:31", "throughput": 4456.07, "total_tokens": 765600} {"current_steps": 1175, "total_steps": 38160, "loss": 0.4, "lr": 0.00030765199161425575, "epoch": 0.6158280922431866, "percentage": 3.08, "elapsed_time": "0:02:52", "remaining_time": "1:30:30", "throughput": 4456.09, "total_tokens": 768736} {"current_steps": 1180, "total_steps": 38160, "loss": 0.6684, "lr": 0.00030896226415094344, "epoch": 0.6184486373165619, "percentage": 3.09, "elapsed_time": "0:02:53", "remaining_time": "1:30:28", "throughput": 4455.83, "total_tokens": 771872} {"current_steps": 1185, "total_steps": 38160, "loss": 0.619, "lr": 0.0003102725366876311, "epoch": 0.6210691823899371, "percentage": 3.11, "elapsed_time": "0:02:53", "remaining_time": "1:30:27", "throughput": 4455.58, "total_tokens": 775008} {"current_steps": 1190, "total_steps": 38160, "loss": 0.4269, "lr": 0.00031158280922431866, "epoch": 0.6236897274633124, "percentage": 3.12, "elapsed_time": "0:02:54", "remaining_time": "1:30:25", "throughput": 4454.89, "total_tokens": 777920} {"current_steps": 1195, "total_steps": 38160, "loss": 0.5171, "lr": 0.0003128930817610063, "epoch": 0.6263102725366876, "percentage": 3.13, "elapsed_time": "0:02:55", "remaining_time": "1:30:23", "throughput": 4455.15, "total_tokens": 781056} {"current_steps": 1200, "total_steps": 38160, "loss": 0.5798, "lr": 0.0003142033542976939, "epoch": 0.6289308176100629, "percentage": 3.14, "elapsed_time": "0:02:56", "remaining_time": "1:30:21", "throughput": 4455.03, "total_tokens": 784128} {"current_steps": 1205, "total_steps": 38160, "loss": 0.5388, "lr": 0.00031551362683438156, "epoch": 0.6315513626834381, "percentage": 3.16, "elapsed_time": "0:02:56", "remaining_time": "1:30:17", "throughput": 4453.28, "total_tokens": 786624} {"current_steps": 1210, "total_steps": 38160, "loss": 0.5321, "lr": 0.0003168238993710692, "epoch": 0.6341719077568134, "percentage": 3.17, "elapsed_time": "0:02:57", "remaining_time": "1:30:15", "throughput": 4452.83, "total_tokens": 789664} {"current_steps": 1215, "total_steps": 38160, "loss": 0.4326, "lr": 0.00031813417190775683, "epoch": 0.6367924528301887, "percentage": 3.18, "elapsed_time": "0:02:58", "remaining_time": "1:30:18", "throughput": 4455.05, "total_tokens": 793824} {"current_steps": 1220, "total_steps": 38160, "loss": 0.6322, "lr": 0.0003194444444444444, "epoch": 0.639412997903564, "percentage": 3.2, "elapsed_time": "0:02:58", "remaining_time": "1:30:15", "throughput": 4453.98, "total_tokens": 796544} {"current_steps": 1225, "total_steps": 38160, "loss": 0.4127, "lr": 0.00032075471698113204, "epoch": 0.6420335429769392, "percentage": 3.21, "elapsed_time": "0:02:59", "remaining_time": "1:30:12", "throughput": 4453.66, "total_tokens": 799520} {"current_steps": 1230, "total_steps": 38160, "loss": 0.3456, "lr": 0.00032206498951781973, "epoch": 0.6446540880503144, "percentage": 3.22, "elapsed_time": "0:03:00", "remaining_time": "1:30:10", "throughput": 4452.98, "total_tokens": 802464} {"current_steps": 1235, "total_steps": 38160, "loss": 0.5828, "lr": 0.00032337526205450737, "epoch": 0.6472746331236897, "percentage": 3.24, "elapsed_time": "0:03:00", "remaining_time": "1:30:08", "throughput": 4452.71, "total_tokens": 805536} {"current_steps": 1240, "total_steps": 38160, "loss": 0.3669, "lr": 0.000324685534591195, "epoch": 0.649895178197065, "percentage": 3.25, "elapsed_time": "0:03:01", "remaining_time": "1:30:06", "throughput": 4452.15, "total_tokens": 808448} {"current_steps": 1245, "total_steps": 38160, "loss": 0.4455, "lr": 0.00032599580712788263, "epoch": 0.6525157232704403, "percentage": 3.26, "elapsed_time": "0:03:02", "remaining_time": "1:30:07", "throughput": 4453.45, "total_tokens": 812160} {"current_steps": 1250, "total_steps": 38160, "loss": 0.637, "lr": 0.0003273060796645702, "epoch": 0.6551362683438156, "percentage": 3.28, "elapsed_time": "0:03:03", "remaining_time": "1:30:03", "throughput": 4452.16, "total_tokens": 814752} {"current_steps": 1255, "total_steps": 38160, "loss": 0.4277, "lr": 0.00032861635220125785, "epoch": 0.6577568134171907, "percentage": 3.29, "elapsed_time": "0:03:03", "remaining_time": "1:30:01", "throughput": 4451.26, "total_tokens": 817568} {"current_steps": 1260, "total_steps": 38160, "loss": 0.5027, "lr": 0.0003299266247379455, "epoch": 0.660377358490566, "percentage": 3.3, "elapsed_time": "0:03:04", "remaining_time": "1:29:58", "throughput": 4450.57, "total_tokens": 820384} {"current_steps": 1265, "total_steps": 38160, "loss": 0.3046, "lr": 0.0003312368972746331, "epoch": 0.6629979035639413, "percentage": 3.31, "elapsed_time": "0:03:04", "remaining_time": "1:29:55", "throughput": 4449.32, "total_tokens": 823040} {"current_steps": 1270, "total_steps": 38160, "loss": 0.5936, "lr": 0.00033254716981132075, "epoch": 0.6656184486373166, "percentage": 3.33, "elapsed_time": "0:03:05", "remaining_time": "1:29:51", "throughput": 4447.62, "total_tokens": 825600} {"current_steps": 1275, "total_steps": 38160, "loss": 0.5951, "lr": 0.0003338574423480084, "epoch": 0.6682389937106918, "percentage": 3.34, "elapsed_time": "0:03:06", "remaining_time": "1:29:48", "throughput": 4445.83, "total_tokens": 828032} {"current_steps": 1280, "total_steps": 38160, "loss": 0.4522, "lr": 0.0003351677148846961, "epoch": 0.6708595387840671, "percentage": 3.35, "elapsed_time": "0:03:06", "remaining_time": "1:29:47", "throughput": 4445.96, "total_tokens": 831296} {"current_steps": 1285, "total_steps": 38160, "loss": 0.6076, "lr": 0.00033647798742138366, "epoch": 0.6734800838574424, "percentage": 3.37, "elapsed_time": "0:03:07", "remaining_time": "1:29:45", "throughput": 4445.25, "total_tokens": 834208} {"current_steps": 1290, "total_steps": 38160, "loss": 0.4781, "lr": 0.0003377882599580713, "epoch": 0.6761006289308176, "percentage": 3.38, "elapsed_time": "0:03:08", "remaining_time": "1:29:46", "throughput": 4447.04, "total_tokens": 838048} {"current_steps": 1295, "total_steps": 38160, "loss": 0.5903, "lr": 0.0003390985324947589, "epoch": 0.6787211740041929, "percentage": 3.39, "elapsed_time": "0:03:09", "remaining_time": "1:29:45", "throughput": 4447.97, "total_tokens": 841536} {"current_steps": 1300, "total_steps": 38160, "loss": 0.4476, "lr": 0.00034040880503144656, "epoch": 0.6813417190775681, "percentage": 3.41, "elapsed_time": "0:03:09", "remaining_time": "1:29:46", "throughput": 4448.92, "total_tokens": 845184} {"current_steps": 1305, "total_steps": 38160, "loss": 0.442, "lr": 0.0003417190775681342, "epoch": 0.6839622641509434, "percentage": 3.42, "elapsed_time": "0:03:10", "remaining_time": "1:29:43", "throughput": 4448.21, "total_tokens": 848000} {"current_steps": 1310, "total_steps": 38160, "loss": 0.5777, "lr": 0.00034302935010482183, "epoch": 0.6865828092243187, "percentage": 3.43, "elapsed_time": "0:03:11", "remaining_time": "1:29:42", "throughput": 4447.86, "total_tokens": 851040} {"current_steps": 1315, "total_steps": 38160, "loss": 0.5948, "lr": 0.0003443396226415094, "epoch": 0.689203354297694, "percentage": 3.45, "elapsed_time": "0:03:12", "remaining_time": "1:29:39", "throughput": 4447.38, "total_tokens": 853920} {"current_steps": 1320, "total_steps": 38160, "loss": 0.513, "lr": 0.00034564989517819704, "epoch": 0.6918238993710691, "percentage": 3.46, "elapsed_time": "0:03:12", "remaining_time": "1:29:38", "throughput": 4448.2, "total_tokens": 857312} {"current_steps": 1325, "total_steps": 38160, "loss": 0.4137, "lr": 0.0003469601677148847, "epoch": 0.6944444444444444, "percentage": 3.47, "elapsed_time": "0:03:13", "remaining_time": "1:29:35", "throughput": 4446.87, "total_tokens": 859904} {"current_steps": 1330, "total_steps": 38160, "loss": 0.5575, "lr": 0.00034827044025157236, "epoch": 0.6970649895178197, "percentage": 3.49, "elapsed_time": "0:03:14", "remaining_time": "1:29:36", "throughput": 4448.57, "total_tokens": 863680} {"current_steps": 1335, "total_steps": 38160, "loss": 0.5729, "lr": 0.00034958071278826, "epoch": 0.699685534591195, "percentage": 3.5, "elapsed_time": "0:03:14", "remaining_time": "1:29:35", "throughput": 4448.67, "total_tokens": 866880} {"current_steps": 1340, "total_steps": 38160, "loss": 0.4186, "lr": 0.00035089098532494763, "epoch": 0.7023060796645703, "percentage": 3.51, "elapsed_time": "0:03:15", "remaining_time": "1:29:33", "throughput": 4448.24, "total_tokens": 869856} {"current_steps": 1345, "total_steps": 38160, "loss": 0.5439, "lr": 0.0003522012578616352, "epoch": 0.7049266247379455, "percentage": 3.52, "elapsed_time": "0:03:16", "remaining_time": "1:29:33", "throughput": 4449.2, "total_tokens": 873472} {"current_steps": 1350, "total_steps": 38160, "loss": 0.4465, "lr": 0.00035351153039832285, "epoch": 0.7075471698113207, "percentage": 3.54, "elapsed_time": "0:03:17", "remaining_time": "1:29:32", "throughput": 4449.41, "total_tokens": 876704} {"current_steps": 1355, "total_steps": 38160, "loss": 0.4769, "lr": 0.0003548218029350105, "epoch": 0.710167714884696, "percentage": 3.55, "elapsed_time": "0:03:17", "remaining_time": "1:29:33", "throughput": 4450.96, "total_tokens": 880576} {"current_steps": 1360, "total_steps": 38160, "loss": 0.4906, "lr": 0.0003561320754716981, "epoch": 0.7127882599580713, "percentage": 3.56, "elapsed_time": "0:03:18", "remaining_time": "1:29:32", "throughput": 4450.95, "total_tokens": 883680} {"current_steps": 1365, "total_steps": 38160, "loss": 0.5653, "lr": 0.00035744234800838575, "epoch": 0.7154088050314465, "percentage": 3.58, "elapsed_time": "0:03:19", "remaining_time": "1:29:29", "throughput": 4450.03, "total_tokens": 886464} {"current_steps": 1370, "total_steps": 38160, "loss": 0.5247, "lr": 0.0003587526205450734, "epoch": 0.7180293501048218, "percentage": 3.59, "elapsed_time": "0:03:19", "remaining_time": "1:29:28", "throughput": 4449.7, "total_tokens": 889536} {"current_steps": 1375, "total_steps": 38160, "loss": 0.507, "lr": 0.00036006289308176097, "epoch": 0.7206498951781971, "percentage": 3.6, "elapsed_time": "0:03:20", "remaining_time": "1:29:32", "throughput": 4452.79, "total_tokens": 894272} {"current_steps": 1380, "total_steps": 38160, "loss": 0.4721, "lr": 0.00036137316561844865, "epoch": 0.7232704402515723, "percentage": 3.62, "elapsed_time": "0:03:21", "remaining_time": "1:29:30", "throughput": 4452.09, "total_tokens": 897120} {"current_steps": 1385, "total_steps": 38160, "loss": 0.4942, "lr": 0.0003626834381551363, "epoch": 0.7258909853249476, "percentage": 3.63, "elapsed_time": "0:03:22", "remaining_time": "1:29:27", "throughput": 4451.18, "total_tokens": 899808} {"current_steps": 1390, "total_steps": 38160, "loss": 0.4896, "lr": 0.0003639937106918239, "epoch": 0.7285115303983228, "percentage": 3.64, "elapsed_time": "0:03:22", "remaining_time": "1:29:28", "throughput": 4452.43, "total_tokens": 903520} {"current_steps": 1395, "total_steps": 38160, "loss": 0.5451, "lr": 0.00036530398322851156, "epoch": 0.7311320754716981, "percentage": 3.66, "elapsed_time": "0:03:23", "remaining_time": "1:29:28", "throughput": 4453.51, "total_tokens": 907200} {"current_steps": 1400, "total_steps": 38160, "loss": 0.4845, "lr": 0.0003666142557651992, "epoch": 0.7337526205450734, "percentage": 3.67, "elapsed_time": "0:03:24", "remaining_time": "1:29:30", "throughput": 4455.68, "total_tokens": 911392} {"current_steps": 1405, "total_steps": 38160, "loss": 0.5145, "lr": 0.00036792452830188677, "epoch": 0.7363731656184487, "percentage": 3.68, "elapsed_time": "0:03:25", "remaining_time": "1:29:26", "throughput": 4453.09, "total_tokens": 913440} {"current_steps": 1410, "total_steps": 38160, "loss": 0.4958, "lr": 0.0003692348008385744, "epoch": 0.7389937106918238, "percentage": 3.69, "elapsed_time": "0:03:26", "remaining_time": "1:29:29", "throughput": 4455.5, "total_tokens": 917888} {"current_steps": 1415, "total_steps": 38160, "loss": 0.5504, "lr": 0.00037054507337526204, "epoch": 0.7416142557651991, "percentage": 3.71, "elapsed_time": "0:03:26", "remaining_time": "1:29:29", "throughput": 4456.12, "total_tokens": 921376} {"current_steps": 1420, "total_steps": 38160, "loss": 0.5504, "lr": 0.0003718553459119497, "epoch": 0.7442348008385744, "percentage": 3.72, "elapsed_time": "0:03:27", "remaining_time": "1:29:28", "throughput": 4456.66, "total_tokens": 924800} {"current_steps": 1425, "total_steps": 38160, "loss": 0.64, "lr": 0.0003731656184486373, "epoch": 0.7468553459119497, "percentage": 3.73, "elapsed_time": "0:03:28", "remaining_time": "1:29:26", "throughput": 4455.72, "total_tokens": 927648} {"current_steps": 1430, "total_steps": 38160, "loss": 0.4149, "lr": 0.000374475890985325, "epoch": 0.749475890985325, "percentage": 3.75, "elapsed_time": "0:03:28", "remaining_time": "1:29:23", "throughput": 4454.31, "total_tokens": 930144} {"current_steps": 1435, "total_steps": 38160, "loss": 0.413, "lr": 0.00037578616352201263, "epoch": 0.7520964360587002, "percentage": 3.76, "elapsed_time": "0:03:29", "remaining_time": "1:29:22", "throughput": 4453.92, "total_tokens": 933184} {"current_steps": 1440, "total_steps": 38160, "loss": 0.5526, "lr": 0.0003770964360587002, "epoch": 0.7547169811320755, "percentage": 3.77, "elapsed_time": "0:03:30", "remaining_time": "1:29:24", "throughput": 4455.84, "total_tokens": 937376} {"current_steps": 1445, "total_steps": 38160, "loss": 0.4662, "lr": 0.00037840670859538785, "epoch": 0.7573375262054507, "percentage": 3.79, "elapsed_time": "0:03:31", "remaining_time": "1:29:22", "throughput": 4454.83, "total_tokens": 940160} {"current_steps": 1450, "total_steps": 38160, "loss": 0.5484, "lr": 0.0003797169811320755, "epoch": 0.759958071278826, "percentage": 3.8, "elapsed_time": "0:03:31", "remaining_time": "1:29:19", "throughput": 4453.68, "total_tokens": 942816} {"current_steps": 1455, "total_steps": 38160, "loss": 0.5784, "lr": 0.0003810272536687631, "epoch": 0.7625786163522013, "percentage": 3.81, "elapsed_time": "0:03:32", "remaining_time": "1:29:18", "throughput": 4453.63, "total_tokens": 945952} {"current_steps": 1460, "total_steps": 38160, "loss": 0.3904, "lr": 0.00038233752620545075, "epoch": 0.7651991614255765, "percentage": 3.83, "elapsed_time": "0:03:33", "remaining_time": "1:29:18", "throughput": 4454.24, "total_tokens": 949472} {"current_steps": 1465, "total_steps": 38160, "loss": 0.5353, "lr": 0.0003836477987421384, "epoch": 0.7678197064989518, "percentage": 3.84, "elapsed_time": "0:03:33", "remaining_time": "1:29:17", "throughput": 4454.27, "total_tokens": 952672} {"current_steps": 1470, "total_steps": 38160, "loss": 0.5603, "lr": 0.00038495807127882596, "epoch": 0.7704402515723271, "percentage": 3.85, "elapsed_time": "0:03:34", "remaining_time": "1:29:14", "throughput": 4453.67, "total_tokens": 955520} {"current_steps": 1475, "total_steps": 38160, "loss": 0.5678, "lr": 0.0003862683438155136, "epoch": 0.7730607966457023, "percentage": 3.87, "elapsed_time": "0:03:35", "remaining_time": "1:29:13", "throughput": 4453.2, "total_tokens": 958464} {"current_steps": 1480, "total_steps": 38160, "loss": 0.4988, "lr": 0.0003875786163522013, "epoch": 0.7756813417190775, "percentage": 3.88, "elapsed_time": "0:03:35", "remaining_time": "1:29:09", "throughput": 4451.38, "total_tokens": 960768} {"current_steps": 1485, "total_steps": 38160, "loss": 0.6904, "lr": 0.0003888888888888889, "epoch": 0.7783018867924528, "percentage": 3.89, "elapsed_time": "0:03:36", "remaining_time": "1:29:06", "throughput": 4450.86, "total_tokens": 963616} {"current_steps": 1490, "total_steps": 38160, "loss": 0.7019, "lr": 0.00039019916142557656, "epoch": 0.7809224318658281, "percentage": 3.9, "elapsed_time": "0:03:37", "remaining_time": "1:29:09", "throughput": 4453.32, "total_tokens": 967936} {"current_steps": 1495, "total_steps": 38160, "loss": 0.481, "lr": 0.0003915094339622642, "epoch": 0.7835429769392034, "percentage": 3.92, "elapsed_time": "0:03:38", "remaining_time": "1:29:10", "throughput": 4454.56, "total_tokens": 971744} {"current_steps": 1500, "total_steps": 38160, "loss": 0.5369, "lr": 0.00039281970649895177, "epoch": 0.7861635220125787, "percentage": 3.93, "elapsed_time": "0:03:38", "remaining_time": "1:29:06", "throughput": 4452.85, "total_tokens": 974080} {"current_steps": 1505, "total_steps": 38160, "loss": 0.4812, "lr": 0.0003941299790356394, "epoch": 0.7887840670859538, "percentage": 3.94, "elapsed_time": "0:03:39", "remaining_time": "1:29:04", "throughput": 4452.33, "total_tokens": 976992} {"current_steps": 1510, "total_steps": 38160, "loss": 0.5068, "lr": 0.00039544025157232704, "epoch": 0.7914046121593291, "percentage": 3.96, "elapsed_time": "0:03:40", "remaining_time": "1:29:01", "throughput": 4451.25, "total_tokens": 979648} {"current_steps": 1515, "total_steps": 38160, "loss": 0.5554, "lr": 0.0003967505241090147, "epoch": 0.7940251572327044, "percentage": 3.97, "elapsed_time": "0:03:40", "remaining_time": "1:29:01", "throughput": 4451.88, "total_tokens": 983136} {"current_steps": 1520, "total_steps": 38160, "loss": 0.4946, "lr": 0.0003980607966457023, "epoch": 0.7966457023060797, "percentage": 3.98, "elapsed_time": "0:03:41", "remaining_time": "1:29:02", "throughput": 4453.29, "total_tokens": 986976} {"current_steps": 1525, "total_steps": 38160, "loss": 0.4699, "lr": 0.00039937106918238994, "epoch": 0.799266247379455, "percentage": 4.0, "elapsed_time": "0:03:42", "remaining_time": "1:29:01", "throughput": 4453.47, "total_tokens": 990272} {"current_steps": 1530, "total_steps": 38160, "loss": 0.4808, "lr": 0.0004006813417190776, "epoch": 0.8018867924528302, "percentage": 4.01, "elapsed_time": "0:03:43", "remaining_time": "1:29:03", "throughput": 4455.29, "total_tokens": 994368} {"current_steps": 1535, "total_steps": 38160, "loss": 0.4407, "lr": 0.0004019916142557652, "epoch": 0.8045073375262054, "percentage": 4.02, "elapsed_time": "0:03:43", "remaining_time": "1:29:02", "throughput": 4455.27, "total_tokens": 997504} {"current_steps": 1540, "total_steps": 38160, "loss": 0.568, "lr": 0.00040330188679245284, "epoch": 0.8071278825995807, "percentage": 4.04, "elapsed_time": "0:03:44", "remaining_time": "1:28:59", "throughput": 4454.63, "total_tokens": 1000352} {"current_steps": 1545, "total_steps": 38160, "loss": 0.58, "lr": 0.0004046121593291405, "epoch": 0.809748427672956, "percentage": 4.05, "elapsed_time": "0:03:45", "remaining_time": "1:28:58", "throughput": 4454.91, "total_tokens": 1003616} {"current_steps": 1550, "total_steps": 38160, "loss": 0.5682, "lr": 0.0004059224318658281, "epoch": 0.8123689727463312, "percentage": 4.06, "elapsed_time": "0:03:45", "remaining_time": "1:28:56", "throughput": 4454.03, "total_tokens": 1006240} {"current_steps": 1555, "total_steps": 38160, "loss": 0.5371, "lr": 0.00040723270440251575, "epoch": 0.8149895178197065, "percentage": 4.07, "elapsed_time": "0:03:46", "remaining_time": "1:28:55", "throughput": 4454.0, "total_tokens": 1009440} {"current_steps": 1560, "total_steps": 38160, "loss": 0.5506, "lr": 0.00040854297693920333, "epoch": 0.8176100628930818, "percentage": 4.09, "elapsed_time": "0:03:47", "remaining_time": "1:28:51", "throughput": 4452.75, "total_tokens": 1011936} {"current_steps": 1565, "total_steps": 38160, "loss": 0.4716, "lr": 0.00040985324947589096, "epoch": 0.820230607966457, "percentage": 4.1, "elapsed_time": "0:03:47", "remaining_time": "1:28:50", "throughput": 4452.69, "total_tokens": 1015040} {"current_steps": 1570, "total_steps": 38160, "loss": 0.5998, "lr": 0.0004111635220125786, "epoch": 0.8228511530398323, "percentage": 4.11, "elapsed_time": "0:03:48", "remaining_time": "1:28:49", "throughput": 4452.66, "total_tokens": 1018240} {"current_steps": 1575, "total_steps": 38160, "loss": 0.503, "lr": 0.00041247379454926623, "epoch": 0.8254716981132075, "percentage": 4.13, "elapsed_time": "0:03:49", "remaining_time": "1:28:50", "throughput": 4454.63, "total_tokens": 1022336} {"current_steps": 1580, "total_steps": 38160, "loss": 0.5135, "lr": 0.0004137840670859539, "epoch": 0.8280922431865828, "percentage": 4.14, "elapsed_time": "0:03:50", "remaining_time": "1:28:48", "throughput": 4454.0, "total_tokens": 1025184} {"current_steps": 1585, "total_steps": 38160, "loss": 0.5793, "lr": 0.00041509433962264155, "epoch": 0.8307127882599581, "percentage": 4.15, "elapsed_time": "0:03:50", "remaining_time": "1:28:48", "throughput": 4454.21, "total_tokens": 1028448} {"current_steps": 1590, "total_steps": 38160, "loss": 0.5545, "lr": 0.00041640461215932913, "epoch": 0.8333333333333334, "percentage": 4.17, "elapsed_time": "0:03:51", "remaining_time": "1:28:45", "throughput": 4453.04, "total_tokens": 1031072} {"current_steps": 1595, "total_steps": 38160, "loss": 0.476, "lr": 0.00041771488469601677, "epoch": 0.8359538784067087, "percentage": 4.18, "elapsed_time": "0:03:52", "remaining_time": "1:28:44", "throughput": 4453.05, "total_tokens": 1034208} {"current_steps": 1600, "total_steps": 38160, "loss": 0.4526, "lr": 0.0004190251572327044, "epoch": 0.8385744234800838, "percentage": 4.19, "elapsed_time": "0:03:53", "remaining_time": "1:28:46", "throughput": 4455.19, "total_tokens": 1038624} {"current_steps": 1605, "total_steps": 38160, "loss": 0.5629, "lr": 0.00042033542976939204, "epoch": 0.8411949685534591, "percentage": 4.21, "elapsed_time": "0:03:53", "remaining_time": "1:28:44", "throughput": 4453.91, "total_tokens": 1041152} {"current_steps": 1610, "total_steps": 38160, "loss": 0.4165, "lr": 0.00042164570230607967, "epoch": 0.8438155136268344, "percentage": 4.22, "elapsed_time": "0:03:54", "remaining_time": "1:28:41", "throughput": 4453.21, "total_tokens": 1043904} {"current_steps": 1615, "total_steps": 38160, "loss": 0.5203, "lr": 0.0004229559748427673, "epoch": 0.8464360587002097, "percentage": 4.23, "elapsed_time": "0:03:55", "remaining_time": "1:28:41", "throughput": 4453.86, "total_tokens": 1047456} {"current_steps": 1620, "total_steps": 38160, "loss": 0.5663, "lr": 0.00042426624737945494, "epoch": 0.8490566037735849, "percentage": 4.25, "elapsed_time": "0:03:55", "remaining_time": "1:28:39", "throughput": 4453.07, "total_tokens": 1050304} {"current_steps": 1625, "total_steps": 38160, "loss": 0.5146, "lr": 0.0004255765199161425, "epoch": 0.8516771488469602, "percentage": 4.26, "elapsed_time": "0:03:56", "remaining_time": "1:28:39", "throughput": 4453.15, "total_tokens": 1053600} {"current_steps": 1630, "total_steps": 38160, "loss": 0.3679, "lr": 0.0004268867924528302, "epoch": 0.8542976939203354, "percentage": 4.27, "elapsed_time": "0:03:57", "remaining_time": "1:28:38", "throughput": 4452.98, "total_tokens": 1056672} {"current_steps": 1635, "total_steps": 38160, "loss": 0.3992, "lr": 0.00042819706498951784, "epoch": 0.8569182389937107, "percentage": 4.28, "elapsed_time": "0:03:58", "remaining_time": "1:28:37", "throughput": 4452.86, "total_tokens": 1059904} {"current_steps": 1640, "total_steps": 38160, "loss": 0.5048, "lr": 0.0004295073375262055, "epoch": 0.859538784067086, "percentage": 4.3, "elapsed_time": "0:03:58", "remaining_time": "1:28:36", "throughput": 4453.5, "total_tokens": 1063360} {"current_steps": 1645, "total_steps": 38160, "loss": 0.508, "lr": 0.0004308176100628931, "epoch": 0.8621593291404612, "percentage": 4.31, "elapsed_time": "0:03:59", "remaining_time": "1:28:33", "throughput": 4452.06, "total_tokens": 1065728} {"current_steps": 1650, "total_steps": 38160, "loss": 0.481, "lr": 0.00043212788259958075, "epoch": 0.8647798742138365, "percentage": 4.32, "elapsed_time": "0:04:00", "remaining_time": "1:28:31", "throughput": 4451.19, "total_tokens": 1068448} {"current_steps": 1655, "total_steps": 38160, "loss": 0.5102, "lr": 0.0004334381551362683, "epoch": 0.8674004192872118, "percentage": 4.34, "elapsed_time": "0:04:00", "remaining_time": "1:28:28", "throughput": 4450.29, "total_tokens": 1071104} {"current_steps": 1660, "total_steps": 38160, "loss": 0.4178, "lr": 0.00043474842767295596, "epoch": 0.870020964360587, "percentage": 4.35, "elapsed_time": "0:04:01", "remaining_time": "1:28:30", "throughput": 4451.6, "total_tokens": 1075072} {"current_steps": 1665, "total_steps": 38160, "loss": 0.5128, "lr": 0.0004360587002096436, "epoch": 0.8726415094339622, "percentage": 4.36, "elapsed_time": "0:04:02", "remaining_time": "1:28:27", "throughput": 4450.98, "total_tokens": 1077824} {"current_steps": 1670, "total_steps": 38160, "loss": 0.4771, "lr": 0.00043736897274633123, "epoch": 0.8752620545073375, "percentage": 4.38, "elapsed_time": "0:04:02", "remaining_time": "1:28:26", "throughput": 4450.73, "total_tokens": 1080832} {"current_steps": 1675, "total_steps": 38160, "loss": 0.543, "lr": 0.00043867924528301886, "epoch": 0.8778825995807128, "percentage": 4.39, "elapsed_time": "0:04:03", "remaining_time": "1:28:25", "throughput": 4450.83, "total_tokens": 1084096} {"current_steps": 1680, "total_steps": 38160, "loss": 0.5159, "lr": 0.00043998951781970655, "epoch": 0.8805031446540881, "percentage": 4.4, "elapsed_time": "0:04:04", "remaining_time": "1:28:24", "throughput": 4450.39, "total_tokens": 1087104} {"current_steps": 1685, "total_steps": 38160, "loss": 0.5715, "lr": 0.00044129979035639413, "epoch": 0.8831236897274634, "percentage": 4.42, "elapsed_time": "0:04:04", "remaining_time": "1:28:22", "throughput": 4450.63, "total_tokens": 1090304} {"current_steps": 1690, "total_steps": 38160, "loss": 0.7883, "lr": 0.00044261006289308177, "epoch": 0.8857442348008385, "percentage": 4.43, "elapsed_time": "0:04:05", "remaining_time": "1:28:23", "throughput": 4451.75, "total_tokens": 1094112} {"current_steps": 1695, "total_steps": 38160, "loss": 0.5333, "lr": 0.0004439203354297694, "epoch": 0.8883647798742138, "percentage": 4.44, "elapsed_time": "0:04:06", "remaining_time": "1:28:26", "throughput": 4453.65, "total_tokens": 1098496} {"current_steps": 1700, "total_steps": 38160, "loss": 0.4503, "lr": 0.00044523060796645704, "epoch": 0.8909853249475891, "percentage": 4.45, "elapsed_time": "0:04:07", "remaining_time": "1:28:23", "throughput": 4452.38, "total_tokens": 1100992} {"current_steps": 1705, "total_steps": 38160, "loss": 0.5451, "lr": 0.00044654088050314467, "epoch": 0.8936058700209644, "percentage": 4.47, "elapsed_time": "0:04:07", "remaining_time": "1:28:21", "throughput": 4451.74, "total_tokens": 1103776} {"current_steps": 1710, "total_steps": 38160, "loss": 0.452, "lr": 0.0004478511530398323, "epoch": 0.8962264150943396, "percentage": 4.48, "elapsed_time": "0:04:08", "remaining_time": "1:28:18", "throughput": 4450.71, "total_tokens": 1106368} {"current_steps": 1715, "total_steps": 38160, "loss": 0.4424, "lr": 0.0004491614255765199, "epoch": 0.8988469601677149, "percentage": 4.49, "elapsed_time": "0:04:09", "remaining_time": "1:28:17", "throughput": 4450.3, "total_tokens": 1109376} {"current_steps": 1720, "total_steps": 38160, "loss": 0.4653, "lr": 0.0004504716981132075, "epoch": 0.9014675052410901, "percentage": 4.51, "elapsed_time": "0:04:09", "remaining_time": "1:28:16", "throughput": 4449.96, "total_tokens": 1112448} {"current_steps": 1725, "total_steps": 38160, "loss": 0.4825, "lr": 0.00045178197064989515, "epoch": 0.9040880503144654, "percentage": 4.52, "elapsed_time": "0:04:10", "remaining_time": "1:28:15", "throughput": 4449.67, "total_tokens": 1115520} {"current_steps": 1730, "total_steps": 38160, "loss": 0.6451, "lr": 0.00045309224318658284, "epoch": 0.9067085953878407, "percentage": 4.53, "elapsed_time": "0:04:11", "remaining_time": "1:28:14", "throughput": 4450.01, "total_tokens": 1118784} {"current_steps": 1735, "total_steps": 38160, "loss": 0.7135, "lr": 0.0004544025157232705, "epoch": 0.9093291404612159, "percentage": 4.55, "elapsed_time": "0:04:12", "remaining_time": "1:28:13", "throughput": 4450.44, "total_tokens": 1122112} {"current_steps": 1740, "total_steps": 38160, "loss": 0.4702, "lr": 0.0004557127882599581, "epoch": 0.9119496855345912, "percentage": 4.56, "elapsed_time": "0:04:12", "remaining_time": "1:28:13", "throughput": 4451.72, "total_tokens": 1125952} {"current_steps": 1745, "total_steps": 38160, "loss": 0.657, "lr": 0.0004570230607966457, "epoch": 0.9145702306079665, "percentage": 4.57, "elapsed_time": "0:04:13", "remaining_time": "1:28:12", "throughput": 4451.66, "total_tokens": 1129024} {"current_steps": 1750, "total_steps": 38160, "loss": 0.4666, "lr": 0.0004583333333333333, "epoch": 0.9171907756813418, "percentage": 4.59, "elapsed_time": "0:04:14", "remaining_time": "1:28:09", "throughput": 4450.34, "total_tokens": 1131488} {"current_steps": 1755, "total_steps": 38160, "loss": 0.4721, "lr": 0.00045964360587002096, "epoch": 0.9198113207547169, "percentage": 4.6, "elapsed_time": "0:04:14", "remaining_time": "1:28:07", "throughput": 4449.54, "total_tokens": 1134176} {"current_steps": 1760, "total_steps": 38160, "loss": 0.5269, "lr": 0.0004609538784067086, "epoch": 0.9224318658280922, "percentage": 4.61, "elapsed_time": "0:04:15", "remaining_time": "1:28:07", "throughput": 4450.54, "total_tokens": 1137888} {"current_steps": 1765, "total_steps": 38160, "loss": 0.615, "lr": 0.00046226415094339623, "epoch": 0.9250524109014675, "percentage": 4.63, "elapsed_time": "0:04:16", "remaining_time": "1:28:06", "throughput": 4450.92, "total_tokens": 1141184} {"current_steps": 1770, "total_steps": 38160, "loss": 0.5396, "lr": 0.00046357442348008386, "epoch": 0.9276729559748428, "percentage": 4.64, "elapsed_time": "0:04:17", "remaining_time": "1:28:04", "throughput": 4450.55, "total_tokens": 1144064} {"current_steps": 1775, "total_steps": 38160, "loss": 0.5017, "lr": 0.00046488469601677155, "epoch": 0.9302935010482181, "percentage": 4.65, "elapsed_time": "0:04:17", "remaining_time": "1:28:04", "throughput": 4451.24, "total_tokens": 1147584} {"current_steps": 1780, "total_steps": 38160, "loss": 0.4822, "lr": 0.00046619496855345913, "epoch": 0.9329140461215933, "percentage": 4.66, "elapsed_time": "0:04:19", "remaining_time": "1:28:15", "throughput": 4457.0, "total_tokens": 1154784} {"current_steps": 1785, "total_steps": 38160, "loss": 0.4725, "lr": 0.00046750524109014677, "epoch": 0.9355345911949685, "percentage": 4.68, "elapsed_time": "0:04:19", "remaining_time": "1:28:12", "throughput": 4456.25, "total_tokens": 1157440} {"current_steps": 1790, "total_steps": 38160, "loss": 0.6405, "lr": 0.0004688155136268344, "epoch": 0.9381551362683438, "percentage": 4.69, "elapsed_time": "0:04:20", "remaining_time": "1:28:10", "throughput": 4455.5, "total_tokens": 1160224} {"current_steps": 1795, "total_steps": 38160, "loss": 0.5172, "lr": 0.00047012578616352203, "epoch": 0.9407756813417191, "percentage": 4.7, "elapsed_time": "0:04:21", "remaining_time": "1:28:12", "throughput": 4457.44, "total_tokens": 1164480} {"current_steps": 1800, "total_steps": 38160, "loss": 0.3977, "lr": 0.00047143605870020967, "epoch": 0.9433962264150944, "percentage": 4.72, "elapsed_time": "0:04:22", "remaining_time": "1:28:13", "throughput": 4459.39, "total_tokens": 1168704} {"current_steps": 1805, "total_steps": 38160, "loss": 0.4354, "lr": 0.0004727463312368973, "epoch": 0.9460167714884696, "percentage": 4.73, "elapsed_time": "0:04:22", "remaining_time": "1:28:14", "throughput": 4460.25, "total_tokens": 1172384} {"current_steps": 1810, "total_steps": 38160, "loss": 0.4943, "lr": 0.0004740566037735849, "epoch": 0.9486373165618449, "percentage": 4.74, "elapsed_time": "0:04:23", "remaining_time": "1:28:12", "throughput": 4460.03, "total_tokens": 1175392} {"current_steps": 1815, "total_steps": 38160, "loss": 0.4631, "lr": 0.0004753668763102725, "epoch": 0.9512578616352201, "percentage": 4.76, "elapsed_time": "0:04:24", "remaining_time": "1:28:11", "throughput": 4459.73, "total_tokens": 1178368} {"current_steps": 1820, "total_steps": 38160, "loss": 0.4071, "lr": 0.00047667714884696015, "epoch": 0.9538784067085954, "percentage": 4.77, "elapsed_time": "0:04:25", "remaining_time": "1:28:11", "throughput": 4460.77, "total_tokens": 1182240} {"current_steps": 1825, "total_steps": 38160, "loss": 0.4638, "lr": 0.00047798742138364784, "epoch": 0.9564989517819706, "percentage": 4.78, "elapsed_time": "0:04:25", "remaining_time": "1:28:11", "throughput": 4460.83, "total_tokens": 1185504} {"current_steps": 1830, "total_steps": 38160, "loss": 0.4824, "lr": 0.0004792976939203355, "epoch": 0.9591194968553459, "percentage": 4.8, "elapsed_time": "0:04:26", "remaining_time": "1:28:09", "throughput": 4460.21, "total_tokens": 1188288} {"current_steps": 1835, "total_steps": 38160, "loss": 0.457, "lr": 0.0004806079664570231, "epoch": 0.9617400419287212, "percentage": 4.81, "elapsed_time": "0:04:27", "remaining_time": "1:28:09", "throughput": 4460.92, "total_tokens": 1192064} {"current_steps": 1840, "total_steps": 38160, "loss": 0.461, "lr": 0.0004819182389937107, "epoch": 0.9643605870020965, "percentage": 4.82, "elapsed_time": "0:04:27", "remaining_time": "1:28:08", "throughput": 4460.82, "total_tokens": 1195104} {"current_steps": 1845, "total_steps": 38160, "loss": 0.6006, "lr": 0.0004832285115303983, "epoch": 0.9669811320754716, "percentage": 4.83, "elapsed_time": "0:04:28", "remaining_time": "1:28:06", "throughput": 4460.17, "total_tokens": 1197920} {"current_steps": 1850, "total_steps": 38160, "loss": 0.4591, "lr": 0.00048453878406708596, "epoch": 0.9696016771488469, "percentage": 4.85, "elapsed_time": "0:04:29", "remaining_time": "1:28:04", "throughput": 4459.81, "total_tokens": 1200896} {"current_steps": 1855, "total_steps": 38160, "loss": 0.4771, "lr": 0.0004858490566037736, "epoch": 0.9722222222222222, "percentage": 4.86, "elapsed_time": "0:04:29", "remaining_time": "1:28:03", "throughput": 4459.74, "total_tokens": 1204032} {"current_steps": 1860, "total_steps": 38160, "loss": 0.4047, "lr": 0.0004871593291404612, "epoch": 0.9748427672955975, "percentage": 4.87, "elapsed_time": "0:04:30", "remaining_time": "1:28:02", "throughput": 4459.83, "total_tokens": 1207264} {"current_steps": 1865, "total_steps": 38160, "loss": 0.5478, "lr": 0.0004884696016771489, "epoch": 0.9774633123689728, "percentage": 4.89, "elapsed_time": "0:04:31", "remaining_time": "1:28:00", "throughput": 4459.16, "total_tokens": 1209984} {"current_steps": 1870, "total_steps": 38160, "loss": 0.4362, "lr": 0.0004897798742138365, "epoch": 0.980083857442348, "percentage": 4.9, "elapsed_time": "0:04:32", "remaining_time": "1:28:01", "throughput": 4460.16, "total_tokens": 1213856} {"current_steps": 1875, "total_steps": 38160, "loss": 0.4379, "lr": 0.0004910901467505241, "epoch": 0.9827044025157232, "percentage": 4.91, "elapsed_time": "0:04:32", "remaining_time": "1:28:01", "throughput": 4460.61, "total_tokens": 1217408} {"current_steps": 1880, "total_steps": 38160, "loss": 0.5103, "lr": 0.0004924004192872118, "epoch": 0.9853249475890985, "percentage": 4.93, "elapsed_time": "0:04:33", "remaining_time": "1:28:01", "throughput": 4461.24, "total_tokens": 1221024} {"current_steps": 1885, "total_steps": 38160, "loss": 0.4078, "lr": 0.0004937106918238993, "epoch": 0.9879454926624738, "percentage": 4.94, "elapsed_time": "0:04:34", "remaining_time": "1:28:01", "throughput": 4461.37, "total_tokens": 1224320} {"current_steps": 1890, "total_steps": 38160, "loss": 0.3956, "lr": 0.000495020964360587, "epoch": 0.9905660377358491, "percentage": 4.95, "elapsed_time": "0:04:35", "remaining_time": "1:28:01", "throughput": 4462.27, "total_tokens": 1228000} {"current_steps": 1895, "total_steps": 38160, "loss": 0.4922, "lr": 0.0004963312368972746, "epoch": 0.9931865828092243, "percentage": 4.97, "elapsed_time": "0:04:36", "remaining_time": "1:28:02", "throughput": 4464.22, "total_tokens": 1232320} {"current_steps": 1900, "total_steps": 38160, "loss": 0.5838, "lr": 0.0004976415094339623, "epoch": 0.9958071278825996, "percentage": 4.98, "elapsed_time": "0:04:37", "remaining_time": "1:28:09", "throughput": 4467.79, "total_tokens": 1238272} {"current_steps": 1905, "total_steps": 38160, "loss": 0.4991, "lr": 0.0004989517819706499, "epoch": 0.9984276729559748, "percentage": 4.99, "elapsed_time": "0:04:37", "remaining_time": "1:28:07", "throughput": 4467.65, "total_tokens": 1241344} {"current_steps": 1908, "total_steps": 38160, "eval_loss": 0.47990021109580994, "epoch": 1.0, "percentage": 5.0, "elapsed_time": "0:04:51", "remaining_time": "1:32:25", "throughput": 4258.72, "total_tokens": 1243048} {"current_steps": 1910, "total_steps": 38160, "loss": 0.4387, "lr": 0.0005002620545073376, "epoch": 1.00104821802935, "percentage": 5.01, "elapsed_time": "0:04:54", "remaining_time": "1:33:02", "throughput": 4231.21, "total_tokens": 1244520} {"current_steps": 1915, "total_steps": 38160, "loss": 0.4998, "lr": 0.0005015723270440253, "epoch": 1.0036687631027255, "percentage": 5.02, "elapsed_time": "0:04:54", "remaining_time": "1:33:00", "throughput": 4231.48, "total_tokens": 1247528} {"current_steps": 1920, "total_steps": 38160, "loss": 0.5969, "lr": 0.0005028825995807128, "epoch": 1.0062893081761006, "percentage": 5.03, "elapsed_time": "0:04:55", "remaining_time": "1:32:58", "throughput": 4232.05, "total_tokens": 1250824} {"current_steps": 1925, "total_steps": 38160, "loss": 0.5149, "lr": 0.0005041928721174004, "epoch": 1.0089098532494758, "percentage": 5.04, "elapsed_time": "0:04:56", "remaining_time": "1:32:57", "throughput": 4232.52, "total_tokens": 1254024} {"current_steps": 1930, "total_steps": 38160, "loss": 0.4696, "lr": 0.0005055031446540881, "epoch": 1.0115303983228512, "percentage": 5.06, "elapsed_time": "0:04:57", "remaining_time": "1:33:03", "throughput": 4237.56, "total_tokens": 1260328} {"current_steps": 1935, "total_steps": 38160, "loss": 0.6895, "lr": 0.0005068134171907757, "epoch": 1.0141509433962264, "percentage": 5.07, "elapsed_time": "0:04:58", "remaining_time": "1:33:01", "throughput": 4238.34, "total_tokens": 1263656} {"current_steps": 1940, "total_steps": 38160, "loss": 0.5358, "lr": 0.0005081236897274634, "epoch": 1.0167714884696017, "percentage": 5.08, "elapsed_time": "0:04:58", "remaining_time": "1:33:01", "throughput": 4240.0, "total_tokens": 1267528} {"current_steps": 1945, "total_steps": 38160, "loss": 0.6001, "lr": 0.000509433962264151, "epoch": 1.019392033542977, "percentage": 5.1, "elapsed_time": "0:04:59", "remaining_time": "1:32:59", "throughput": 4240.21, "total_tokens": 1270536} {"current_steps": 1950, "total_steps": 38160, "loss": 0.399, "lr": 0.0005107442348008385, "epoch": 1.0220125786163523, "percentage": 5.11, "elapsed_time": "0:05:00", "remaining_time": "1:32:56", "throughput": 4240.16, "total_tokens": 1273416} {"current_steps": 1955, "total_steps": 38160, "loss": 0.375, "lr": 0.0005120545073375262, "epoch": 1.0246331236897275, "percentage": 5.12, "elapsed_time": "0:05:00", "remaining_time": "1:32:54", "throughput": 4240.11, "total_tokens": 1276232} {"current_steps": 1960, "total_steps": 38160, "loss": 0.402, "lr": 0.0005133647798742138, "epoch": 1.0272536687631026, "percentage": 5.14, "elapsed_time": "0:05:01", "remaining_time": "1:32:52", "throughput": 4240.63, "total_tokens": 1279400} {"current_steps": 1965, "total_steps": 38160, "loss": 0.4461, "lr": 0.0005146750524109015, "epoch": 1.029874213836478, "percentage": 5.15, "elapsed_time": "0:05:02", "remaining_time": "1:32:53", "throughput": 4242.76, "total_tokens": 1283752} {"current_steps": 1970, "total_steps": 38160, "loss": 0.4364, "lr": 0.0005159853249475891, "epoch": 1.0324947589098532, "percentage": 5.16, "elapsed_time": "0:05:03", "remaining_time": "1:32:51", "throughput": 4243.45, "total_tokens": 1287048} {"current_steps": 1975, "total_steps": 38160, "loss": 0.5042, "lr": 0.0005172955974842768, "epoch": 1.0351153039832286, "percentage": 5.18, "elapsed_time": "0:05:03", "remaining_time": "1:32:48", "throughput": 4242.85, "total_tokens": 1289544} {"current_steps": 1980, "total_steps": 38160, "loss": 0.4788, "lr": 0.0005186058700209643, "epoch": 1.0377358490566038, "percentage": 5.19, "elapsed_time": "0:05:04", "remaining_time": "1:32:45", "throughput": 4242.88, "total_tokens": 1292392} {"current_steps": 1985, "total_steps": 38160, "loss": 0.5652, "lr": 0.0005199161425576519, "epoch": 1.040356394129979, "percentage": 5.2, "elapsed_time": "0:05:05", "remaining_time": "1:32:43", "throughput": 4243.1, "total_tokens": 1295400} {"current_steps": 1990, "total_steps": 38160, "loss": 0.5139, "lr": 0.0005212264150943396, "epoch": 1.0429769392033543, "percentage": 5.21, "elapsed_time": "0:05:05", "remaining_time": "1:32:40", "throughput": 4243.0, "total_tokens": 1298152} {"current_steps": 1995, "total_steps": 38160, "loss": 0.5943, "lr": 0.0005225366876310272, "epoch": 1.0455974842767295, "percentage": 5.23, "elapsed_time": "0:05:06", "remaining_time": "1:32:39", "throughput": 4243.53, "total_tokens": 1301384} {"current_steps": 2000, "total_steps": 38160, "loss": 0.5438, "lr": 0.000523846960167715, "epoch": 1.0482180293501049, "percentage": 5.24, "elapsed_time": "0:05:07", "remaining_time": "1:32:36", "throughput": 4243.66, "total_tokens": 1304296} {"current_steps": 2005, "total_steps": 38160, "loss": 0.5838, "lr": 0.0005251572327044026, "epoch": 1.05083857442348, "percentage": 5.25, "elapsed_time": "0:05:08", "remaining_time": "1:32:34", "throughput": 4243.57, "total_tokens": 1307048} {"current_steps": 2010, "total_steps": 38160, "loss": 0.4636, "lr": 0.0005264675052410901, "epoch": 1.0534591194968554, "percentage": 5.27, "elapsed_time": "0:05:08", "remaining_time": "1:32:33", "throughput": 4244.99, "total_tokens": 1310792} {"current_steps": 2015, "total_steps": 38160, "loss": 0.6042, "lr": 0.0005277777777777778, "epoch": 1.0560796645702306, "percentage": 5.28, "elapsed_time": "0:05:09", "remaining_time": "1:32:30", "throughput": 4244.79, "total_tokens": 1313448} {"current_steps": 2020, "total_steps": 38160, "loss": 0.4096, "lr": 0.0005290880503144654, "epoch": 1.0587002096436058, "percentage": 5.29, "elapsed_time": "0:05:10", "remaining_time": "1:32:27", "throughput": 4244.6, "total_tokens": 1316200} {"current_steps": 2025, "total_steps": 38160, "loss": 0.7931, "lr": 0.0005303983228511531, "epoch": 1.0613207547169812, "percentage": 5.31, "elapsed_time": "0:05:10", "remaining_time": "1:32:26", "throughput": 4245.64, "total_tokens": 1319720} {"current_steps": 2030, "total_steps": 38160, "loss": 0.5444, "lr": 0.0005317085953878407, "epoch": 1.0639412997903563, "percentage": 5.32, "elapsed_time": "0:05:11", "remaining_time": "1:32:26", "throughput": 4246.83, "total_tokens": 1323432} {"current_steps": 2035, "total_steps": 38160, "loss": 0.4949, "lr": 0.0005330188679245284, "epoch": 1.0665618448637317, "percentage": 5.33, "elapsed_time": "0:05:12", "remaining_time": "1:32:24", "throughput": 4247.51, "total_tokens": 1326760} {"current_steps": 2040, "total_steps": 38160, "loss": 0.4619, "lr": 0.000534329140461216, "epoch": 1.069182389937107, "percentage": 5.35, "elapsed_time": "0:05:13", "remaining_time": "1:32:23", "throughput": 4248.23, "total_tokens": 1330120} {"current_steps": 2045, "total_steps": 38160, "loss": 0.5418, "lr": 0.0005356394129979035, "epoch": 1.0718029350104823, "percentage": 5.36, "elapsed_time": "0:05:13", "remaining_time": "1:32:21", "throughput": 4248.26, "total_tokens": 1333032} {"current_steps": 2050, "total_steps": 38160, "loss": 0.5808, "lr": 0.0005369496855345912, "epoch": 1.0744234800838575, "percentage": 5.37, "elapsed_time": "0:05:14", "remaining_time": "1:32:19", "throughput": 4248.94, "total_tokens": 1336296} {"current_steps": 2055, "total_steps": 38160, "loss": 0.3735, "lr": 0.0005382599580712788, "epoch": 1.0770440251572326, "percentage": 5.39, "elapsed_time": "0:05:15", "remaining_time": "1:32:18", "throughput": 4249.63, "total_tokens": 1339592} {"current_steps": 2060, "total_steps": 38160, "loss": 0.4939, "lr": 0.0005395702306079665, "epoch": 1.079664570230608, "percentage": 5.4, "elapsed_time": "0:05:15", "remaining_time": "1:32:16", "throughput": 4249.78, "total_tokens": 1342664} {"current_steps": 2065, "total_steps": 38160, "loss": 0.5871, "lr": 0.0005408805031446541, "epoch": 1.0822851153039832, "percentage": 5.41, "elapsed_time": "0:05:16", "remaining_time": "1:32:13", "throughput": 4249.47, "total_tokens": 1345288} {"current_steps": 2070, "total_steps": 38160, "loss": 0.4675, "lr": 0.0005421907756813418, "epoch": 1.0849056603773586, "percentage": 5.42, "elapsed_time": "0:05:17", "remaining_time": "1:32:11", "throughput": 4250.07, "total_tokens": 1348488} {"current_steps": 2075, "total_steps": 38160, "loss": 0.6155, "lr": 0.0005435010482180293, "epoch": 1.0875262054507338, "percentage": 5.44, "elapsed_time": "0:05:18", "remaining_time": "1:32:12", "throughput": 4252.02, "total_tokens": 1352712} {"current_steps": 2080, "total_steps": 38160, "loss": 0.4465, "lr": 0.0005448113207547169, "epoch": 1.090146750524109, "percentage": 5.45, "elapsed_time": "0:05:18", "remaining_time": "1:32:10", "throughput": 4251.73, "total_tokens": 1355496} {"current_steps": 2085, "total_steps": 38160, "loss": 0.52, "lr": 0.0005461215932914046, "epoch": 1.0927672955974843, "percentage": 5.46, "elapsed_time": "0:05:19", "remaining_time": "1:32:12", "throughput": 4254.73, "total_tokens": 1360552} {"current_steps": 2090, "total_steps": 38160, "loss": 0.428, "lr": 0.0005474318658280922, "epoch": 1.0953878406708595, "percentage": 5.48, "elapsed_time": "0:05:20", "remaining_time": "1:32:10", "throughput": 4254.81, "total_tokens": 1363432} {"current_steps": 2095, "total_steps": 38160, "loss": 0.3868, "lr": 0.0005487421383647799, "epoch": 1.0980083857442349, "percentage": 5.49, "elapsed_time": "0:05:21", "remaining_time": "1:32:09", "throughput": 4255.51, "total_tokens": 1366824} {"current_steps": 2100, "total_steps": 38160, "loss": 0.5607, "lr": 0.0005500524109014676, "epoch": 1.10062893081761, "percentage": 5.5, "elapsed_time": "0:05:21", "remaining_time": "1:32:07", "throughput": 4256.57, "total_tokens": 1370312} {"current_steps": 2105, "total_steps": 38160, "loss": 0.7055, "lr": 0.0005513626834381551, "epoch": 1.1032494758909852, "percentage": 5.52, "elapsed_time": "0:05:22", "remaining_time": "1:32:05", "throughput": 4256.64, "total_tokens": 1373160} {"current_steps": 2110, "total_steps": 38160, "loss": 0.5473, "lr": 0.0005526729559748428, "epoch": 1.1058700209643606, "percentage": 5.53, "elapsed_time": "0:05:23", "remaining_time": "1:32:03", "throughput": 4256.58, "total_tokens": 1376008} {"current_steps": 2115, "total_steps": 38160, "loss": 0.5465, "lr": 0.0005539832285115304, "epoch": 1.1084905660377358, "percentage": 5.54, "elapsed_time": "0:05:23", "remaining_time": "1:31:59", "throughput": 4255.96, "total_tokens": 1378440} {"current_steps": 2120, "total_steps": 38160, "loss": 0.5314, "lr": 0.0005552935010482181, "epoch": 1.1111111111111112, "percentage": 5.56, "elapsed_time": "0:05:24", "remaining_time": "1:31:59", "throughput": 4257.13, "total_tokens": 1382152} {"current_steps": 2125, "total_steps": 38160, "loss": 0.6587, "lr": 0.0005566037735849057, "epoch": 1.1137316561844863, "percentage": 5.57, "elapsed_time": "0:05:25", "remaining_time": "1:31:57", "throughput": 4257.6, "total_tokens": 1385416} {"current_steps": 2130, "total_steps": 38160, "loss": 0.4586, "lr": 0.0005579140461215934, "epoch": 1.1163522012578617, "percentage": 5.58, "elapsed_time": "0:05:26", "remaining_time": "1:31:57", "throughput": 4259.01, "total_tokens": 1389288} {"current_steps": 2135, "total_steps": 38160, "loss": 0.5157, "lr": 0.000559224318658281, "epoch": 1.118972746331237, "percentage": 5.59, "elapsed_time": "0:05:26", "remaining_time": "1:31:55", "throughput": 4259.01, "total_tokens": 1392136} {"current_steps": 2140, "total_steps": 38160, "loss": 0.4965, "lr": 0.0005605345911949685, "epoch": 1.121593291404612, "percentage": 5.61, "elapsed_time": "0:05:27", "remaining_time": "1:31:53", "throughput": 4259.27, "total_tokens": 1395208} {"current_steps": 2145, "total_steps": 38160, "loss": 0.4232, "lr": 0.0005618448637316562, "epoch": 1.1242138364779874, "percentage": 5.62, "elapsed_time": "0:05:28", "remaining_time": "1:31:51", "throughput": 4259.28, "total_tokens": 1398024} {"current_steps": 2150, "total_steps": 38160, "loss": 0.4574, "lr": 0.0005631551362683438, "epoch": 1.1268343815513626, "percentage": 5.63, "elapsed_time": "0:05:28", "remaining_time": "1:31:49", "throughput": 4259.67, "total_tokens": 1401256} {"current_steps": 2155, "total_steps": 38160, "loss": 0.3676, "lr": 0.0005644654088050315, "epoch": 1.129454926624738, "percentage": 5.65, "elapsed_time": "0:05:29", "remaining_time": "1:31:46", "throughput": 4259.21, "total_tokens": 1403848} {"current_steps": 2160, "total_steps": 38160, "loss": 0.5891, "lr": 0.0005657756813417191, "epoch": 1.1320754716981132, "percentage": 5.66, "elapsed_time": "0:05:30", "remaining_time": "1:31:47", "throughput": 4261.04, "total_tokens": 1408040} {"current_steps": 2165, "total_steps": 38160, "loss": 0.6175, "lr": 0.0005670859538784067, "epoch": 1.1346960167714886, "percentage": 5.67, "elapsed_time": "0:05:31", "remaining_time": "1:31:46", "throughput": 4262.08, "total_tokens": 1411688} {"current_steps": 2170, "total_steps": 38160, "loss": 0.6036, "lr": 0.0005683962264150943, "epoch": 1.1373165618448637, "percentage": 5.69, "elapsed_time": "0:05:32", "remaining_time": "1:31:46", "throughput": 4263.26, "total_tokens": 1415464} {"current_steps": 2175, "total_steps": 38160, "loss": 0.4133, "lr": 0.0005697064989517819, "epoch": 1.139937106918239, "percentage": 5.7, "elapsed_time": "0:05:32", "remaining_time": "1:31:45", "throughput": 4263.62, "total_tokens": 1418664} {"current_steps": 2180, "total_steps": 38160, "loss": 0.4336, "lr": 0.0005710167714884696, "epoch": 1.1425576519916143, "percentage": 5.71, "elapsed_time": "0:05:33", "remaining_time": "1:31:44", "throughput": 4264.33, "total_tokens": 1422088} {"current_steps": 2185, "total_steps": 38160, "loss": 0.4393, "lr": 0.0005723270440251572, "epoch": 1.1451781970649895, "percentage": 5.73, "elapsed_time": "0:05:34", "remaining_time": "1:31:41", "throughput": 4264.26, "total_tokens": 1424872} {"current_steps": 2190, "total_steps": 38160, "loss": 0.6248, "lr": 0.0005736373165618449, "epoch": 1.1477987421383649, "percentage": 5.74, "elapsed_time": "0:05:35", "remaining_time": "1:31:42", "throughput": 4266.5, "total_tokens": 1429320} {"current_steps": 2195, "total_steps": 38160, "loss": 0.4801, "lr": 0.0005749475890985325, "epoch": 1.15041928721174, "percentage": 5.75, "elapsed_time": "0:05:35", "remaining_time": "1:31:43", "throughput": 4268.64, "total_tokens": 1433704} {"current_steps": 2200, "total_steps": 38160, "loss": 0.5103, "lr": 0.0005762578616352201, "epoch": 1.1530398322851152, "percentage": 5.77, "elapsed_time": "0:05:36", "remaining_time": "1:31:41", "throughput": 4269.03, "total_tokens": 1436872} {"current_steps": 2205, "total_steps": 38160, "loss": 0.4957, "lr": 0.0005775681341719078, "epoch": 1.1556603773584906, "percentage": 5.78, "elapsed_time": "0:05:37", "remaining_time": "1:31:39", "throughput": 4269.68, "total_tokens": 1440104} {"current_steps": 2210, "total_steps": 38160, "loss": 0.6599, "lr": 0.0005788784067085954, "epoch": 1.1582809224318658, "percentage": 5.79, "elapsed_time": "0:05:37", "remaining_time": "1:31:37", "throughput": 4269.94, "total_tokens": 1443176} {"current_steps": 2215, "total_steps": 38160, "loss": 0.4622, "lr": 0.0005801886792452831, "epoch": 1.1609014675052411, "percentage": 5.8, "elapsed_time": "0:05:38", "remaining_time": "1:31:36", "throughput": 4270.36, "total_tokens": 1446440} {"current_steps": 2220, "total_steps": 38160, "loss": 0.4721, "lr": 0.0005814989517819707, "epoch": 1.1635220125786163, "percentage": 5.82, "elapsed_time": "0:05:39", "remaining_time": "1:31:36", "throughput": 4271.46, "total_tokens": 1450120} {"current_steps": 2225, "total_steps": 38160, "loss": 0.4728, "lr": 0.0005828092243186583, "epoch": 1.1661425576519917, "percentage": 5.83, "elapsed_time": "0:05:40", "remaining_time": "1:31:35", "throughput": 4272.31, "total_tokens": 1453608} {"current_steps": 2230, "total_steps": 38160, "loss": 0.6287, "lr": 0.000584119496855346, "epoch": 1.1687631027253669, "percentage": 5.84, "elapsed_time": "0:05:41", "remaining_time": "1:31:35", "throughput": 4274.25, "total_tokens": 1457832} {"current_steps": 2235, "total_steps": 38160, "loss": 0.543, "lr": 0.0005854297693920335, "epoch": 1.171383647798742, "percentage": 5.86, "elapsed_time": "0:05:41", "remaining_time": "1:31:36", "throughput": 4276.41, "total_tokens": 1462280} {"current_steps": 2240, "total_steps": 38160, "loss": 0.4937, "lr": 0.0005867400419287212, "epoch": 1.1740041928721174, "percentage": 5.87, "elapsed_time": "0:05:42", "remaining_time": "1:31:35", "throughput": 4277.56, "total_tokens": 1466024} {"current_steps": 2245, "total_steps": 38160, "loss": 0.4739, "lr": 0.0005880503144654088, "epoch": 1.1766247379454926, "percentage": 5.88, "elapsed_time": "0:05:43", "remaining_time": "1:31:33", "throughput": 4277.42, "total_tokens": 1468872} {"current_steps": 2250, "total_steps": 38160, "loss": 0.4959, "lr": 0.0005893605870020965, "epoch": 1.179245283018868, "percentage": 5.9, "elapsed_time": "0:05:44", "remaining_time": "1:31:30", "throughput": 4276.86, "total_tokens": 1471336} {"current_steps": 2255, "total_steps": 38160, "loss": 0.6223, "lr": 0.0005906708595387841, "epoch": 1.1818658280922432, "percentage": 5.91, "elapsed_time": "0:05:44", "remaining_time": "1:31:27", "throughput": 4276.47, "total_tokens": 1473928} {"current_steps": 2260, "total_steps": 38160, "loss": 0.428, "lr": 0.0005919811320754716, "epoch": 1.1844863731656186, "percentage": 5.92, "elapsed_time": "0:05:45", "remaining_time": "1:31:29", "throughput": 4278.94, "total_tokens": 1478728} {"current_steps": 2265, "total_steps": 38160, "loss": 0.4867, "lr": 0.0005932914046121593, "epoch": 1.1871069182389937, "percentage": 5.94, "elapsed_time": "0:05:46", "remaining_time": "1:31:27", "throughput": 4278.89, "total_tokens": 1481576} {"current_steps": 2270, "total_steps": 38160, "loss": 0.5201, "lr": 0.0005946016771488469, "epoch": 1.189727463312369, "percentage": 5.95, "elapsed_time": "0:05:46", "remaining_time": "1:31:24", "throughput": 4278.43, "total_tokens": 1484104} {"current_steps": 2275, "total_steps": 38160, "loss": 0.5939, "lr": 0.0005959119496855346, "epoch": 1.1923480083857443, "percentage": 5.96, "elapsed_time": "0:05:47", "remaining_time": "1:31:22", "throughput": 4278.55, "total_tokens": 1487048} {"current_steps": 2280, "total_steps": 38160, "loss": 0.4562, "lr": 0.0005972222222222222, "epoch": 1.1949685534591195, "percentage": 5.97, "elapsed_time": "0:05:48", "remaining_time": "1:31:20", "throughput": 4278.85, "total_tokens": 1490152} {"current_steps": 2285, "total_steps": 38160, "loss": 0.4346, "lr": 0.0005985324947589099, "epoch": 1.1975890985324948, "percentage": 5.99, "elapsed_time": "0:05:48", "remaining_time": "1:31:17", "throughput": 4278.25, "total_tokens": 1492648} {"current_steps": 2290, "total_steps": 38160, "loss": 0.5848, "lr": 0.0005998427672955975, "epoch": 1.20020964360587, "percentage": 6.0, "elapsed_time": "0:05:49", "remaining_time": "1:31:15", "throughput": 4277.88, "total_tokens": 1495272} {"current_steps": 2295, "total_steps": 38160, "loss": 0.5072, "lr": 0.000601153039832285, "epoch": 1.2028301886792452, "percentage": 6.01, "elapsed_time": "0:05:50", "remaining_time": "1:31:12", "throughput": 4277.34, "total_tokens": 1497832} {"current_steps": 2300, "total_steps": 38160, "loss": 0.4003, "lr": 0.0006024633123689728, "epoch": 1.2054507337526206, "percentage": 6.03, "elapsed_time": "0:05:51", "remaining_time": "1:31:12", "throughput": 4278.9, "total_tokens": 1501896} {"current_steps": 2305, "total_steps": 38160, "loss": 0.4761, "lr": 0.0006037735849056604, "epoch": 1.2080712788259957, "percentage": 6.04, "elapsed_time": "0:05:51", "remaining_time": "1:31:09", "throughput": 4278.28, "total_tokens": 1504328} {"current_steps": 2310, "total_steps": 38160, "loss": 0.5255, "lr": 0.0006050838574423481, "epoch": 1.2106918238993711, "percentage": 6.05, "elapsed_time": "0:05:52", "remaining_time": "1:31:09", "throughput": 4279.71, "total_tokens": 1508264} {"current_steps": 2315, "total_steps": 38160, "loss": 0.5938, "lr": 0.0006063941299790357, "epoch": 1.2133123689727463, "percentage": 6.07, "elapsed_time": "0:05:53", "remaining_time": "1:31:07", "throughput": 4279.56, "total_tokens": 1511048} {"current_steps": 2320, "total_steps": 38160, "loss": 0.679, "lr": 0.0006077044025157233, "epoch": 1.2159329140461215, "percentage": 6.08, "elapsed_time": "0:05:53", "remaining_time": "1:31:04", "throughput": 4279.6, "total_tokens": 1513928} {"current_steps": 2325, "total_steps": 38160, "loss": 0.4412, "lr": 0.000609014675052411, "epoch": 1.2185534591194969, "percentage": 6.09, "elapsed_time": "0:05:54", "remaining_time": "1:31:04", "throughput": 4280.43, "total_tokens": 1517512} {"current_steps": 2330, "total_steps": 38160, "loss": 0.391, "lr": 0.0006103249475890985, "epoch": 1.221174004192872, "percentage": 6.11, "elapsed_time": "0:05:55", "remaining_time": "1:31:03", "throughput": 4281.55, "total_tokens": 1521256} {"current_steps": 2335, "total_steps": 38160, "loss": 0.6336, "lr": 0.0006116352201257862, "epoch": 1.2237945492662474, "percentage": 6.12, "elapsed_time": "0:05:55", "remaining_time": "1:30:59", "throughput": 4280.13, "total_tokens": 1523144} {"current_steps": 2340, "total_steps": 38160, "loss": 0.5005, "lr": 0.0006129454926624738, "epoch": 1.2264150943396226, "percentage": 6.13, "elapsed_time": "0:05:56", "remaining_time": "1:31:01", "throughput": 4281.97, "total_tokens": 1527624} {"current_steps": 2345, "total_steps": 38160, "loss": 0.4744, "lr": 0.0006142557651991615, "epoch": 1.229035639412998, "percentage": 6.15, "elapsed_time": "0:05:57", "remaining_time": "1:31:01", "throughput": 4283.24, "total_tokens": 1531560} {"current_steps": 2350, "total_steps": 38160, "loss": 0.4903, "lr": 0.0006155660377358491, "epoch": 1.2316561844863732, "percentage": 6.16, "elapsed_time": "0:05:58", "remaining_time": "1:30:58", "throughput": 4282.33, "total_tokens": 1533832} {"current_steps": 2355, "total_steps": 38160, "loss": 0.5364, "lr": 0.0006168763102725366, "epoch": 1.2342767295597485, "percentage": 6.17, "elapsed_time": "0:05:58", "remaining_time": "1:30:55", "throughput": 4282.11, "total_tokens": 1536584} {"current_steps": 2360, "total_steps": 38160, "loss": 0.4857, "lr": 0.0006181865828092243, "epoch": 1.2368972746331237, "percentage": 6.18, "elapsed_time": "0:05:59", "remaining_time": "1:30:54", "throughput": 4282.18, "total_tokens": 1539720} {"current_steps": 2365, "total_steps": 38160, "loss": 0.3794, "lr": 0.0006194968553459119, "epoch": 1.2395178197064989, "percentage": 6.2, "elapsed_time": "0:06:00", "remaining_time": "1:30:53", "throughput": 4282.75, "total_tokens": 1543112} {"current_steps": 2370, "total_steps": 38160, "loss": 0.519, "lr": 0.0006208071278825996, "epoch": 1.2421383647798743, "percentage": 6.21, "elapsed_time": "0:06:01", "remaining_time": "1:30:52", "throughput": 4283.4, "total_tokens": 1546568} {"current_steps": 2375, "total_steps": 38160, "loss": 0.5325, "lr": 0.0006221174004192872, "epoch": 1.2447589098532494, "percentage": 6.22, "elapsed_time": "0:06:01", "remaining_time": "1:30:51", "throughput": 4283.99, "total_tokens": 1549864} {"current_steps": 2380, "total_steps": 38160, "loss": 0.4411, "lr": 0.0006234276729559748, "epoch": 1.2473794549266248, "percentage": 6.24, "elapsed_time": "0:06:02", "remaining_time": "1:30:48", "throughput": 4283.62, "total_tokens": 1552456} {"current_steps": 2385, "total_steps": 38160, "loss": 0.5765, "lr": 0.0006247379454926625, "epoch": 1.25, "percentage": 6.25, "elapsed_time": "0:06:03", "remaining_time": "1:30:46", "throughput": 4283.4, "total_tokens": 1555240} {"current_steps": 2390, "total_steps": 38160, "loss": 0.4217, "lr": 0.00062604821802935, "epoch": 1.2526205450733752, "percentage": 6.26, "elapsed_time": "0:06:03", "remaining_time": "1:30:45", "throughput": 4283.98, "total_tokens": 1558568} {"current_steps": 2395, "total_steps": 38160, "loss": 0.546, "lr": 0.0006273584905660377, "epoch": 1.2552410901467506, "percentage": 6.28, "elapsed_time": "0:06:04", "remaining_time": "1:30:42", "throughput": 4283.79, "total_tokens": 1561288} {"current_steps": 2400, "total_steps": 38160, "loss": 0.5648, "lr": 0.0006286687631027254, "epoch": 1.2578616352201257, "percentage": 6.29, "elapsed_time": "0:06:05", "remaining_time": "1:30:40", "throughput": 4283.77, "total_tokens": 1564200} {"current_steps": 2405, "total_steps": 38160, "loss": 0.5169, "lr": 0.0006299790356394131, "epoch": 1.2604821802935011, "percentage": 6.3, "elapsed_time": "0:06:05", "remaining_time": "1:30:38", "throughput": 4283.85, "total_tokens": 1567208} {"current_steps": 2410, "total_steps": 38160, "loss": 0.4424, "lr": 0.0006312893081761007, "epoch": 1.2631027253668763, "percentage": 6.32, "elapsed_time": "0:06:06", "remaining_time": "1:30:38", "throughput": 4285.32, "total_tokens": 1571240} {"current_steps": 2415, "total_steps": 38160, "loss": 0.504, "lr": 0.0006325995807127883, "epoch": 1.2657232704402515, "percentage": 6.33, "elapsed_time": "0:06:07", "remaining_time": "1:30:37", "throughput": 4285.56, "total_tokens": 1574376} {"current_steps": 2420, "total_steps": 38160, "loss": 0.5658, "lr": 0.000633909853249476, "epoch": 1.2683438155136268, "percentage": 6.34, "elapsed_time": "0:06:08", "remaining_time": "1:30:36", "throughput": 4286.13, "total_tokens": 1577672} {"current_steps": 2425, "total_steps": 38160, "loss": 0.4414, "lr": 0.0006352201257861635, "epoch": 1.270964360587002, "percentage": 6.35, "elapsed_time": "0:06:08", "remaining_time": "1:30:35", "throughput": 4286.9, "total_tokens": 1581192} {"current_steps": 2430, "total_steps": 38160, "loss": 0.4289, "lr": 0.0006365303983228512, "epoch": 1.2735849056603774, "percentage": 6.37, "elapsed_time": "0:06:09", "remaining_time": "1:30:33", "throughput": 4287.29, "total_tokens": 1584424} {"current_steps": 2435, "total_steps": 38160, "loss": 0.5018, "lr": 0.0006378406708595388, "epoch": 1.2762054507337526, "percentage": 6.38, "elapsed_time": "0:06:10", "remaining_time": "1:30:33", "throughput": 4287.87, "total_tokens": 1587912} {"current_steps": 2440, "total_steps": 38160, "loss": 0.3716, "lr": 0.0006391509433962265, "epoch": 1.2788259958071277, "percentage": 6.39, "elapsed_time": "0:06:11", "remaining_time": "1:30:32", "throughput": 4288.86, "total_tokens": 1591624} {"current_steps": 2445, "total_steps": 38160, "loss": 0.5233, "lr": 0.0006404612159329141, "epoch": 1.2814465408805031, "percentage": 6.41, "elapsed_time": "0:06:11", "remaining_time": "1:30:30", "throughput": 4288.72, "total_tokens": 1594376} {"current_steps": 2450, "total_steps": 38160, "loss": 0.4619, "lr": 0.0006417714884696016, "epoch": 1.2840670859538785, "percentage": 6.42, "elapsed_time": "0:06:12", "remaining_time": "1:30:29", "throughput": 4289.12, "total_tokens": 1597608} {"current_steps": 2455, "total_steps": 38160, "loss": 0.4558, "lr": 0.0006430817610062893, "epoch": 1.2866876310272537, "percentage": 6.43, "elapsed_time": "0:06:13", "remaining_time": "1:30:26", "throughput": 4288.63, "total_tokens": 1600136} {"current_steps": 2460, "total_steps": 38160, "loss": 0.495, "lr": 0.0006443920335429769, "epoch": 1.2893081761006289, "percentage": 6.45, "elapsed_time": "0:06:13", "remaining_time": "1:30:25", "throughput": 4289.26, "total_tokens": 1603592} {"current_steps": 2465, "total_steps": 38160, "loss": 0.6001, "lr": 0.0006457023060796646, "epoch": 1.2919287211740043, "percentage": 6.46, "elapsed_time": "0:06:14", "remaining_time": "1:30:23", "throughput": 4289.25, "total_tokens": 1606504} {"current_steps": 2470, "total_steps": 38160, "loss": 0.4403, "lr": 0.0006470125786163522, "epoch": 1.2945492662473794, "percentage": 6.47, "elapsed_time": "0:06:15", "remaining_time": "1:30:29", "throughput": 4293.01, "total_tokens": 1613064} {"current_steps": 2475, "total_steps": 38160, "loss": 0.4773, "lr": 0.0006483228511530398, "epoch": 1.2971698113207548, "percentage": 6.49, "elapsed_time": "0:06:16", "remaining_time": "1:30:27", "throughput": 4293.16, "total_tokens": 1616136} {"current_steps": 2480, "total_steps": 38160, "loss": 0.4508, "lr": 0.0006496331236897275, "epoch": 1.29979035639413, "percentage": 6.5, "elapsed_time": "0:06:17", "remaining_time": "1:30:25", "throughput": 4292.84, "total_tokens": 1618792} {"current_steps": 2485, "total_steps": 38160, "loss": 0.4108, "lr": 0.000650943396226415, "epoch": 1.3024109014675052, "percentage": 6.51, "elapsed_time": "0:06:17", "remaining_time": "1:30:22", "throughput": 4292.06, "total_tokens": 1621096} {"current_steps": 2490, "total_steps": 38160, "loss": 0.4194, "lr": 0.0006522536687631027, "epoch": 1.3050314465408805, "percentage": 6.53, "elapsed_time": "0:06:18", "remaining_time": "1:30:19", "throughput": 4291.64, "total_tokens": 1623720} {"current_steps": 2495, "total_steps": 38160, "loss": 0.51, "lr": 0.0006535639412997903, "epoch": 1.3076519916142557, "percentage": 6.54, "elapsed_time": "0:06:19", "remaining_time": "1:30:18", "throughput": 4291.95, "total_tokens": 1626888} {"current_steps": 2500, "total_steps": 38160, "loss": 0.6266, "lr": 0.0006548742138364781, "epoch": 1.310272536687631, "percentage": 6.55, "elapsed_time": "0:06:19", "remaining_time": "1:30:17", "throughput": 4292.67, "total_tokens": 1630472} {"current_steps": 2505, "total_steps": 38160, "loss": 0.4654, "lr": 0.0006561844863731657, "epoch": 1.3128930817610063, "percentage": 6.56, "elapsed_time": "0:06:20", "remaining_time": "1:30:15", "throughput": 4292.42, "total_tokens": 1633192} {"current_steps": 2510, "total_steps": 38160, "loss": 0.5465, "lr": 0.0006574947589098533, "epoch": 1.3155136268343814, "percentage": 6.58, "elapsed_time": "0:06:21", "remaining_time": "1:30:15", "throughput": 4293.7, "total_tokens": 1637128} {"current_steps": 2515, "total_steps": 38160, "loss": 0.5135, "lr": 0.000658805031446541, "epoch": 1.3181341719077568, "percentage": 6.59, "elapsed_time": "0:06:22", "remaining_time": "1:30:14", "throughput": 4294.23, "total_tokens": 1640456} {"current_steps": 2520, "total_steps": 38160, "loss": 0.6134, "lr": 0.0006601153039832285, "epoch": 1.320754716981132, "percentage": 6.6, "elapsed_time": "0:06:22", "remaining_time": "1:30:13", "throughput": 4295.0, "total_tokens": 1644008} {"current_steps": 2525, "total_steps": 38160, "loss": 0.4634, "lr": 0.0006614255765199162, "epoch": 1.3233752620545074, "percentage": 6.62, "elapsed_time": "0:06:23", "remaining_time": "1:30:13", "throughput": 4295.87, "total_tokens": 1647720} {"current_steps": 2530, "total_steps": 38160, "loss": 0.6304, "lr": 0.0006627358490566038, "epoch": 1.3259958071278826, "percentage": 6.63, "elapsed_time": "0:06:24", "remaining_time": "1:30:10", "throughput": 4295.65, "total_tokens": 1650440} {"current_steps": 2535, "total_steps": 38160, "loss": 0.5914, "lr": 0.0006640461215932914, "epoch": 1.3286163522012577, "percentage": 6.64, "elapsed_time": "0:06:24", "remaining_time": "1:30:09", "throughput": 4295.57, "total_tokens": 1653352} {"current_steps": 2540, "total_steps": 38160, "loss": 0.4623, "lr": 0.0006653563941299791, "epoch": 1.3312368972746331, "percentage": 6.66, "elapsed_time": "0:06:25", "remaining_time": "1:30:07", "throughput": 4295.62, "total_tokens": 1656360} {"current_steps": 2545, "total_steps": 38160, "loss": 0.6201, "lr": 0.0006666666666666666, "epoch": 1.3338574423480085, "percentage": 6.67, "elapsed_time": "0:06:26", "remaining_time": "1:30:05", "throughput": 4295.71, "total_tokens": 1659336} {"current_steps": 2550, "total_steps": 38160, "loss": 0.7107, "lr": 0.0006679769392033543, "epoch": 1.3364779874213837, "percentage": 6.68, "elapsed_time": "0:06:26", "remaining_time": "1:30:03", "throughput": 4295.23, "total_tokens": 1661896} {"current_steps": 2555, "total_steps": 38160, "loss": 0.3833, "lr": 0.0006692872117400419, "epoch": 1.3390985324947589, "percentage": 6.7, "elapsed_time": "0:06:27", "remaining_time": "1:30:03", "throughput": 4296.36, "total_tokens": 1665832} {"current_steps": 2560, "total_steps": 38160, "loss": 0.5444, "lr": 0.0006705974842767296, "epoch": 1.3417190775681342, "percentage": 6.71, "elapsed_time": "0:06:28", "remaining_time": "1:30:01", "throughput": 4296.03, "total_tokens": 1668520} {"current_steps": 2565, "total_steps": 38160, "loss": 0.4662, "lr": 0.0006719077568134172, "epoch": 1.3443396226415094, "percentage": 6.72, "elapsed_time": "0:06:29", "remaining_time": "1:29:59", "throughput": 4296.64, "total_tokens": 1671912} {"current_steps": 2570, "total_steps": 38160, "loss": 0.4916, "lr": 0.0006732180293501048, "epoch": 1.3469601677148848, "percentage": 6.73, "elapsed_time": "0:06:29", "remaining_time": "1:29:58", "throughput": 4296.93, "total_tokens": 1675080} {"current_steps": 2575, "total_steps": 38160, "loss": 0.3431, "lr": 0.0006745283018867925, "epoch": 1.34958071278826, "percentage": 6.75, "elapsed_time": "0:06:30", "remaining_time": "1:30:03", "throughput": 4300.57, "total_tokens": 1681512} {"current_steps": 2580, "total_steps": 38160, "loss": 0.4818, "lr": 0.00067583857442348, "epoch": 1.3522012578616351, "percentage": 6.76, "elapsed_time": "0:06:31", "remaining_time": "1:30:02", "throughput": 4301.16, "total_tokens": 1685000} {"current_steps": 2585, "total_steps": 38160, "loss": 0.4459, "lr": 0.0006771488469601677, "epoch": 1.3548218029350105, "percentage": 6.77, "elapsed_time": "0:06:32", "remaining_time": "1:30:00", "throughput": 4300.7, "total_tokens": 1687528} {"current_steps": 2590, "total_steps": 38160, "loss": 0.6047, "lr": 0.0006784591194968553, "epoch": 1.3574423480083857, "percentage": 6.79, "elapsed_time": "0:06:33", "remaining_time": "1:29:57", "throughput": 4300.43, "total_tokens": 1690280} {"current_steps": 2595, "total_steps": 38160, "loss": 0.4013, "lr": 0.0006797693920335431, "epoch": 1.360062893081761, "percentage": 6.8, "elapsed_time": "0:06:33", "remaining_time": "1:29:56", "throughput": 4300.51, "total_tokens": 1693352} {"current_steps": 2600, "total_steps": 38160, "loss": 0.4774, "lr": 0.0006810796645702307, "epoch": 1.3626834381551363, "percentage": 6.81, "elapsed_time": "0:06:34", "remaining_time": "1:29:55", "throughput": 4300.61, "total_tokens": 1696456} {"current_steps": 2605, "total_steps": 38160, "loss": 0.4359, "lr": 0.0006823899371069183, "epoch": 1.3653039832285114, "percentage": 6.83, "elapsed_time": "0:06:35", "remaining_time": "1:29:55", "throughput": 4301.97, "total_tokens": 1700488} {"current_steps": 2610, "total_steps": 38160, "loss": 0.4523, "lr": 0.0006837002096436059, "epoch": 1.3679245283018868, "percentage": 6.84, "elapsed_time": "0:06:35", "remaining_time": "1:29:53", "throughput": 4301.75, "total_tokens": 1703304} {"current_steps": 2615, "total_steps": 38160, "loss": 0.5371, "lr": 0.0006850104821802935, "epoch": 1.370545073375262, "percentage": 6.85, "elapsed_time": "0:06:36", "remaining_time": "1:29:50", "throughput": 4301.31, "total_tokens": 1705864} {"current_steps": 2620, "total_steps": 38160, "loss": 0.6124, "lr": 0.0006863207547169812, "epoch": 1.3731656184486374, "percentage": 6.87, "elapsed_time": "0:06:37", "remaining_time": "1:29:48", "throughput": 4301.08, "total_tokens": 1708616} {"current_steps": 2625, "total_steps": 38160, "loss": 0.4809, "lr": 0.0006876310272536688, "epoch": 1.3757861635220126, "percentage": 6.88, "elapsed_time": "0:06:38", "remaining_time": "1:29:48", "throughput": 4301.89, "total_tokens": 1712232} {"current_steps": 2630, "total_steps": 38160, "loss": 0.3278, "lr": 0.0006889412997903564, "epoch": 1.3784067085953877, "percentage": 6.89, "elapsed_time": "0:06:38", "remaining_time": "1:29:46", "throughput": 4301.9, "total_tokens": 1715144} {"current_steps": 2635, "total_steps": 38160, "loss": 0.4597, "lr": 0.0006902515723270441, "epoch": 1.381027253668763, "percentage": 6.91, "elapsed_time": "0:06:39", "remaining_time": "1:29:43", "throughput": 4301.54, "total_tokens": 1717800} {"current_steps": 2640, "total_steps": 38160, "loss": 0.4859, "lr": 0.0006915618448637316, "epoch": 1.3836477987421385, "percentage": 6.92, "elapsed_time": "0:06:40", "remaining_time": "1:29:42", "throughput": 4301.9, "total_tokens": 1721128} {"current_steps": 2645, "total_steps": 38160, "loss": 0.4524, "lr": 0.0006928721174004193, "epoch": 1.3862683438155137, "percentage": 6.93, "elapsed_time": "0:06:40", "remaining_time": "1:29:41", "throughput": 4302.18, "total_tokens": 1724328} {"current_steps": 2650, "total_steps": 38160, "loss": 0.5577, "lr": 0.0006941823899371069, "epoch": 1.3888888888888888, "percentage": 6.94, "elapsed_time": "0:06:41", "remaining_time": "1:29:41", "throughput": 4303.35, "total_tokens": 1728328} {"current_steps": 2655, "total_steps": 38160, "loss": 0.473, "lr": 0.0006954926624737946, "epoch": 1.3915094339622642, "percentage": 6.96, "elapsed_time": "0:06:42", "remaining_time": "1:29:39", "throughput": 4303.16, "total_tokens": 1731080} {"current_steps": 2660, "total_steps": 38160, "loss": 0.5375, "lr": 0.0006968029350104822, "epoch": 1.3941299790356394, "percentage": 6.97, "elapsed_time": "0:06:43", "remaining_time": "1:29:41", "throughput": 4305.32, "total_tokens": 1736008} {"current_steps": 2665, "total_steps": 38160, "loss": 0.4075, "lr": 0.0006981132075471698, "epoch": 1.3967505241090148, "percentage": 6.98, "elapsed_time": "0:06:43", "remaining_time": "1:29:40", "throughput": 4305.76, "total_tokens": 1739368} {"current_steps": 2670, "total_steps": 38160, "loss": 0.6998, "lr": 0.0006994234800838574, "epoch": 1.39937106918239, "percentage": 7.0, "elapsed_time": "0:06:44", "remaining_time": "1:29:38", "throughput": 4305.83, "total_tokens": 1742408} {"current_steps": 2675, "total_steps": 38160, "loss": 0.5335, "lr": 0.000700733752620545, "epoch": 1.4019916142557651, "percentage": 7.01, "elapsed_time": "0:06:45", "remaining_time": "1:29:38", "throughput": 4306.74, "total_tokens": 1746120} {"current_steps": 2680, "total_steps": 38160, "loss": 0.5233, "lr": 0.0007020440251572327, "epoch": 1.4046121593291405, "percentage": 7.02, "elapsed_time": "0:06:46", "remaining_time": "1:29:36", "throughput": 4306.75, "total_tokens": 1749096} {"current_steps": 2685, "total_steps": 38160, "loss": 0.5474, "lr": 0.0007033542976939203, "epoch": 1.4072327044025157, "percentage": 7.04, "elapsed_time": "0:06:46", "remaining_time": "1:29:34", "throughput": 4306.24, "total_tokens": 1751624} {"current_steps": 2690, "total_steps": 38160, "loss": 0.4435, "lr": 0.0007046645702306079, "epoch": 1.409853249475891, "percentage": 7.05, "elapsed_time": "0:06:47", "remaining_time": "1:29:32", "throughput": 4305.76, "total_tokens": 1754216} {"current_steps": 2695, "total_steps": 38160, "loss": 0.5723, "lr": 0.0007059748427672957, "epoch": 1.4124737945492662, "percentage": 7.06, "elapsed_time": "0:06:48", "remaining_time": "1:29:32", "throughput": 4306.93, "total_tokens": 1758280} {"current_steps": 2700, "total_steps": 38160, "loss": 0.4881, "lr": 0.0007072851153039833, "epoch": 1.4150943396226414, "percentage": 7.08, "elapsed_time": "0:06:48", "remaining_time": "1:29:30", "throughput": 4306.96, "total_tokens": 1761352} {"current_steps": 2705, "total_steps": 38160, "loss": 0.4421, "lr": 0.0007085953878406709, "epoch": 1.4177148846960168, "percentage": 7.09, "elapsed_time": "0:06:49", "remaining_time": "1:29:29", "throughput": 4307.24, "total_tokens": 1764648} {"current_steps": 2710, "total_steps": 38160, "loss": 0.6195, "lr": 0.0007099056603773585, "epoch": 1.420335429769392, "percentage": 7.1, "elapsed_time": "0:06:50", "remaining_time": "1:29:28", "throughput": 4307.24, "total_tokens": 1767592} {"current_steps": 2715, "total_steps": 38160, "loss": 0.4565, "lr": 0.0007112159329140462, "epoch": 1.4229559748427674, "percentage": 7.11, "elapsed_time": "0:06:51", "remaining_time": "1:29:34", "throughput": 4311.03, "total_tokens": 1774600} {"current_steps": 2720, "total_steps": 38160, "loss": 0.5814, "lr": 0.0007125262054507338, "epoch": 1.4255765199161425, "percentage": 7.13, "elapsed_time": "0:06:52", "remaining_time": "1:29:33", "throughput": 4311.65, "total_tokens": 1778248} {"current_steps": 2725, "total_steps": 38160, "loss": 0.4708, "lr": 0.0007138364779874214, "epoch": 1.4281970649895177, "percentage": 7.14, "elapsed_time": "0:06:53", "remaining_time": "1:29:32", "throughput": 4312.08, "total_tokens": 1781608} {"current_steps": 2730, "total_steps": 38160, "loss": 0.6384, "lr": 0.0007151467505241091, "epoch": 1.430817610062893, "percentage": 7.15, "elapsed_time": "0:06:53", "remaining_time": "1:29:31", "throughput": 4312.2, "total_tokens": 1784776} {"current_steps": 2735, "total_steps": 38160, "loss": 0.5616, "lr": 0.0007164570230607966, "epoch": 1.4334381551362683, "percentage": 7.17, "elapsed_time": "0:06:54", "remaining_time": "1:29:29", "throughput": 4312.04, "total_tokens": 1787688} {"current_steps": 2740, "total_steps": 38160, "loss": 0.5882, "lr": 0.0007177672955974843, "epoch": 1.4360587002096437, "percentage": 7.18, "elapsed_time": "0:06:55", "remaining_time": "1:29:28", "throughput": 4312.53, "total_tokens": 1791016} {"current_steps": 2745, "total_steps": 38160, "loss": 0.5074, "lr": 0.0007190775681341719, "epoch": 1.4386792452830188, "percentage": 7.19, "elapsed_time": "0:06:56", "remaining_time": "1:29:27", "throughput": 4312.87, "total_tokens": 1794280} {"current_steps": 2750, "total_steps": 38160, "loss": 0.3968, "lr": 0.0007203878406708596, "epoch": 1.441299790356394, "percentage": 7.21, "elapsed_time": "0:06:56", "remaining_time": "1:29:26", "throughput": 4313.06, "total_tokens": 1797480} {"current_steps": 2755, "total_steps": 38160, "loss": 0.6271, "lr": 0.0007216981132075472, "epoch": 1.4439203354297694, "percentage": 7.22, "elapsed_time": "0:06:57", "remaining_time": "1:29:25", "throughput": 4313.74, "total_tokens": 1801160} {"current_steps": 2760, "total_steps": 38160, "loss": 0.6007, "lr": 0.0007230083857442348, "epoch": 1.4465408805031448, "percentage": 7.23, "elapsed_time": "0:06:58", "remaining_time": "1:29:23", "throughput": 4313.04, "total_tokens": 1803464} {"current_steps": 2765, "total_steps": 38160, "loss": 0.4611, "lr": 0.0007243186582809224, "epoch": 1.44916142557652, "percentage": 7.25, "elapsed_time": "0:06:58", "remaining_time": "1:29:22", "throughput": 4313.28, "total_tokens": 1806728} {"current_steps": 2770, "total_steps": 38160, "loss": 0.4343, "lr": 0.00072562893081761, "epoch": 1.4517819706498951, "percentage": 7.26, "elapsed_time": "0:06:59", "remaining_time": "1:29:21", "throughput": 4313.59, "total_tokens": 1810088} {"current_steps": 2775, "total_steps": 38160, "loss": 0.4314, "lr": 0.0007269392033542977, "epoch": 1.4544025157232705, "percentage": 7.27, "elapsed_time": "0:07:00", "remaining_time": "1:29:23", "throughput": 4315.75, "total_tokens": 1815144} {"current_steps": 2780, "total_steps": 38160, "loss": 0.4187, "lr": 0.0007282494758909853, "epoch": 1.4570230607966457, "percentage": 7.29, "elapsed_time": "0:07:01", "remaining_time": "1:29:22", "throughput": 4316.49, "total_tokens": 1818792} {"current_steps": 2785, "total_steps": 38160, "loss": 0.6008, "lr": 0.0007295597484276729, "epoch": 1.459643605870021, "percentage": 7.3, "elapsed_time": "0:07:02", "remaining_time": "1:29:20", "throughput": 4316.55, "total_tokens": 1821768} {"current_steps": 2790, "total_steps": 38160, "loss": 0.6171, "lr": 0.0007308700209643606, "epoch": 1.4622641509433962, "percentage": 7.31, "elapsed_time": "0:07:02", "remaining_time": "1:29:20", "throughput": 4317.41, "total_tokens": 1825512} {"current_steps": 2795, "total_steps": 38160, "loss": 0.3789, "lr": 0.0007321802935010483, "epoch": 1.4648846960167714, "percentage": 7.32, "elapsed_time": "0:07:03", "remaining_time": "1:29:19", "throughput": 4317.96, "total_tokens": 1828968} {"current_steps": 2800, "total_steps": 38160, "loss": 0.5442, "lr": 0.0007334905660377359, "epoch": 1.4675052410901468, "percentage": 7.34, "elapsed_time": "0:07:04", "remaining_time": "1:29:16", "throughput": 4317.28, "total_tokens": 1831336} {"current_steps": 2805, "total_steps": 38160, "loss": 0.5314, "lr": 0.0007348008385744235, "epoch": 1.470125786163522, "percentage": 7.35, "elapsed_time": "0:07:04", "remaining_time": "1:29:15", "throughput": 4317.5, "total_tokens": 1834536} {"current_steps": 2810, "total_steps": 38160, "loss": 0.4684, "lr": 0.0007361111111111112, "epoch": 1.4727463312368974, "percentage": 7.36, "elapsed_time": "0:07:05", "remaining_time": "1:29:14", "throughput": 4317.41, "total_tokens": 1837480} {"current_steps": 2815, "total_steps": 38160, "loss": 0.5823, "lr": 0.0007374213836477988, "epoch": 1.4753668763102725, "percentage": 7.38, "elapsed_time": "0:07:06", "remaining_time": "1:29:12", "throughput": 4317.82, "total_tokens": 1840808} {"current_steps": 2820, "total_steps": 38160, "loss": 0.6257, "lr": 0.0007387316561844864, "epoch": 1.4779874213836477, "percentage": 7.39, "elapsed_time": "0:07:07", "remaining_time": "1:29:12", "throughput": 4318.43, "total_tokens": 1844392} {"current_steps": 2825, "total_steps": 38160, "loss": 0.3899, "lr": 0.0007400419287211741, "epoch": 1.480607966457023, "percentage": 7.4, "elapsed_time": "0:07:07", "remaining_time": "1:29:11", "throughput": 4319.07, "total_tokens": 1848008} {"current_steps": 2830, "total_steps": 38160, "loss": 0.4283, "lr": 0.0007413522012578616, "epoch": 1.4832285115303983, "percentage": 7.42, "elapsed_time": "0:07:08", "remaining_time": "1:29:10", "throughput": 4318.89, "total_tokens": 1850888} {"current_steps": 2835, "total_steps": 38160, "loss": 0.697, "lr": 0.0007426624737945493, "epoch": 1.4858490566037736, "percentage": 7.43, "elapsed_time": "0:07:09", "remaining_time": "1:29:09", "throughput": 4319.35, "total_tokens": 1854312} {"current_steps": 2840, "total_steps": 38160, "loss": 0.4895, "lr": 0.0007439727463312369, "epoch": 1.4884696016771488, "percentage": 7.44, "elapsed_time": "0:07:10", "remaining_time": "1:29:10", "throughput": 4320.87, "total_tokens": 1858792} {"current_steps": 2845, "total_steps": 38160, "loss": 0.4691, "lr": 0.0007452830188679245, "epoch": 1.491090146750524, "percentage": 7.46, "elapsed_time": "0:07:10", "remaining_time": "1:29:08", "throughput": 4320.81, "total_tokens": 1861672} {"current_steps": 2850, "total_steps": 38160, "loss": 0.4469, "lr": 0.0007465932914046122, "epoch": 1.4937106918238994, "percentage": 7.47, "elapsed_time": "0:07:11", "remaining_time": "1:29:06", "throughput": 4320.49, "total_tokens": 1864360} {"current_steps": 2855, "total_steps": 38160, "loss": 0.4787, "lr": 0.0007479035639412998, "epoch": 1.4963312368972748, "percentage": 7.48, "elapsed_time": "0:07:12", "remaining_time": "1:29:04", "throughput": 4320.19, "total_tokens": 1867048} {"current_steps": 2860, "total_steps": 38160, "loss": 0.4734, "lr": 0.0007492138364779874, "epoch": 1.49895178197065, "percentage": 7.49, "elapsed_time": "0:07:12", "remaining_time": "1:29:03", "throughput": 4320.43, "total_tokens": 1870280} {"current_steps": 2865, "total_steps": 38160, "loss": 0.6569, "lr": 0.000750524109014675, "epoch": 1.501572327044025, "percentage": 7.51, "elapsed_time": "0:07:13", "remaining_time": "1:29:02", "throughput": 4320.99, "total_tokens": 1873896} {"current_steps": 2870, "total_steps": 38160, "loss": 0.5101, "lr": 0.0007518343815513627, "epoch": 1.5041928721174003, "percentage": 7.52, "elapsed_time": "0:07:14", "remaining_time": "1:29:00", "throughput": 4320.95, "total_tokens": 1876808} {"current_steps": 2875, "total_steps": 38160, "loss": 0.5233, "lr": 0.0007531446540880503, "epoch": 1.5068134171907757, "percentage": 7.53, "elapsed_time": "0:07:15", "remaining_time": "1:28:59", "throughput": 4321.44, "total_tokens": 1880168} {"current_steps": 2880, "total_steps": 38160, "loss": 0.4208, "lr": 0.0007544549266247379, "epoch": 1.509433962264151, "percentage": 7.55, "elapsed_time": "0:07:15", "remaining_time": "1:28:57", "throughput": 4321.09, "total_tokens": 1882824} {"current_steps": 2885, "total_steps": 38160, "loss": 0.4526, "lr": 0.0007557651991614256, "epoch": 1.5120545073375262, "percentage": 7.56, "elapsed_time": "0:07:16", "remaining_time": "1:28:56", "throughput": 4321.43, "total_tokens": 1886184} {"current_steps": 2890, "total_steps": 38160, "loss": 0.526, "lr": 0.0007570754716981131, "epoch": 1.5146750524109014, "percentage": 7.57, "elapsed_time": "0:07:17", "remaining_time": "1:28:54", "throughput": 4321.25, "total_tokens": 1888968} {"current_steps": 2895, "total_steps": 38160, "loss": 0.5918, "lr": 0.0007583857442348009, "epoch": 1.5172955974842768, "percentage": 7.59, "elapsed_time": "0:07:17", "remaining_time": "1:28:53", "throughput": 4321.48, "total_tokens": 1892232} {"current_steps": 2900, "total_steps": 38160, "loss": 0.4495, "lr": 0.0007596960167714885, "epoch": 1.519916142557652, "percentage": 7.6, "elapsed_time": "0:07:18", "remaining_time": "1:28:52", "throughput": 4321.57, "total_tokens": 1895240} {"current_steps": 2905, "total_steps": 38160, "loss": 0.3535, "lr": 0.0007610062893081762, "epoch": 1.5225366876310273, "percentage": 7.61, "elapsed_time": "0:07:19", "remaining_time": "1:28:52", "throughput": 4322.49, "total_tokens": 1899144} {"current_steps": 2910, "total_steps": 38160, "loss": 0.4514, "lr": 0.0007623165618448638, "epoch": 1.5251572327044025, "percentage": 7.63, "elapsed_time": "0:07:20", "remaining_time": "1:28:50", "throughput": 4322.25, "total_tokens": 1901896} {"current_steps": 2915, "total_steps": 38160, "loss": 0.4711, "lr": 0.0007636268343815514, "epoch": 1.5277777777777777, "percentage": 7.64, "elapsed_time": "0:07:20", "remaining_time": "1:28:48", "throughput": 4322.32, "total_tokens": 1904936} {"current_steps": 2920, "total_steps": 38160, "loss": 0.5089, "lr": 0.0007649371069182391, "epoch": 1.530398322851153, "percentage": 7.65, "elapsed_time": "0:07:21", "remaining_time": "1:28:47", "throughput": 4322.61, "total_tokens": 1908328} {"current_steps": 2925, "total_steps": 38160, "loss": 0.5612, "lr": 0.0007662473794549266, "epoch": 1.5330188679245285, "percentage": 7.67, "elapsed_time": "0:07:22", "remaining_time": "1:28:46", "throughput": 4322.84, "total_tokens": 1911496} {"current_steps": 2930, "total_steps": 38160, "loss": 0.4345, "lr": 0.0007675576519916143, "epoch": 1.5356394129979036, "percentage": 7.68, "elapsed_time": "0:07:22", "remaining_time": "1:28:44", "throughput": 4322.42, "total_tokens": 1913992} {"current_steps": 2935, "total_steps": 38160, "loss": 0.5532, "lr": 0.0007688679245283019, "epoch": 1.5382599580712788, "percentage": 7.69, "elapsed_time": "0:07:23", "remaining_time": "1:28:43", "throughput": 4323.04, "total_tokens": 1917640} {"current_steps": 2940, "total_steps": 38160, "loss": 0.3933, "lr": 0.0007701781970649895, "epoch": 1.540880503144654, "percentage": 7.7, "elapsed_time": "0:07:24", "remaining_time": "1:28:42", "throughput": 4323.08, "total_tokens": 1920616} {"current_steps": 2945, "total_steps": 38160, "loss": 0.4593, "lr": 0.0007714884696016772, "epoch": 1.5435010482180294, "percentage": 7.72, "elapsed_time": "0:07:24", "remaining_time": "1:28:39", "throughput": 4322.75, "total_tokens": 1923208} {"current_steps": 2950, "total_steps": 38160, "loss": 0.4172, "lr": 0.0007727987421383648, "epoch": 1.5461215932914047, "percentage": 7.73, "elapsed_time": "0:07:25", "remaining_time": "1:28:39", "throughput": 4323.49, "total_tokens": 1926952} {"current_steps": 2955, "total_steps": 38160, "loss": 0.4724, "lr": 0.0007741090146750524, "epoch": 1.54874213836478, "percentage": 7.74, "elapsed_time": "0:07:26", "remaining_time": "1:28:39", "throughput": 4324.34, "total_tokens": 1930696} {"current_steps": 2960, "total_steps": 38160, "loss": 0.4842, "lr": 0.00077541928721174, "epoch": 1.551362683438155, "percentage": 7.76, "elapsed_time": "0:07:27", "remaining_time": "1:28:37", "throughput": 4324.52, "total_tokens": 1933864} {"current_steps": 2965, "total_steps": 38160, "loss": 0.5093, "lr": 0.0007767295597484277, "epoch": 1.5539832285115303, "percentage": 7.77, "elapsed_time": "0:07:28", "remaining_time": "1:28:38", "throughput": 4326.1, "total_tokens": 1938440} {"current_steps": 2970, "total_steps": 38160, "loss": 0.5786, "lr": 0.0007780398322851153, "epoch": 1.5566037735849056, "percentage": 7.78, "elapsed_time": "0:07:28", "remaining_time": "1:28:38", "throughput": 4326.87, "total_tokens": 1942184} {"current_steps": 2975, "total_steps": 38160, "loss": 0.4438, "lr": 0.0007793501048218029, "epoch": 1.559224318658281, "percentage": 7.8, "elapsed_time": "0:07:29", "remaining_time": "1:28:37", "throughput": 4327.66, "total_tokens": 1945928} {"current_steps": 2980, "total_steps": 38160, "loss": 0.5561, "lr": 0.0007806603773584906, "epoch": 1.5618448637316562, "percentage": 7.81, "elapsed_time": "0:07:30", "remaining_time": "1:28:37", "throughput": 4328.17, "total_tokens": 1949416} {"current_steps": 2985, "total_steps": 38160, "loss": 0.4447, "lr": 0.0007819706498951781, "epoch": 1.5644654088050314, "percentage": 7.82, "elapsed_time": "0:07:31", "remaining_time": "1:28:35", "throughput": 4327.78, "total_tokens": 1952008} {"current_steps": 2990, "total_steps": 38160, "loss": 0.4526, "lr": 0.0007832809224318658, "epoch": 1.5670859538784065, "percentage": 7.84, "elapsed_time": "0:07:31", "remaining_time": "1:28:34", "throughput": 4328.56, "total_tokens": 1955656} {"current_steps": 2995, "total_steps": 38160, "loss": 0.6624, "lr": 0.0007845911949685535, "epoch": 1.569706498951782, "percentage": 7.85, "elapsed_time": "0:07:32", "remaining_time": "1:28:32", "throughput": 4328.55, "total_tokens": 1958632} {"current_steps": 3000, "total_steps": 38160, "loss": 0.4898, "lr": 0.0007859014675052411, "epoch": 1.5723270440251573, "percentage": 7.86, "elapsed_time": "0:07:33", "remaining_time": "1:28:30", "throughput": 4328.21, "total_tokens": 1961256} {"current_steps": 3005, "total_steps": 38160, "loss": 0.4196, "lr": 0.0007872117400419288, "epoch": 1.5749475890985325, "percentage": 7.87, "elapsed_time": "0:07:33", "remaining_time": "1:28:31", "throughput": 4329.45, "total_tokens": 1965480} {"current_steps": 3010, "total_steps": 38160, "loss": 0.4771, "lr": 0.0007885220125786164, "epoch": 1.5775681341719077, "percentage": 7.89, "elapsed_time": "0:07:34", "remaining_time": "1:28:29", "throughput": 4329.48, "total_tokens": 1968552} {"current_steps": 3015, "total_steps": 38160, "loss": 0.4646, "lr": 0.0007898322851153041, "epoch": 1.580188679245283, "percentage": 7.9, "elapsed_time": "0:07:35", "remaining_time": "1:28:27", "throughput": 4329.38, "total_tokens": 1971400} {"current_steps": 3020, "total_steps": 38160, "loss": 0.398, "lr": 0.0007911425576519916, "epoch": 1.5828092243186582, "percentage": 7.91, "elapsed_time": "0:07:36", "remaining_time": "1:28:26", "throughput": 4329.36, "total_tokens": 1974312} {"current_steps": 3025, "total_steps": 38160, "loss": 0.3763, "lr": 0.0007924528301886793, "epoch": 1.5854297693920336, "percentage": 7.93, "elapsed_time": "0:07:36", "remaining_time": "1:28:24", "throughput": 4329.02, "total_tokens": 1976904} {"current_steps": 3030, "total_steps": 38160, "loss": 0.5424, "lr": 0.0007937631027253669, "epoch": 1.5880503144654088, "percentage": 7.94, "elapsed_time": "0:07:37", "remaining_time": "1:28:21", "throughput": 4328.53, "total_tokens": 1979432} {"current_steps": 3035, "total_steps": 38160, "loss": 0.4991, "lr": 0.0007950733752620545, "epoch": 1.590670859538784, "percentage": 7.95, "elapsed_time": "0:07:38", "remaining_time": "1:28:21", "throughput": 4329.05, "total_tokens": 1982952} {"current_steps": 3040, "total_steps": 38160, "loss": 0.4756, "lr": 0.0007963836477987422, "epoch": 1.5932914046121593, "percentage": 7.97, "elapsed_time": "0:07:38", "remaining_time": "1:28:20", "throughput": 4329.62, "total_tokens": 1986408} {"current_steps": 3045, "total_steps": 38160, "loss": 0.4414, "lr": 0.0007976939203354298, "epoch": 1.5959119496855347, "percentage": 7.98, "elapsed_time": "0:07:39", "remaining_time": "1:28:18", "throughput": 4329.18, "total_tokens": 1988936} {"current_steps": 3050, "total_steps": 38160, "loss": 0.6301, "lr": 0.0007990041928721174, "epoch": 1.59853249475891, "percentage": 7.99, "elapsed_time": "0:07:40", "remaining_time": "1:28:17", "throughput": 4329.47, "total_tokens": 1992264} {"current_steps": 3055, "total_steps": 38160, "loss": 0.591, "lr": 0.000800314465408805, "epoch": 1.601153039832285, "percentage": 8.01, "elapsed_time": "0:07:40", "remaining_time": "1:28:15", "throughput": 4329.53, "total_tokens": 1995240} {"current_steps": 3060, "total_steps": 38160, "loss": 0.5291, "lr": 0.0008016247379454927, "epoch": 1.6037735849056602, "percentage": 8.02, "elapsed_time": "0:07:41", "remaining_time": "1:28:14", "throughput": 4329.78, "total_tokens": 1998408} {"current_steps": 3065, "total_steps": 38160, "loss": 0.485, "lr": 0.0008029350104821803, "epoch": 1.6063941299790356, "percentage": 8.03, "elapsed_time": "0:07:42", "remaining_time": "1:28:12", "throughput": 4329.8, "total_tokens": 2001416} {"current_steps": 3070, "total_steps": 38160, "loss": 0.4601, "lr": 0.0008042452830188679, "epoch": 1.609014675052411, "percentage": 8.05, "elapsed_time": "0:07:42", "remaining_time": "1:28:10", "throughput": 4329.17, "total_tokens": 2003752} {"current_steps": 3075, "total_steps": 38160, "loss": 0.467, "lr": 0.0008055555555555556, "epoch": 1.6116352201257862, "percentage": 8.06, "elapsed_time": "0:07:43", "remaining_time": "1:28:08", "throughput": 4329.16, "total_tokens": 2006728} {"current_steps": 3080, "total_steps": 38160, "loss": 0.4623, "lr": 0.0008068658280922431, "epoch": 1.6142557651991614, "percentage": 8.07, "elapsed_time": "0:07:44", "remaining_time": "1:28:07", "throughput": 4329.32, "total_tokens": 2009928} {"current_steps": 3085, "total_steps": 38160, "loss": 0.3521, "lr": 0.0008081761006289308, "epoch": 1.6168763102725365, "percentage": 8.08, "elapsed_time": "0:07:44", "remaining_time": "1:28:05", "throughput": 4329.07, "total_tokens": 2012648} {"current_steps": 3090, "total_steps": 38160, "loss": 0.4057, "lr": 0.0008094863731656184, "epoch": 1.619496855345912, "percentage": 8.1, "elapsed_time": "0:07:45", "remaining_time": "1:28:06", "throughput": 4330.43, "total_tokens": 2016936} {"current_steps": 3095, "total_steps": 38160, "loss": 0.3439, "lr": 0.0008107966457023061, "epoch": 1.6221174004192873, "percentage": 8.11, "elapsed_time": "0:07:46", "remaining_time": "1:28:04", "throughput": 4330.25, "total_tokens": 2019720} {"current_steps": 3100, "total_steps": 38160, "loss": 0.4394, "lr": 0.0008121069182389938, "epoch": 1.6247379454926625, "percentage": 8.12, "elapsed_time": "0:07:47", "remaining_time": "1:28:03", "throughput": 4330.23, "total_tokens": 2022760} {"current_steps": 3105, "total_steps": 38160, "loss": 0.4408, "lr": 0.0008134171907756814, "epoch": 1.6273584905660377, "percentage": 8.14, "elapsed_time": "0:07:47", "remaining_time": "1:28:01", "throughput": 4330.04, "total_tokens": 2025544} {"current_steps": 3110, "total_steps": 38160, "loss": 0.4214, "lr": 0.0008147274633123691, "epoch": 1.629979035639413, "percentage": 8.15, "elapsed_time": "0:07:48", "remaining_time": "1:28:00", "throughput": 4330.33, "total_tokens": 2028872} {"current_steps": 3115, "total_steps": 38160, "loss": 0.4243, "lr": 0.0008160377358490566, "epoch": 1.6325995807127882, "percentage": 8.16, "elapsed_time": "0:07:49", "remaining_time": "1:27:58", "throughput": 4330.3, "total_tokens": 2031816} {"current_steps": 3120, "total_steps": 38160, "loss": 0.5943, "lr": 0.0008173480083857443, "epoch": 1.6352201257861636, "percentage": 8.18, "elapsed_time": "0:07:49", "remaining_time": "1:27:56", "throughput": 4329.82, "total_tokens": 2034280} {"current_steps": 3125, "total_steps": 38160, "loss": 0.4913, "lr": 0.0008186582809224319, "epoch": 1.6378406708595388, "percentage": 8.19, "elapsed_time": "0:07:50", "remaining_time": "1:27:56", "throughput": 4330.59, "total_tokens": 2038056} {"current_steps": 3130, "total_steps": 38160, "loss": 0.5348, "lr": 0.0008199685534591195, "epoch": 1.640461215932914, "percentage": 8.2, "elapsed_time": "0:07:51", "remaining_time": "1:27:54", "throughput": 4330.71, "total_tokens": 2041192} {"current_steps": 3135, "total_steps": 38160, "loss": 0.4764, "lr": 0.0008212788259958072, "epoch": 1.6430817610062893, "percentage": 8.22, "elapsed_time": "0:07:51", "remaining_time": "1:27:52", "throughput": 4330.3, "total_tokens": 2043720} {"current_steps": 3140, "total_steps": 38160, "loss": 0.5506, "lr": 0.0008225890985324948, "epoch": 1.6457023060796647, "percentage": 8.23, "elapsed_time": "0:07:52", "remaining_time": "1:27:51", "throughput": 4330.38, "total_tokens": 2046792} {"current_steps": 3145, "total_steps": 38160, "loss": 0.633, "lr": 0.0008238993710691824, "epoch": 1.64832285115304, "percentage": 8.24, "elapsed_time": "0:07:53", "remaining_time": "1:27:50", "throughput": 4330.27, "total_tokens": 2049768} {"current_steps": 3150, "total_steps": 38160, "loss": 0.5126, "lr": 0.00082520964360587, "epoch": 1.650943396226415, "percentage": 8.25, "elapsed_time": "0:07:54", "remaining_time": "1:27:48", "throughput": 4330.38, "total_tokens": 2052840} {"current_steps": 3155, "total_steps": 38160, "loss": 0.5228, "lr": 0.0008265199161425576, "epoch": 1.6535639412997902, "percentage": 8.27, "elapsed_time": "0:07:54", "remaining_time": "1:27:46", "throughput": 4330.01, "total_tokens": 2055432} {"current_steps": 3160, "total_steps": 38160, "loss": 0.6153, "lr": 0.0008278301886792453, "epoch": 1.6561844863731656, "percentage": 8.28, "elapsed_time": "0:07:55", "remaining_time": "1:27:45", "throughput": 4330.35, "total_tokens": 2058792} {"current_steps": 3165, "total_steps": 38160, "loss": 0.4796, "lr": 0.0008291404612159329, "epoch": 1.658805031446541, "percentage": 8.29, "elapsed_time": "0:07:56", "remaining_time": "1:27:44", "throughput": 4330.51, "total_tokens": 2061960} {"current_steps": 3170, "total_steps": 38160, "loss": 0.63, "lr": 0.0008304507337526206, "epoch": 1.6614255765199162, "percentage": 8.31, "elapsed_time": "0:07:56", "remaining_time": "1:27:42", "throughput": 4330.27, "total_tokens": 2064712} {"current_steps": 3175, "total_steps": 38160, "loss": 0.4393, "lr": 0.0008317610062893081, "epoch": 1.6640461215932913, "percentage": 8.32, "elapsed_time": "0:07:57", "remaining_time": "1:27:42", "throughput": 4330.9, "total_tokens": 2068360} {"current_steps": 3180, "total_steps": 38160, "loss": 0.4699, "lr": 0.0008330712788259958, "epoch": 1.6666666666666665, "percentage": 8.33, "elapsed_time": "0:07:58", "remaining_time": "1:27:40", "throughput": 4330.87, "total_tokens": 2071304} {"current_steps": 3185, "total_steps": 38160, "loss": 0.6975, "lr": 0.0008343815513626834, "epoch": 1.669287211740042, "percentage": 8.35, "elapsed_time": "0:07:59", "remaining_time": "1:27:40", "throughput": 4331.53, "total_tokens": 2075016} {"current_steps": 3190, "total_steps": 38160, "loss": 0.4554, "lr": 0.000835691823899371, "epoch": 1.6719077568134173, "percentage": 8.36, "elapsed_time": "0:07:59", "remaining_time": "1:27:40", "throughput": 4332.38, "total_tokens": 2079016} {"current_steps": 3195, "total_steps": 38160, "loss": 0.377, "lr": 0.0008370020964360588, "epoch": 1.6745283018867925, "percentage": 8.37, "elapsed_time": "0:08:00", "remaining_time": "1:27:39", "throughput": 4332.4, "total_tokens": 2081960} {"current_steps": 3200, "total_steps": 38160, "loss": 0.4096, "lr": 0.0008383123689727464, "epoch": 1.6771488469601676, "percentage": 8.39, "elapsed_time": "0:08:01", "remaining_time": "1:27:37", "throughput": 4332.03, "total_tokens": 2084648} {"current_steps": 3205, "total_steps": 38160, "loss": 0.4549, "lr": 0.000839622641509434, "epoch": 1.679769392033543, "percentage": 8.4, "elapsed_time": "0:08:02", "remaining_time": "1:27:37", "throughput": 4333.18, "total_tokens": 2088840} {"current_steps": 3210, "total_steps": 38160, "loss": 0.4993, "lr": 0.0008409329140461216, "epoch": 1.6823899371069182, "percentage": 8.41, "elapsed_time": "0:08:02", "remaining_time": "1:27:36", "throughput": 4333.27, "total_tokens": 2091944} {"current_steps": 3215, "total_steps": 38160, "loss": 0.5405, "lr": 0.0008422431865828093, "epoch": 1.6850104821802936, "percentage": 8.43, "elapsed_time": "0:08:03", "remaining_time": "1:27:35", "throughput": 4333.47, "total_tokens": 2095144} {"current_steps": 3220, "total_steps": 38160, "loss": 0.5443, "lr": 0.0008435534591194969, "epoch": 1.6876310272536688, "percentage": 8.44, "elapsed_time": "0:08:04", "remaining_time": "1:27:34", "throughput": 4334.29, "total_tokens": 2098984} {"current_steps": 3225, "total_steps": 38160, "loss": 0.3469, "lr": 0.0008448637316561845, "epoch": 1.690251572327044, "percentage": 8.45, "elapsed_time": "0:08:04", "remaining_time": "1:27:33", "throughput": 4333.96, "total_tokens": 2101736} {"current_steps": 3230, "total_steps": 38160, "loss": 0.5256, "lr": 0.0008461740041928722, "epoch": 1.6928721174004193, "percentage": 8.46, "elapsed_time": "0:08:05", "remaining_time": "1:27:32", "throughput": 4334.08, "total_tokens": 2104904} {"current_steps": 3235, "total_steps": 38160, "loss": 0.5294, "lr": 0.0008474842767295598, "epoch": 1.6954926624737947, "percentage": 8.48, "elapsed_time": "0:08:06", "remaining_time": "1:27:31", "throughput": 4334.55, "total_tokens": 2108392} {"current_steps": 3240, "total_steps": 38160, "loss": 0.6037, "lr": 0.0008487945492662474, "epoch": 1.6981132075471699, "percentage": 8.49, "elapsed_time": "0:08:07", "remaining_time": "1:27:31", "throughput": 4335.48, "total_tokens": 2112360} {"current_steps": 3245, "total_steps": 38160, "loss": 0.512, "lr": 0.000850104821802935, "epoch": 1.700733752620545, "percentage": 8.5, "elapsed_time": "0:08:08", "remaining_time": "1:27:33", "throughput": 4337.53, "total_tokens": 2117992} {"current_steps": 3250, "total_steps": 38160, "loss": 0.411, "lr": 0.0008514150943396226, "epoch": 1.7033542976939202, "percentage": 8.52, "elapsed_time": "0:08:08", "remaining_time": "1:27:32", "throughput": 4337.62, "total_tokens": 2121096} {"current_steps": 3255, "total_steps": 38160, "loss": 0.4941, "lr": 0.0008527253668763103, "epoch": 1.7059748427672956, "percentage": 8.53, "elapsed_time": "0:08:09", "remaining_time": "1:27:32", "throughput": 4338.52, "total_tokens": 2125064} {"current_steps": 3260, "total_steps": 38160, "loss": 0.393, "lr": 0.0008540356394129979, "epoch": 1.708595387840671, "percentage": 8.54, "elapsed_time": "0:08:10", "remaining_time": "1:27:32", "throughput": 4339.37, "total_tokens": 2129032} {"current_steps": 3265, "total_steps": 38160, "loss": 0.5836, "lr": 0.0008553459119496856, "epoch": 1.7112159329140462, "percentage": 8.56, "elapsed_time": "0:08:11", "remaining_time": "1:27:30", "throughput": 4338.94, "total_tokens": 2131656} {"current_steps": 3270, "total_steps": 38160, "loss": 0.5959, "lr": 0.0008566561844863731, "epoch": 1.7138364779874213, "percentage": 8.57, "elapsed_time": "0:08:11", "remaining_time": "1:27:29", "throughput": 4338.95, "total_tokens": 2134760} {"current_steps": 3275, "total_steps": 38160, "loss": 0.5868, "lr": 0.0008579664570230608, "epoch": 1.7164570230607965, "percentage": 8.58, "elapsed_time": "0:08:12", "remaining_time": "1:27:28", "throughput": 4339.1, "total_tokens": 2137960} {"current_steps": 3280, "total_steps": 38160, "loss": 0.4612, "lr": 0.0008592767295597484, "epoch": 1.719077568134172, "percentage": 8.6, "elapsed_time": "0:08:13", "remaining_time": "1:27:26", "throughput": 4338.65, "total_tokens": 2140552} {"current_steps": 3285, "total_steps": 38160, "loss": 0.3742, "lr": 0.000860587002096436, "epoch": 1.7216981132075473, "percentage": 8.61, "elapsed_time": "0:08:14", "remaining_time": "1:27:24", "throughput": 4338.36, "total_tokens": 2143272} {"current_steps": 3290, "total_steps": 38160, "loss": 0.5275, "lr": 0.0008618972746331238, "epoch": 1.7243186582809225, "percentage": 8.62, "elapsed_time": "0:08:14", "remaining_time": "1:27:24", "throughput": 4339.38, "total_tokens": 2147304} {"current_steps": 3295, "total_steps": 38160, "loss": 0.666, "lr": 0.0008632075471698114, "epoch": 1.7269392033542976, "percentage": 8.63, "elapsed_time": "0:08:15", "remaining_time": "1:27:24", "throughput": 4340.71, "total_tokens": 2151624} {"current_steps": 3300, "total_steps": 38160, "loss": 0.5473, "lr": 0.000864517819706499, "epoch": 1.7295597484276728, "percentage": 8.65, "elapsed_time": "0:08:16", "remaining_time": "1:27:23", "throughput": 4340.35, "total_tokens": 2154248} {"current_steps": 3305, "total_steps": 38160, "loss": 0.5689, "lr": 0.0008658280922431866, "epoch": 1.7321802935010482, "percentage": 8.66, "elapsed_time": "0:08:17", "remaining_time": "1:27:21", "throughput": 4340.04, "total_tokens": 2157000} {"current_steps": 3310, "total_steps": 38160, "loss": 0.4344, "lr": 0.0008671383647798742, "epoch": 1.7348008385744236, "percentage": 8.67, "elapsed_time": "0:08:17", "remaining_time": "1:27:21", "throughput": 4340.87, "total_tokens": 2160904} {"current_steps": 3315, "total_steps": 38160, "loss": 0.5471, "lr": 0.0008684486373165619, "epoch": 1.7374213836477987, "percentage": 8.69, "elapsed_time": "0:08:18", "remaining_time": "1:27:19", "throughput": 4340.7, "total_tokens": 2163720} {"current_steps": 3320, "total_steps": 38160, "loss": 0.4304, "lr": 0.0008697589098532495, "epoch": 1.740041928721174, "percentage": 8.7, "elapsed_time": "0:08:19", "remaining_time": "1:27:19", "throughput": 4341.77, "total_tokens": 2167912} {"current_steps": 3325, "total_steps": 38160, "loss": 0.4638, "lr": 0.0008710691823899372, "epoch": 1.7426624737945493, "percentage": 8.71, "elapsed_time": "0:08:20", "remaining_time": "1:27:19", "throughput": 4342.35, "total_tokens": 2171592} {"current_steps": 3330, "total_steps": 38160, "loss": 0.5429, "lr": 0.0008723794549266247, "epoch": 1.7452830188679245, "percentage": 8.73, "elapsed_time": "0:08:20", "remaining_time": "1:27:17", "throughput": 4341.68, "total_tokens": 2173864} {"current_steps": 3335, "total_steps": 38160, "loss": 0.4438, "lr": 0.0008736897274633124, "epoch": 1.7479035639412999, "percentage": 8.74, "elapsed_time": "0:08:21", "remaining_time": "1:27:15", "throughput": 4341.5, "total_tokens": 2176744} {"current_steps": 3340, "total_steps": 38160, "loss": 0.6511, "lr": 0.000875, "epoch": 1.750524109014675, "percentage": 8.75, "elapsed_time": "0:08:22", "remaining_time": "1:27:13", "throughput": 4341.22, "total_tokens": 2179528} {"current_steps": 3345, "total_steps": 38160, "loss": 0.4411, "lr": 0.0008763102725366876, "epoch": 1.7531446540880502, "percentage": 8.77, "elapsed_time": "0:08:22", "remaining_time": "1:27:12", "throughput": 4341.58, "total_tokens": 2182856} {"current_steps": 3350, "total_steps": 38160, "loss": 0.4344, "lr": 0.0008776205450733753, "epoch": 1.7557651991614256, "percentage": 8.78, "elapsed_time": "0:08:23", "remaining_time": "1:27:11", "throughput": 4341.52, "total_tokens": 2185832} {"current_steps": 3355, "total_steps": 38160, "loss": 0.5057, "lr": 0.0008789308176100629, "epoch": 1.758385744234801, "percentage": 8.79, "elapsed_time": "0:08:24", "remaining_time": "1:27:10", "throughput": 4341.97, "total_tokens": 2189352} {"current_steps": 3360, "total_steps": 38160, "loss": 0.4654, "lr": 0.0008802410901467506, "epoch": 1.7610062893081762, "percentage": 8.81, "elapsed_time": "0:08:24", "remaining_time": "1:27:09", "throughput": 4341.9, "total_tokens": 2192264} {"current_steps": 3365, "total_steps": 38160, "loss": 0.4776, "lr": 0.0008815513626834381, "epoch": 1.7636268343815513, "percentage": 8.82, "elapsed_time": "0:08:25", "remaining_time": "1:27:08", "throughput": 4342.2, "total_tokens": 2195560} {"current_steps": 3370, "total_steps": 38160, "loss": 0.4305, "lr": 0.0008828616352201258, "epoch": 1.7662473794549265, "percentage": 8.83, "elapsed_time": "0:08:26", "remaining_time": "1:27:07", "throughput": 4342.59, "total_tokens": 2199080} {"current_steps": 3375, "total_steps": 38160, "loss": 0.403, "lr": 0.0008841719077568134, "epoch": 1.7688679245283019, "percentage": 8.84, "elapsed_time": "0:08:27", "remaining_time": "1:27:06", "throughput": 4342.88, "total_tokens": 2202408} {"current_steps": 3380, "total_steps": 38160, "loss": 0.5245, "lr": 0.000885482180293501, "epoch": 1.7714884696016773, "percentage": 8.86, "elapsed_time": "0:08:27", "remaining_time": "1:27:06", "throughput": 4343.41, "total_tokens": 2206056} {"current_steps": 3385, "total_steps": 38160, "loss": 0.4139, "lr": 0.0008867924528301887, "epoch": 1.7741090146750524, "percentage": 8.87, "elapsed_time": "0:08:28", "remaining_time": "1:27:04", "throughput": 4342.87, "total_tokens": 2208456} {"current_steps": 3390, "total_steps": 38160, "loss": 0.3706, "lr": 0.0008881027253668763, "epoch": 1.7767295597484276, "percentage": 8.88, "elapsed_time": "0:08:29", "remaining_time": "1:27:03", "throughput": 4343.2, "total_tokens": 2211848} {"current_steps": 3395, "total_steps": 38160, "loss": 0.402, "lr": 0.000889412997903564, "epoch": 1.7793501048218028, "percentage": 8.9, "elapsed_time": "0:08:29", "remaining_time": "1:27:02", "throughput": 4343.45, "total_tokens": 2215112} {"current_steps": 3400, "total_steps": 38160, "loss": 0.5224, "lr": 0.0008907232704402516, "epoch": 1.7819706498951782, "percentage": 8.91, "elapsed_time": "0:08:30", "remaining_time": "1:27:02", "throughput": 4344.66, "total_tokens": 2219528} {"current_steps": 3405, "total_steps": 38160, "loss": 0.5433, "lr": 0.0008920335429769392, "epoch": 1.7845911949685536, "percentage": 8.92, "elapsed_time": "0:08:31", "remaining_time": "1:27:02", "throughput": 4345.6, "total_tokens": 2223624} {"current_steps": 3410, "total_steps": 38160, "loss": 0.4873, "lr": 0.0008933438155136269, "epoch": 1.7872117400419287, "percentage": 8.94, "elapsed_time": "0:08:32", "remaining_time": "1:27:02", "throughput": 4346.29, "total_tokens": 2227464} {"current_steps": 3415, "total_steps": 38160, "loss": 0.4291, "lr": 0.0008946540880503145, "epoch": 1.789832285115304, "percentage": 8.95, "elapsed_time": "0:08:33", "remaining_time": "1:27:02", "throughput": 4346.98, "total_tokens": 2231240} {"current_steps": 3420, "total_steps": 38160, "loss": 0.5872, "lr": 0.0008959643605870022, "epoch": 1.7924528301886793, "percentage": 8.96, "elapsed_time": "0:08:34", "remaining_time": "1:27:01", "throughput": 4347.27, "total_tokens": 2234600} {"current_steps": 3425, "total_steps": 38160, "loss": 0.5048, "lr": 0.0008972746331236897, "epoch": 1.7950733752620545, "percentage": 8.98, "elapsed_time": "0:08:34", "remaining_time": "1:27:00", "throughput": 4347.61, "total_tokens": 2238056} {"current_steps": 3430, "total_steps": 38160, "loss": 0.4224, "lr": 0.0008985849056603774, "epoch": 1.7976939203354299, "percentage": 8.99, "elapsed_time": "0:08:35", "remaining_time": "1:26:59", "throughput": 4348.17, "total_tokens": 2241640} {"current_steps": 3435, "total_steps": 38160, "loss": 0.5282, "lr": 0.000899895178197065, "epoch": 1.800314465408805, "percentage": 9.0, "elapsed_time": "0:08:36", "remaining_time": "1:27:00", "throughput": 4349.11, "total_tokens": 2245832} {"current_steps": 3440, "total_steps": 38160, "loss": 0.7093, "lr": 0.0009012054507337526, "epoch": 1.8029350104821802, "percentage": 9.01, "elapsed_time": "0:08:37", "remaining_time": "1:26:58", "throughput": 4348.81, "total_tokens": 2248552} {"current_steps": 3445, "total_steps": 38160, "loss": 0.5474, "lr": 0.0009025157232704403, "epoch": 1.8055555555555556, "percentage": 9.03, "elapsed_time": "0:08:37", "remaining_time": "1:26:57", "throughput": 4348.69, "total_tokens": 2251432} {"current_steps": 3450, "total_steps": 38160, "loss": 0.5682, "lr": 0.0009038259958071279, "epoch": 1.808176100628931, "percentage": 9.04, "elapsed_time": "0:08:38", "remaining_time": "1:26:55", "throughput": 4348.68, "total_tokens": 2254408} {"current_steps": 3455, "total_steps": 38160, "loss": 0.6698, "lr": 0.0009051362683438156, "epoch": 1.8107966457023061, "percentage": 9.05, "elapsed_time": "0:08:39", "remaining_time": "1:26:53", "throughput": 4348.38, "total_tokens": 2257032} {"current_steps": 3460, "total_steps": 38160, "loss": 0.435, "lr": 0.0009064465408805031, "epoch": 1.8134171907756813, "percentage": 9.07, "elapsed_time": "0:08:39", "remaining_time": "1:26:51", "throughput": 4347.94, "total_tokens": 2259560} {"current_steps": 3465, "total_steps": 38160, "loss": 0.5373, "lr": 0.0009077568134171907, "epoch": 1.8160377358490565, "percentage": 9.08, "elapsed_time": "0:08:40", "remaining_time": "1:26:51", "throughput": 4348.54, "total_tokens": 2263240} {"current_steps": 3470, "total_steps": 38160, "loss": 0.4613, "lr": 0.0009090670859538784, "epoch": 1.8186582809224319, "percentage": 9.09, "elapsed_time": "0:08:41", "remaining_time": "1:26:51", "throughput": 4349.32, "total_tokens": 2267144} {"current_steps": 3475, "total_steps": 38160, "loss": 0.5479, "lr": 0.000910377358490566, "epoch": 1.8212788259958073, "percentage": 9.11, "elapsed_time": "0:08:42", "remaining_time": "1:26:50", "throughput": 4349.95, "total_tokens": 2270856} {"current_steps": 3480, "total_steps": 38160, "loss": 0.5688, "lr": 0.0009116876310272537, "epoch": 1.8238993710691824, "percentage": 9.12, "elapsed_time": "0:08:42", "remaining_time": "1:26:49", "throughput": 4349.79, "total_tokens": 2273672} {"current_steps": 3485, "total_steps": 38160, "loss": 0.4809, "lr": 0.0009129979035639413, "epoch": 1.8265199161425576, "percentage": 9.13, "elapsed_time": "0:08:43", "remaining_time": "1:26:47", "throughput": 4349.61, "total_tokens": 2276520} {"current_steps": 3490, "total_steps": 38160, "loss": 0.428, "lr": 0.000914308176100629, "epoch": 1.8291404612159328, "percentage": 9.15, "elapsed_time": "0:08:44", "remaining_time": "1:26:46", "throughput": 4349.43, "total_tokens": 2279368} {"current_steps": 3495, "total_steps": 38160, "loss": 0.7151, "lr": 0.0009156184486373166, "epoch": 1.8317610062893082, "percentage": 9.16, "elapsed_time": "0:08:44", "remaining_time": "1:26:44", "throughput": 4349.02, "total_tokens": 2281992} {"current_steps": 3500, "total_steps": 38160, "loss": 0.4417, "lr": 0.0009169287211740042, "epoch": 1.8343815513626835, "percentage": 9.17, "elapsed_time": "0:08:45", "remaining_time": "1:26:43", "throughput": 4349.53, "total_tokens": 2285576} {"current_steps": 3505, "total_steps": 38160, "loss": 0.4197, "lr": 0.0009182389937106919, "epoch": 1.8370020964360587, "percentage": 9.19, "elapsed_time": "0:08:46", "remaining_time": "1:26:41", "throughput": 4349.12, "total_tokens": 2288072} {"current_steps": 3510, "total_steps": 38160, "loss": 0.381, "lr": 0.0009195492662473795, "epoch": 1.8396226415094339, "percentage": 9.2, "elapsed_time": "0:08:46", "remaining_time": "1:26:40", "throughput": 4349.3, "total_tokens": 2291336} {"current_steps": 3515, "total_steps": 38160, "loss": 0.5317, "lr": 0.0009208595387840672, "epoch": 1.8422431865828093, "percentage": 9.21, "elapsed_time": "0:08:47", "remaining_time": "1:26:39", "throughput": 4349.14, "total_tokens": 2294152} {"current_steps": 3520, "total_steps": 38160, "loss": 0.3897, "lr": 0.0009221698113207547, "epoch": 1.8448637316561844, "percentage": 9.22, "elapsed_time": "0:08:48", "remaining_time": "1:26:37", "throughput": 4348.92, "total_tokens": 2296872} {"current_steps": 3525, "total_steps": 38160, "loss": 0.4716, "lr": 0.0009234800838574424, "epoch": 1.8474842767295598, "percentage": 9.24, "elapsed_time": "0:08:48", "remaining_time": "1:26:35", "throughput": 4348.61, "total_tokens": 2299528} {"current_steps": 3530, "total_steps": 38160, "loss": 0.6484, "lr": 0.00092479035639413, "epoch": 1.850104821802935, "percentage": 9.25, "elapsed_time": "0:08:49", "remaining_time": "1:26:33", "throughput": 4347.97, "total_tokens": 2301864} {"current_steps": 3535, "total_steps": 38160, "loss": 0.4412, "lr": 0.0009261006289308176, "epoch": 1.8527253668763102, "percentage": 9.26, "elapsed_time": "0:08:50", "remaining_time": "1:26:33", "throughput": 4348.97, "total_tokens": 2306088} {"current_steps": 3540, "total_steps": 38160, "loss": 0.5363, "lr": 0.0009274109014675053, "epoch": 1.8553459119496856, "percentage": 9.28, "elapsed_time": "0:08:50", "remaining_time": "1:26:32", "throughput": 4349.21, "total_tokens": 2309416} {"current_steps": 3545, "total_steps": 38160, "loss": 0.532, "lr": 0.0009287211740041929, "epoch": 1.857966457023061, "percentage": 9.29, "elapsed_time": "0:08:51", "remaining_time": "1:26:31", "throughput": 4349.05, "total_tokens": 2312328} {"current_steps": 3550, "total_steps": 38160, "loss": 0.5517, "lr": 0.0009300314465408806, "epoch": 1.8605870020964361, "percentage": 9.3, "elapsed_time": "0:08:52", "remaining_time": "1:26:29", "throughput": 4348.28, "total_tokens": 2314472} {"current_steps": 3555, "total_steps": 38160, "loss": 0.3898, "lr": 0.0009313417190775681, "epoch": 1.8632075471698113, "percentage": 9.32, "elapsed_time": "0:08:53", "remaining_time": "1:26:29", "throughput": 4349.21, "total_tokens": 2318664} {"current_steps": 3560, "total_steps": 38160, "loss": 0.5736, "lr": 0.0009326519916142557, "epoch": 1.8658280922431865, "percentage": 9.33, "elapsed_time": "0:08:54", "remaining_time": "1:26:31", "throughput": 4350.75, "total_tokens": 2323784} {"current_steps": 3565, "total_steps": 38160, "loss": 0.5279, "lr": 0.0009339622641509434, "epoch": 1.8684486373165619, "percentage": 9.34, "elapsed_time": "0:08:54", "remaining_time": "1:26:29", "throughput": 4350.54, "total_tokens": 2326536} {"current_steps": 3570, "total_steps": 38160, "loss": 0.4692, "lr": 0.000935272536687631, "epoch": 1.8710691823899372, "percentage": 9.36, "elapsed_time": "0:08:55", "remaining_time": "1:26:29", "throughput": 4351.26, "total_tokens": 2330440} {"current_steps": 3575, "total_steps": 38160, "loss": 0.5676, "lr": 0.0009365828092243187, "epoch": 1.8736897274633124, "percentage": 9.37, "elapsed_time": "0:08:56", "remaining_time": "1:26:30", "throughput": 4352.95, "total_tokens": 2335688} {"current_steps": 3580, "total_steps": 38160, "loss": 0.4477, "lr": 0.0009378930817610063, "epoch": 1.8763102725366876, "percentage": 9.38, "elapsed_time": "0:08:57", "remaining_time": "1:26:29", "throughput": 4352.8, "total_tokens": 2338568} {"current_steps": 3585, "total_steps": 38160, "loss": 0.5171, "lr": 0.0009392033542976939, "epoch": 1.8789308176100628, "percentage": 9.39, "elapsed_time": "0:08:58", "remaining_time": "1:26:28", "throughput": 4353.19, "total_tokens": 2342120} {"current_steps": 3590, "total_steps": 38160, "loss": 0.4159, "lr": 0.0009405136268343816, "epoch": 1.8815513626834381, "percentage": 9.41, "elapsed_time": "0:08:58", "remaining_time": "1:26:28", "throughput": 4354.05, "total_tokens": 2346184} {"current_steps": 3595, "total_steps": 38160, "loss": 0.5966, "lr": 0.0009418238993710692, "epoch": 1.8841719077568135, "percentage": 9.42, "elapsed_time": "0:08:59", "remaining_time": "1:26:27", "throughput": 4353.81, "total_tokens": 2348936} {"current_steps": 3600, "total_steps": 38160, "loss": 0.4844, "lr": 0.0009431341719077569, "epoch": 1.8867924528301887, "percentage": 9.43, "elapsed_time": "0:09:00", "remaining_time": "1:26:26", "throughput": 4353.8, "total_tokens": 2351976} {"current_steps": 3605, "total_steps": 38160, "loss": 0.4954, "lr": 0.0009444444444444445, "epoch": 1.8894129979035639, "percentage": 9.45, "elapsed_time": "0:09:01", "remaining_time": "1:26:27", "throughput": 4355.53, "total_tokens": 2357192} {"current_steps": 3610, "total_steps": 38160, "loss": 0.6317, "lr": 0.0009457547169811322, "epoch": 1.892033542976939, "percentage": 9.46, "elapsed_time": "0:09:01", "remaining_time": "1:26:26", "throughput": 4355.4, "total_tokens": 2360072} {"current_steps": 3615, "total_steps": 38160, "loss": 0.4669, "lr": 0.0009470649895178197, "epoch": 1.8946540880503144, "percentage": 9.47, "elapsed_time": "0:09:02", "remaining_time": "1:26:25", "throughput": 4355.86, "total_tokens": 2363656} {"current_steps": 3620, "total_steps": 38160, "loss": 0.5419, "lr": 0.0009483752620545073, "epoch": 1.8972746331236898, "percentage": 9.49, "elapsed_time": "0:09:03", "remaining_time": "1:26:23", "throughput": 4355.45, "total_tokens": 2366216} {"current_steps": 3625, "total_steps": 38160, "loss": 0.5239, "lr": 0.000949685534591195, "epoch": 1.899895178197065, "percentage": 9.5, "elapsed_time": "0:09:04", "remaining_time": "1:26:22", "throughput": 4355.57, "total_tokens": 2369448} {"current_steps": 3630, "total_steps": 38160, "loss": 0.6532, "lr": 0.0009509958071278826, "epoch": 1.9025157232704402, "percentage": 9.51, "elapsed_time": "0:09:04", "remaining_time": "1:26:21", "throughput": 4355.74, "total_tokens": 2372744} {"current_steps": 3635, "total_steps": 38160, "loss": 0.4249, "lr": 0.0009523060796645703, "epoch": 1.9051362683438156, "percentage": 9.53, "elapsed_time": "0:09:05", "remaining_time": "1:26:19", "throughput": 4355.13, "total_tokens": 2375080} {"current_steps": 3640, "total_steps": 38160, "loss": 0.5104, "lr": 0.0009536163522012579, "epoch": 1.9077568134171907, "percentage": 9.54, "elapsed_time": "0:09:06", "remaining_time": "1:26:18", "throughput": 4354.93, "total_tokens": 2377864} {"current_steps": 3645, "total_steps": 38160, "loss": 0.4972, "lr": 0.0009549266247379456, "epoch": 1.9103773584905661, "percentage": 9.55, "elapsed_time": "0:09:06", "remaining_time": "1:26:17", "throughput": 4355.16, "total_tokens": 2381224} {"current_steps": 3650, "total_steps": 38160, "loss": 0.5206, "lr": 0.0009562368972746331, "epoch": 1.9129979035639413, "percentage": 9.56, "elapsed_time": "0:09:07", "remaining_time": "1:26:16", "throughput": 4355.23, "total_tokens": 2384424} {"current_steps": 3655, "total_steps": 38160, "loss": 0.4534, "lr": 0.0009575471698113207, "epoch": 1.9156184486373165, "percentage": 9.58, "elapsed_time": "0:09:08", "remaining_time": "1:26:16", "throughput": 4356.52, "total_tokens": 2388936} {"current_steps": 3660, "total_steps": 38160, "loss": 0.5267, "lr": 0.0009588574423480084, "epoch": 1.9182389937106918, "percentage": 9.59, "elapsed_time": "0:09:09", "remaining_time": "1:26:16", "throughput": 4357.15, "total_tokens": 2392744} {"current_steps": 3665, "total_steps": 38160, "loss": 0.5947, "lr": 0.000960167714884696, "epoch": 1.9208595387840672, "percentage": 9.6, "elapsed_time": "0:09:09", "remaining_time": "1:26:14", "throughput": 4356.63, "total_tokens": 2395112} {"current_steps": 3670, "total_steps": 38160, "loss": 0.4281, "lr": 0.0009614779874213837, "epoch": 1.9234800838574424, "percentage": 9.62, "elapsed_time": "0:09:10", "remaining_time": "1:26:13", "throughput": 4356.81, "total_tokens": 2398344} {"current_steps": 3675, "total_steps": 38160, "loss": 0.5068, "lr": 0.0009627882599580712, "epoch": 1.9261006289308176, "percentage": 9.63, "elapsed_time": "0:09:11", "remaining_time": "1:26:12", "throughput": 4357.13, "total_tokens": 2401704} {"current_steps": 3680, "total_steps": 38160, "loss": 0.3746, "lr": 0.0009640985324947589, "epoch": 1.9287211740041927, "percentage": 9.64, "elapsed_time": "0:09:11", "remaining_time": "1:26:10", "throughput": 4356.68, "total_tokens": 2404168} {"current_steps": 3685, "total_steps": 38160, "loss": 0.3896, "lr": 0.0009654088050314465, "epoch": 1.9313417190775681, "percentage": 9.66, "elapsed_time": "0:09:12", "remaining_time": "1:26:09", "throughput": 4357.08, "total_tokens": 2407688} {"current_steps": 3690, "total_steps": 38160, "loss": 0.4068, "lr": 0.0009667190775681342, "epoch": 1.9339622641509435, "percentage": 9.67, "elapsed_time": "0:09:13", "remaining_time": "1:26:09", "throughput": 4357.76, "total_tokens": 2411528} {"current_steps": 3695, "total_steps": 38160, "loss": 0.5376, "lr": 0.0009680293501048219, "epoch": 1.9365828092243187, "percentage": 9.68, "elapsed_time": "0:09:14", "remaining_time": "1:26:08", "throughput": 4357.67, "total_tokens": 2414440} {"current_steps": 3700, "total_steps": 38160, "loss": 0.4284, "lr": 0.0009693396226415095, "epoch": 1.9392033542976939, "percentage": 9.7, "elapsed_time": "0:09:14", "remaining_time": "1:26:06", "throughput": 4357.67, "total_tokens": 2417448} {"current_steps": 3705, "total_steps": 38160, "loss": 0.4731, "lr": 0.0009706498951781972, "epoch": 1.941823899371069, "percentage": 9.71, "elapsed_time": "0:09:15", "remaining_time": "1:26:05", "throughput": 4357.82, "total_tokens": 2420680} {"current_steps": 3710, "total_steps": 38160, "loss": 0.4777, "lr": 0.0009719601677148847, "epoch": 1.9444444444444444, "percentage": 9.72, "elapsed_time": "0:09:16", "remaining_time": "1:26:04", "throughput": 4357.88, "total_tokens": 2423752} {"current_steps": 3715, "total_steps": 38160, "loss": 0.5005, "lr": 0.0009732704402515723, "epoch": 1.9470649895178198, "percentage": 9.74, "elapsed_time": "0:09:16", "remaining_time": "1:26:02", "throughput": 4357.44, "total_tokens": 2426216} {"current_steps": 3720, "total_steps": 38160, "loss": 0.5479, "lr": 0.00097458071278826, "epoch": 1.949685534591195, "percentage": 9.75, "elapsed_time": "0:09:17", "remaining_time": "1:26:01", "throughput": 4357.74, "total_tokens": 2429640} {"current_steps": 3725, "total_steps": 38160, "loss": 0.4347, "lr": 0.0009758909853249476, "epoch": 1.9523060796645701, "percentage": 9.76, "elapsed_time": "0:09:18", "remaining_time": "1:26:01", "throughput": 4358.18, "total_tokens": 2433224} {"current_steps": 3730, "total_steps": 38160, "loss": 0.5512, "lr": 0.0009772012578616353, "epoch": 1.9549266247379455, "percentage": 9.77, "elapsed_time": "0:09:19", "remaining_time": "1:26:01", "throughput": 4359.14, "total_tokens": 2437576} {"current_steps": 3735, "total_steps": 38160, "loss": 0.4763, "lr": 0.0009785115303983228, "epoch": 1.9575471698113207, "percentage": 9.79, "elapsed_time": "0:09:19", "remaining_time": "1:25:59", "throughput": 4358.68, "total_tokens": 2439976} {"current_steps": 3740, "total_steps": 38160, "loss": 0.4643, "lr": 0.0009798218029350107, "epoch": 1.960167714884696, "percentage": 9.8, "elapsed_time": "0:09:20", "remaining_time": "1:25:58", "throughput": 4358.89, "total_tokens": 2443272} {"current_steps": 3745, "total_steps": 38160, "loss": 0.561, "lr": 0.0009811320754716981, "epoch": 1.9627882599580713, "percentage": 9.81, "elapsed_time": "0:09:21", "remaining_time": "1:25:56", "throughput": 4358.53, "total_tokens": 2445832} {"current_steps": 3750, "total_steps": 38160, "loss": 0.3808, "lr": 0.0009824423480083858, "epoch": 1.9654088050314464, "percentage": 9.83, "elapsed_time": "0:09:21", "remaining_time": "1:25:55", "throughput": 4358.13, "total_tokens": 2448456} {"current_steps": 3755, "total_steps": 38160, "loss": 0.554, "lr": 0.0009837526205450735, "epoch": 1.9680293501048218, "percentage": 9.84, "elapsed_time": "0:09:22", "remaining_time": "1:25:53", "throughput": 4357.88, "total_tokens": 2451208} {"current_steps": 3760, "total_steps": 38160, "loss": 0.4463, "lr": 0.000985062893081761, "epoch": 1.9706498951781972, "percentage": 9.85, "elapsed_time": "0:09:23", "remaining_time": "1:25:52", "throughput": 4357.8, "total_tokens": 2454152} {"current_steps": 3765, "total_steps": 38160, "loss": 0.3922, "lr": 0.0009863731656184487, "epoch": 1.9732704402515724, "percentage": 9.87, "elapsed_time": "0:09:23", "remaining_time": "1:25:51", "throughput": 4358.19, "total_tokens": 2457736} {"current_steps": 3770, "total_steps": 38160, "loss": 0.5966, "lr": 0.0009876834381551364, "epoch": 1.9758909853249476, "percentage": 9.88, "elapsed_time": "0:09:24", "remaining_time": "1:25:51", "throughput": 4358.6, "total_tokens": 2461384} {"current_steps": 3775, "total_steps": 38160, "loss": 0.3799, "lr": 0.0009889937106918238, "epoch": 1.9785115303983227, "percentage": 9.89, "elapsed_time": "0:09:25", "remaining_time": "1:25:50", "throughput": 4358.87, "total_tokens": 2464776} {"current_steps": 3780, "total_steps": 38160, "loss": 0.4618, "lr": 0.0009903039832285115, "epoch": 1.9811320754716981, "percentage": 9.91, "elapsed_time": "0:09:26", "remaining_time": "1:25:48", "throughput": 4358.38, "total_tokens": 2467144} {"current_steps": 3785, "total_steps": 38160, "loss": 0.599, "lr": 0.0009916142557651992, "epoch": 1.9837526205450735, "percentage": 9.92, "elapsed_time": "0:09:26", "remaining_time": "1:25:46", "throughput": 4358.09, "total_tokens": 2469736} {"current_steps": 3790, "total_steps": 38160, "loss": 0.3779, "lr": 0.000992924528301887, "epoch": 1.9863731656184487, "percentage": 9.93, "elapsed_time": "0:09:27", "remaining_time": "1:25:47", "throughput": 4359.48, "total_tokens": 2474536} {"current_steps": 3795, "total_steps": 38160, "loss": 0.5266, "lr": 0.0009942348008385744, "epoch": 1.9889937106918238, "percentage": 9.94, "elapsed_time": "0:09:28", "remaining_time": "1:25:46", "throughput": 4359.56, "total_tokens": 2477704} {"current_steps": 3800, "total_steps": 38160, "loss": 0.4644, "lr": 0.000995545073375262, "epoch": 1.991614255765199, "percentage": 9.96, "elapsed_time": "0:09:28", "remaining_time": "1:25:44", "throughput": 4359.2, "total_tokens": 2480296} {"current_steps": 3805, "total_steps": 38160, "loss": 0.5545, "lr": 0.0009968553459119497, "epoch": 1.9942348008385744, "percentage": 9.97, "elapsed_time": "0:09:29", "remaining_time": "1:25:43", "throughput": 4359.17, "total_tokens": 2483368} {"current_steps": 3810, "total_steps": 38160, "loss": 0.3954, "lr": 0.0009981656184486372, "epoch": 1.9968553459119498, "percentage": 9.98, "elapsed_time": "0:09:30", "remaining_time": "1:25:42", "throughput": 4359.19, "total_tokens": 2486440} {"current_steps": 3815, "total_steps": 38160, "loss": 0.3548, "lr": 0.000999475890985325, "epoch": 1.999475890985325, "percentage": 10.0, "elapsed_time": "0:09:31", "remaining_time": "1:25:41", "throughput": 4359.1, "total_tokens": 2489352} {"current_steps": 3816, "total_steps": 38160, "eval_loss": 0.46972936391830444, "epoch": 2.0, "percentage": 10.0, "elapsed_time": "0:09:44", "remaining_time": "1:27:43", "throughput": 4256.73, "total_tokens": 2489456} {"current_steps": 3820, "total_steps": 38160, "loss": 0.5616, "lr": 0.0009999999811730266, "epoch": 2.0020964360587, "percentage": 10.01, "elapsed_time": "0:09:47", "remaining_time": "1:27:57", "throughput": 4244.8, "total_tokens": 2492112} {"current_steps": 3825, "total_steps": 38160, "loss": 0.3784, "lr": 0.000999999866119305, "epoch": 2.0047169811320753, "percentage": 10.02, "elapsed_time": "0:09:47", "remaining_time": "1:27:55", "throughput": 4244.66, "total_tokens": 2494800} {"current_steps": 3830, "total_steps": 38160, "loss": 0.4886, "lr": 0.000999999646471316, "epoch": 2.007337526205451, "percentage": 10.04, "elapsed_time": "0:09:48", "remaining_time": "1:27:55", "throughput": 4245.7, "total_tokens": 2498896} {"current_steps": 3835, "total_steps": 38160, "loss": 0.5382, "lr": 0.0009999993222291053, "epoch": 2.009958071278826, "percentage": 10.05, "elapsed_time": "0:09:49", "remaining_time": "1:27:54", "throughput": 4246.02, "total_tokens": 2502160} {"current_steps": 3840, "total_steps": 38160, "loss": 0.4978, "lr": 0.0009999988933927404, "epoch": 2.0125786163522013, "percentage": 10.06, "elapsed_time": "0:09:49", "remaining_time": "1:27:52", "throughput": 4245.8, "total_tokens": 2504752} {"current_steps": 3845, "total_steps": 38160, "loss": 0.4899, "lr": 0.0009999983599623115, "epoch": 2.0151991614255764, "percentage": 10.08, "elapsed_time": "0:09:50", "remaining_time": "1:27:50", "throughput": 4245.74, "total_tokens": 2507536} {"current_steps": 3850, "total_steps": 38160, "loss": 0.4819, "lr": 0.0009999977219379299, "epoch": 2.0178197064989516, "percentage": 10.09, "elapsed_time": "0:09:51", "remaining_time": "1:27:49", "throughput": 4245.72, "total_tokens": 2510352} {"current_steps": 3855, "total_steps": 38160, "loss": 0.43, "lr": 0.000999996979319729, "epoch": 2.020440251572327, "percentage": 10.1, "elapsed_time": "0:09:51", "remaining_time": "1:27:47", "throughput": 4245.39, "total_tokens": 2512784} {"current_steps": 3860, "total_steps": 38160, "loss": 0.4149, "lr": 0.0009999961321078645, "epoch": 2.0230607966457024, "percentage": 10.12, "elapsed_time": "0:09:52", "remaining_time": "1:27:46", "throughput": 4245.84, "total_tokens": 2516304} {"current_steps": 3865, "total_steps": 38160, "loss": 0.5254, "lr": 0.0009999951803025134, "epoch": 2.0256813417190775, "percentage": 10.13, "elapsed_time": "0:09:53", "remaining_time": "1:27:44", "throughput": 4245.88, "total_tokens": 2519184} {"current_steps": 3870, "total_steps": 38160, "loss": 0.5622, "lr": 0.0009999941239038747, "epoch": 2.0283018867924527, "percentage": 10.14, "elapsed_time": "0:09:54", "remaining_time": "1:27:43", "throughput": 4246.14, "total_tokens": 2522448} {"current_steps": 3875, "total_steps": 38160, "loss": 0.4468, "lr": 0.0009999929629121696, "epoch": 2.030922431865828, "percentage": 10.15, "elapsed_time": "0:09:54", "remaining_time": "1:27:42", "throughput": 4246.53, "total_tokens": 2525744} {"current_steps": 3880, "total_steps": 38160, "loss": 0.4294, "lr": 0.000999991697327641, "epoch": 2.0335429769392035, "percentage": 10.17, "elapsed_time": "0:09:55", "remaining_time": "1:27:40", "throughput": 4246.22, "total_tokens": 2528240} {"current_steps": 3885, "total_steps": 38160, "loss": 0.4618, "lr": 0.0009999903271505535, "epoch": 2.0361635220125787, "percentage": 10.18, "elapsed_time": "0:09:56", "remaining_time": "1:27:38", "throughput": 4245.91, "total_tokens": 2530928} {"current_steps": 3890, "total_steps": 38160, "loss": 0.4684, "lr": 0.0009999888523811935, "epoch": 2.038784067085954, "percentage": 10.19, "elapsed_time": "0:09:56", "remaining_time": "1:27:37", "throughput": 4245.93, "total_tokens": 2533936} {"current_steps": 3895, "total_steps": 38160, "loss": 0.5945, "lr": 0.00099998727301987, "epoch": 2.041404612159329, "percentage": 10.21, "elapsed_time": "0:09:57", "remaining_time": "1:27:35", "throughput": 4245.83, "total_tokens": 2536720} {"current_steps": 3900, "total_steps": 38160, "loss": 0.4606, "lr": 0.000999985589066913, "epoch": 2.0440251572327046, "percentage": 10.22, "elapsed_time": "0:09:58", "remaining_time": "1:27:35", "throughput": 4246.68, "total_tokens": 2540656} {"current_steps": 3905, "total_steps": 38160, "loss": 0.4367, "lr": 0.000999983800522675, "epoch": 2.04664570230608, "percentage": 10.23, "elapsed_time": "0:09:59", "remaining_time": "1:27:35", "throughput": 4247.88, "total_tokens": 2545040} {"current_steps": 3910, "total_steps": 38160, "loss": 0.718, "lr": 0.00099998190738753, "epoch": 2.049266247379455, "percentage": 10.25, "elapsed_time": "0:09:59", "remaining_time": "1:27:34", "throughput": 4247.75, "total_tokens": 2547888} {"current_steps": 3915, "total_steps": 38160, "loss": 0.3676, "lr": 0.000999979909661874, "epoch": 2.05188679245283, "percentage": 10.26, "elapsed_time": "0:10:00", "remaining_time": "1:27:32", "throughput": 4247.27, "total_tokens": 2550256} {"current_steps": 3920, "total_steps": 38160, "loss": 0.3702, "lr": 0.000999977807346125, "epoch": 2.0545073375262053, "percentage": 10.27, "elapsed_time": "0:10:01", "remaining_time": "1:27:31", "throughput": 4247.69, "total_tokens": 2553712} {"current_steps": 3925, "total_steps": 38160, "loss": 0.523, "lr": 0.000999975600440723, "epoch": 2.057127882599581, "percentage": 10.29, "elapsed_time": "0:10:01", "remaining_time": "1:27:30", "throughput": 4248.31, "total_tokens": 2557392} {"current_steps": 3930, "total_steps": 38160, "loss": 0.6425, "lr": 0.000999973288946129, "epoch": 2.059748427672956, "percentage": 10.3, "elapsed_time": "0:10:02", "remaining_time": "1:27:29", "throughput": 4248.62, "total_tokens": 2560656} {"current_steps": 3935, "total_steps": 38160, "loss": 0.4118, "lr": 0.0009999708728628271, "epoch": 2.0623689727463312, "percentage": 10.31, "elapsed_time": "0:10:03", "remaining_time": "1:27:28", "throughput": 4249.0, "total_tokens": 2563984} {"current_steps": 3940, "total_steps": 38160, "loss": 0.593, "lr": 0.0009999683521913227, "epoch": 2.0649895178197064, "percentage": 10.32, "elapsed_time": "0:10:04", "remaining_time": "1:27:27", "throughput": 4249.21, "total_tokens": 2567088} {"current_steps": 3945, "total_steps": 38160, "loss": 0.4266, "lr": 0.000999965726932143, "epoch": 2.0676100628930816, "percentage": 10.34, "elapsed_time": "0:10:04", "remaining_time": "1:27:25", "throughput": 4249.47, "total_tokens": 2570288} {"current_steps": 3950, "total_steps": 38160, "loss": 0.5064, "lr": 0.0009999629970858371, "epoch": 2.070230607966457, "percentage": 10.35, "elapsed_time": "0:10:05", "remaining_time": "1:27:24", "throughput": 4249.47, "total_tokens": 2573136} {"current_steps": 3955, "total_steps": 38160, "loss": 0.5041, "lr": 0.000999960162652976, "epoch": 2.0728511530398324, "percentage": 10.36, "elapsed_time": "0:10:06", "remaining_time": "1:27:23", "throughput": 4250.15, "total_tokens": 2576912} {"current_steps": 3960, "total_steps": 38160, "loss": 0.5134, "lr": 0.0009999572236341527, "epoch": 2.0754716981132075, "percentage": 10.38, "elapsed_time": "0:10:06", "remaining_time": "1:27:22", "throughput": 4250.16, "total_tokens": 2579824} {"current_steps": 3965, "total_steps": 38160, "loss": 0.4804, "lr": 0.000999954180029982, "epoch": 2.0780922431865827, "percentage": 10.39, "elapsed_time": "0:10:07", "remaining_time": "1:27:21", "throughput": 4250.88, "total_tokens": 2583664} {"current_steps": 3970, "total_steps": 38160, "loss": 0.4763, "lr": 0.0009999510318411007, "epoch": 2.080712788259958, "percentage": 10.4, "elapsed_time": "0:10:08", "remaining_time": "1:27:21", "throughput": 4251.49, "total_tokens": 2587344} {"current_steps": 3975, "total_steps": 38160, "loss": 0.4741, "lr": 0.0009999477790681673, "epoch": 2.0833333333333335, "percentage": 10.42, "elapsed_time": "0:10:09", "remaining_time": "1:27:20", "throughput": 4251.94, "total_tokens": 2590800} {"current_steps": 3980, "total_steps": 38160, "loss": 0.6152, "lr": 0.000999944421711862, "epoch": 2.0859538784067087, "percentage": 10.43, "elapsed_time": "0:10:10", "remaining_time": "1:27:18", "throughput": 4252.05, "total_tokens": 2593872} {"current_steps": 3985, "total_steps": 38160, "loss": 0.5628, "lr": 0.0009999409597728876, "epoch": 2.088574423480084, "percentage": 10.44, "elapsed_time": "0:10:10", "remaining_time": "1:27:17", "throughput": 4252.27, "total_tokens": 2596976} {"current_steps": 3990, "total_steps": 38160, "loss": 0.4711, "lr": 0.0009999373932519679, "epoch": 2.091194968553459, "percentage": 10.46, "elapsed_time": "0:10:11", "remaining_time": "1:27:15", "throughput": 4252.27, "total_tokens": 2599824} {"current_steps": 3995, "total_steps": 38160, "loss": 0.5345, "lr": 0.0009999337221498492, "epoch": 2.0938155136268346, "percentage": 10.47, "elapsed_time": "0:10:12", "remaining_time": "1:27:14", "throughput": 4252.45, "total_tokens": 2602992} {"current_steps": 4000, "total_steps": 38160, "loss": 0.3546, "lr": 0.0009999299464672996, "epoch": 2.0964360587002098, "percentage": 10.48, "elapsed_time": "0:10:12", "remaining_time": "1:27:13", "throughput": 4252.91, "total_tokens": 2606448} {"current_steps": 4005, "total_steps": 38160, "loss": 0.3515, "lr": 0.0009999260662051084, "epoch": 2.099056603773585, "percentage": 10.5, "elapsed_time": "0:10:13", "remaining_time": "1:27:13", "throughput": 4254.05, "total_tokens": 2610864} {"current_steps": 4010, "total_steps": 38160, "loss": 0.4228, "lr": 0.0009999220813640877, "epoch": 2.10167714884696, "percentage": 10.51, "elapsed_time": "0:10:14", "remaining_time": "1:27:12", "throughput": 4254.51, "total_tokens": 2614256} {"current_steps": 4015, "total_steps": 38160, "loss": 0.6422, "lr": 0.000999917991945071, "epoch": 2.1042976939203353, "percentage": 10.52, "elapsed_time": "0:10:15", "remaining_time": "1:27:11", "throughput": 4254.47, "total_tokens": 2617072} {"current_steps": 4020, "total_steps": 38160, "loss": 0.4634, "lr": 0.0009999137979489136, "epoch": 2.106918238993711, "percentage": 10.53, "elapsed_time": "0:10:15", "remaining_time": "1:27:09", "throughput": 4254.36, "total_tokens": 2619792} {"current_steps": 4025, "total_steps": 38160, "loss": 0.391, "lr": 0.000999909499376493, "epoch": 2.109538784067086, "percentage": 10.55, "elapsed_time": "0:10:16", "remaining_time": "1:27:07", "throughput": 4254.24, "total_tokens": 2622448} {"current_steps": 4030, "total_steps": 38160, "loss": 0.5344, "lr": 0.0009999050962287085, "epoch": 2.1121593291404612, "percentage": 10.56, "elapsed_time": "0:10:17", "remaining_time": "1:27:06", "throughput": 4254.23, "total_tokens": 2625328} {"current_steps": 4035, "total_steps": 38160, "loss": 0.5176, "lr": 0.0009999005885064811, "epoch": 2.1147798742138364, "percentage": 10.57, "elapsed_time": "0:10:17", "remaining_time": "1:27:04", "throughput": 4254.3, "total_tokens": 2628336} {"current_steps": 4040, "total_steps": 38160, "loss": 0.487, "lr": 0.0009998959762107537, "epoch": 2.1174004192872116, "percentage": 10.59, "elapsed_time": "0:10:18", "remaining_time": "1:27:06", "throughput": 4256.18, "total_tokens": 2634128} {"current_steps": 4045, "total_steps": 38160, "loss": 0.417, "lr": 0.0009998912593424914, "epoch": 2.120020964360587, "percentage": 10.6, "elapsed_time": "0:10:19", "remaining_time": "1:27:07", "throughput": 4257.34, "total_tokens": 2638672} {"current_steps": 4050, "total_steps": 38160, "loss": 0.5273, "lr": 0.0009998864379026804, "epoch": 2.1226415094339623, "percentage": 10.61, "elapsed_time": "0:10:20", "remaining_time": "1:27:06", "throughput": 4258.3, "total_tokens": 2642768} {"current_steps": 4055, "total_steps": 38160, "loss": 0.4735, "lr": 0.00099988151189233, "epoch": 2.1252620545073375, "percentage": 10.63, "elapsed_time": "0:10:21", "remaining_time": "1:27:05", "throughput": 4258.23, "total_tokens": 2645552} {"current_steps": 4060, "total_steps": 38160, "loss": 0.4296, "lr": 0.00099987648131247, "epoch": 2.1278825995807127, "percentage": 10.64, "elapsed_time": "0:10:21", "remaining_time": "1:27:03", "throughput": 4257.68, "total_tokens": 2647728} {"current_steps": 4065, "total_steps": 38160, "loss": 0.5692, "lr": 0.000999871346164153, "epoch": 2.130503144654088, "percentage": 10.65, "elapsed_time": "0:10:22", "remaining_time": "1:27:01", "throughput": 4258.01, "total_tokens": 2650992} {"current_steps": 4070, "total_steps": 38160, "loss": 0.522, "lr": 0.0009998661064484532, "epoch": 2.1331236897274635, "percentage": 10.67, "elapsed_time": "0:10:23", "remaining_time": "1:27:00", "throughput": 4257.97, "total_tokens": 2653744} {"current_steps": 4075, "total_steps": 38160, "loss": 0.298, "lr": 0.0009998607621664666, "epoch": 2.1357442348008386, "percentage": 10.68, "elapsed_time": "0:10:23", "remaining_time": "1:26:58", "throughput": 4257.74, "total_tokens": 2656336} {"current_steps": 4080, "total_steps": 38160, "loss": 0.7396, "lr": 0.0009998553133193113, "epoch": 2.138364779874214, "percentage": 10.69, "elapsed_time": "0:10:24", "remaining_time": "1:26:56", "throughput": 4257.72, "total_tokens": 2659216} {"current_steps": 4085, "total_steps": 38160, "loss": 0.5666, "lr": 0.0009998497599081272, "epoch": 2.140985324947589, "percentage": 10.7, "elapsed_time": "0:10:25", "remaining_time": "1:26:55", "throughput": 4257.74, "total_tokens": 2662224} {"current_steps": 4090, "total_steps": 38160, "loss": 0.3735, "lr": 0.0009998441019340761, "epoch": 2.1436058700209646, "percentage": 10.72, "elapsed_time": "0:10:26", "remaining_time": "1:26:55", "throughput": 4258.37, "total_tokens": 2665936} {"current_steps": 4095, "total_steps": 38160, "loss": 0.3677, "lr": 0.000999838339398341, "epoch": 2.1462264150943398, "percentage": 10.73, "elapsed_time": "0:10:26", "remaining_time": "1:26:54", "throughput": 4258.9, "total_tokens": 2669648} {"current_steps": 4100, "total_steps": 38160, "loss": 0.7111, "lr": 0.000999832472302128, "epoch": 2.148846960167715, "percentage": 10.74, "elapsed_time": "0:10:27", "remaining_time": "1:26:54", "throughput": 4259.58, "total_tokens": 2673552} {"current_steps": 4105, "total_steps": 38160, "loss": 0.631, "lr": 0.0009998265006466642, "epoch": 2.15146750524109, "percentage": 10.76, "elapsed_time": "0:10:28", "remaining_time": "1:26:52", "throughput": 4259.12, "total_tokens": 2675824} {"current_steps": 4110, "total_steps": 38160, "loss": 0.5383, "lr": 0.0009998204244331987, "epoch": 2.1540880503144653, "percentage": 10.77, "elapsed_time": "0:10:28", "remaining_time": "1:26:50", "throughput": 4258.75, "total_tokens": 2678256} {"current_steps": 4115, "total_steps": 38160, "loss": 0.4123, "lr": 0.0009998142436630027, "epoch": 2.156708595387841, "percentage": 10.78, "elapsed_time": "0:10:29", "remaining_time": "1:26:49", "throughput": 4259.53, "total_tokens": 2682224} {"current_steps": 4120, "total_steps": 38160, "loss": 0.3469, "lr": 0.0009998079583373692, "epoch": 2.159329140461216, "percentage": 10.8, "elapsed_time": "0:10:30", "remaining_time": "1:26:47", "throughput": 4259.37, "total_tokens": 2684848} {"current_steps": 4125, "total_steps": 38160, "loss": 0.5241, "lr": 0.0009998015684576128, "epoch": 2.161949685534591, "percentage": 10.81, "elapsed_time": "0:10:31", "remaining_time": "1:26:47", "throughput": 4260.12, "total_tokens": 2688816} {"current_steps": 4130, "total_steps": 38160, "loss": 0.9151, "lr": 0.0009997950740250703, "epoch": 2.1645702306079664, "percentage": 10.82, "elapsed_time": "0:10:31", "remaining_time": "1:26:46", "throughput": 4260.05, "total_tokens": 2691728} {"current_steps": 4135, "total_steps": 38160, "loss": 0.5796, "lr": 0.0009997884750411004, "epoch": 2.1671907756813416, "percentage": 10.84, "elapsed_time": "0:10:32", "remaining_time": "1:26:44", "throughput": 4260.04, "total_tokens": 2694608} {"current_steps": 4140, "total_steps": 38160, "loss": 0.5386, "lr": 0.0009997817715070832, "epoch": 2.169811320754717, "percentage": 10.85, "elapsed_time": "0:10:33", "remaining_time": "1:26:43", "throughput": 4260.3, "total_tokens": 2697872} {"current_steps": 4145, "total_steps": 38160, "loss": 0.4297, "lr": 0.0009997749634244213, "epoch": 2.1724318658280923, "percentage": 10.86, "elapsed_time": "0:10:33", "remaining_time": "1:26:42", "throughput": 4260.5, "total_tokens": 2701040} {"current_steps": 4150, "total_steps": 38160, "loss": 0.6311, "lr": 0.000999768050794539, "epoch": 2.1750524109014675, "percentage": 10.88, "elapsed_time": "0:10:34", "remaining_time": "1:26:40", "throughput": 4260.33, "total_tokens": 2703760} {"current_steps": 4155, "total_steps": 38160, "loss": 0.4769, "lr": 0.0009997610336188818, "epoch": 2.1776729559748427, "percentage": 10.89, "elapsed_time": "0:10:35", "remaining_time": "1:26:39", "throughput": 4260.17, "total_tokens": 2706480} {"current_steps": 4160, "total_steps": 38160, "loss": 0.3312, "lr": 0.0009997539118989183, "epoch": 2.180293501048218, "percentage": 10.9, "elapsed_time": "0:10:35", "remaining_time": "1:26:37", "throughput": 4260.29, "total_tokens": 2709488} {"current_steps": 4165, "total_steps": 38160, "loss": 0.4199, "lr": 0.0009997466856361376, "epoch": 2.1829140461215935, "percentage": 10.91, "elapsed_time": "0:10:36", "remaining_time": "1:26:36", "throughput": 4260.7, "total_tokens": 2712880} {"current_steps": 4170, "total_steps": 38160, "loss": 0.4885, "lr": 0.000999739354832052, "epoch": 2.1855345911949686, "percentage": 10.93, "elapsed_time": "0:10:37", "remaining_time": "1:26:35", "throughput": 4260.99, "total_tokens": 2716112} {"current_steps": 4175, "total_steps": 38160, "loss": 0.5274, "lr": 0.0009997319194881944, "epoch": 2.188155136268344, "percentage": 10.94, "elapsed_time": "0:10:38", "remaining_time": "1:26:34", "throughput": 4261.03, "total_tokens": 2719088} {"current_steps": 4180, "total_steps": 38160, "loss": 0.4615, "lr": 0.0009997243796061204, "epoch": 2.190775681341719, "percentage": 10.95, "elapsed_time": "0:10:38", "remaining_time": "1:26:33", "throughput": 4261.05, "total_tokens": 2722064} {"current_steps": 4185, "total_steps": 38160, "loss": 0.3371, "lr": 0.0009997167351874076, "epoch": 2.1933962264150946, "percentage": 10.97, "elapsed_time": "0:10:39", "remaining_time": "1:26:31", "throughput": 4261.11, "total_tokens": 2725072} {"current_steps": 4190, "total_steps": 38160, "loss": 0.4337, "lr": 0.0009997089862336548, "epoch": 2.1960167714884697, "percentage": 10.98, "elapsed_time": "0:10:40", "remaining_time": "1:26:30", "throughput": 4261.42, "total_tokens": 2728368} {"current_steps": 4195, "total_steps": 38160, "loss": 0.5336, "lr": 0.000999701132746483, "epoch": 2.198637316561845, "percentage": 10.99, "elapsed_time": "0:10:41", "remaining_time": "1:26:30", "throughput": 4261.96, "total_tokens": 2731984} {"current_steps": 4200, "total_steps": 38160, "loss": 0.4665, "lr": 0.0009996931747275352, "epoch": 2.20125786163522, "percentage": 11.01, "elapsed_time": "0:10:41", "remaining_time": "1:26:29", "throughput": 4262.56, "total_tokens": 2735632} {"current_steps": 4205, "total_steps": 38160, "loss": 0.5085, "lr": 0.000999685112178476, "epoch": 2.2038784067085953, "percentage": 11.02, "elapsed_time": "0:10:42", "remaining_time": "1:26:28", "throughput": 4262.84, "total_tokens": 2738928} {"current_steps": 4210, "total_steps": 38160, "loss": 0.4811, "lr": 0.0009996769451009922, "epoch": 2.2064989517819704, "percentage": 11.03, "elapsed_time": "0:10:43", "remaining_time": "1:26:28", "throughput": 4263.8, "total_tokens": 2743248} {"current_steps": 4215, "total_steps": 38160, "loss": 0.6042, "lr": 0.000999668673496792, "epoch": 2.209119496855346, "percentage": 11.05, "elapsed_time": "0:10:44", "remaining_time": "1:26:26", "throughput": 4263.43, "total_tokens": 2745744} {"current_steps": 4220, "total_steps": 38160, "loss": 0.4771, "lr": 0.0009996602973676057, "epoch": 2.211740041928721, "percentage": 11.06, "elapsed_time": "0:10:44", "remaining_time": "1:26:24", "throughput": 4263.24, "total_tokens": 2748432} {"current_steps": 4225, "total_steps": 38160, "loss": 0.5978, "lr": 0.0009996518167151858, "epoch": 2.2143605870020964, "percentage": 11.07, "elapsed_time": "0:10:45", "remaining_time": "1:26:23", "throughput": 4263.21, "total_tokens": 2751280} {"current_steps": 4230, "total_steps": 38160, "loss": 0.5655, "lr": 0.000999643231541306, "epoch": 2.2169811320754715, "percentage": 11.08, "elapsed_time": "0:10:46", "remaining_time": "1:26:21", "throughput": 4263.14, "total_tokens": 2754096} {"current_steps": 4235, "total_steps": 38160, "loss": 0.6119, "lr": 0.0009996345418477625, "epoch": 2.219601677148847, "percentage": 11.1, "elapsed_time": "0:10:46", "remaining_time": "1:26:20", "throughput": 4263.29, "total_tokens": 2757200} {"current_steps": 4240, "total_steps": 38160, "loss": 0.5338, "lr": 0.000999625747636373, "epoch": 2.2222222222222223, "percentage": 11.11, "elapsed_time": "0:10:47", "remaining_time": "1:26:19", "throughput": 4263.37, "total_tokens": 2760240} {"current_steps": 4245, "total_steps": 38160, "loss": 0.4632, "lr": 0.000999616848908977, "epoch": 2.2248427672955975, "percentage": 11.12, "elapsed_time": "0:10:48", "remaining_time": "1:26:18", "throughput": 4263.48, "total_tokens": 2763248} {"current_steps": 4250, "total_steps": 38160, "loss": 0.488, "lr": 0.0009996078456674363, "epoch": 2.2274633123689727, "percentage": 11.14, "elapsed_time": "0:10:48", "remaining_time": "1:26:16", "throughput": 4263.49, "total_tokens": 2766192} {"current_steps": 4255, "total_steps": 38160, "loss": 0.4971, "lr": 0.000999598737913634, "epoch": 2.230083857442348, "percentage": 11.15, "elapsed_time": "0:10:49", "remaining_time": "1:26:16", "throughput": 4264.22, "total_tokens": 2770160} {"current_steps": 4260, "total_steps": 38160, "loss": 0.4129, "lr": 0.0009995895256494755, "epoch": 2.2327044025157234, "percentage": 11.16, "elapsed_time": "0:10:50", "remaining_time": "1:26:15", "throughput": 4264.44, "total_tokens": 2773424} {"current_steps": 4265, "total_steps": 38160, "loss": 0.467, "lr": 0.000999580208876888, "epoch": 2.2353249475890986, "percentage": 11.18, "elapsed_time": "0:10:51", "remaining_time": "1:26:13", "throughput": 4264.4, "total_tokens": 2776240} {"current_steps": 4270, "total_steps": 38160, "loss": 0.489, "lr": 0.0009995707875978198, "epoch": 2.237945492662474, "percentage": 11.19, "elapsed_time": "0:10:51", "remaining_time": "1:26:12", "throughput": 4264.39, "total_tokens": 2779088} {"current_steps": 4275, "total_steps": 38160, "loss": 0.4194, "lr": 0.0009995612618142428, "epoch": 2.240566037735849, "percentage": 11.2, "elapsed_time": "0:10:52", "remaining_time": "1:26:11", "throughput": 4264.38, "total_tokens": 2782032} {"current_steps": 4280, "total_steps": 38160, "loss": 0.6451, "lr": 0.000999551631528149, "epoch": 2.243186582809224, "percentage": 11.22, "elapsed_time": "0:10:53", "remaining_time": "1:26:10", "throughput": 4265.15, "total_tokens": 2786000} {"current_steps": 4285, "total_steps": 38160, "loss": 0.3774, "lr": 0.000999541896741553, "epoch": 2.2458071278825997, "percentage": 11.23, "elapsed_time": "0:10:53", "remaining_time": "1:26:09", "throughput": 4265.61, "total_tokens": 2789584} {"current_steps": 4290, "total_steps": 38160, "loss": 0.5437, "lr": 0.0009995320574564912, "epoch": 2.248427672955975, "percentage": 11.24, "elapsed_time": "0:10:54", "remaining_time": "1:26:09", "throughput": 4265.89, "total_tokens": 2792976} {"current_steps": 4295, "total_steps": 38160, "loss": 0.5111, "lr": 0.000999522113675022, "epoch": 2.25104821802935, "percentage": 11.26, "elapsed_time": "0:10:55", "remaining_time": "1:26:07", "throughput": 4265.77, "total_tokens": 2795856} {"current_steps": 4300, "total_steps": 38160, "loss": 0.4938, "lr": 0.0009995120653992255, "epoch": 2.2536687631027252, "percentage": 11.27, "elapsed_time": "0:10:56", "remaining_time": "1:26:06", "throughput": 4265.43, "total_tokens": 2798384} {"current_steps": 4305, "total_steps": 38160, "loss": 0.369, "lr": 0.0009995019126312035, "epoch": 2.2562893081761004, "percentage": 11.28, "elapsed_time": "0:10:56", "remaining_time": "1:26:04", "throughput": 4265.63, "total_tokens": 2801552} {"current_steps": 4310, "total_steps": 38160, "loss": 0.5605, "lr": 0.0009994916553730802, "epoch": 2.258909853249476, "percentage": 11.29, "elapsed_time": "0:10:57", "remaining_time": "1:26:03", "throughput": 4265.84, "total_tokens": 2804816} {"current_steps": 4315, "total_steps": 38160, "loss": 0.77, "lr": 0.000999481293627001, "epoch": 2.261530398322851, "percentage": 11.31, "elapsed_time": "0:10:58", "remaining_time": "1:26:02", "throughput": 4265.64, "total_tokens": 2807536} {"current_steps": 4320, "total_steps": 38160, "loss": 0.4729, "lr": 0.0009994708273951337, "epoch": 2.2641509433962264, "percentage": 11.32, "elapsed_time": "0:10:59", "remaining_time": "1:26:02", "throughput": 4266.8, "total_tokens": 2812080} {"current_steps": 4325, "total_steps": 38160, "loss": 0.5175, "lr": 0.0009994602566796673, "epoch": 2.2667714884696015, "percentage": 11.33, "elapsed_time": "0:10:59", "remaining_time": "1:26:01", "throughput": 4266.56, "total_tokens": 2814768} {"current_steps": 4330, "total_steps": 38160, "loss": 0.5362, "lr": 0.0009994495814828136, "epoch": 2.269392033542977, "percentage": 11.35, "elapsed_time": "0:11:00", "remaining_time": "1:25:59", "throughput": 4266.3, "total_tokens": 2817328} {"current_steps": 4335, "total_steps": 38160, "loss": 0.6179, "lr": 0.0009994388018068055, "epoch": 2.2720125786163523, "percentage": 11.36, "elapsed_time": "0:11:01", "remaining_time": "1:25:58", "throughput": 4266.53, "total_tokens": 2820624} {"current_steps": 4340, "total_steps": 38160, "loss": 0.396, "lr": 0.0009994279176538977, "epoch": 2.2746331236897275, "percentage": 11.37, "elapsed_time": "0:11:01", "remaining_time": "1:25:58", "throughput": 4267.33, "total_tokens": 2824720} {"current_steps": 4345, "total_steps": 38160, "loss": 0.5895, "lr": 0.0009994169290263675, "epoch": 2.2772536687631026, "percentage": 11.39, "elapsed_time": "0:11:02", "remaining_time": "1:25:57", "throughput": 4268.03, "total_tokens": 2828560} {"current_steps": 4350, "total_steps": 38160, "loss": 0.5509, "lr": 0.0009994058359265132, "epoch": 2.279874213836478, "percentage": 11.4, "elapsed_time": "0:11:03", "remaining_time": "1:25:57", "throughput": 4268.35, "total_tokens": 2832080} {"current_steps": 4355, "total_steps": 38160, "loss": 0.5834, "lr": 0.0009993946383566558, "epoch": 2.2824947589098534, "percentage": 11.41, "elapsed_time": "0:11:04", "remaining_time": "1:25:55", "throughput": 4268.03, "total_tokens": 2834640} {"current_steps": 4360, "total_steps": 38160, "loss": 0.4968, "lr": 0.0009993833363191374, "epoch": 2.2851153039832286, "percentage": 11.43, "elapsed_time": "0:11:04", "remaining_time": "1:25:53", "throughput": 4267.75, "total_tokens": 2837136} {"current_steps": 4365, "total_steps": 38160, "loss": 0.479, "lr": 0.0009993719298163222, "epoch": 2.2877358490566038, "percentage": 11.44, "elapsed_time": "0:11:05", "remaining_time": "1:25:53", "throughput": 4268.39, "total_tokens": 2841040} {"current_steps": 4370, "total_steps": 38160, "loss": 0.5332, "lr": 0.0009993604188505965, "epoch": 2.290356394129979, "percentage": 11.45, "elapsed_time": "0:11:06", "remaining_time": "1:25:51", "throughput": 4268.39, "total_tokens": 2843984} {"current_steps": 4375, "total_steps": 38160, "loss": 0.6361, "lr": 0.000999348803424368, "epoch": 2.2929769392033545, "percentage": 11.46, "elapsed_time": "0:11:06", "remaining_time": "1:25:50", "throughput": 4268.37, "total_tokens": 2846832} {"current_steps": 4380, "total_steps": 38160, "loss": 0.4098, "lr": 0.000999337083540067, "epoch": 2.2955974842767297, "percentage": 11.48, "elapsed_time": "0:11:07", "remaining_time": "1:25:49", "throughput": 4268.89, "total_tokens": 2850512} {"current_steps": 4385, "total_steps": 38160, "loss": 0.3743, "lr": 0.0009993252592001448, "epoch": 2.298218029350105, "percentage": 11.49, "elapsed_time": "0:11:08", "remaining_time": "1:25:49", "throughput": 4269.74, "total_tokens": 2854800} {"current_steps": 4390, "total_steps": 38160, "loss": 0.3949, "lr": 0.0009993133304070747, "epoch": 2.30083857442348, "percentage": 11.5, "elapsed_time": "0:11:09", "remaining_time": "1:25:48", "throughput": 4269.6, "total_tokens": 2857552} {"current_steps": 4395, "total_steps": 38160, "loss": 0.4984, "lr": 0.0009993012971633527, "epoch": 2.3034591194968552, "percentage": 11.52, "elapsed_time": "0:11:09", "remaining_time": "1:25:47", "throughput": 4269.58, "total_tokens": 2860432} {"current_steps": 4400, "total_steps": 38160, "loss": 0.5719, "lr": 0.0009992891594714952, "epoch": 2.3060796645702304, "percentage": 11.53, "elapsed_time": "0:11:10", "remaining_time": "1:25:45", "throughput": 4269.72, "total_tokens": 2863568} {"current_steps": 4405, "total_steps": 38160, "loss": 0.411, "lr": 0.0009992769173340422, "epoch": 2.308700209643606, "percentage": 11.54, "elapsed_time": "0:11:11", "remaining_time": "1:25:43", "throughput": 4269.38, "total_tokens": 2865968} {"current_steps": 4410, "total_steps": 38160, "loss": 0.6423, "lr": 0.000999264570753554, "epoch": 2.311320754716981, "percentage": 11.56, "elapsed_time": "0:11:11", "remaining_time": "1:25:42", "throughput": 4269.35, "total_tokens": 2868848} {"current_steps": 4415, "total_steps": 38160, "loss": 0.425, "lr": 0.0009992521197326135, "epoch": 2.3139412997903563, "percentage": 11.57, "elapsed_time": "0:11:12", "remaining_time": "1:25:41", "throughput": 4269.4, "total_tokens": 2871792} {"current_steps": 4420, "total_steps": 38160, "loss": 0.491, "lr": 0.0009992395642738252, "epoch": 2.3165618448637315, "percentage": 11.58, "elapsed_time": "0:11:13", "remaining_time": "1:25:40", "throughput": 4269.44, "total_tokens": 2874832} {"current_steps": 4425, "total_steps": 38160, "loss": 0.4954, "lr": 0.0009992269043798158, "epoch": 2.319182389937107, "percentage": 11.6, "elapsed_time": "0:11:14", "remaining_time": "1:25:38", "throughput": 4269.37, "total_tokens": 2877648} {"current_steps": 4430, "total_steps": 38160, "loss": 0.5049, "lr": 0.0009992141400532336, "epoch": 2.3218029350104823, "percentage": 11.61, "elapsed_time": "0:11:14", "remaining_time": "1:25:36", "throughput": 4268.97, "total_tokens": 2880016} {"current_steps": 4435, "total_steps": 38160, "loss": 0.6229, "lr": 0.0009992012712967484, "epoch": 2.3244234800838575, "percentage": 11.62, "elapsed_time": "0:11:15", "remaining_time": "1:25:35", "throughput": 4269.05, "total_tokens": 2883184} {"current_steps": 4440, "total_steps": 38160, "loss": 0.4027, "lr": 0.0009991882981130525, "epoch": 2.3270440251572326, "percentage": 11.64, "elapsed_time": "0:11:16", "remaining_time": "1:25:35", "throughput": 4269.85, "total_tokens": 2887408} {"current_steps": 4445, "total_steps": 38160, "loss": 0.2889, "lr": 0.0009991752205048597, "epoch": 2.329664570230608, "percentage": 11.65, "elapsed_time": "0:11:17", "remaining_time": "1:25:37", "throughput": 4271.39, "total_tokens": 2892912} {"current_steps": 4450, "total_steps": 38160, "loss": 0.5234, "lr": 0.0009991620384749058, "epoch": 2.3322851153039834, "percentage": 11.66, "elapsed_time": "0:11:17", "remaining_time": "1:25:35", "throughput": 4271.18, "total_tokens": 2895504} {"current_steps": 4455, "total_steps": 38160, "loss": 0.5843, "lr": 0.0009991487520259479, "epoch": 2.3349056603773586, "percentage": 11.67, "elapsed_time": "0:11:18", "remaining_time": "1:25:35", "throughput": 4272.38, "total_tokens": 2900208} {"current_steps": 4460, "total_steps": 38160, "loss": 0.403, "lr": 0.000999135361160766, "epoch": 2.3375262054507338, "percentage": 11.69, "elapsed_time": "0:11:19", "remaining_time": "1:25:34", "throughput": 4272.68, "total_tokens": 2903568} {"current_steps": 4465, "total_steps": 38160, "loss": 0.5729, "lr": 0.0009991218658821608, "epoch": 2.340146750524109, "percentage": 11.7, "elapsed_time": "0:11:20", "remaining_time": "1:25:33", "throughput": 4272.91, "total_tokens": 2906864} {"current_steps": 4470, "total_steps": 38160, "loss": 0.4312, "lr": 0.0009991082661929556, "epoch": 2.342767295597484, "percentage": 11.71, "elapsed_time": "0:11:21", "remaining_time": "1:25:33", "throughput": 4273.41, "total_tokens": 2910480} {"current_steps": 4475, "total_steps": 38160, "loss": 0.4303, "lr": 0.000999094562095995, "epoch": 2.3453878406708597, "percentage": 11.73, "elapsed_time": "0:11:21", "remaining_time": "1:25:31", "throughput": 4273.48, "total_tokens": 2913552} {"current_steps": 4480, "total_steps": 38160, "loss": 0.5476, "lr": 0.0009990807535941461, "epoch": 2.348008385744235, "percentage": 11.74, "elapsed_time": "0:11:22", "remaining_time": "1:25:30", "throughput": 4273.39, "total_tokens": 2916368} {"current_steps": 4485, "total_steps": 38160, "loss": 0.5049, "lr": 0.0009990668406902976, "epoch": 2.35062893081761, "percentage": 11.75, "elapsed_time": "0:11:23", "remaining_time": "1:25:28", "throughput": 4273.19, "total_tokens": 2918960} {"current_steps": 4490, "total_steps": 38160, "loss": 0.4902, "lr": 0.0009990528233873594, "epoch": 2.353249475890985, "percentage": 11.77, "elapsed_time": "0:11:23", "remaining_time": "1:25:28", "throughput": 4273.72, "total_tokens": 2922768} {"current_steps": 4495, "total_steps": 38160, "loss": 0.5043, "lr": 0.0009990387016882642, "epoch": 2.3558700209643604, "percentage": 11.78, "elapsed_time": "0:11:24", "remaining_time": "1:25:27", "throughput": 4273.83, "total_tokens": 2925840} {"current_steps": 4500, "total_steps": 38160, "loss": 0.4153, "lr": 0.000999024475595966, "epoch": 2.358490566037736, "percentage": 11.79, "elapsed_time": "0:11:25", "remaining_time": "1:25:26", "throughput": 4274.01, "total_tokens": 2929008} {"current_steps": 4505, "total_steps": 38160, "loss": 0.4942, "lr": 0.0009990101451134406, "epoch": 2.361111111111111, "percentage": 11.81, "elapsed_time": "0:11:25", "remaining_time": "1:25:24", "throughput": 4273.74, "total_tokens": 2931632} {"current_steps": 4510, "total_steps": 38160, "loss": 0.558, "lr": 0.0009989957102436858, "epoch": 2.3637316561844863, "percentage": 11.82, "elapsed_time": "0:11:26", "remaining_time": "1:25:24", "throughput": 4274.6, "total_tokens": 2935824} {"current_steps": 4515, "total_steps": 38160, "loss": 0.3717, "lr": 0.0009989811709897212, "epoch": 2.3663522012578615, "percentage": 11.83, "elapsed_time": "0:11:27", "remaining_time": "1:25:23", "throughput": 4274.6, "total_tokens": 2938832} {"current_steps": 4520, "total_steps": 38160, "loss": 0.4439, "lr": 0.0009989665273545884, "epoch": 2.368972746331237, "percentage": 11.84, "elapsed_time": "0:11:28", "remaining_time": "1:25:22", "throughput": 4274.8, "total_tokens": 2942096} {"current_steps": 4525, "total_steps": 38160, "loss": 0.4734, "lr": 0.0009989517793413507, "epoch": 2.3715932914046123, "percentage": 11.86, "elapsed_time": "0:11:29", "remaining_time": "1:25:21", "throughput": 4275.37, "total_tokens": 2945968} {"current_steps": 4530, "total_steps": 38160, "loss": 0.5304, "lr": 0.000998936926953093, "epoch": 2.3742138364779874, "percentage": 11.87, "elapsed_time": "0:11:29", "remaining_time": "1:25:21", "throughput": 4275.71, "total_tokens": 2949456} {"current_steps": 4535, "total_steps": 38160, "loss": 0.4956, "lr": 0.0009989219701929224, "epoch": 2.3768343815513626, "percentage": 11.88, "elapsed_time": "0:11:30", "remaining_time": "1:25:20", "throughput": 4275.79, "total_tokens": 2952592} {"current_steps": 4540, "total_steps": 38160, "loss": 0.3549, "lr": 0.0009989069090639675, "epoch": 2.379454926624738, "percentage": 11.9, "elapsed_time": "0:11:31", "remaining_time": "1:25:18", "throughput": 4275.92, "total_tokens": 2955760} {"current_steps": 4545, "total_steps": 38160, "loss": 0.2994, "lr": 0.0009988917435693793, "epoch": 2.3820754716981134, "percentage": 11.91, "elapsed_time": "0:11:31", "remaining_time": "1:25:17", "throughput": 4275.96, "total_tokens": 2958768} {"current_steps": 4550, "total_steps": 38160, "loss": 0.394, "lr": 0.0009988764737123297, "epoch": 2.3846960167714886, "percentage": 11.92, "elapsed_time": "0:11:32", "remaining_time": "1:25:16", "throughput": 4275.83, "total_tokens": 2961552} {"current_steps": 4555, "total_steps": 38160, "loss": 0.4398, "lr": 0.0009988610994960134, "epoch": 2.3873165618448637, "percentage": 11.94, "elapsed_time": "0:11:33", "remaining_time": "1:25:15", "throughput": 4275.78, "total_tokens": 2964464} {"current_steps": 4560, "total_steps": 38160, "loss": 0.525, "lr": 0.0009988456209236464, "epoch": 2.389937106918239, "percentage": 11.95, "elapsed_time": "0:11:33", "remaining_time": "1:25:13", "throughput": 4275.38, "total_tokens": 2966832} {"current_steps": 4565, "total_steps": 38160, "loss": 0.47, "lr": 0.0009988300379984668, "epoch": 2.392557651991614, "percentage": 11.96, "elapsed_time": "0:11:34", "remaining_time": "1:25:12", "throughput": 4275.48, "total_tokens": 2969968} {"current_steps": 4570, "total_steps": 38160, "loss": 0.4392, "lr": 0.0009988143507237341, "epoch": 2.3951781970649897, "percentage": 11.98, "elapsed_time": "0:11:35", "remaining_time": "1:25:11", "throughput": 4275.49, "total_tokens": 2973040} {"current_steps": 4575, "total_steps": 38160, "loss": 0.5265, "lr": 0.00099879855910273, "epoch": 2.397798742138365, "percentage": 11.99, "elapsed_time": "0:11:36", "remaining_time": "1:25:11", "throughput": 4276.57, "total_tokens": 2977520} {"current_steps": 4580, "total_steps": 38160, "loss": 0.4019, "lr": 0.0009987826631387578, "epoch": 2.40041928721174, "percentage": 12.0, "elapsed_time": "0:11:36", "remaining_time": "1:25:10", "throughput": 4276.83, "total_tokens": 2980880} {"current_steps": 4585, "total_steps": 38160, "loss": 0.6019, "lr": 0.000998766662835143, "epoch": 2.403039832285115, "percentage": 12.02, "elapsed_time": "0:11:37", "remaining_time": "1:25:08", "throughput": 4276.74, "total_tokens": 2983632} {"current_steps": 4590, "total_steps": 38160, "loss": 0.4581, "lr": 0.0009987505581952325, "epoch": 2.4056603773584904, "percentage": 12.03, "elapsed_time": "0:11:38", "remaining_time": "1:25:07", "throughput": 4276.54, "total_tokens": 2986256} {"current_steps": 4595, "total_steps": 38160, "loss": 0.4396, "lr": 0.0009987343492223954, "epoch": 2.408280922431866, "percentage": 12.04, "elapsed_time": "0:11:39", "remaining_time": "1:25:07", "throughput": 4277.8, "total_tokens": 2991056} {"current_steps": 4600, "total_steps": 38160, "loss": 0.3692, "lr": 0.0009987180359200222, "epoch": 2.410901467505241, "percentage": 12.05, "elapsed_time": "0:11:39", "remaining_time": "1:25:06", "throughput": 4278.02, "total_tokens": 2994320} {"current_steps": 4605, "total_steps": 38160, "loss": 0.4061, "lr": 0.0009987016182915257, "epoch": 2.4135220125786163, "percentage": 12.07, "elapsed_time": "0:11:40", "remaining_time": "1:25:05", "throughput": 4277.9, "total_tokens": 2997104} {"current_steps": 4610, "total_steps": 38160, "loss": 0.4986, "lr": 0.0009986850963403398, "epoch": 2.4161425576519915, "percentage": 12.08, "elapsed_time": "0:11:41", "remaining_time": "1:25:03", "throughput": 4277.93, "total_tokens": 3000112} {"current_steps": 4615, "total_steps": 38160, "loss": 0.4438, "lr": 0.0009986684700699214, "epoch": 2.418763102725367, "percentage": 12.09, "elapsed_time": "0:11:42", "remaining_time": "1:25:03", "throughput": 4278.24, "total_tokens": 3003568} {"current_steps": 4620, "total_steps": 38160, "loss": 0.4113, "lr": 0.000998651739483748, "epoch": 2.4213836477987423, "percentage": 12.11, "elapsed_time": "0:11:42", "remaining_time": "1:25:02", "throughput": 4278.99, "total_tokens": 3007696} {"current_steps": 4625, "total_steps": 38160, "loss": 0.5354, "lr": 0.0009986349045853196, "epoch": 2.4240041928721174, "percentage": 12.12, "elapsed_time": "0:11:43", "remaining_time": "1:25:02", "throughput": 4279.54, "total_tokens": 3011472} {"current_steps": 4630, "total_steps": 38160, "loss": 0.4428, "lr": 0.000998617965378158, "epoch": 2.4266247379454926, "percentage": 12.13, "elapsed_time": "0:11:44", "remaining_time": "1:25:00", "throughput": 4279.45, "total_tokens": 3014320} {"current_steps": 4635, "total_steps": 38160, "loss": 0.6018, "lr": 0.0009986009218658064, "epoch": 2.4292452830188678, "percentage": 12.15, "elapsed_time": "0:11:45", "remaining_time": "1:25:00", "throughput": 4280.14, "total_tokens": 3018224} {"current_steps": 4640, "total_steps": 38160, "loss": 0.5243, "lr": 0.0009985837740518306, "epoch": 2.431865828092243, "percentage": 12.16, "elapsed_time": "0:11:45", "remaining_time": "1:24:59", "throughput": 4280.02, "total_tokens": 3021072} {"current_steps": 4645, "total_steps": 38160, "loss": 0.3662, "lr": 0.0009985665219398173, "epoch": 2.4344863731656186, "percentage": 12.17, "elapsed_time": "0:11:46", "remaining_time": "1:24:57", "throughput": 4279.67, "total_tokens": 3023600} {"current_steps": 4650, "total_steps": 38160, "loss": 0.4896, "lr": 0.0009985491655333755, "epoch": 2.4371069182389937, "percentage": 12.19, "elapsed_time": "0:11:47", "remaining_time": "1:24:56", "throughput": 4279.77, "total_tokens": 3026768} {"current_steps": 4655, "total_steps": 38160, "loss": 0.5012, "lr": 0.000998531704836136, "epoch": 2.439727463312369, "percentage": 12.2, "elapsed_time": "0:11:48", "remaining_time": "1:24:59", "throughput": 4281.79, "total_tokens": 3033424} {"current_steps": 4660, "total_steps": 38160, "loss": 0.4783, "lr": 0.0009985141398517513, "epoch": 2.442348008385744, "percentage": 12.21, "elapsed_time": "0:11:49", "remaining_time": "1:24:57", "throughput": 4281.45, "total_tokens": 3035952} {"current_steps": 4665, "total_steps": 38160, "loss": 0.4844, "lr": 0.000998496470583896, "epoch": 2.4449685534591197, "percentage": 12.22, "elapsed_time": "0:11:49", "remaining_time": "1:24:56", "throughput": 4281.61, "total_tokens": 3039216} {"current_steps": 4670, "total_steps": 38160, "loss": 0.7001, "lr": 0.0009984786970362663, "epoch": 2.447589098532495, "percentage": 12.24, "elapsed_time": "0:11:50", "remaining_time": "1:24:55", "throughput": 4281.69, "total_tokens": 3042224} {"current_steps": 4675, "total_steps": 38160, "loss": 0.4197, "lr": 0.00099846081921258, "epoch": 2.45020964360587, "percentage": 12.25, "elapsed_time": "0:11:51", "remaining_time": "1:24:53", "throughput": 4281.39, "total_tokens": 3044752} {"current_steps": 4680, "total_steps": 38160, "loss": 0.5594, "lr": 0.000998442837116577, "epoch": 2.452830188679245, "percentage": 12.26, "elapsed_time": "0:11:51", "remaining_time": "1:24:53", "throughput": 4281.74, "total_tokens": 3048336} {"current_steps": 4685, "total_steps": 38160, "loss": 0.4458, "lr": 0.0009984247507520193, "epoch": 2.4554507337526204, "percentage": 12.28, "elapsed_time": "0:11:52", "remaining_time": "1:24:51", "throughput": 4281.47, "total_tokens": 3050864} {"current_steps": 4690, "total_steps": 38160, "loss": 0.4659, "lr": 0.0009984065601226896, "epoch": 2.458071278825996, "percentage": 12.29, "elapsed_time": "0:11:53", "remaining_time": "1:24:50", "throughput": 4281.38, "total_tokens": 3053712} {"current_steps": 4695, "total_steps": 38160, "loss": 0.6641, "lr": 0.0009983882652323942, "epoch": 2.460691823899371, "percentage": 12.3, "elapsed_time": "0:11:53", "remaining_time": "1:24:49", "throughput": 4281.58, "total_tokens": 3056944} {"current_steps": 4700, "total_steps": 38160, "loss": 0.5122, "lr": 0.0009983698660849592, "epoch": 2.4633123689727463, "percentage": 12.32, "elapsed_time": "0:11:54", "remaining_time": "1:24:48", "throughput": 4281.76, "total_tokens": 3060176} {"current_steps": 4705, "total_steps": 38160, "loss": 0.7305, "lr": 0.0009983513626842342, "epoch": 2.4659329140461215, "percentage": 12.33, "elapsed_time": "0:11:55", "remaining_time": "1:24:46", "throughput": 4281.24, "total_tokens": 3062352} {"current_steps": 4710, "total_steps": 38160, "loss": 0.4793, "lr": 0.0009983327550340893, "epoch": 2.468553459119497, "percentage": 12.34, "elapsed_time": "0:11:55", "remaining_time": "1:24:44", "throughput": 4280.97, "total_tokens": 3064848} {"current_steps": 4715, "total_steps": 38160, "loss": 0.5454, "lr": 0.0009983140431384177, "epoch": 2.4711740041928723, "percentage": 12.36, "elapsed_time": "0:11:56", "remaining_time": "1:24:43", "throughput": 4281.3, "total_tokens": 3068368} {"current_steps": 4720, "total_steps": 38160, "loss": 0.6006, "lr": 0.0009982952270011331, "epoch": 2.4737945492662474, "percentage": 12.37, "elapsed_time": "0:11:57", "remaining_time": "1:24:42", "throughput": 4281.47, "total_tokens": 3071536} {"current_steps": 4725, "total_steps": 38160, "loss": 0.3713, "lr": 0.000998276306626172, "epoch": 2.4764150943396226, "percentage": 12.38, "elapsed_time": "0:11:58", "remaining_time": "1:24:41", "throughput": 4281.34, "total_tokens": 3074224} {"current_steps": 4730, "total_steps": 38160, "loss": 0.5426, "lr": 0.000998257282017492, "epoch": 2.4790356394129978, "percentage": 12.4, "elapsed_time": "0:11:58", "remaining_time": "1:24:40", "throughput": 4281.77, "total_tokens": 3077744} {"current_steps": 4735, "total_steps": 38160, "loss": 0.5018, "lr": 0.0009982381531790732, "epoch": 2.481656184486373, "percentage": 12.41, "elapsed_time": "0:11:59", "remaining_time": "1:24:38", "throughput": 4281.73, "total_tokens": 3080656} {"current_steps": 4740, "total_steps": 38160, "loss": 0.4918, "lr": 0.0009982189201149167, "epoch": 2.4842767295597485, "percentage": 12.42, "elapsed_time": "0:12:00", "remaining_time": "1:24:38", "throughput": 4282.26, "total_tokens": 3084624} {"current_steps": 4745, "total_steps": 38160, "loss": 0.4389, "lr": 0.0009981995828290465, "epoch": 2.4868972746331237, "percentage": 12.43, "elapsed_time": "0:12:01", "remaining_time": "1:24:37", "throughput": 4282.42, "total_tokens": 3087760} {"current_steps": 4750, "total_steps": 38160, "loss": 0.51, "lr": 0.0009981801413255068, "epoch": 2.489517819706499, "percentage": 12.45, "elapsed_time": "0:12:01", "remaining_time": "1:24:36", "throughput": 4282.92, "total_tokens": 3091440} {"current_steps": 4755, "total_steps": 38160, "loss": 0.4885, "lr": 0.0009981605956083657, "epoch": 2.492138364779874, "percentage": 12.46, "elapsed_time": "0:12:02", "remaining_time": "1:24:35", "throughput": 4282.79, "total_tokens": 3094192} {"current_steps": 4760, "total_steps": 38160, "loss": 0.4191, "lr": 0.000998140945681711, "epoch": 2.4947589098532497, "percentage": 12.47, "elapsed_time": "0:12:03", "remaining_time": "1:24:34", "throughput": 4283.08, "total_tokens": 3097584} {"current_steps": 4765, "total_steps": 38160, "loss": 0.4948, "lr": 0.0009981211915496536, "epoch": 2.497379454926625, "percentage": 12.49, "elapsed_time": "0:12:03", "remaining_time": "1:24:34", "throughput": 4283.52, "total_tokens": 3101232} {"current_steps": 4770, "total_steps": 38160, "loss": 0.3329, "lr": 0.0009981013332163256, "epoch": 2.5, "percentage": 12.5, "elapsed_time": "0:12:04", "remaining_time": "1:24:32", "throughput": 4283.28, "total_tokens": 3103888} {"current_steps": 4775, "total_steps": 38160, "loss": 0.3867, "lr": 0.0009980813706858816, "epoch": 2.502620545073375, "percentage": 12.51, "elapsed_time": "0:12:05", "remaining_time": "1:24:35", "throughput": 4285.8, "total_tokens": 3111408} {"current_steps": 4780, "total_steps": 38160, "loss": 0.406, "lr": 0.000998061303962497, "epoch": 2.5052410901467503, "percentage": 12.53, "elapsed_time": "0:12:06", "remaining_time": "1:24:34", "throughput": 4285.8, "total_tokens": 3114288} {"current_steps": 4785, "total_steps": 38160, "loss": 0.5473, "lr": 0.00099804113305037, "epoch": 2.507861635220126, "percentage": 12.54, "elapsed_time": "0:12:07", "remaining_time": "1:24:33", "throughput": 4285.88, "total_tokens": 3117296} {"current_steps": 4790, "total_steps": 38160, "loss": 0.3556, "lr": 0.0009980208579537199, "epoch": 2.510482180293501, "percentage": 12.55, "elapsed_time": "0:12:07", "remaining_time": "1:24:31", "throughput": 4285.57, "total_tokens": 3119792} {"current_steps": 4795, "total_steps": 38160, "loss": 0.5445, "lr": 0.000998000478676788, "epoch": 2.5131027253668763, "percentage": 12.57, "elapsed_time": "0:12:08", "remaining_time": "1:24:30", "throughput": 4285.45, "total_tokens": 3122544} {"current_steps": 4800, "total_steps": 38160, "loss": 0.4258, "lr": 0.0009979799952238373, "epoch": 2.5157232704402515, "percentage": 12.58, "elapsed_time": "0:12:09", "remaining_time": "1:24:28", "throughput": 4285.58, "total_tokens": 3125648} {"current_steps": 4805, "total_steps": 38160, "loss": 0.4371, "lr": 0.000997959407599153, "epoch": 2.518343815513627, "percentage": 12.59, "elapsed_time": "0:12:10", "remaining_time": "1:24:27", "throughput": 4285.43, "total_tokens": 3128400} {"current_steps": 4810, "total_steps": 38160, "loss": 0.4276, "lr": 0.000997938715807042, "epoch": 2.5209643605870022, "percentage": 12.6, "elapsed_time": "0:12:10", "remaining_time": "1:24:26", "throughput": 4285.38, "total_tokens": 3131280} {"current_steps": 4815, "total_steps": 38160, "loss": 0.506, "lr": 0.000997917919851832, "epoch": 2.5235849056603774, "percentage": 12.62, "elapsed_time": "0:12:11", "remaining_time": "1:24:24", "throughput": 4285.43, "total_tokens": 3134288} {"current_steps": 4820, "total_steps": 38160, "loss": 0.5153, "lr": 0.0009978970197378736, "epoch": 2.5262054507337526, "percentage": 12.63, "elapsed_time": "0:12:12", "remaining_time": "1:24:23", "throughput": 4285.14, "total_tokens": 3136784} {"current_steps": 4825, "total_steps": 38160, "loss": 0.5077, "lr": 0.0009978760154695392, "epoch": 2.5288259958071277, "percentage": 12.64, "elapsed_time": "0:12:12", "remaining_time": "1:24:22", "throughput": 4285.05, "total_tokens": 3139664} {"current_steps": 4830, "total_steps": 38160, "loss": 0.7152, "lr": 0.0009978549070512226, "epoch": 2.531446540880503, "percentage": 12.66, "elapsed_time": "0:12:13", "remaining_time": "1:24:21", "throughput": 4285.28, "total_tokens": 3142896} {"current_steps": 4835, "total_steps": 38160, "loss": 0.5313, "lr": 0.000997833694487339, "epoch": 2.5340670859538785, "percentage": 12.67, "elapsed_time": "0:12:14", "remaining_time": "1:24:20", "throughput": 4285.56, "total_tokens": 3146224} {"current_steps": 4840, "total_steps": 38160, "loss": 0.5414, "lr": 0.0009978123777823263, "epoch": 2.5366876310272537, "percentage": 12.68, "elapsed_time": "0:12:14", "remaining_time": "1:24:18", "throughput": 4285.5, "total_tokens": 3149136} {"current_steps": 4845, "total_steps": 38160, "loss": 0.5157, "lr": 0.0009977909569406434, "epoch": 2.539308176100629, "percentage": 12.7, "elapsed_time": "0:12:15", "remaining_time": "1:24:17", "throughput": 4285.45, "total_tokens": 3151984} {"current_steps": 4850, "total_steps": 38160, "loss": 0.5451, "lr": 0.0009977694319667713, "epoch": 2.541928721174004, "percentage": 12.71, "elapsed_time": "0:12:16", "remaining_time": "1:24:16", "throughput": 4285.77, "total_tokens": 3155440} {"current_steps": 4855, "total_steps": 38160, "loss": 0.3719, "lr": 0.0009977478028652131, "epoch": 2.5445492662473796, "percentage": 12.72, "elapsed_time": "0:12:17", "remaining_time": "1:24:16", "throughput": 4286.29, "total_tokens": 3159216} {"current_steps": 4860, "total_steps": 38160, "loss": 0.594, "lr": 0.000997726069640493, "epoch": 2.547169811320755, "percentage": 12.74, "elapsed_time": "0:12:17", "remaining_time": "1:24:15", "throughput": 4286.58, "total_tokens": 3162640} {"current_steps": 4865, "total_steps": 38160, "loss": 0.4393, "lr": 0.0009977042322971577, "epoch": 2.54979035639413, "percentage": 12.75, "elapsed_time": "0:12:18", "remaining_time": "1:24:14", "throughput": 4286.86, "total_tokens": 3165968} {"current_steps": 4870, "total_steps": 38160, "loss": 0.4271, "lr": 0.000997682290839775, "epoch": 2.552410901467505, "percentage": 12.76, "elapsed_time": "0:12:19", "remaining_time": "1:24:12", "throughput": 4286.73, "total_tokens": 3168688} {"current_steps": 4875, "total_steps": 38160, "loss": 0.5711, "lr": 0.0009976602452729348, "epoch": 2.5550314465408803, "percentage": 12.78, "elapsed_time": "0:12:19", "remaining_time": "1:24:12", "throughput": 4287.23, "total_tokens": 3172400} {"current_steps": 4880, "total_steps": 38160, "loss": 0.5878, "lr": 0.000997638095601249, "epoch": 2.5576519916142555, "percentage": 12.79, "elapsed_time": "0:12:20", "remaining_time": "1:24:11", "throughput": 4287.27, "total_tokens": 3175472} {"current_steps": 4885, "total_steps": 38160, "loss": 0.7429, "lr": 0.000997615841829351, "epoch": 2.560272536687631, "percentage": 12.8, "elapsed_time": "0:12:21", "remaining_time": "1:24:09", "throughput": 4286.98, "total_tokens": 3178032} {"current_steps": 4890, "total_steps": 38160, "loss": 0.3668, "lr": 0.000997593483961896, "epoch": 2.5628930817610063, "percentage": 12.81, "elapsed_time": "0:12:22", "remaining_time": "1:24:09", "throughput": 4287.49, "total_tokens": 3181744} {"current_steps": 4895, "total_steps": 38160, "loss": 0.4541, "lr": 0.0009975710220035607, "epoch": 2.5655136268343814, "percentage": 12.83, "elapsed_time": "0:12:22", "remaining_time": "1:24:07", "throughput": 4287.47, "total_tokens": 3184656} {"current_steps": 4900, "total_steps": 38160, "loss": 0.4705, "lr": 0.0009975484559590444, "epoch": 2.568134171907757, "percentage": 12.84, "elapsed_time": "0:12:23", "remaining_time": "1:24:06", "throughput": 4287.4, "total_tokens": 3187504} {"current_steps": 4905, "total_steps": 38160, "loss": 0.5153, "lr": 0.0009975257858330674, "epoch": 2.5707547169811322, "percentage": 12.85, "elapsed_time": "0:12:24", "remaining_time": "1:24:05", "throughput": 4287.51, "total_tokens": 3190608} {"current_steps": 4910, "total_steps": 38160, "loss": 0.5102, "lr": 0.0009975030116303723, "epoch": 2.5733752620545074, "percentage": 12.87, "elapsed_time": "0:12:24", "remaining_time": "1:24:04", "throughput": 4287.58, "total_tokens": 3193584} {"current_steps": 4915, "total_steps": 38160, "loss": 0.6332, "lr": 0.0009974801333557228, "epoch": 2.5759958071278826, "percentage": 12.88, "elapsed_time": "0:12:25", "remaining_time": "1:24:03", "throughput": 4288.12, "total_tokens": 3197488} {"current_steps": 4920, "total_steps": 38160, "loss": 0.5743, "lr": 0.000997457151013905, "epoch": 2.5786163522012577, "percentage": 12.89, "elapsed_time": "0:12:26", "remaining_time": "1:24:02", "throughput": 4288.24, "total_tokens": 3200592} {"current_steps": 4925, "total_steps": 38160, "loss": 0.4663, "lr": 0.0009974340646097264, "epoch": 2.581236897274633, "percentage": 12.91, "elapsed_time": "0:12:27", "remaining_time": "1:24:01", "throughput": 4288.66, "total_tokens": 3204208} {"current_steps": 4930, "total_steps": 38160, "loss": 0.5792, "lr": 0.0009974108741480166, "epoch": 2.5838574423480085, "percentage": 12.92, "elapsed_time": "0:12:27", "remaining_time": "1:24:01", "throughput": 4289.18, "total_tokens": 3208048} {"current_steps": 4935, "total_steps": 38160, "loss": 0.4394, "lr": 0.0009973875796336267, "epoch": 2.5864779874213837, "percentage": 12.93, "elapsed_time": "0:12:28", "remaining_time": "1:23:59", "throughput": 4288.93, "total_tokens": 3210576} {"current_steps": 4940, "total_steps": 38160, "loss": 0.3826, "lr": 0.0009973641810714295, "epoch": 2.589098532494759, "percentage": 12.95, "elapsed_time": "0:12:29", "remaining_time": "1:23:58", "throughput": 4289.05, "total_tokens": 3213648} {"current_steps": 4945, "total_steps": 38160, "loss": 0.6814, "lr": 0.00099734067846632, "epoch": 2.591719077568134, "percentage": 12.96, "elapsed_time": "0:12:29", "remaining_time": "1:23:57", "throughput": 4289.1, "total_tokens": 3216592} {"current_steps": 4950, "total_steps": 38160, "loss": 0.4692, "lr": 0.0009973170718232144, "epoch": 2.5943396226415096, "percentage": 12.97, "elapsed_time": "0:12:30", "remaining_time": "1:23:56", "throughput": 4289.24, "total_tokens": 3219760} {"current_steps": 4955, "total_steps": 38160, "loss": 0.694, "lr": 0.000997293361147051, "epoch": 2.596960167714885, "percentage": 12.98, "elapsed_time": "0:12:31", "remaining_time": "1:23:55", "throughput": 4289.86, "total_tokens": 3223600} {"current_steps": 4960, "total_steps": 38160, "loss": 0.5992, "lr": 0.0009972695464427904, "epoch": 2.59958071278826, "percentage": 13.0, "elapsed_time": "0:12:32", "remaining_time": "1:23:54", "throughput": 4289.76, "total_tokens": 3226416} {"current_steps": 4965, "total_steps": 38160, "loss": 0.3971, "lr": 0.0009972456277154134, "epoch": 2.602201257861635, "percentage": 13.01, "elapsed_time": "0:12:32", "remaining_time": "1:23:53", "throughput": 4290.27, "total_tokens": 3230288} {"current_steps": 4970, "total_steps": 38160, "loss": 0.5174, "lr": 0.000997221604969924, "epoch": 2.6048218029350103, "percentage": 13.02, "elapsed_time": "0:12:33", "remaining_time": "1:23:52", "throughput": 4290.22, "total_tokens": 3233104} {"current_steps": 4975, "total_steps": 38160, "loss": 0.5211, "lr": 0.0009971974782113475, "epoch": 2.6074423480083855, "percentage": 13.04, "elapsed_time": "0:12:34", "remaining_time": "1:23:52", "throughput": 4291.29, "total_tokens": 3237872} {"current_steps": 4980, "total_steps": 38160, "loss": 0.4539, "lr": 0.0009971732474447308, "epoch": 2.610062893081761, "percentage": 13.05, "elapsed_time": "0:12:35", "remaining_time": "1:23:52", "throughput": 4292.09, "total_tokens": 3242064} {"current_steps": 4985, "total_steps": 38160, "loss": 0.4767, "lr": 0.0009971489126751427, "epoch": 2.6126834381551363, "percentage": 13.06, "elapsed_time": "0:12:36", "remaining_time": "1:23:52", "throughput": 4292.52, "total_tokens": 3245712} {"current_steps": 4990, "total_steps": 38160, "loss": 0.4936, "lr": 0.0009971244739076742, "epoch": 2.6153039832285114, "percentage": 13.08, "elapsed_time": "0:12:36", "remaining_time": "1:23:50", "throughput": 4292.45, "total_tokens": 3248560} {"current_steps": 4995, "total_steps": 38160, "loss": 0.4937, "lr": 0.000997099931147437, "epoch": 2.617924528301887, "percentage": 13.09, "elapsed_time": "0:12:37", "remaining_time": "1:23:49", "throughput": 4292.44, "total_tokens": 3251440} {"current_steps": 5000, "total_steps": 38160, "loss": 0.4671, "lr": 0.0009970752843995654, "epoch": 2.620545073375262, "percentage": 13.1, "elapsed_time": "0:12:38", "remaining_time": "1:23:48", "throughput": 4292.59, "total_tokens": 3254640} {"current_steps": 5005, "total_steps": 38160, "loss": 0.4113, "lr": 0.0009970505336692153, "epoch": 2.6231656184486374, "percentage": 13.12, "elapsed_time": "0:12:38", "remaining_time": "1:23:47", "throughput": 4293.02, "total_tokens": 3258320} {"current_steps": 5010, "total_steps": 38160, "loss": 0.4355, "lr": 0.0009970256789615642, "epoch": 2.6257861635220126, "percentage": 13.13, "elapsed_time": "0:12:39", "remaining_time": "1:23:46", "throughput": 4292.95, "total_tokens": 3261168} {"current_steps": 5015, "total_steps": 38160, "loss": 0.5616, "lr": 0.0009970007202818115, "epoch": 2.6284067085953877, "percentage": 13.14, "elapsed_time": "0:12:40", "remaining_time": "1:23:45", "throughput": 4293.39, "total_tokens": 3264816} {"current_steps": 5020, "total_steps": 38160, "loss": 0.3743, "lr": 0.000996975657635178, "epoch": 2.631027253668763, "percentage": 13.16, "elapsed_time": "0:12:41", "remaining_time": "1:23:44", "throughput": 4293.57, "total_tokens": 3268080} {"current_steps": 5025, "total_steps": 38160, "loss": 0.5196, "lr": 0.000996950491026907, "epoch": 2.6336477987421385, "percentage": 13.17, "elapsed_time": "0:12:42", "remaining_time": "1:23:44", "throughput": 4294.47, "total_tokens": 3272528} {"current_steps": 5030, "total_steps": 38160, "loss": 0.5071, "lr": 0.0009969252204622624, "epoch": 2.6362683438155137, "percentage": 13.18, "elapsed_time": "0:12:42", "remaining_time": "1:23:43", "throughput": 4294.72, "total_tokens": 3275888} {"current_steps": 5035, "total_steps": 38160, "loss": 0.4195, "lr": 0.0009968998459465312, "epoch": 2.638888888888889, "percentage": 13.19, "elapsed_time": "0:12:43", "remaining_time": "1:23:44", "throughput": 4295.92, "total_tokens": 3281072} {"current_steps": 5040, "total_steps": 38160, "loss": 0.4925, "lr": 0.0009968743674850212, "epoch": 2.641509433962264, "percentage": 13.21, "elapsed_time": "0:12:44", "remaining_time": "1:23:45", "throughput": 4296.99, "total_tokens": 3285808} {"current_steps": 5045, "total_steps": 38160, "loss": 0.4312, "lr": 0.0009968487850830622, "epoch": 2.6441299790356396, "percentage": 13.22, "elapsed_time": "0:12:45", "remaining_time": "1:23:44", "throughput": 4297.18, "total_tokens": 3289168} {"current_steps": 5050, "total_steps": 38160, "loss": 0.6515, "lr": 0.0009968230987460055, "epoch": 2.646750524109015, "percentage": 13.23, "elapsed_time": "0:12:46", "remaining_time": "1:23:43", "throughput": 4297.31, "total_tokens": 3292336} {"current_steps": 5055, "total_steps": 38160, "loss": 0.4366, "lr": 0.0009967973084792246, "epoch": 2.64937106918239, "percentage": 13.25, "elapsed_time": "0:12:46", "remaining_time": "1:23:41", "throughput": 4297.19, "total_tokens": 3295024} {"current_steps": 5060, "total_steps": 38160, "loss": 0.6597, "lr": 0.0009967714142881145, "epoch": 2.651991614255765, "percentage": 13.26, "elapsed_time": "0:12:47", "remaining_time": "1:23:40", "throughput": 4297.06, "total_tokens": 3297776} {"current_steps": 5065, "total_steps": 38160, "loss": 0.3878, "lr": 0.0009967454161780923, "epoch": 2.6546121593291403, "percentage": 13.27, "elapsed_time": "0:12:48", "remaining_time": "1:23:38", "throughput": 4296.97, "total_tokens": 3300560} {"current_steps": 5070, "total_steps": 38160, "loss": 0.4905, "lr": 0.000996719314154596, "epoch": 2.6572327044025155, "percentage": 13.29, "elapsed_time": "0:12:48", "remaining_time": "1:23:38", "throughput": 4297.49, "total_tokens": 3304432} {"current_steps": 5075, "total_steps": 38160, "loss": 0.4738, "lr": 0.0009966931082230862, "epoch": 2.659853249475891, "percentage": 13.3, "elapsed_time": "0:12:49", "remaining_time": "1:23:37", "throughput": 4297.48, "total_tokens": 3307344} {"current_steps": 5080, "total_steps": 38160, "loss": 0.5092, "lr": 0.0009966667983890445, "epoch": 2.6624737945492662, "percentage": 13.31, "elapsed_time": "0:12:50", "remaining_time": "1:23:36", "throughput": 4297.92, "total_tokens": 3311056} {"current_steps": 5085, "total_steps": 38160, "loss": 0.4777, "lr": 0.000996640384657975, "epoch": 2.6650943396226414, "percentage": 13.33, "elapsed_time": "0:12:51", "remaining_time": "1:23:35", "throughput": 4297.74, "total_tokens": 3313712} {"current_steps": 5090, "total_steps": 38160, "loss": 0.4607, "lr": 0.0009966138670354028, "epoch": 2.667714884696017, "percentage": 13.34, "elapsed_time": "0:12:51", "remaining_time": "1:23:34", "throughput": 4298.08, "total_tokens": 3317232} {"current_steps": 5095, "total_steps": 38160, "loss": 0.617, "lr": 0.0009965872455268755, "epoch": 2.670335429769392, "percentage": 13.35, "elapsed_time": "0:12:52", "remaining_time": "1:23:33", "throughput": 4298.03, "total_tokens": 3320048} {"current_steps": 5100, "total_steps": 38160, "loss": 0.4534, "lr": 0.0009965605201379616, "epoch": 2.6729559748427674, "percentage": 13.36, "elapsed_time": "0:12:53", "remaining_time": "1:23:33", "throughput": 4298.96, "total_tokens": 3324720} {"current_steps": 5105, "total_steps": 38160, "loss": 0.4666, "lr": 0.000996533690874252, "epoch": 2.6755765199161425, "percentage": 13.38, "elapsed_time": "0:12:54", "remaining_time": "1:23:32", "throughput": 4298.97, "total_tokens": 3327696} {"current_steps": 5110, "total_steps": 38160, "loss": 0.3645, "lr": 0.0009965067577413593, "epoch": 2.6781970649895177, "percentage": 13.39, "elapsed_time": "0:12:54", "remaining_time": "1:23:30", "throughput": 4298.93, "total_tokens": 3330608} {"current_steps": 5115, "total_steps": 38160, "loss": 0.4875, "lr": 0.0009964797207449173, "epoch": 2.680817610062893, "percentage": 13.4, "elapsed_time": "0:12:55", "remaining_time": "1:23:29", "throughput": 4298.77, "total_tokens": 3333296} {"current_steps": 5120, "total_steps": 38160, "loss": 0.4475, "lr": 0.0009964525798905816, "epoch": 2.6834381551362685, "percentage": 13.42, "elapsed_time": "0:12:56", "remaining_time": "1:23:29", "throughput": 4299.56, "total_tokens": 3337552} {"current_steps": 5125, "total_steps": 38160, "loss": 0.4689, "lr": 0.0009964253351840303, "epoch": 2.6860587002096437, "percentage": 13.43, "elapsed_time": "0:12:57", "remaining_time": "1:23:28", "throughput": 4299.98, "total_tokens": 3341296} {"current_steps": 5130, "total_steps": 38160, "loss": 0.5171, "lr": 0.000996397986630962, "epoch": 2.688679245283019, "percentage": 13.44, "elapsed_time": "0:12:57", "remaining_time": "1:23:27", "throughput": 4299.77, "total_tokens": 3343920} {"current_steps": 5135, "total_steps": 38160, "loss": 0.4475, "lr": 0.0009963705342370982, "epoch": 2.691299790356394, "percentage": 13.46, "elapsed_time": "0:12:58", "remaining_time": "1:23:25", "throughput": 4299.69, "total_tokens": 3346736} {"current_steps": 5140, "total_steps": 38160, "loss": 0.4781, "lr": 0.000996342978008182, "epoch": 2.6939203354297696, "percentage": 13.47, "elapsed_time": "0:12:59", "remaining_time": "1:23:25", "throughput": 4300.1, "total_tokens": 3350320} {"current_steps": 5145, "total_steps": 38160, "loss": 0.4297, "lr": 0.000996315317949977, "epoch": 2.6965408805031448, "percentage": 13.48, "elapsed_time": "0:12:59", "remaining_time": "1:23:24", "throughput": 4300.24, "total_tokens": 3353552} {"current_steps": 5150, "total_steps": 38160, "loss": 0.518, "lr": 0.0009962875540682696, "epoch": 2.69916142557652, "percentage": 13.5, "elapsed_time": "0:13:00", "remaining_time": "1:23:23", "throughput": 4300.61, "total_tokens": 3357136} {"current_steps": 5155, "total_steps": 38160, "loss": 0.4417, "lr": 0.0009962596863688682, "epoch": 2.701781970649895, "percentage": 13.51, "elapsed_time": "0:13:01", "remaining_time": "1:23:22", "throughput": 4300.57, "total_tokens": 3360048} {"current_steps": 5160, "total_steps": 38160, "loss": 0.4198, "lr": 0.000996231714857602, "epoch": 2.7044025157232703, "percentage": 13.52, "elapsed_time": "0:13:02", "remaining_time": "1:23:21", "throughput": 4300.73, "total_tokens": 3363280} {"current_steps": 5165, "total_steps": 38160, "loss": 0.6311, "lr": 0.000996203639540322, "epoch": 2.7070230607966455, "percentage": 13.54, "elapsed_time": "0:13:02", "remaining_time": "1:23:19", "throughput": 4300.62, "total_tokens": 3366000} {"current_steps": 5170, "total_steps": 38160, "loss": 0.5092, "lr": 0.0009961754604229018, "epoch": 2.709643605870021, "percentage": 13.55, "elapsed_time": "0:13:03", "remaining_time": "1:23:19", "throughput": 4301.07, "total_tokens": 3369648} {"current_steps": 5175, "total_steps": 38160, "loss": 0.4661, "lr": 0.0009961471775112361, "epoch": 2.7122641509433962, "percentage": 13.56, "elapsed_time": "0:13:04", "remaining_time": "1:23:17", "throughput": 4301.01, "total_tokens": 3372528} {"current_steps": 5180, "total_steps": 38160, "loss": 0.5069, "lr": 0.000996118790811241, "epoch": 2.7148846960167714, "percentage": 13.57, "elapsed_time": "0:13:04", "remaining_time": "1:23:16", "throughput": 4301.14, "total_tokens": 3375728} {"current_steps": 5185, "total_steps": 38160, "loss": 0.435, "lr": 0.0009960903003288551, "epoch": 2.717505241090147, "percentage": 13.59, "elapsed_time": "0:13:05", "remaining_time": "1:23:15", "throughput": 4301.2, "total_tokens": 3378864} {"current_steps": 5190, "total_steps": 38160, "loss": 0.4216, "lr": 0.0009960617060700378, "epoch": 2.720125786163522, "percentage": 13.6, "elapsed_time": "0:13:06", "remaining_time": "1:23:14", "throughput": 4301.3, "total_tokens": 3381936} {"current_steps": 5195, "total_steps": 38160, "loss": 0.527, "lr": 0.000996033008040771, "epoch": 2.7227463312368974, "percentage": 13.61, "elapsed_time": "0:13:06", "remaining_time": "1:23:13", "throughput": 4301.06, "total_tokens": 3384464} {"current_steps": 5200, "total_steps": 38160, "loss": 0.5652, "lr": 0.0009960042062470583, "epoch": 2.7253668763102725, "percentage": 13.63, "elapsed_time": "0:13:07", "remaining_time": "1:23:11", "throughput": 4300.97, "total_tokens": 3387312} {"current_steps": 5205, "total_steps": 38160, "loss": 0.4463, "lr": 0.0009959753006949241, "epoch": 2.7279874213836477, "percentage": 13.64, "elapsed_time": "0:13:08", "remaining_time": "1:23:11", "throughput": 4301.63, "total_tokens": 3391376} {"current_steps": 5210, "total_steps": 38160, "loss": 0.4993, "lr": 0.0009959462913904154, "epoch": 2.730607966457023, "percentage": 13.65, "elapsed_time": "0:13:09", "remaining_time": "1:23:10", "throughput": 4301.63, "total_tokens": 3394352} {"current_steps": 5215, "total_steps": 38160, "loss": 0.54, "lr": 0.0009959171783396007, "epoch": 2.7332285115303985, "percentage": 13.67, "elapsed_time": "0:13:09", "remaining_time": "1:23:09", "throughput": 4301.72, "total_tokens": 3397456} {"current_steps": 5220, "total_steps": 38160, "loss": 0.5499, "lr": 0.00099588796154857, "epoch": 2.7358490566037736, "percentage": 13.68, "elapsed_time": "0:13:10", "remaining_time": "1:23:11", "throughput": 4303.34, "total_tokens": 3403792} {"current_steps": 5225, "total_steps": 38160, "loss": 0.5079, "lr": 0.000995858641023435, "epoch": 2.738469601677149, "percentage": 13.69, "elapsed_time": "0:13:11", "remaining_time": "1:23:10", "throughput": 4303.6, "total_tokens": 3407184} {"current_steps": 5230, "total_steps": 38160, "loss": 0.5329, "lr": 0.0009958292167703293, "epoch": 2.741090146750524, "percentage": 13.71, "elapsed_time": "0:13:12", "remaining_time": "1:23:09", "throughput": 4303.66, "total_tokens": 3410256} {"current_steps": 5235, "total_steps": 38160, "loss": 0.5545, "lr": 0.0009957996887954082, "epoch": 2.7437106918238996, "percentage": 13.72, "elapsed_time": "0:13:13", "remaining_time": "1:23:08", "throughput": 4303.63, "total_tokens": 3413168} {"current_steps": 5240, "total_steps": 38160, "loss": 0.6493, "lr": 0.0009957700571048486, "epoch": 2.7463312368972748, "percentage": 13.73, "elapsed_time": "0:13:13", "remaining_time": "1:23:06", "throughput": 4303.37, "total_tokens": 3415728} {"current_steps": 5245, "total_steps": 38160, "loss": 0.4034, "lr": 0.0009957403217048493, "epoch": 2.74895178197065, "percentage": 13.74, "elapsed_time": "0:13:14", "remaining_time": "1:23:06", "throughput": 4303.85, "total_tokens": 3419568} {"current_steps": 5250, "total_steps": 38160, "loss": 0.3652, "lr": 0.0009957104826016302, "epoch": 2.751572327044025, "percentage": 13.76, "elapsed_time": "0:13:15", "remaining_time": "1:23:05", "throughput": 4303.96, "total_tokens": 3422736} {"current_steps": 5255, "total_steps": 38160, "loss": 0.4344, "lr": 0.0009956805398014337, "epoch": 2.7541928721174003, "percentage": 13.77, "elapsed_time": "0:13:16", "remaining_time": "1:23:05", "throughput": 4304.89, "total_tokens": 3427472} {"current_steps": 5260, "total_steps": 38160, "loss": 0.4141, "lr": 0.0009956504933105231, "epoch": 2.7568134171907754, "percentage": 13.78, "elapsed_time": "0:13:16", "remaining_time": "1:23:04", "throughput": 4304.77, "total_tokens": 3430256} {"current_steps": 5265, "total_steps": 38160, "loss": 0.5857, "lr": 0.000995620343135184, "epoch": 2.759433962264151, "percentage": 13.8, "elapsed_time": "0:13:17", "remaining_time": "1:23:03", "throughput": 4304.82, "total_tokens": 3433328} {"current_steps": 5270, "total_steps": 38160, "loss": 0.4384, "lr": 0.0009955900892817235, "epoch": 2.762054507337526, "percentage": 13.81, "elapsed_time": "0:13:18", "remaining_time": "1:23:02", "throughput": 4305.47, "total_tokens": 3437456} {"current_steps": 5275, "total_steps": 38160, "loss": 0.3807, "lr": 0.0009955597317564703, "epoch": 2.7646750524109014, "percentage": 13.82, "elapsed_time": "0:13:19", "remaining_time": "1:23:01", "throughput": 4305.36, "total_tokens": 3440240} {"current_steps": 5280, "total_steps": 38160, "loss": 0.4722, "lr": 0.0009955292705657749, "epoch": 2.767295597484277, "percentage": 13.84, "elapsed_time": "0:13:19", "remaining_time": "1:23:00", "throughput": 4305.68, "total_tokens": 3443824} {"current_steps": 5285, "total_steps": 38160, "loss": 0.5572, "lr": 0.0009954987057160093, "epoch": 2.769916142557652, "percentage": 13.85, "elapsed_time": "0:13:20", "remaining_time": "1:22:59", "throughput": 4305.83, "total_tokens": 3447184} {"current_steps": 5290, "total_steps": 38160, "loss": 0.4287, "lr": 0.0009954680372135675, "epoch": 2.7725366876310273, "percentage": 13.86, "elapsed_time": "0:13:21", "remaining_time": "1:22:58", "throughput": 4305.95, "total_tokens": 3450320} {"current_steps": 5295, "total_steps": 38160, "loss": 0.5816, "lr": 0.000995437265064865, "epoch": 2.7751572327044025, "percentage": 13.88, "elapsed_time": "0:13:22", "remaining_time": "1:22:58", "throughput": 4306.73, "total_tokens": 3454640} {"current_steps": 5300, "total_steps": 38160, "loss": 0.4634, "lr": 0.0009954063892763387, "epoch": 2.7777777777777777, "percentage": 13.89, "elapsed_time": "0:13:22", "remaining_time": "1:22:57", "throughput": 4306.92, "total_tokens": 3458000} {"current_steps": 5305, "total_steps": 38160, "loss": 0.6013, "lr": 0.0009953754098544479, "epoch": 2.780398322851153, "percentage": 13.9, "elapsed_time": "0:13:23", "remaining_time": "1:22:57", "throughput": 4307.09, "total_tokens": 3461296} {"current_steps": 5310, "total_steps": 38160, "loss": 0.4116, "lr": 0.0009953443268056726, "epoch": 2.7830188679245285, "percentage": 13.92, "elapsed_time": "0:13:24", "remaining_time": "1:22:55", "throughput": 4307.15, "total_tokens": 3464336} {"current_steps": 5315, "total_steps": 38160, "loss": 0.5837, "lr": 0.0009953131401365155, "epoch": 2.7856394129979036, "percentage": 13.93, "elapsed_time": "0:13:24", "remaining_time": "1:22:54", "throughput": 4307.08, "total_tokens": 3467184} {"current_steps": 5320, "total_steps": 38160, "loss": 0.5457, "lr": 0.0009952818498535003, "epoch": 2.788259958071279, "percentage": 13.94, "elapsed_time": "0:13:25", "remaining_time": "1:22:53", "throughput": 4307.16, "total_tokens": 3470320} {"current_steps": 5325, "total_steps": 38160, "loss": 0.4116, "lr": 0.0009952504559631726, "epoch": 2.790880503144654, "percentage": 13.95, "elapsed_time": "0:13:26", "remaining_time": "1:22:53", "throughput": 4307.6, "total_tokens": 3474128} {"current_steps": 5330, "total_steps": 38160, "loss": 0.6511, "lr": 0.0009952189584720996, "epoch": 2.7935010482180296, "percentage": 13.97, "elapsed_time": "0:13:27", "remaining_time": "1:22:51", "throughput": 4307.15, "total_tokens": 3476336} {"current_steps": 5335, "total_steps": 38160, "loss": 0.537, "lr": 0.0009951873573868701, "epoch": 2.7961215932914047, "percentage": 13.98, "elapsed_time": "0:13:27", "remaining_time": "1:22:50", "throughput": 4307.52, "total_tokens": 3480016} {"current_steps": 5340, "total_steps": 38160, "loss": 0.4226, "lr": 0.000995155652714095, "epoch": 2.79874213836478, "percentage": 13.99, "elapsed_time": "0:13:28", "remaining_time": "1:22:49", "throughput": 4307.32, "total_tokens": 3482608} {"current_steps": 5345, "total_steps": 38160, "loss": 0.7051, "lr": 0.0009951238444604064, "epoch": 2.801362683438155, "percentage": 14.01, "elapsed_time": "0:13:29", "remaining_time": "1:22:47", "throughput": 4307.09, "total_tokens": 3485200} {"current_steps": 5350, "total_steps": 38160, "loss": 0.3597, "lr": 0.000995091932632458, "epoch": 2.8039832285115303, "percentage": 14.02, "elapsed_time": "0:13:29", "remaining_time": "1:22:46", "throughput": 4307.21, "total_tokens": 3488336} {"current_steps": 5355, "total_steps": 38160, "loss": 0.5557, "lr": 0.000995059917236926, "epoch": 2.8066037735849054, "percentage": 14.03, "elapsed_time": "0:13:30", "remaining_time": "1:22:46", "throughput": 4307.65, "total_tokens": 3492080} {"current_steps": 5360, "total_steps": 38160, "loss": 0.4424, "lr": 0.000995027798280507, "epoch": 2.809224318658281, "percentage": 14.05, "elapsed_time": "0:13:31", "remaining_time": "1:22:45", "throughput": 4308.15, "total_tokens": 3495952} {"current_steps": 5365, "total_steps": 38160, "loss": 0.435, "lr": 0.00099499557576992, "epoch": 2.811844863731656, "percentage": 14.06, "elapsed_time": "0:13:32", "remaining_time": "1:22:44", "throughput": 4307.71, "total_tokens": 3498224} {"current_steps": 5370, "total_steps": 38160, "loss": 0.5648, "lr": 0.000994963249711906, "epoch": 2.8144654088050314, "percentage": 14.07, "elapsed_time": "0:13:32", "remaining_time": "1:22:43", "throughput": 4308.06, "total_tokens": 3501872} {"current_steps": 5375, "total_steps": 38160, "loss": 0.4112, "lr": 0.000994930820113227, "epoch": 2.8170859538784065, "percentage": 14.09, "elapsed_time": "0:13:33", "remaining_time": "1:22:42", "throughput": 4308.13, "total_tokens": 3505008} {"current_steps": 5380, "total_steps": 38160, "loss": 0.3886, "lr": 0.0009948982869806668, "epoch": 2.819706498951782, "percentage": 14.1, "elapsed_time": "0:13:34", "remaining_time": "1:22:41", "throughput": 4308.15, "total_tokens": 3508016} {"current_steps": 5385, "total_steps": 38160, "loss": 0.5118, "lr": 0.0009948656503210311, "epoch": 2.8223270440251573, "percentage": 14.11, "elapsed_time": "0:13:35", "remaining_time": "1:22:41", "throughput": 4309.23, "total_tokens": 3512912} {"current_steps": 5390, "total_steps": 38160, "loss": 0.4644, "lr": 0.000994832910141147, "epoch": 2.8249475890985325, "percentage": 14.12, "elapsed_time": "0:13:35", "remaining_time": "1:22:40", "throughput": 4309.37, "total_tokens": 3516112} {"current_steps": 5395, "total_steps": 38160, "loss": 0.5736, "lr": 0.0009948000664478638, "epoch": 2.8275681341719077, "percentage": 14.14, "elapsed_time": "0:13:36", "remaining_time": "1:22:39", "throughput": 4309.18, "total_tokens": 3518800} {"current_steps": 5400, "total_steps": 38160, "loss": 0.4028, "lr": 0.0009947671192480515, "epoch": 2.830188679245283, "percentage": 14.15, "elapsed_time": "0:13:37", "remaining_time": "1:22:38", "throughput": 4309.68, "total_tokens": 3522608} {"current_steps": 5405, "total_steps": 38160, "loss": 0.502, "lr": 0.0009947340685486023, "epoch": 2.832809224318658, "percentage": 14.16, "elapsed_time": "0:13:38", "remaining_time": "1:22:38", "throughput": 4310.17, "total_tokens": 3526512} {"current_steps": 5410, "total_steps": 38160, "loss": 0.4383, "lr": 0.0009947009143564303, "epoch": 2.8354297693920336, "percentage": 14.18, "elapsed_time": "0:13:38", "remaining_time": "1:22:37", "throughput": 4310.11, "total_tokens": 3529456} {"current_steps": 5415, "total_steps": 38160, "loss": 0.4385, "lr": 0.0009946676566784708, "epoch": 2.838050314465409, "percentage": 14.19, "elapsed_time": "0:13:39", "remaining_time": "1:22:36", "throughput": 4310.12, "total_tokens": 3532464} {"current_steps": 5420, "total_steps": 38160, "loss": 0.4782, "lr": 0.000994634295521681, "epoch": 2.840670859538784, "percentage": 14.2, "elapsed_time": "0:13:40", "remaining_time": "1:22:35", "throughput": 4310.33, "total_tokens": 3535824} {"current_steps": 5425, "total_steps": 38160, "loss": 0.4993, "lr": 0.0009946008308930397, "epoch": 2.8432914046121596, "percentage": 14.22, "elapsed_time": "0:13:41", "remaining_time": "1:22:34", "throughput": 4310.84, "total_tokens": 3539696} {"current_steps": 5430, "total_steps": 38160, "loss": 0.4999, "lr": 0.0009945672627995473, "epoch": 2.8459119496855347, "percentage": 14.23, "elapsed_time": "0:13:41", "remaining_time": "1:22:34", "throughput": 4311.28, "total_tokens": 3543408} {"current_steps": 5435, "total_steps": 38160, "loss": 0.3971, "lr": 0.0009945335912482256, "epoch": 2.84853249475891, "percentage": 14.24, "elapsed_time": "0:13:42", "remaining_time": "1:22:33", "throughput": 4311.52, "total_tokens": 3546864} {"current_steps": 5440, "total_steps": 38160, "loss": 0.4553, "lr": 0.000994499816246119, "epoch": 2.851153039832285, "percentage": 14.26, "elapsed_time": "0:13:43", "remaining_time": "1:22:32", "throughput": 4311.53, "total_tokens": 3549904} {"current_steps": 5445, "total_steps": 38160, "loss": 0.4611, "lr": 0.000994465937800292, "epoch": 2.8537735849056602, "percentage": 14.27, "elapsed_time": "0:13:44", "remaining_time": "1:22:31", "throughput": 4311.68, "total_tokens": 3553072} {"current_steps": 5450, "total_steps": 38160, "loss": 0.3475, "lr": 0.0009944319559178321, "epoch": 2.8563941299790354, "percentage": 14.28, "elapsed_time": "0:13:44", "remaining_time": "1:22:30", "throughput": 4312.11, "total_tokens": 3556784} {"current_steps": 5455, "total_steps": 38160, "loss": 0.5035, "lr": 0.0009943978706058478, "epoch": 2.859014675052411, "percentage": 14.3, "elapsed_time": "0:13:45", "remaining_time": "1:22:30", "throughput": 4312.92, "total_tokens": 3561232} {"current_steps": 5460, "total_steps": 38160, "loss": 0.5045, "lr": 0.0009943636818714695, "epoch": 2.861635220125786, "percentage": 14.31, "elapsed_time": "0:13:46", "remaining_time": "1:22:29", "throughput": 4312.85, "total_tokens": 3564048} {"current_steps": 5465, "total_steps": 38160, "loss": 0.3893, "lr": 0.0009943293897218487, "epoch": 2.8642557651991614, "percentage": 14.32, "elapsed_time": "0:13:47", "remaining_time": "1:22:28", "throughput": 4313.19, "total_tokens": 3567664} {"current_steps": 5470, "total_steps": 38160, "loss": 0.4734, "lr": 0.0009942949941641594, "epoch": 2.8668763102725365, "percentage": 14.33, "elapsed_time": "0:13:47", "remaining_time": "1:22:27", "throughput": 4313.57, "total_tokens": 3571344} {"current_steps": 5475, "total_steps": 38160, "loss": 0.4485, "lr": 0.0009942604952055964, "epoch": 2.869496855345912, "percentage": 14.35, "elapsed_time": "0:13:48", "remaining_time": "1:22:26", "throughput": 4313.46, "total_tokens": 3574128} {"current_steps": 5480, "total_steps": 38160, "loss": 0.4769, "lr": 0.0009942258928533768, "epoch": 2.8721174004192873, "percentage": 14.36, "elapsed_time": "0:13:49", "remaining_time": "1:22:25", "throughput": 4313.68, "total_tokens": 3577552} {"current_steps": 5485, "total_steps": 38160, "loss": 0.672, "lr": 0.0009941911871147386, "epoch": 2.8747379454926625, "percentage": 14.37, "elapsed_time": "0:13:50", "remaining_time": "1:22:25", "throughput": 4313.99, "total_tokens": 3581040} {"current_steps": 5490, "total_steps": 38160, "loss": 0.4455, "lr": 0.000994156377996942, "epoch": 2.8773584905660377, "percentage": 14.39, "elapsed_time": "0:13:50", "remaining_time": "1:22:23", "throughput": 4313.85, "total_tokens": 3583760} {"current_steps": 5495, "total_steps": 38160, "loss": 0.5032, "lr": 0.0009941214655072692, "epoch": 2.879979035639413, "percentage": 14.4, "elapsed_time": "0:13:51", "remaining_time": "1:22:23", "throughput": 4314.36, "total_tokens": 3587632} {"current_steps": 5500, "total_steps": 38160, "loss": 0.4964, "lr": 0.0009940864496530226, "epoch": 2.882599580712788, "percentage": 14.41, "elapsed_time": "0:13:52", "remaining_time": "1:22:22", "throughput": 4314.54, "total_tokens": 3590960} {"current_steps": 5505, "total_steps": 38160, "loss": 0.3853, "lr": 0.000994051330441528, "epoch": 2.8852201257861636, "percentage": 14.43, "elapsed_time": "0:13:53", "remaining_time": "1:22:21", "throughput": 4314.92, "total_tokens": 3594672} {"current_steps": 5510, "total_steps": 38160, "loss": 0.4308, "lr": 0.0009940161078801312, "epoch": 2.8878406708595388, "percentage": 14.44, "elapsed_time": "0:13:53", "remaining_time": "1:22:20", "throughput": 4314.99, "total_tokens": 3597872} {"current_steps": 5515, "total_steps": 38160, "loss": 0.3603, "lr": 0.0009939807819762008, "epoch": 2.890461215932914, "percentage": 14.45, "elapsed_time": "0:13:54", "remaining_time": "1:22:19", "throughput": 4314.82, "total_tokens": 3600528} {"current_steps": 5520, "total_steps": 38160, "loss": 0.5159, "lr": 0.0009939453527371262, "epoch": 2.8930817610062896, "percentage": 14.47, "elapsed_time": "0:13:55", "remaining_time": "1:22:18", "throughput": 4314.73, "total_tokens": 3603344} {"current_steps": 5525, "total_steps": 38160, "loss": 0.4488, "lr": 0.0009939098201703193, "epoch": 2.8957023060796647, "percentage": 14.48, "elapsed_time": "0:13:55", "remaining_time": "1:22:17", "throughput": 4314.78, "total_tokens": 3606448} {"current_steps": 5530, "total_steps": 38160, "loss": 0.6639, "lr": 0.0009938741842832129, "epoch": 2.89832285115304, "percentage": 14.49, "elapsed_time": "0:13:56", "remaining_time": "1:22:16", "throughput": 4314.92, "total_tokens": 3609776} {"current_steps": 5535, "total_steps": 38160, "loss": 0.5016, "lr": 0.0009938384450832614, "epoch": 2.900943396226415, "percentage": 14.5, "elapsed_time": "0:13:57", "remaining_time": "1:22:14", "throughput": 4314.55, "total_tokens": 3612080} {"current_steps": 5540, "total_steps": 38160, "loss": 0.5243, "lr": 0.0009938026025779411, "epoch": 2.9035639412997902, "percentage": 14.52, "elapsed_time": "0:13:57", "remaining_time": "1:22:13", "throughput": 4314.82, "total_tokens": 3615504} {"current_steps": 5545, "total_steps": 38160, "loss": 0.658, "lr": 0.0009937666567747501, "epoch": 2.9061844863731654, "percentage": 14.53, "elapsed_time": "0:13:58", "remaining_time": "1:22:12", "throughput": 4314.58, "total_tokens": 3618096} {"current_steps": 5550, "total_steps": 38160, "loss": 0.4381, "lr": 0.0009937306076812076, "epoch": 2.908805031446541, "percentage": 14.54, "elapsed_time": "0:13:59", "remaining_time": "1:22:11", "throughput": 4314.67, "total_tokens": 3621296} {"current_steps": 5555, "total_steps": 38160, "loss": 0.4796, "lr": 0.0009936944553048548, "epoch": 2.911425576519916, "percentage": 14.56, "elapsed_time": "0:14:00", "remaining_time": "1:22:10", "throughput": 4314.92, "total_tokens": 3624784} {"current_steps": 5560, "total_steps": 38160, "loss": 0.5642, "lr": 0.0009936581996532543, "epoch": 2.9140461215932913, "percentage": 14.57, "elapsed_time": "0:14:00", "remaining_time": "1:22:10", "throughput": 4315.17, "total_tokens": 3628336} {"current_steps": 5565, "total_steps": 38160, "loss": 0.5979, "lr": 0.0009936218407339905, "epoch": 2.9166666666666665, "percentage": 14.58, "elapsed_time": "0:14:01", "remaining_time": "1:22:08", "throughput": 4315.12, "total_tokens": 3631280} {"current_steps": 5570, "total_steps": 38160, "loss": 0.6359, "lr": 0.0009935853785546691, "epoch": 2.919287211740042, "percentage": 14.6, "elapsed_time": "0:14:02", "remaining_time": "1:22:07", "throughput": 4315.19, "total_tokens": 3634448} {"current_steps": 5575, "total_steps": 38160, "loss": 0.471, "lr": 0.0009935488131229177, "epoch": 2.9219077568134173, "percentage": 14.61, "elapsed_time": "0:14:02", "remaining_time": "1:22:06", "throughput": 4314.99, "total_tokens": 3637072} {"current_steps": 5580, "total_steps": 38160, "loss": 0.6355, "lr": 0.000993512144446385, "epoch": 2.9245283018867925, "percentage": 14.62, "elapsed_time": "0:14:03", "remaining_time": "1:22:06", "throughput": 4315.33, "total_tokens": 3640880} {"current_steps": 5585, "total_steps": 38160, "loss": 0.5179, "lr": 0.000993475372532742, "epoch": 2.9271488469601676, "percentage": 14.64, "elapsed_time": "0:14:04", "remaining_time": "1:22:04", "throughput": 4315.03, "total_tokens": 3643312} {"current_steps": 5590, "total_steps": 38160, "loss": 0.4989, "lr": 0.0009934384973896812, "epoch": 2.929769392033543, "percentage": 14.65, "elapsed_time": "0:14:05", "remaining_time": "1:22:04", "throughput": 4315.49, "total_tokens": 3647152} {"current_steps": 5595, "total_steps": 38160, "loss": 0.5002, "lr": 0.0009934015190249162, "epoch": 2.932389937106918, "percentage": 14.66, "elapsed_time": "0:14:05", "remaining_time": "1:22:02", "throughput": 4315.34, "total_tokens": 3649904} {"current_steps": 5600, "total_steps": 38160, "loss": 0.3973, "lr": 0.0009933644374461822, "epoch": 2.9350104821802936, "percentage": 14.68, "elapsed_time": "0:14:06", "remaining_time": "1:22:02", "throughput": 4315.72, "total_tokens": 3653680} {"current_steps": 5605, "total_steps": 38160, "loss": 0.5719, "lr": 0.0009933272526612366, "epoch": 2.9376310272536688, "percentage": 14.69, "elapsed_time": "0:14:07", "remaining_time": "1:22:01", "throughput": 4316.04, "total_tokens": 3657328} {"current_steps": 5610, "total_steps": 38160, "loss": 0.492, "lr": 0.0009932899646778578, "epoch": 2.940251572327044, "percentage": 14.7, "elapsed_time": "0:14:08", "remaining_time": "1:22:01", "throughput": 4316.45, "total_tokens": 3661008} {"current_steps": 5615, "total_steps": 38160, "loss": 0.4808, "lr": 0.0009932525735038464, "epoch": 2.9428721174004195, "percentage": 14.71, "elapsed_time": "0:14:08", "remaining_time": "1:22:00", "throughput": 4316.45, "total_tokens": 3664144} {"current_steps": 5620, "total_steps": 38160, "loss": 0.4223, "lr": 0.0009932150791470238, "epoch": 2.9454926624737947, "percentage": 14.73, "elapsed_time": "0:14:09", "remaining_time": "1:21:58", "throughput": 4316.25, "total_tokens": 3666800} {"current_steps": 5625, "total_steps": 38160, "loss": 0.46, "lr": 0.0009931774816152334, "epoch": 2.94811320754717, "percentage": 14.74, "elapsed_time": "0:14:10", "remaining_time": "1:21:57", "throughput": 4316.31, "total_tokens": 3669936} {"current_steps": 5630, "total_steps": 38160, "loss": 0.3994, "lr": 0.0009931397809163406, "epoch": 2.950733752620545, "percentage": 14.75, "elapsed_time": "0:14:11", "remaining_time": "1:21:57", "throughput": 4316.68, "total_tokens": 3673584} {"current_steps": 5635, "total_steps": 38160, "loss": 0.4572, "lr": 0.0009931019770582316, "epoch": 2.95335429769392, "percentage": 14.77, "elapsed_time": "0:14:11", "remaining_time": "1:21:56", "throughput": 4316.84, "total_tokens": 3676816} {"current_steps": 5640, "total_steps": 38160, "loss": 0.5818, "lr": 0.0009930640700488143, "epoch": 2.9559748427672954, "percentage": 14.78, "elapsed_time": "0:14:12", "remaining_time": "1:21:55", "throughput": 4316.87, "total_tokens": 3679792} {"current_steps": 5645, "total_steps": 38160, "loss": 0.4964, "lr": 0.000993026059896019, "epoch": 2.958595387840671, "percentage": 14.79, "elapsed_time": "0:14:13", "remaining_time": "1:21:53", "throughput": 4316.84, "total_tokens": 3682704} {"current_steps": 5650, "total_steps": 38160, "loss": 0.4592, "lr": 0.0009929879466077968, "epoch": 2.961215932914046, "percentage": 14.81, "elapsed_time": "0:14:13", "remaining_time": "1:21:52", "throughput": 4316.99, "total_tokens": 3685968} {"current_steps": 5655, "total_steps": 38160, "loss": 0.4911, "lr": 0.0009929497301921202, "epoch": 2.9638364779874213, "percentage": 14.82, "elapsed_time": "0:14:14", "remaining_time": "1:21:51", "throughput": 4316.72, "total_tokens": 3688528} {"current_steps": 5660, "total_steps": 38160, "loss": 0.4989, "lr": 0.000992911410656984, "epoch": 2.9664570230607965, "percentage": 14.83, "elapsed_time": "0:14:15", "remaining_time": "1:21:51", "throughput": 4317.23, "total_tokens": 3692464} {"current_steps": 5665, "total_steps": 38160, "loss": 0.3933, "lr": 0.000992872988010404, "epoch": 2.969077568134172, "percentage": 14.85, "elapsed_time": "0:14:16", "remaining_time": "1:21:50", "throughput": 4317.43, "total_tokens": 3695920} {"current_steps": 5670, "total_steps": 38160, "loss": 0.6394, "lr": 0.0009928344622604183, "epoch": 2.9716981132075473, "percentage": 14.86, "elapsed_time": "0:14:16", "remaining_time": "1:21:49", "throughput": 4317.76, "total_tokens": 3699600} {"current_steps": 5675, "total_steps": 38160, "loss": 0.5498, "lr": 0.0009927958334150853, "epoch": 2.9743186582809225, "percentage": 14.87, "elapsed_time": "0:14:17", "remaining_time": "1:21:49", "throughput": 4317.98, "total_tokens": 3703024} {"current_steps": 5680, "total_steps": 38160, "loss": 0.3807, "lr": 0.0009927571014824862, "epoch": 2.9769392033542976, "percentage": 14.88, "elapsed_time": "0:14:18", "remaining_time": "1:21:48", "throughput": 4318.25, "total_tokens": 3706544} {"current_steps": 5685, "total_steps": 38160, "loss": 0.5953, "lr": 0.000992718266470723, "epoch": 2.979559748427673, "percentage": 14.9, "elapsed_time": "0:14:19", "remaining_time": "1:21:47", "throughput": 4318.23, "total_tokens": 3709584} {"current_steps": 5690, "total_steps": 38160, "loss": 0.5519, "lr": 0.00099267932838792, "epoch": 2.982180293501048, "percentage": 14.91, "elapsed_time": "0:14:19", "remaining_time": "1:21:47", "throughput": 4318.65, "total_tokens": 3713616} {"current_steps": 5695, "total_steps": 38160, "loss": 0.5175, "lr": 0.000992640287242222, "epoch": 2.9848008385744236, "percentage": 14.92, "elapsed_time": "0:14:20", "remaining_time": "1:21:45", "throughput": 4318.7, "total_tokens": 3716656} {"current_steps": 5700, "total_steps": 38160, "loss": 0.4071, "lr": 0.0009926011430417961, "epoch": 2.9874213836477987, "percentage": 14.94, "elapsed_time": "0:14:21", "remaining_time": "1:21:44", "throughput": 4318.55, "total_tokens": 3719504} {"current_steps": 5705, "total_steps": 38160, "loss": 0.4531, "lr": 0.0009925618957948312, "epoch": 2.990041928721174, "percentage": 14.95, "elapsed_time": "0:14:22", "remaining_time": "1:21:43", "throughput": 4318.61, "total_tokens": 3722672} {"current_steps": 5710, "total_steps": 38160, "loss": 0.4698, "lr": 0.0009925225455095373, "epoch": 2.9926624737945495, "percentage": 14.96, "elapsed_time": "0:14:22", "remaining_time": "1:21:42", "throughput": 4318.32, "total_tokens": 3725104} {"current_steps": 5715, "total_steps": 38160, "loss": 0.6194, "lr": 0.0009924830921941455, "epoch": 2.9952830188679247, "percentage": 14.98, "elapsed_time": "0:14:23", "remaining_time": "1:21:41", "throughput": 4318.37, "total_tokens": 3728272} {"current_steps": 5720, "total_steps": 38160, "loss": 0.4295, "lr": 0.0009924435358569096, "epoch": 2.9979035639413, "percentage": 14.99, "elapsed_time": "0:14:24", "remaining_time": "1:21:40", "throughput": 4318.43, "total_tokens": 3731344} {"current_steps": 5724, "total_steps": 38160, "eval_loss": 0.4684428870677948, "epoch": 3.0, "percentage": 15.0, "elapsed_time": "0:14:38", "remaining_time": "1:22:56", "throughput": 4251.16, "total_tokens": 3733736} {"current_steps": 5725, "total_steps": 38160, "loss": 0.4733, "lr": 0.000992403876506104, "epoch": 3.000524109014675, "percentage": 15.0, "elapsed_time": "0:14:39", "remaining_time": "1:23:05", "throughput": 4243.9, "total_tokens": 3734280} {"current_steps": 5730, "total_steps": 38160, "loss": 0.4046, "lr": 0.000992364114150025, "epoch": 3.00314465408805, "percentage": 15.02, "elapsed_time": "0:14:40", "remaining_time": "1:23:03", "throughput": 4243.65, "total_tokens": 3736776} {"current_steps": 5735, "total_steps": 38160, "loss": 0.4667, "lr": 0.0009923242487969908, "epoch": 3.0057651991614254, "percentage": 15.03, "elapsed_time": "0:14:41", "remaining_time": "1:23:02", "throughput": 4243.46, "total_tokens": 3739496} {"current_steps": 5740, "total_steps": 38160, "loss": 0.3941, "lr": 0.0009922842804553403, "epoch": 3.008385744234801, "percentage": 15.04, "elapsed_time": "0:14:41", "remaining_time": "1:23:00", "throughput": 4243.2, "total_tokens": 3741992} {"current_steps": 5745, "total_steps": 38160, "loss": 0.5477, "lr": 0.0009922442091334345, "epoch": 3.011006289308176, "percentage": 15.06, "elapsed_time": "0:14:42", "remaining_time": "1:22:59", "throughput": 4242.99, "total_tokens": 3744488} {"current_steps": 5750, "total_steps": 38160, "loss": 0.5467, "lr": 0.0009922040348396561, "epoch": 3.0136268343815513, "percentage": 15.07, "elapsed_time": "0:14:43", "remaining_time": "1:22:58", "throughput": 4243.15, "total_tokens": 3747688} {"current_steps": 5755, "total_steps": 38160, "loss": 0.4798, "lr": 0.000992163757582409, "epoch": 3.0162473794549265, "percentage": 15.08, "elapsed_time": "0:14:44", "remaining_time": "1:22:58", "throughput": 4244.46, "total_tokens": 3753064} {"current_steps": 5760, "total_steps": 38160, "loss": 0.5391, "lr": 0.0009921233773701188, "epoch": 3.018867924528302, "percentage": 15.09, "elapsed_time": "0:14:44", "remaining_time": "1:22:57", "throughput": 4244.59, "total_tokens": 3756136} {"current_steps": 5765, "total_steps": 38160, "loss": 0.5437, "lr": 0.0009920828942112322, "epoch": 3.0214884696016773, "percentage": 15.11, "elapsed_time": "0:14:45", "remaining_time": "1:22:56", "throughput": 4244.49, "total_tokens": 3758888} {"current_steps": 5770, "total_steps": 38160, "loss": 0.3819, "lr": 0.0009920423081142184, "epoch": 3.0241090146750524, "percentage": 15.12, "elapsed_time": "0:14:46", "remaining_time": "1:22:55", "throughput": 4244.52, "total_tokens": 3761832} {"current_steps": 5775, "total_steps": 38160, "loss": 0.4776, "lr": 0.0009920016190875672, "epoch": 3.0267295597484276, "percentage": 15.13, "elapsed_time": "0:14:47", "remaining_time": "1:22:54", "throughput": 4244.65, "total_tokens": 3765032} {"current_steps": 5780, "total_steps": 38160, "loss": 0.5643, "lr": 0.00099196082713979, "epoch": 3.029350104821803, "percentage": 15.15, "elapsed_time": "0:14:47", "remaining_time": "1:22:52", "throughput": 4244.68, "total_tokens": 3767944} {"current_steps": 5785, "total_steps": 38160, "loss": 0.4569, "lr": 0.0009919199322794207, "epoch": 3.0319706498951784, "percentage": 15.16, "elapsed_time": "0:14:48", "remaining_time": "1:22:51", "throughput": 4244.79, "total_tokens": 3771112} {"current_steps": 5790, "total_steps": 38160, "loss": 0.5821, "lr": 0.0009918789345150136, "epoch": 3.0345911949685536, "percentage": 15.17, "elapsed_time": "0:14:49", "remaining_time": "1:22:50", "throughput": 4244.78, "total_tokens": 3773960} {"current_steps": 5795, "total_steps": 38160, "loss": 0.5608, "lr": 0.000991837833855145, "epoch": 3.0372117400419287, "percentage": 15.19, "elapsed_time": "0:14:49", "remaining_time": "1:22:49", "throughput": 4244.91, "total_tokens": 3777192} {"current_steps": 5800, "total_steps": 38160, "loss": 0.5248, "lr": 0.000991796630308413, "epoch": 3.039832285115304, "percentage": 15.2, "elapsed_time": "0:14:50", "remaining_time": "1:22:48", "throughput": 4245.09, "total_tokens": 3780488} {"current_steps": 5805, "total_steps": 38160, "loss": 0.4793, "lr": 0.0009917553238834363, "epoch": 3.042452830188679, "percentage": 15.21, "elapsed_time": "0:14:51", "remaining_time": "1:22:48", "throughput": 4245.61, "total_tokens": 3784328} {"current_steps": 5810, "total_steps": 38160, "loss": 0.4975, "lr": 0.0009917139145888562, "epoch": 3.0450733752620547, "percentage": 15.23, "elapsed_time": "0:14:51", "remaining_time": "1:22:46", "throughput": 4245.33, "total_tokens": 3786696} {"current_steps": 5815, "total_steps": 38160, "loss": 0.5632, "lr": 0.000991672402433335, "epoch": 3.04769392033543, "percentage": 15.24, "elapsed_time": "0:14:52", "remaining_time": "1:22:45", "throughput": 4245.42, "total_tokens": 3789768} {"current_steps": 5820, "total_steps": 38160, "loss": 0.5055, "lr": 0.0009916307874255565, "epoch": 3.050314465408805, "percentage": 15.25, "elapsed_time": "0:14:53", "remaining_time": "1:22:44", "throughput": 4245.54, "total_tokens": 3792936} {"current_steps": 5825, "total_steps": 38160, "loss": 0.5436, "lr": 0.000991589069574226, "epoch": 3.05293501048218, "percentage": 15.26, "elapsed_time": "0:14:54", "remaining_time": "1:22:43", "throughput": 4245.73, "total_tokens": 3796168} {"current_steps": 5830, "total_steps": 38160, "loss": 0.4811, "lr": 0.0009915472488880705, "epoch": 3.0555555555555554, "percentage": 15.28, "elapsed_time": "0:14:54", "remaining_time": "1:22:41", "throughput": 4245.49, "total_tokens": 3798696} {"current_steps": 5835, "total_steps": 38160, "loss": 0.4206, "lr": 0.0009915053253758386, "epoch": 3.058176100628931, "percentage": 15.29, "elapsed_time": "0:14:55", "remaining_time": "1:22:40", "throughput": 4245.69, "total_tokens": 3801992} {"current_steps": 5840, "total_steps": 38160, "loss": 0.3805, "lr": 0.0009914632990462998, "epoch": 3.060796645702306, "percentage": 15.3, "elapsed_time": "0:14:56", "remaining_time": "1:22:39", "throughput": 4245.5, "total_tokens": 3804648} {"current_steps": 5845, "total_steps": 38160, "loss": 0.651, "lr": 0.0009914211699082458, "epoch": 3.0634171907756813, "percentage": 15.32, "elapsed_time": "0:14:56", "remaining_time": "1:22:38", "throughput": 4245.9, "total_tokens": 3808296} {"current_steps": 5850, "total_steps": 38160, "loss": 0.502, "lr": 0.0009913789379704897, "epoch": 3.0660377358490565, "percentage": 15.33, "elapsed_time": "0:14:57", "remaining_time": "1:22:37", "throughput": 4246.14, "total_tokens": 3811688} {"current_steps": 5855, "total_steps": 38160, "loss": 0.45, "lr": 0.0009913366032418653, "epoch": 3.068658280922432, "percentage": 15.34, "elapsed_time": "0:14:58", "remaining_time": "1:22:38", "throughput": 4247.51, "total_tokens": 3817416} {"current_steps": 5860, "total_steps": 38160, "loss": 0.4744, "lr": 0.0009912941657312293, "epoch": 3.0712788259958073, "percentage": 15.36, "elapsed_time": "0:14:59", "remaining_time": "1:22:37", "throughput": 4247.42, "total_tokens": 3820168} {"current_steps": 5865, "total_steps": 38160, "loss": 0.43, "lr": 0.0009912516254474586, "epoch": 3.0738993710691824, "percentage": 15.37, "elapsed_time": "0:15:00", "remaining_time": "1:22:36", "throughput": 4247.73, "total_tokens": 3823720} {"current_steps": 5870, "total_steps": 38160, "loss": 0.4877, "lr": 0.0009912089823994525, "epoch": 3.0765199161425576, "percentage": 15.38, "elapsed_time": "0:15:00", "remaining_time": "1:22:36", "throughput": 4248.07, "total_tokens": 3827432} {"current_steps": 5875, "total_steps": 38160, "loss": 0.5218, "lr": 0.0009911662365961313, "epoch": 3.0791404612159328, "percentage": 15.4, "elapsed_time": "0:15:01", "remaining_time": "1:22:34", "throughput": 4247.8, "total_tokens": 3829832} {"current_steps": 5880, "total_steps": 38160, "loss": 0.4529, "lr": 0.000991123388046437, "epoch": 3.0817610062893084, "percentage": 15.41, "elapsed_time": "0:15:02", "remaining_time": "1:22:32", "throughput": 4247.43, "total_tokens": 3832040} {"current_steps": 5885, "total_steps": 38160, "loss": 0.4934, "lr": 0.0009910804367593328, "epoch": 3.0843815513626835, "percentage": 15.42, "elapsed_time": "0:15:02", "remaining_time": "1:22:31", "throughput": 4247.46, "total_tokens": 3834984} {"current_steps": 5890, "total_steps": 38160, "loss": 0.5013, "lr": 0.0009910373827438038, "epoch": 3.0870020964360587, "percentage": 15.44, "elapsed_time": "0:15:04", "remaining_time": "1:22:33", "throughput": 4249.28, "total_tokens": 3841800} {"current_steps": 5895, "total_steps": 38160, "loss": 0.4652, "lr": 0.0009909942260088562, "epoch": 3.089622641509434, "percentage": 15.45, "elapsed_time": "0:15:04", "remaining_time": "1:22:32", "throughput": 4249.14, "total_tokens": 3844456} {"current_steps": 5900, "total_steps": 38160, "loss": 0.3641, "lr": 0.0009909509665635184, "epoch": 3.092243186582809, "percentage": 15.46, "elapsed_time": "0:15:05", "remaining_time": "1:22:31", "throughput": 4249.38, "total_tokens": 3847912} {"current_steps": 5905, "total_steps": 38160, "loss": 0.3501, "lr": 0.0009909076044168394, "epoch": 3.0948637316561847, "percentage": 15.47, "elapsed_time": "0:15:06", "remaining_time": "1:22:30", "throughput": 4249.58, "total_tokens": 3851208} {"current_steps": 5910, "total_steps": 38160, "loss": 0.3668, "lr": 0.00099086413957789, "epoch": 3.09748427672956, "percentage": 15.49, "elapsed_time": "0:15:07", "remaining_time": "1:22:29", "throughput": 4249.95, "total_tokens": 3854920} {"current_steps": 5915, "total_steps": 38160, "loss": 0.477, "lr": 0.0009908205720557627, "epoch": 3.100104821802935, "percentage": 15.5, "elapsed_time": "0:15:07", "remaining_time": "1:22:28", "throughput": 4250.26, "total_tokens": 3858408} {"current_steps": 5920, "total_steps": 38160, "loss": 0.5255, "lr": 0.0009907769018595713, "epoch": 3.10272536687631, "percentage": 15.51, "elapsed_time": "0:15:08", "remaining_time": "1:22:27", "throughput": 4250.28, "total_tokens": 3861352} {"current_steps": 5925, "total_steps": 38160, "loss": 0.3984, "lr": 0.0009907331289984512, "epoch": 3.1053459119496853, "percentage": 15.53, "elapsed_time": "0:15:09", "remaining_time": "1:22:26", "throughput": 4250.51, "total_tokens": 3864680} {"current_steps": 5930, "total_steps": 38160, "loss": 0.4598, "lr": 0.000990689253481559, "epoch": 3.107966457023061, "percentage": 15.54, "elapsed_time": "0:15:09", "remaining_time": "1:22:25", "throughput": 4250.3, "total_tokens": 3867176} {"current_steps": 5935, "total_steps": 38160, "loss": 0.465, "lr": 0.000990645275318073, "epoch": 3.110587002096436, "percentage": 15.55, "elapsed_time": "0:15:10", "remaining_time": "1:22:23", "throughput": 4250.19, "total_tokens": 3869864} {"current_steps": 5940, "total_steps": 38160, "loss": 0.4659, "lr": 0.000990601194517193, "epoch": 3.1132075471698113, "percentage": 15.57, "elapsed_time": "0:15:11", "remaining_time": "1:22:22", "throughput": 4250.17, "total_tokens": 3872744} {"current_steps": 5945, "total_steps": 38160, "loss": 0.4715, "lr": 0.0009905570110881402, "epoch": 3.1158280922431865, "percentage": 15.58, "elapsed_time": "0:15:11", "remaining_time": "1:22:21", "throughput": 4250.3, "total_tokens": 3875880} {"current_steps": 5950, "total_steps": 38160, "loss": 0.3938, "lr": 0.0009905127250401573, "epoch": 3.1184486373165616, "percentage": 15.59, "elapsed_time": "0:15:12", "remaining_time": "1:22:20", "throughput": 4250.4, "total_tokens": 3879048} {"current_steps": 5955, "total_steps": 38160, "loss": 0.3319, "lr": 0.0009904683363825084, "epoch": 3.1210691823899372, "percentage": 15.61, "elapsed_time": "0:15:13", "remaining_time": "1:22:19", "throughput": 4250.6, "total_tokens": 3882376} {"current_steps": 5960, "total_steps": 38160, "loss": 0.4006, "lr": 0.0009904238451244791, "epoch": 3.1236897274633124, "percentage": 15.62, "elapsed_time": "0:15:14", "remaining_time": "1:22:18", "throughput": 4250.69, "total_tokens": 3885576} {"current_steps": 5965, "total_steps": 38160, "loss": 0.459, "lr": 0.0009903792512753764, "epoch": 3.1263102725366876, "percentage": 15.63, "elapsed_time": "0:15:14", "remaining_time": "1:22:17", "throughput": 4250.85, "total_tokens": 3888808} {"current_steps": 5970, "total_steps": 38160, "loss": 0.469, "lr": 0.0009903345548445289, "epoch": 3.1289308176100628, "percentage": 15.64, "elapsed_time": "0:15:15", "remaining_time": "1:22:16", "throughput": 4250.98, "total_tokens": 3891976} {"current_steps": 5975, "total_steps": 38160, "loss": 0.4712, "lr": 0.0009902897558412864, "epoch": 3.131551362683438, "percentage": 15.66, "elapsed_time": "0:15:16", "remaining_time": "1:22:15", "throughput": 4251.36, "total_tokens": 3895592} {"current_steps": 5980, "total_steps": 38160, "loss": 0.6429, "lr": 0.0009902448542750207, "epoch": 3.1341719077568135, "percentage": 15.67, "elapsed_time": "0:15:17", "remaining_time": "1:22:15", "throughput": 4251.7, "total_tokens": 3899336} {"current_steps": 5985, "total_steps": 38160, "loss": 0.4216, "lr": 0.0009901998501551245, "epoch": 3.1367924528301887, "percentage": 15.68, "elapsed_time": "0:15:17", "remaining_time": "1:22:14", "throughput": 4251.73, "total_tokens": 3902280} {"current_steps": 5990, "total_steps": 38160, "loss": 0.4468, "lr": 0.000990154743491012, "epoch": 3.139412997903564, "percentage": 15.7, "elapsed_time": "0:15:18", "remaining_time": "1:22:13", "throughput": 4251.98, "total_tokens": 3905672} {"current_steps": 5995, "total_steps": 38160, "loss": 0.4141, "lr": 0.0009901095342921193, "epoch": 3.142033542976939, "percentage": 15.71, "elapsed_time": "0:15:19", "remaining_time": "1:22:11", "throughput": 4251.88, "total_tokens": 3908392} {"current_steps": 6000, "total_steps": 38160, "loss": 0.5446, "lr": 0.0009900642225679035, "epoch": 3.1446540880503147, "percentage": 15.72, "elapsed_time": "0:15:20", "remaining_time": "1:22:11", "throughput": 4252.3, "total_tokens": 3912200} {"current_steps": 6005, "total_steps": 38160, "loss": 0.5572, "lr": 0.000990018808327843, "epoch": 3.14727463312369, "percentage": 15.74, "elapsed_time": "0:15:20", "remaining_time": "1:22:10", "throughput": 4252.37, "total_tokens": 3915304} {"current_steps": 6010, "total_steps": 38160, "loss": 0.5156, "lr": 0.0009899732915814386, "epoch": 3.149895178197065, "percentage": 15.75, "elapsed_time": "0:15:21", "remaining_time": "1:22:09", "throughput": 4252.69, "total_tokens": 3918952} {"current_steps": 6015, "total_steps": 38160, "loss": 0.6279, "lr": 0.0009899276723382112, "epoch": 3.15251572327044, "percentage": 15.76, "elapsed_time": "0:15:22", "remaining_time": "1:22:08", "throughput": 4252.63, "total_tokens": 3921864} {"current_steps": 6020, "total_steps": 38160, "loss": 0.4129, "lr": 0.0009898819506077043, "epoch": 3.1551362683438153, "percentage": 15.78, "elapsed_time": "0:15:22", "remaining_time": "1:22:07", "throughput": 4252.85, "total_tokens": 3925256} {"current_steps": 6025, "total_steps": 38160, "loss": 0.4149, "lr": 0.0009898361263994823, "epoch": 3.157756813417191, "percentage": 15.79, "elapsed_time": "0:15:23", "remaining_time": "1:22:05", "throughput": 4252.48, "total_tokens": 3927432} {"current_steps": 6030, "total_steps": 38160, "loss": 0.4447, "lr": 0.0009897901997231308, "epoch": 3.160377358490566, "percentage": 15.8, "elapsed_time": "0:15:24", "remaining_time": "1:22:05", "throughput": 4252.98, "total_tokens": 3931368} {"current_steps": 6035, "total_steps": 38160, "loss": 0.4313, "lr": 0.0009897441705882576, "epoch": 3.1629979035639413, "percentage": 15.81, "elapsed_time": "0:15:25", "remaining_time": "1:22:04", "throughput": 4253.09, "total_tokens": 3934504} {"current_steps": 6040, "total_steps": 38160, "loss": 0.4469, "lr": 0.0009896980390044908, "epoch": 3.1656184486373165, "percentage": 15.83, "elapsed_time": "0:15:25", "remaining_time": "1:22:03", "throughput": 4253.07, "total_tokens": 3937384} {"current_steps": 6045, "total_steps": 38160, "loss": 0.5967, "lr": 0.0009896518049814812, "epoch": 3.1682389937106916, "percentage": 15.84, "elapsed_time": "0:15:26", "remaining_time": "1:22:01", "throughput": 4253.03, "total_tokens": 3940168} {"current_steps": 6050, "total_steps": 38160, "loss": 0.4171, "lr": 0.0009896054685289005, "epoch": 3.1708595387840672, "percentage": 15.85, "elapsed_time": "0:15:27", "remaining_time": "1:22:00", "throughput": 4252.73, "total_tokens": 3942504} {"current_steps": 6055, "total_steps": 38160, "loss": 0.4972, "lr": 0.0009895590296564412, "epoch": 3.1734800838574424, "percentage": 15.87, "elapsed_time": "0:15:27", "remaining_time": "1:21:59", "throughput": 4252.82, "total_tokens": 3945480} {"current_steps": 6060, "total_steps": 38160, "loss": 0.4607, "lr": 0.000989512488373818, "epoch": 3.1761006289308176, "percentage": 15.88, "elapsed_time": "0:15:28", "remaining_time": "1:21:57", "throughput": 4252.91, "total_tokens": 3948520} {"current_steps": 6065, "total_steps": 38160, "loss": 0.5499, "lr": 0.0009894658446907671, "epoch": 3.1787211740041927, "percentage": 15.89, "elapsed_time": "0:15:29", "remaining_time": "1:21:57", "throughput": 4253.64, "total_tokens": 3952904} {"current_steps": 6070, "total_steps": 38160, "loss": 0.4733, "lr": 0.0009894190986170458, "epoch": 3.181341719077568, "percentage": 15.91, "elapsed_time": "0:15:29", "remaining_time": "1:21:56", "throughput": 4253.61, "total_tokens": 3955816} {"current_steps": 6075, "total_steps": 38160, "loss": 0.4823, "lr": 0.0009893722501624323, "epoch": 3.1839622641509435, "percentage": 15.92, "elapsed_time": "0:15:30", "remaining_time": "1:21:54", "throughput": 4253.28, "total_tokens": 3958120} {"current_steps": 6080, "total_steps": 38160, "loss": 0.53, "lr": 0.0009893252993367272, "epoch": 3.1865828092243187, "percentage": 15.93, "elapsed_time": "0:15:31", "remaining_time": "1:21:53", "throughput": 4253.05, "total_tokens": 3960520} {"current_steps": 6085, "total_steps": 38160, "loss": 0.5046, "lr": 0.000989278246149752, "epoch": 3.189203354297694, "percentage": 15.95, "elapsed_time": "0:15:31", "remaining_time": "1:21:52", "throughput": 4252.97, "total_tokens": 3963208} {"current_steps": 6090, "total_steps": 38160, "loss": 0.5343, "lr": 0.0009892310906113497, "epoch": 3.191823899371069, "percentage": 15.96, "elapsed_time": "0:15:32", "remaining_time": "1:21:51", "throughput": 4253.2, "total_tokens": 3966568} {"current_steps": 6095, "total_steps": 38160, "loss": 0.5541, "lr": 0.0009891838327313847, "epoch": 3.1944444444444446, "percentage": 15.97, "elapsed_time": "0:15:33", "remaining_time": "1:21:50", "throughput": 4253.58, "total_tokens": 3970184} {"current_steps": 6100, "total_steps": 38160, "loss": 0.5266, "lr": 0.000989136472519743, "epoch": 3.19706498951782, "percentage": 15.99, "elapsed_time": "0:15:34", "remaining_time": "1:21:49", "throughput": 4253.64, "total_tokens": 3973192} {"current_steps": 6105, "total_steps": 38160, "loss": 0.4266, "lr": 0.0009890890099863313, "epoch": 3.199685534591195, "percentage": 16.0, "elapsed_time": "0:15:34", "remaining_time": "1:21:47", "throughput": 4253.46, "total_tokens": 3975656} {"current_steps": 6110, "total_steps": 38160, "loss": 0.4226, "lr": 0.0009890414451410787, "epoch": 3.20230607966457, "percentage": 16.01, "elapsed_time": "0:15:35", "remaining_time": "1:21:46", "throughput": 4253.8, "total_tokens": 3979240} {"current_steps": 6115, "total_steps": 38160, "loss": 0.4542, "lr": 0.0009889937779939348, "epoch": 3.2049266247379453, "percentage": 16.02, "elapsed_time": "0:15:36", "remaining_time": "1:21:46", "throughput": 4254.44, "total_tokens": 3983464} {"current_steps": 6120, "total_steps": 38160, "loss": 0.5238, "lr": 0.0009889460085548715, "epoch": 3.207547169811321, "percentage": 16.04, "elapsed_time": "0:15:37", "remaining_time": "1:21:45", "throughput": 4254.57, "total_tokens": 3986568} {"current_steps": 6125, "total_steps": 38160, "loss": 0.4544, "lr": 0.0009888981368338815, "epoch": 3.210167714884696, "percentage": 16.05, "elapsed_time": "0:15:37", "remaining_time": "1:21:44", "throughput": 4254.45, "total_tokens": 3989224} {"current_steps": 6130, "total_steps": 38160, "loss": 0.6113, "lr": 0.0009888501628409789, "epoch": 3.2127882599580713, "percentage": 16.06, "elapsed_time": "0:15:38", "remaining_time": "1:21:43", "throughput": 4254.77, "total_tokens": 3992648} {"current_steps": 6135, "total_steps": 38160, "loss": 0.4341, "lr": 0.0009888020865861991, "epoch": 3.2154088050314464, "percentage": 16.08, "elapsed_time": "0:15:39", "remaining_time": "1:21:41", "throughput": 4254.77, "total_tokens": 3995528} {"current_steps": 6140, "total_steps": 38160, "loss": 0.4694, "lr": 0.0009887539080795996, "epoch": 3.2180293501048216, "percentage": 16.09, "elapsed_time": "0:15:39", "remaining_time": "1:21:40", "throughput": 4254.87, "total_tokens": 3998536} {"current_steps": 6145, "total_steps": 38160, "loss": 0.4904, "lr": 0.0009887056273312584, "epoch": 3.220649895178197, "percentage": 16.1, "elapsed_time": "0:15:40", "remaining_time": "1:21:39", "throughput": 4254.76, "total_tokens": 4001224} {"current_steps": 6150, "total_steps": 38160, "loss": 0.4354, "lr": 0.0009886572443512753, "epoch": 3.2232704402515724, "percentage": 16.12, "elapsed_time": "0:15:41", "remaining_time": "1:21:38", "throughput": 4254.89, "total_tokens": 4004328} {"current_steps": 6155, "total_steps": 38160, "loss": 0.4629, "lr": 0.0009886087591497717, "epoch": 3.2258909853249476, "percentage": 16.13, "elapsed_time": "0:15:41", "remaining_time": "1:21:37", "throughput": 4255.22, "total_tokens": 4007944} {"current_steps": 6160, "total_steps": 38160, "loss": 0.4849, "lr": 0.00098856017173689, "epoch": 3.2285115303983227, "percentage": 16.14, "elapsed_time": "0:15:42", "remaining_time": "1:21:36", "throughput": 4255.34, "total_tokens": 4011144} {"current_steps": 6165, "total_steps": 38160, "loss": 0.4174, "lr": 0.0009885114821227942, "epoch": 3.231132075471698, "percentage": 16.16, "elapsed_time": "0:15:43", "remaining_time": "1:21:35", "throughput": 4255.49, "total_tokens": 4014376} {"current_steps": 6170, "total_steps": 38160, "loss": 0.489, "lr": 0.0009884626903176696, "epoch": 3.2337526205450735, "percentage": 16.17, "elapsed_time": "0:15:44", "remaining_time": "1:21:35", "throughput": 4255.94, "total_tokens": 4018216} {"current_steps": 6175, "total_steps": 38160, "loss": 0.5073, "lr": 0.0009884137963317228, "epoch": 3.2363731656184487, "percentage": 16.18, "elapsed_time": "0:15:44", "remaining_time": "1:21:33", "throughput": 4255.9, "total_tokens": 4021032} {"current_steps": 6180, "total_steps": 38160, "loss": 0.5944, "lr": 0.000988364800175182, "epoch": 3.238993710691824, "percentage": 16.19, "elapsed_time": "0:15:45", "remaining_time": "1:21:32", "throughput": 4255.82, "total_tokens": 4024040} {"current_steps": 6185, "total_steps": 38160, "loss": 0.3505, "lr": 0.0009883157018582966, "epoch": 3.241614255765199, "percentage": 16.21, "elapsed_time": "0:15:46", "remaining_time": "1:21:32", "throughput": 4255.92, "total_tokens": 4027336} {"current_steps": 6190, "total_steps": 38160, "loss": 0.5446, "lr": 0.0009882665013913373, "epoch": 3.2442348008385746, "percentage": 16.22, "elapsed_time": "0:15:47", "remaining_time": "1:21:31", "throughput": 4256.0, "total_tokens": 4030472} {"current_steps": 6195, "total_steps": 38160, "loss": 0.4677, "lr": 0.0009882171987845962, "epoch": 3.24685534591195, "percentage": 16.23, "elapsed_time": "0:15:47", "remaining_time": "1:21:30", "throughput": 4256.44, "total_tokens": 4034312} {"current_steps": 6200, "total_steps": 38160, "loss": 0.4686, "lr": 0.000988167794048387, "epoch": 3.249475890985325, "percentage": 16.25, "elapsed_time": "0:15:48", "remaining_time": "1:21:30", "throughput": 4257.13, "total_tokens": 4038632} {"current_steps": 6205, "total_steps": 38160, "loss": 0.5439, "lr": 0.0009881182871930448, "epoch": 3.2520964360587, "percentage": 16.26, "elapsed_time": "0:15:49", "remaining_time": "1:21:29", "throughput": 4257.76, "total_tokens": 4042824} {"current_steps": 6210, "total_steps": 38160, "loss": 0.4668, "lr": 0.0009880686782289256, "epoch": 3.2547169811320753, "percentage": 16.27, "elapsed_time": "0:15:50", "remaining_time": "1:21:28", "throughput": 4257.77, "total_tokens": 4045896} {"current_steps": 6215, "total_steps": 38160, "loss": 0.5267, "lr": 0.000988018967166407, "epoch": 3.257337526205451, "percentage": 16.29, "elapsed_time": "0:15:50", "remaining_time": "1:21:27", "throughput": 4257.74, "total_tokens": 4048712} {"current_steps": 6220, "total_steps": 38160, "loss": 0.509, "lr": 0.0009879691540158884, "epoch": 3.259958071278826, "percentage": 16.3, "elapsed_time": "0:15:51", "remaining_time": "1:21:26", "throughput": 4257.5, "total_tokens": 4051176} {"current_steps": 6225, "total_steps": 38160, "loss": 0.3601, "lr": 0.0009879192387877895, "epoch": 3.2625786163522013, "percentage": 16.31, "elapsed_time": "0:15:52", "remaining_time": "1:21:25", "throughput": 4257.47, "total_tokens": 4054056} {"current_steps": 6230, "total_steps": 38160, "loss": 0.4355, "lr": 0.0009878692214925523, "epoch": 3.2651991614255764, "percentage": 16.33, "elapsed_time": "0:15:53", "remaining_time": "1:21:24", "throughput": 4258.02, "total_tokens": 4058120} {"current_steps": 6235, "total_steps": 38160, "loss": 0.5397, "lr": 0.00098781910214064, "epoch": 3.2678197064989516, "percentage": 16.34, "elapsed_time": "0:15:53", "remaining_time": "1:21:23", "throughput": 4257.91, "total_tokens": 4060840} {"current_steps": 6240, "total_steps": 38160, "loss": 0.543, "lr": 0.0009877688807425368, "epoch": 3.270440251572327, "percentage": 16.35, "elapsed_time": "0:15:54", "remaining_time": "1:21:22", "throughput": 4258.08, "total_tokens": 4064136} {"current_steps": 6245, "total_steps": 38160, "loss": 0.4707, "lr": 0.0009877185573087487, "epoch": 3.2730607966457024, "percentage": 16.37, "elapsed_time": "0:15:55", "remaining_time": "1:21:21", "throughput": 4257.94, "total_tokens": 4066824} {"current_steps": 6250, "total_steps": 38160, "loss": 0.6259, "lr": 0.0009876681318498025, "epoch": 3.2756813417190775, "percentage": 16.38, "elapsed_time": "0:15:55", "remaining_time": "1:21:20", "throughput": 4257.97, "total_tokens": 4069864} {"current_steps": 6255, "total_steps": 38160, "loss": 0.3532, "lr": 0.0009876176043762466, "epoch": 3.2783018867924527, "percentage": 16.39, "elapsed_time": "0:15:56", "remaining_time": "1:21:19", "throughput": 4258.0, "total_tokens": 4072936} {"current_steps": 6260, "total_steps": 38160, "loss": 0.6389, "lr": 0.000987566974898651, "epoch": 3.280922431865828, "percentage": 16.4, "elapsed_time": "0:15:57", "remaining_time": "1:21:17", "throughput": 4257.77, "total_tokens": 4075400} {"current_steps": 6265, "total_steps": 38160, "loss": 0.5006, "lr": 0.0009875162434276065, "epoch": 3.2835429769392035, "percentage": 16.42, "elapsed_time": "0:15:57", "remaining_time": "1:21:16", "throughput": 4257.89, "total_tokens": 4078696} {"current_steps": 6270, "total_steps": 38160, "loss": 0.4968, "lr": 0.000987465409973726, "epoch": 3.2861635220125787, "percentage": 16.43, "elapsed_time": "0:15:58", "remaining_time": "1:21:16", "throughput": 4258.45, "total_tokens": 4082824} {"current_steps": 6275, "total_steps": 38160, "loss": 0.5836, "lr": 0.0009874144745476432, "epoch": 3.288784067085954, "percentage": 16.44, "elapsed_time": "0:15:59", "remaining_time": "1:21:15", "throughput": 4258.28, "total_tokens": 4085448} {"current_steps": 6280, "total_steps": 38160, "loss": 0.527, "lr": 0.0009873634371600126, "epoch": 3.291404612159329, "percentage": 16.46, "elapsed_time": "0:16:00", "remaining_time": "1:21:13", "throughput": 4258.29, "total_tokens": 4088424} {"current_steps": 6285, "total_steps": 38160, "loss": 0.5667, "lr": 0.0009873122978215115, "epoch": 3.2940251572327046, "percentage": 16.47, "elapsed_time": "0:16:00", "remaining_time": "1:21:13", "throughput": 4258.46, "total_tokens": 4091752} {"current_steps": 6290, "total_steps": 38160, "loss": 0.473, "lr": 0.000987261056542837, "epoch": 3.29664570230608, "percentage": 16.48, "elapsed_time": "0:16:01", "remaining_time": "1:21:11", "throughput": 4258.4, "total_tokens": 4094568} {"current_steps": 6295, "total_steps": 38160, "loss": 0.5049, "lr": 0.0009872097133347085, "epoch": 3.299266247379455, "percentage": 16.5, "elapsed_time": "0:16:02", "remaining_time": "1:21:10", "throughput": 4258.36, "total_tokens": 4097352} {"current_steps": 6300, "total_steps": 38160, "loss": 0.3926, "lr": 0.0009871582682078664, "epoch": 3.30188679245283, "percentage": 16.51, "elapsed_time": "0:16:02", "remaining_time": "1:21:09", "throughput": 4258.43, "total_tokens": 4100328} {"current_steps": 6305, "total_steps": 38160, "loss": 0.4389, "lr": 0.0009871067211730722, "epoch": 3.3045073375262053, "percentage": 16.52, "elapsed_time": "0:16:03", "remaining_time": "1:21:07", "throughput": 4258.18, "total_tokens": 4102728} {"current_steps": 6310, "total_steps": 38160, "loss": 0.3858, "lr": 0.0009870550722411093, "epoch": 3.307127882599581, "percentage": 16.54, "elapsed_time": "0:16:04", "remaining_time": "1:21:06", "throughput": 4258.05, "total_tokens": 4105352} {"current_steps": 6315, "total_steps": 38160, "loss": 0.4298, "lr": 0.000987003321422782, "epoch": 3.309748427672956, "percentage": 16.55, "elapsed_time": "0:16:04", "remaining_time": "1:21:05", "throughput": 4258.27, "total_tokens": 4108744} {"current_steps": 6320, "total_steps": 38160, "loss": 0.3658, "lr": 0.0009869514687289155, "epoch": 3.3123689727463312, "percentage": 16.56, "elapsed_time": "0:16:05", "remaining_time": "1:21:04", "throughput": 4258.47, "total_tokens": 4112168} {"current_steps": 6325, "total_steps": 38160, "loss": 0.6434, "lr": 0.0009868995141703576, "epoch": 3.3149895178197064, "percentage": 16.57, "elapsed_time": "0:16:06", "remaining_time": "1:21:03", "throughput": 4258.53, "total_tokens": 4115240} {"current_steps": 6330, "total_steps": 38160, "loss": 0.4707, "lr": 0.000986847457757976, "epoch": 3.3176100628930816, "percentage": 16.59, "elapsed_time": "0:16:06", "remaining_time": "1:21:02", "throughput": 4258.39, "total_tokens": 4117864} {"current_steps": 6335, "total_steps": 38160, "loss": 0.4729, "lr": 0.0009867952995026605, "epoch": 3.320230607966457, "percentage": 16.6, "elapsed_time": "0:16:07", "remaining_time": "1:21:02", "throughput": 4259.03, "total_tokens": 4121960} {"current_steps": 6340, "total_steps": 38160, "loss": 0.5743, "lr": 0.0009867430394153221, "epoch": 3.3228511530398324, "percentage": 16.61, "elapsed_time": "0:16:08", "remaining_time": "1:21:01", "throughput": 4259.12, "total_tokens": 4125160} {"current_steps": 6345, "total_steps": 38160, "loss": 0.539, "lr": 0.0009866906775068927, "epoch": 3.3254716981132075, "percentage": 16.63, "elapsed_time": "0:16:09", "remaining_time": "1:21:00", "throughput": 4259.12, "total_tokens": 4128168} {"current_steps": 6350, "total_steps": 38160, "loss": 0.5723, "lr": 0.0009866382137883262, "epoch": 3.3280922431865827, "percentage": 16.64, "elapsed_time": "0:16:10", "remaining_time": "1:21:01", "throughput": 4260.5, "total_tokens": 4134632} {"current_steps": 6355, "total_steps": 38160, "loss": 0.5318, "lr": 0.0009865856482705973, "epoch": 3.330712788259958, "percentage": 16.65, "elapsed_time": "0:16:11", "remaining_time": "1:21:00", "throughput": 4260.76, "total_tokens": 4138088} {"current_steps": 6360, "total_steps": 38160, "loss": 0.435, "lr": 0.0009865329809647019, "epoch": 3.3333333333333335, "percentage": 16.67, "elapsed_time": "0:16:11", "remaining_time": "1:20:59", "throughput": 4261.02, "total_tokens": 4141608} {"current_steps": 6365, "total_steps": 38160, "loss": 0.4097, "lr": 0.0009864802118816575, "epoch": 3.3359538784067087, "percentage": 16.68, "elapsed_time": "0:16:12", "remaining_time": "1:20:58", "throughput": 4261.1, "total_tokens": 4144712} {"current_steps": 6370, "total_steps": 38160, "loss": 0.4182, "lr": 0.0009864273410325028, "epoch": 3.338574423480084, "percentage": 16.69, "elapsed_time": "0:16:13", "remaining_time": "1:20:57", "throughput": 4261.11, "total_tokens": 4147624} {"current_steps": 6375, "total_steps": 38160, "loss": 0.3881, "lr": 0.000986374368428298, "epoch": 3.341194968553459, "percentage": 16.71, "elapsed_time": "0:16:14", "remaining_time": "1:20:56", "throughput": 4261.23, "total_tokens": 4150728} {"current_steps": 6380, "total_steps": 38160, "loss": 0.4407, "lr": 0.000986321294080124, "epoch": 3.3438155136268346, "percentage": 16.72, "elapsed_time": "0:16:14", "remaining_time": "1:20:55", "throughput": 4261.38, "total_tokens": 4153928} {"current_steps": 6385, "total_steps": 38160, "loss": 0.4131, "lr": 0.0009862681179990838, "epoch": 3.3464360587002098, "percentage": 16.73, "elapsed_time": "0:16:15", "remaining_time": "1:20:54", "throughput": 4261.77, "total_tokens": 4157608} {"current_steps": 6390, "total_steps": 38160, "loss": 0.4505, "lr": 0.0009862148401963008, "epoch": 3.349056603773585, "percentage": 16.75, "elapsed_time": "0:16:16", "remaining_time": "1:20:53", "throughput": 4261.82, "total_tokens": 4160648} {"current_steps": 6395, "total_steps": 38160, "loss": 0.5034, "lr": 0.0009861614606829201, "epoch": 3.35167714884696, "percentage": 16.76, "elapsed_time": "0:16:16", "remaining_time": "1:20:52", "throughput": 4261.88, "total_tokens": 4163720} {"current_steps": 6400, "total_steps": 38160, "loss": 0.4649, "lr": 0.0009861079794701085, "epoch": 3.3542976939203353, "percentage": 16.77, "elapsed_time": "0:16:17", "remaining_time": "1:20:51", "throughput": 4262.01, "total_tokens": 4166920} {"current_steps": 6405, "total_steps": 38160, "loss": 0.3491, "lr": 0.000986054396569053, "epoch": 3.3569182389937104, "percentage": 16.78, "elapsed_time": "0:16:18", "remaining_time": "1:20:50", "throughput": 4262.08, "total_tokens": 4170024} {"current_steps": 6410, "total_steps": 38160, "loss": 0.3968, "lr": 0.0009860007119909635, "epoch": 3.359538784067086, "percentage": 16.8, "elapsed_time": "0:16:19", "remaining_time": "1:20:49", "throughput": 4262.23, "total_tokens": 4173288} {"current_steps": 6415, "total_steps": 38160, "loss": 0.3658, "lr": 0.0009859469257470692, "epoch": 3.3621593291404612, "percentage": 16.81, "elapsed_time": "0:16:19", "remaining_time": "1:20:48", "throughput": 4261.98, "total_tokens": 4175688} {"current_steps": 6420, "total_steps": 38160, "loss": 0.4352, "lr": 0.0009858930378486223, "epoch": 3.3647798742138364, "percentage": 16.82, "elapsed_time": "0:16:20", "remaining_time": "1:20:47", "throughput": 4261.93, "total_tokens": 4178504} {"current_steps": 6425, "total_steps": 38160, "loss": 0.4098, "lr": 0.000985839048306895, "epoch": 3.3674004192872116, "percentage": 16.84, "elapsed_time": "0:16:21", "remaining_time": "1:20:45", "throughput": 4261.64, "total_tokens": 4180840} {"current_steps": 6430, "total_steps": 38160, "loss": 0.4578, "lr": 0.000985784957133182, "epoch": 3.370020964360587, "percentage": 16.85, "elapsed_time": "0:16:21", "remaining_time": "1:20:44", "throughput": 4261.9, "total_tokens": 4184328} {"current_steps": 6435, "total_steps": 38160, "loss": 0.5911, "lr": 0.0009857307643387975, "epoch": 3.3726415094339623, "percentage": 16.86, "elapsed_time": "0:16:22", "remaining_time": "1:20:44", "throughput": 4262.3, "total_tokens": 4188072} {"current_steps": 6440, "total_steps": 38160, "loss": 0.4443, "lr": 0.000985676469935079, "epoch": 3.3752620545073375, "percentage": 16.88, "elapsed_time": "0:16:23", "remaining_time": "1:20:43", "throughput": 4262.67, "total_tokens": 4191848} {"current_steps": 6445, "total_steps": 38160, "loss": 0.4261, "lr": 0.0009856220739333837, "epoch": 3.3778825995807127, "percentage": 16.89, "elapsed_time": "0:16:24", "remaining_time": "1:20:42", "throughput": 4262.51, "total_tokens": 4194440} {"current_steps": 6450, "total_steps": 38160, "loss": 0.5291, "lr": 0.000985567576345091, "epoch": 3.380503144654088, "percentage": 16.9, "elapsed_time": "0:16:24", "remaining_time": "1:20:41", "throughput": 4262.47, "total_tokens": 4197256} {"current_steps": 6455, "total_steps": 38160, "loss": 0.4742, "lr": 0.0009855129771816006, "epoch": 3.3831236897274635, "percentage": 16.92, "elapsed_time": "0:16:25", "remaining_time": "1:20:40", "throughput": 4262.8, "total_tokens": 4200872} {"current_steps": 6460, "total_steps": 38160, "loss": 0.4356, "lr": 0.0009854582764543347, "epoch": 3.3857442348008386, "percentage": 16.93, "elapsed_time": "0:16:26", "remaining_time": "1:20:39", "throughput": 4262.97, "total_tokens": 4204232} {"current_steps": 6465, "total_steps": 38160, "loss": 0.4427, "lr": 0.0009854034741747356, "epoch": 3.388364779874214, "percentage": 16.94, "elapsed_time": "0:16:26", "remaining_time": "1:20:38", "throughput": 4263.03, "total_tokens": 4207304} {"current_steps": 6470, "total_steps": 38160, "loss": 0.4228, "lr": 0.0009853485703542675, "epoch": 3.390985324947589, "percentage": 16.95, "elapsed_time": "0:16:27", "remaining_time": "1:20:37", "throughput": 4262.84, "total_tokens": 4209832} {"current_steps": 6475, "total_steps": 38160, "loss": 0.4525, "lr": 0.0009852935650044158, "epoch": 3.3936058700209646, "percentage": 16.97, "elapsed_time": "0:16:28", "remaining_time": "1:20:36", "throughput": 4262.98, "total_tokens": 4213128} {"current_steps": 6480, "total_steps": 38160, "loss": 0.3762, "lr": 0.0009852384581366866, "epoch": 3.3962264150943398, "percentage": 16.98, "elapsed_time": "0:16:28", "remaining_time": "1:20:35", "throughput": 4262.94, "total_tokens": 4215976} {"current_steps": 6485, "total_steps": 38160, "loss": 0.6441, "lr": 0.000985183249762608, "epoch": 3.398846960167715, "percentage": 16.99, "elapsed_time": "0:16:29", "remaining_time": "1:20:33", "throughput": 4262.79, "total_tokens": 4218632} {"current_steps": 6490, "total_steps": 38160, "loss": 0.5317, "lr": 0.000985127939893729, "epoch": 3.40146750524109, "percentage": 17.01, "elapsed_time": "0:16:30", "remaining_time": "1:20:32", "throughput": 4262.71, "total_tokens": 4221416} {"current_steps": 6495, "total_steps": 38160, "loss": 0.3771, "lr": 0.0009850725285416194, "epoch": 3.4040880503144653, "percentage": 17.02, "elapsed_time": "0:16:31", "remaining_time": "1:20:31", "throughput": 4262.72, "total_tokens": 4224392} {"current_steps": 6500, "total_steps": 38160, "loss": 0.4756, "lr": 0.0009850170157178707, "epoch": 3.4067085953878404, "percentage": 17.03, "elapsed_time": "0:16:31", "remaining_time": "1:20:30", "throughput": 4262.63, "total_tokens": 4227176} {"current_steps": 6505, "total_steps": 38160, "loss": 0.5219, "lr": 0.000984961401434096, "epoch": 3.409329140461216, "percentage": 17.05, "elapsed_time": "0:16:32", "remaining_time": "1:20:29", "throughput": 4262.57, "total_tokens": 4229960} {"current_steps": 6510, "total_steps": 38160, "loss": 0.4575, "lr": 0.0009849056857019285, "epoch": 3.411949685534591, "percentage": 17.06, "elapsed_time": "0:16:32", "remaining_time": "1:20:27", "throughput": 4262.22, "total_tokens": 4232136} {"current_steps": 6515, "total_steps": 38160, "loss": 0.5589, "lr": 0.0009848498685330238, "epoch": 3.4145702306079664, "percentage": 17.07, "elapsed_time": "0:16:33", "remaining_time": "1:20:26", "throughput": 4262.5, "total_tokens": 4235624} {"current_steps": 6520, "total_steps": 38160, "loss": 0.5505, "lr": 0.000984793949939058, "epoch": 3.4171907756813416, "percentage": 17.09, "elapsed_time": "0:16:34", "remaining_time": "1:20:26", "throughput": 4263.42, "total_tokens": 4240616} {"current_steps": 6525, "total_steps": 38160, "loss": 0.4711, "lr": 0.0009847379299317287, "epoch": 3.419811320754717, "percentage": 17.1, "elapsed_time": "0:16:35", "remaining_time": "1:20:25", "throughput": 4263.41, "total_tokens": 4243528} {"current_steps": 6530, "total_steps": 38160, "loss": 0.5071, "lr": 0.0009846818085227549, "epoch": 3.4224318658280923, "percentage": 17.11, "elapsed_time": "0:16:36", "remaining_time": "1:20:24", "throughput": 4263.76, "total_tokens": 4247208} {"current_steps": 6535, "total_steps": 38160, "loss": 0.3639, "lr": 0.000984625585723876, "epoch": 3.4250524109014675, "percentage": 17.13, "elapsed_time": "0:16:37", "remaining_time": "1:20:25", "throughput": 4264.76, "total_tokens": 4252424} {"current_steps": 6540, "total_steps": 38160, "loss": 0.5162, "lr": 0.0009845692615468536, "epoch": 3.4276729559748427, "percentage": 17.14, "elapsed_time": "0:16:37", "remaining_time": "1:20:24", "throughput": 4264.97, "total_tokens": 4255752} {"current_steps": 6545, "total_steps": 38160, "loss": 0.5301, "lr": 0.00098451283600347, "epoch": 3.430293501048218, "percentage": 17.15, "elapsed_time": "0:16:38", "remaining_time": "1:20:23", "throughput": 4264.82, "total_tokens": 4258472} {"current_steps": 6550, "total_steps": 38160, "loss": 0.4059, "lr": 0.0009844563091055286, "epoch": 3.4329140461215935, "percentage": 17.16, "elapsed_time": "0:16:39", "remaining_time": "1:20:21", "throughput": 4264.58, "total_tokens": 4260904} {"current_steps": 6555, "total_steps": 38160, "loss": 0.5742, "lr": 0.0009843996808648542, "epoch": 3.4355345911949686, "percentage": 17.18, "elapsed_time": "0:16:39", "remaining_time": "1:20:20", "throughput": 4264.73, "total_tokens": 4264104} {"current_steps": 6560, "total_steps": 38160, "loss": 0.5552, "lr": 0.000984342951293293, "epoch": 3.438155136268344, "percentage": 17.19, "elapsed_time": "0:16:40", "remaining_time": "1:20:20", "throughput": 4265.46, "total_tokens": 4268648} {"current_steps": 6565, "total_steps": 38160, "loss": 0.5316, "lr": 0.0009842861204027121, "epoch": 3.440775681341719, "percentage": 17.2, "elapsed_time": "0:16:41", "remaining_time": "1:20:20", "throughput": 4265.94, "total_tokens": 4272776} {"current_steps": 6570, "total_steps": 38160, "loss": 0.4802, "lr": 0.0009842291882049999, "epoch": 3.4433962264150946, "percentage": 17.22, "elapsed_time": "0:16:42", "remaining_time": "1:20:19", "throughput": 4265.99, "total_tokens": 4275784} {"current_steps": 6575, "total_steps": 38160, "loss": 0.5904, "lr": 0.0009841721547120658, "epoch": 3.4460167714884697, "percentage": 17.23, "elapsed_time": "0:16:43", "remaining_time": "1:20:18", "throughput": 4266.31, "total_tokens": 4279400} {"current_steps": 6580, "total_steps": 38160, "loss": 0.4039, "lr": 0.0009841150199358408, "epoch": 3.448637316561845, "percentage": 17.24, "elapsed_time": "0:16:43", "remaining_time": "1:20:17", "throughput": 4266.59, "total_tokens": 4282920} {"current_steps": 6585, "total_steps": 38160, "loss": 0.5152, "lr": 0.0009840577838882765, "epoch": 3.45125786163522, "percentage": 17.26, "elapsed_time": "0:16:44", "remaining_time": "1:20:17", "throughput": 4267.05, "total_tokens": 4286856} {"current_steps": 6590, "total_steps": 38160, "loss": 0.5301, "lr": 0.0009840004465813464, "epoch": 3.4538784067085953, "percentage": 17.27, "elapsed_time": "0:16:45", "remaining_time": "1:20:16", "throughput": 4267.26, "total_tokens": 4290216} {"current_steps": 6595, "total_steps": 38160, "loss": 0.6427, "lr": 0.0009839430080270445, "epoch": 3.4564989517819704, "percentage": 17.28, "elapsed_time": "0:16:46", "remaining_time": "1:20:15", "throughput": 4267.56, "total_tokens": 4293768} {"current_steps": 6600, "total_steps": 38160, "loss": 0.4518, "lr": 0.0009838854682373865, "epoch": 3.459119496855346, "percentage": 17.3, "elapsed_time": "0:16:46", "remaining_time": "1:20:14", "throughput": 4267.85, "total_tokens": 4297288} {"current_steps": 6605, "total_steps": 38160, "loss": 0.4622, "lr": 0.000983827827224409, "epoch": 3.461740041928721, "percentage": 17.31, "elapsed_time": "0:16:47", "remaining_time": "1:20:13", "throughput": 4267.57, "total_tokens": 4299592} {"current_steps": 6610, "total_steps": 38160, "loss": 0.4921, "lr": 0.0009837700850001698, "epoch": 3.4643605870020964, "percentage": 17.32, "elapsed_time": "0:16:48", "remaining_time": "1:20:12", "throughput": 4267.58, "total_tokens": 4302600} {"current_steps": 6615, "total_steps": 38160, "loss": 0.6014, "lr": 0.000983712241576748, "epoch": 3.4669811320754715, "percentage": 17.33, "elapsed_time": "0:16:48", "remaining_time": "1:20:11", "throughput": 4267.59, "total_tokens": 4305640} {"current_steps": 6620, "total_steps": 38160, "loss": 0.4482, "lr": 0.000983654296966244, "epoch": 3.469601677148847, "percentage": 17.35, "elapsed_time": "0:16:49", "remaining_time": "1:20:09", "throughput": 4267.37, "total_tokens": 4308168} {"current_steps": 6625, "total_steps": 38160, "loss": 0.4272, "lr": 0.0009835962511807786, "epoch": 3.4722222222222223, "percentage": 17.36, "elapsed_time": "0:16:50", "remaining_time": "1:20:08", "throughput": 4267.44, "total_tokens": 4311208} {"current_steps": 6630, "total_steps": 38160, "loss": 0.583, "lr": 0.0009835381042324948, "epoch": 3.4748427672955975, "percentage": 17.37, "elapsed_time": "0:16:50", "remaining_time": "1:20:07", "throughput": 4267.51, "total_tokens": 4314312} {"current_steps": 6635, "total_steps": 38160, "loss": 0.5285, "lr": 0.0009834798561335558, "epoch": 3.4774633123689727, "percentage": 17.39, "elapsed_time": "0:16:51", "remaining_time": "1:20:06", "throughput": 4267.4, "total_tokens": 4316936} {"current_steps": 6640, "total_steps": 38160, "loss": 0.4375, "lr": 0.000983421506896147, "epoch": 3.480083857442348, "percentage": 17.4, "elapsed_time": "0:16:52", "remaining_time": "1:20:05", "throughput": 4267.57, "total_tokens": 4320232} {"current_steps": 6645, "total_steps": 38160, "loss": 0.5677, "lr": 0.000983363056532474, "epoch": 3.4827044025157234, "percentage": 17.41, "elapsed_time": "0:16:53", "remaining_time": "1:20:05", "throughput": 4267.98, "total_tokens": 4324104} {"current_steps": 6650, "total_steps": 38160, "loss": 0.6485, "lr": 0.000983304505054764, "epoch": 3.4853249475890986, "percentage": 17.43, "elapsed_time": "0:16:53", "remaining_time": "1:20:04", "throughput": 4268.12, "total_tokens": 4327304} {"current_steps": 6655, "total_steps": 38160, "loss": 0.5302, "lr": 0.0009832458524752655, "epoch": 3.487945492662474, "percentage": 17.44, "elapsed_time": "0:16:54", "remaining_time": "1:20:03", "throughput": 4268.95, "total_tokens": 4332008} {"current_steps": 6660, "total_steps": 38160, "loss": 0.4827, "lr": 0.0009831870988062476, "epoch": 3.490566037735849, "percentage": 17.45, "elapsed_time": "0:16:55", "remaining_time": "1:20:02", "throughput": 4268.85, "total_tokens": 4334728} {"current_steps": 6665, "total_steps": 38160, "loss": 0.482, "lr": 0.0009831282440600014, "epoch": 3.4931865828092246, "percentage": 17.47, "elapsed_time": "0:16:56", "remaining_time": "1:20:01", "throughput": 4268.71, "total_tokens": 4337416} {"current_steps": 6670, "total_steps": 38160, "loss": 0.3768, "lr": 0.0009830692882488383, "epoch": 3.4958071278825997, "percentage": 17.48, "elapsed_time": "0:16:56", "remaining_time": "1:20:00", "throughput": 4268.72, "total_tokens": 4340328} {"current_steps": 6675, "total_steps": 38160, "loss": 0.4522, "lr": 0.000983010231385091, "epoch": 3.498427672955975, "percentage": 17.49, "elapsed_time": "0:16:57", "remaining_time": "1:19:59", "throughput": 4269.27, "total_tokens": 4344456} {"current_steps": 6680, "total_steps": 38160, "loss": 0.4429, "lr": 0.000982951073481114, "epoch": 3.50104821802935, "percentage": 17.51, "elapsed_time": "0:16:58", "remaining_time": "1:19:59", "throughput": 4269.54, "total_tokens": 4347944} {"current_steps": 6685, "total_steps": 38160, "loss": 0.5053, "lr": 0.0009828918145492823, "epoch": 3.5036687631027252, "percentage": 17.52, "elapsed_time": "0:16:59", "remaining_time": "1:19:57", "throughput": 4269.49, "total_tokens": 4350760} {"current_steps": 6690, "total_steps": 38160, "loss": 0.5075, "lr": 0.000982832454601992, "epoch": 3.5062893081761004, "percentage": 17.53, "elapsed_time": "0:16:59", "remaining_time": "1:19:57", "throughput": 4269.91, "total_tokens": 4354760} {"current_steps": 6695, "total_steps": 38160, "loss": 0.4261, "lr": 0.0009827729936516605, "epoch": 3.508909853249476, "percentage": 17.54, "elapsed_time": "0:17:00", "remaining_time": "1:19:56", "throughput": 4270.14, "total_tokens": 4358120} {"current_steps": 6700, "total_steps": 38160, "loss": 0.4412, "lr": 0.0009827134317107267, "epoch": 3.511530398322851, "percentage": 17.56, "elapsed_time": "0:17:01", "remaining_time": "1:19:55", "throughput": 4270.25, "total_tokens": 4361352} {"current_steps": 6705, "total_steps": 38160, "loss": 0.5416, "lr": 0.0009826537687916501, "epoch": 3.5141509433962264, "percentage": 17.57, "elapsed_time": "0:17:01", "remaining_time": "1:19:54", "throughput": 4270.0, "total_tokens": 4363784} {"current_steps": 6710, "total_steps": 38160, "loss": 0.451, "lr": 0.0009825940049069113, "epoch": 3.5167714884696015, "percentage": 17.58, "elapsed_time": "0:17:02", "remaining_time": "1:19:53", "throughput": 4270.31, "total_tokens": 4367400} {"current_steps": 6715, "total_steps": 38160, "loss": 0.5494, "lr": 0.0009825341400690126, "epoch": 3.519392033542977, "percentage": 17.6, "elapsed_time": "0:17:03", "remaining_time": "1:19:53", "throughput": 4271.08, "total_tokens": 4372232} {"current_steps": 6720, "total_steps": 38160, "loss": 0.4477, "lr": 0.0009824741742904767, "epoch": 3.5220125786163523, "percentage": 17.61, "elapsed_time": "0:17:04", "remaining_time": "1:19:52", "throughput": 4271.27, "total_tokens": 4375560} {"current_steps": 6725, "total_steps": 38160, "loss": 0.4837, "lr": 0.000982414107583848, "epoch": 3.5246331236897275, "percentage": 17.62, "elapsed_time": "0:17:05", "remaining_time": "1:19:51", "throughput": 4271.14, "total_tokens": 4378216} {"current_steps": 6730, "total_steps": 38160, "loss": 0.6063, "lr": 0.0009823539399616914, "epoch": 3.5272536687631026, "percentage": 17.64, "elapsed_time": "0:17:05", "remaining_time": "1:19:50", "throughput": 4270.97, "total_tokens": 4380744} {"current_steps": 6735, "total_steps": 38160, "loss": 0.4331, "lr": 0.0009822936714365938, "epoch": 3.529874213836478, "percentage": 17.65, "elapsed_time": "0:17:06", "remaining_time": "1:19:49", "throughput": 4271.25, "total_tokens": 4384264} {"current_steps": 6740, "total_steps": 38160, "loss": 0.6028, "lr": 0.0009822333020211623, "epoch": 3.532494758909853, "percentage": 17.66, "elapsed_time": "0:17:07", "remaining_time": "1:19:48", "throughput": 4271.73, "total_tokens": 4388200} {"current_steps": 6745, "total_steps": 38160, "loss": 0.4455, "lr": 0.0009821728317280256, "epoch": 3.5351153039832286, "percentage": 17.68, "elapsed_time": "0:17:07", "remaining_time": "1:19:47", "throughput": 4271.5, "total_tokens": 4390760} {"current_steps": 6750, "total_steps": 38160, "loss": 0.533, "lr": 0.0009821122605698336, "epoch": 3.5377358490566038, "percentage": 17.69, "elapsed_time": "0:17:08", "remaining_time": "1:19:46", "throughput": 4271.41, "total_tokens": 4393416} {"current_steps": 6755, "total_steps": 38160, "loss": 0.4864, "lr": 0.0009820515885592567, "epoch": 3.540356394129979, "percentage": 17.7, "elapsed_time": "0:17:09", "remaining_time": "1:19:45", "throughput": 4271.4, "total_tokens": 4396392} {"current_steps": 6760, "total_steps": 38160, "loss": 0.4414, "lr": 0.0009819908157089872, "epoch": 3.5429769392033545, "percentage": 17.71, "elapsed_time": "0:17:09", "remaining_time": "1:19:44", "throughput": 4271.48, "total_tokens": 4399496} {"current_steps": 6765, "total_steps": 38160, "loss": 0.4923, "lr": 0.0009819299420317379, "epoch": 3.5455974842767297, "percentage": 17.73, "elapsed_time": "0:17:10", "remaining_time": "1:19:43", "throughput": 4271.46, "total_tokens": 4402440} {"current_steps": 6770, "total_steps": 38160, "loss": 0.5752, "lr": 0.0009818689675402427, "epoch": 3.548218029350105, "percentage": 17.74, "elapsed_time": "0:17:11", "remaining_time": "1:19:42", "throughput": 4271.6, "total_tokens": 4405672} {"current_steps": 6775, "total_steps": 38160, "loss": 0.5709, "lr": 0.000981807892247257, "epoch": 3.55083857442348, "percentage": 17.75, "elapsed_time": "0:17:12", "remaining_time": "1:19:41", "throughput": 4271.7, "total_tokens": 4408872} {"current_steps": 6780, "total_steps": 38160, "loss": 0.4444, "lr": 0.0009817467161655571, "epoch": 3.5534591194968552, "percentage": 17.77, "elapsed_time": "0:17:12", "remaining_time": "1:19:39", "throughput": 4271.35, "total_tokens": 4411112} {"current_steps": 6785, "total_steps": 38160, "loss": 0.4056, "lr": 0.0009816854393079402, "epoch": 3.5560796645702304, "percentage": 17.78, "elapsed_time": "0:17:13", "remaining_time": "1:19:38", "throughput": 4271.45, "total_tokens": 4414248} {"current_steps": 6790, "total_steps": 38160, "loss": 0.5767, "lr": 0.0009816240616872247, "epoch": 3.558700209643606, "percentage": 17.79, "elapsed_time": "0:17:14", "remaining_time": "1:19:37", "throughput": 4271.46, "total_tokens": 4417160} {"current_steps": 6795, "total_steps": 38160, "loss": 0.4323, "lr": 0.0009815625833162502, "epoch": 3.561320754716981, "percentage": 17.81, "elapsed_time": "0:17:14", "remaining_time": "1:19:37", "throughput": 4271.89, "total_tokens": 4421032} {"current_steps": 6800, "total_steps": 38160, "loss": 0.6365, "lr": 0.0009815010042078772, "epoch": 3.5639412997903563, "percentage": 17.82, "elapsed_time": "0:17:15", "remaining_time": "1:19:35", "throughput": 4271.85, "total_tokens": 4423848} {"current_steps": 6805, "total_steps": 38160, "loss": 0.421, "lr": 0.0009814393243749873, "epoch": 3.5665618448637315, "percentage": 17.83, "elapsed_time": "0:17:16", "remaining_time": "1:19:34", "throughput": 4271.99, "total_tokens": 4427144} {"current_steps": 6810, "total_steps": 38160, "loss": 0.5413, "lr": 0.0009813775438304835, "epoch": 3.569182389937107, "percentage": 17.85, "elapsed_time": "0:17:16", "remaining_time": "1:19:33", "throughput": 4271.9, "total_tokens": 4429896} {"current_steps": 6815, "total_steps": 38160, "loss": 0.4846, "lr": 0.0009813156625872893, "epoch": 3.5718029350104823, "percentage": 17.86, "elapsed_time": "0:17:18", "remaining_time": "1:19:34", "throughput": 4272.98, "total_tokens": 4435720} {"current_steps": 6820, "total_steps": 38160, "loss": 0.4477, "lr": 0.0009812536806583494, "epoch": 3.5744234800838575, "percentage": 17.87, "elapsed_time": "0:17:18", "remaining_time": "1:19:33", "throughput": 4273.14, "total_tokens": 4439048} {"current_steps": 6825, "total_steps": 38160, "loss": 0.4957, "lr": 0.0009811915980566302, "epoch": 3.5770440251572326, "percentage": 17.89, "elapsed_time": "0:17:19", "remaining_time": "1:19:32", "throughput": 4273.12, "total_tokens": 4441928} {"current_steps": 6830, "total_steps": 38160, "loss": 0.4197, "lr": 0.0009811294147951182, "epoch": 3.579664570230608, "percentage": 17.9, "elapsed_time": "0:17:20", "remaining_time": "1:19:31", "throughput": 4273.3, "total_tokens": 4445160} {"current_steps": 6835, "total_steps": 38160, "loss": 0.5044, "lr": 0.000981067130886822, "epoch": 3.582285115303983, "percentage": 17.91, "elapsed_time": "0:17:20", "remaining_time": "1:19:30", "throughput": 4273.45, "total_tokens": 4448328} {"current_steps": 6840, "total_steps": 38160, "loss": 0.3976, "lr": 0.00098100474634477, "epoch": 3.5849056603773586, "percentage": 17.92, "elapsed_time": "0:17:21", "remaining_time": "1:19:29", "throughput": 4273.69, "total_tokens": 4451816} {"current_steps": 6845, "total_steps": 38160, "loss": 0.5091, "lr": 0.0009809422611820127, "epoch": 3.5875262054507338, "percentage": 17.94, "elapsed_time": "0:17:22", "remaining_time": "1:19:28", "throughput": 4273.76, "total_tokens": 4454856} {"current_steps": 6850, "total_steps": 38160, "loss": 0.5015, "lr": 0.0009808796754116212, "epoch": 3.590146750524109, "percentage": 17.95, "elapsed_time": "0:17:23", "remaining_time": "1:19:27", "throughput": 4273.66, "total_tokens": 4457544} {"current_steps": 6855, "total_steps": 38160, "loss": 0.5464, "lr": 0.0009808169890466879, "epoch": 3.5927672955974845, "percentage": 17.96, "elapsed_time": "0:17:23", "remaining_time": "1:19:26", "throughput": 4273.93, "total_tokens": 4461160} {"current_steps": 6860, "total_steps": 38160, "loss": 0.3941, "lr": 0.000980754202100326, "epoch": 3.5953878406708597, "percentage": 17.98, "elapsed_time": "0:17:24", "remaining_time": "1:19:26", "throughput": 4274.38, "total_tokens": 4465000} {"current_steps": 6865, "total_steps": 38160, "loss": 0.5051, "lr": 0.0009806913145856695, "epoch": 3.598008385744235, "percentage": 17.99, "elapsed_time": "0:17:25", "remaining_time": "1:19:25", "throughput": 4274.42, "total_tokens": 4467944} {"current_steps": 6870, "total_steps": 38160, "loss": 0.546, "lr": 0.0009806283265158741, "epoch": 3.60062893081761, "percentage": 18.0, "elapsed_time": "0:17:26", "remaining_time": "1:19:24", "throughput": 4274.89, "total_tokens": 4471880} {"current_steps": 6875, "total_steps": 38160, "loss": 0.4415, "lr": 0.0009805652379041162, "epoch": 3.603249475890985, "percentage": 18.02, "elapsed_time": "0:17:26", "remaining_time": "1:19:23", "throughput": 4274.56, "total_tokens": 4474184} {"current_steps": 6880, "total_steps": 38160, "loss": 0.4141, "lr": 0.000980502048763593, "epoch": 3.6058700209643604, "percentage": 18.03, "elapsed_time": "0:17:27", "remaining_time": "1:19:21", "throughput": 4274.32, "total_tokens": 4476584} {"current_steps": 6885, "total_steps": 38160, "loss": 0.4449, "lr": 0.0009804387591075233, "epoch": 3.608490566037736, "percentage": 18.04, "elapsed_time": "0:17:28", "remaining_time": "1:19:20", "throughput": 4274.37, "total_tokens": 4479592} {"current_steps": 6890, "total_steps": 38160, "loss": 0.4872, "lr": 0.000980375368949146, "epoch": 3.611111111111111, "percentage": 18.06, "elapsed_time": "0:17:28", "remaining_time": "1:19:19", "throughput": 4274.27, "total_tokens": 4482280} {"current_steps": 6895, "total_steps": 38160, "loss": 0.4099, "lr": 0.0009803118783017221, "epoch": 3.6137316561844863, "percentage": 18.07, "elapsed_time": "0:17:29", "remaining_time": "1:19:18", "throughput": 4274.28, "total_tokens": 4485224} {"current_steps": 6900, "total_steps": 38160, "loss": 0.5568, "lr": 0.0009802482871785329, "epoch": 3.6163522012578615, "percentage": 18.08, "elapsed_time": "0:17:30", "remaining_time": "1:19:17", "throughput": 4274.55, "total_tokens": 4488680} {"current_steps": 6905, "total_steps": 38160, "loss": 0.4953, "lr": 0.000980184595592881, "epoch": 3.618972746331237, "percentage": 18.09, "elapsed_time": "0:17:30", "remaining_time": "1:19:16", "throughput": 4274.8, "total_tokens": 4492104} {"current_steps": 6910, "total_steps": 38160, "loss": 0.4653, "lr": 0.00098012080355809, "epoch": 3.6215932914046123, "percentage": 18.11, "elapsed_time": "0:17:31", "remaining_time": "1:19:15", "throughput": 4274.87, "total_tokens": 4495240} {"current_steps": 6915, "total_steps": 38160, "loss": 0.3641, "lr": 0.0009800569110875043, "epoch": 3.6242138364779874, "percentage": 18.12, "elapsed_time": "0:17:32", "remaining_time": "1:19:14", "throughput": 4274.84, "total_tokens": 4498088} {"current_steps": 6920, "total_steps": 38160, "loss": 0.4432, "lr": 0.0009799929181944895, "epoch": 3.6268343815513626, "percentage": 18.13, "elapsed_time": "0:17:32", "remaining_time": "1:19:13", "throughput": 4274.95, "total_tokens": 4501224} {"current_steps": 6925, "total_steps": 38160, "loss": 0.5693, "lr": 0.0009799288248924325, "epoch": 3.629454926624738, "percentage": 18.15, "elapsed_time": "0:17:33", "remaining_time": "1:19:12", "throughput": 4274.81, "total_tokens": 4503784} {"current_steps": 6930, "total_steps": 38160, "loss": 0.4664, "lr": 0.0009798646311947404, "epoch": 3.632075471698113, "percentage": 18.16, "elapsed_time": "0:17:34", "remaining_time": "1:19:10", "throughput": 4274.74, "total_tokens": 4506568} {"current_steps": 6935, "total_steps": 38160, "loss": 0.3817, "lr": 0.0009798003371148422, "epoch": 3.6346960167714886, "percentage": 18.17, "elapsed_time": "0:17:34", "remaining_time": "1:19:09", "throughput": 4274.56, "total_tokens": 4509096} {"current_steps": 6940, "total_steps": 38160, "loss": 0.366, "lr": 0.0009797359426661873, "epoch": 3.6373165618448637, "percentage": 18.19, "elapsed_time": "0:17:35", "remaining_time": "1:19:08", "throughput": 4274.67, "total_tokens": 4512200} {"current_steps": 6945, "total_steps": 38160, "loss": 0.4411, "lr": 0.0009796714478622463, "epoch": 3.639937106918239, "percentage": 18.2, "elapsed_time": "0:17:36", "remaining_time": "1:19:07", "throughput": 4274.63, "total_tokens": 4514984} {"current_steps": 6950, "total_steps": 38160, "loss": 0.4541, "lr": 0.0009796068527165107, "epoch": 3.6425576519916145, "percentage": 18.21, "elapsed_time": "0:17:36", "remaining_time": "1:19:06", "throughput": 4274.93, "total_tokens": 4518568} {"current_steps": 6955, "total_steps": 38160, "loss": 0.8077, "lr": 0.0009795421572424935, "epoch": 3.6451781970649897, "percentage": 18.23, "elapsed_time": "0:17:37", "remaining_time": "1:19:05", "throughput": 4275.1, "total_tokens": 4521832} {"current_steps": 6960, "total_steps": 38160, "loss": 0.5581, "lr": 0.0009794773614537275, "epoch": 3.647798742138365, "percentage": 18.24, "elapsed_time": "0:17:38", "remaining_time": "1:19:05", "throughput": 4275.46, "total_tokens": 4525640} {"current_steps": 6965, "total_steps": 38160, "loss": 0.4386, "lr": 0.0009794124653637677, "epoch": 3.65041928721174, "percentage": 18.25, "elapsed_time": "0:17:39", "remaining_time": "1:19:04", "throughput": 4275.98, "total_tokens": 4529608} {"current_steps": 6970, "total_steps": 38160, "loss": 0.5619, "lr": 0.00097934746898619, "epoch": 3.653039832285115, "percentage": 18.27, "elapsed_time": "0:17:39", "remaining_time": "1:19:03", "throughput": 4275.88, "total_tokens": 4532328} {"current_steps": 6975, "total_steps": 38160, "loss": 0.505, "lr": 0.00097928237233459, "epoch": 3.6556603773584904, "percentage": 18.28, "elapsed_time": "0:17:40", "remaining_time": "1:19:02", "throughput": 4275.92, "total_tokens": 4535336} {"current_steps": 6980, "total_steps": 38160, "loss": 0.3757, "lr": 0.0009792171754225859, "epoch": 3.658280922431866, "percentage": 18.29, "elapsed_time": "0:17:41", "remaining_time": "1:19:01", "throughput": 4276.12, "total_tokens": 4538760} {"current_steps": 6985, "total_steps": 38160, "loss": 0.4245, "lr": 0.0009791518782638158, "epoch": 3.660901467505241, "percentage": 18.3, "elapsed_time": "0:17:42", "remaining_time": "1:19:03", "throughput": 4277.88, "total_tokens": 4546376} {"current_steps": 6990, "total_steps": 38160, "loss": 0.4953, "lr": 0.0009790864808719392, "epoch": 3.6635220125786163, "percentage": 18.32, "elapsed_time": "0:17:43", "remaining_time": "1:19:02", "throughput": 4278.34, "total_tokens": 4550376} {"current_steps": 6995, "total_steps": 38160, "loss": 0.5907, "lr": 0.0009790209832606365, "epoch": 3.6661425576519915, "percentage": 18.33, "elapsed_time": "0:17:44", "remaining_time": "1:19:01", "throughput": 4278.48, "total_tokens": 4553736} {"current_steps": 7000, "total_steps": 38160, "loss": 0.4317, "lr": 0.000978955385443609, "epoch": 3.668763102725367, "percentage": 18.34, "elapsed_time": "0:17:45", "remaining_time": "1:19:01", "throughput": 4278.53, "total_tokens": 4556936} {"current_steps": 7005, "total_steps": 38160, "loss": 0.4601, "lr": 0.0009788896874345792, "epoch": 3.6713836477987423, "percentage": 18.36, "elapsed_time": "0:17:45", "remaining_time": "1:18:59", "throughput": 4278.49, "total_tokens": 4559816} {"current_steps": 7010, "total_steps": 38160, "loss": 0.4487, "lr": 0.0009788238892472904, "epoch": 3.6740041928721174, "percentage": 18.37, "elapsed_time": "0:17:46", "remaining_time": "1:18:59", "throughput": 4279.27, "total_tokens": 4564520} {"current_steps": 7015, "total_steps": 38160, "loss": 0.5149, "lr": 0.0009787579908955063, "epoch": 3.6766247379454926, "percentage": 18.38, "elapsed_time": "0:17:47", "remaining_time": "1:18:58", "throughput": 4279.35, "total_tokens": 4567592} {"current_steps": 7020, "total_steps": 38160, "loss": 0.4925, "lr": 0.0009786919923930127, "epoch": 3.6792452830188678, "percentage": 18.4, "elapsed_time": "0:17:48", "remaining_time": "1:18:57", "throughput": 4279.32, "total_tokens": 4570408} {"current_steps": 7025, "total_steps": 38160, "loss": 0.4551, "lr": 0.0009786258937536155, "epoch": 3.681865828092243, "percentage": 18.41, "elapsed_time": "0:17:48", "remaining_time": "1:18:56", "throughput": 4279.3, "total_tokens": 4573320} {"current_steps": 7030, "total_steps": 38160, "loss": 0.5497, "lr": 0.0009785596949911418, "epoch": 3.6844863731656186, "percentage": 18.42, "elapsed_time": "0:17:49", "remaining_time": "1:18:55", "throughput": 4279.48, "total_tokens": 4576680} {"current_steps": 7035, "total_steps": 38160, "loss": 0.4808, "lr": 0.0009784933961194395, "epoch": 3.6871069182389937, "percentage": 18.44, "elapsed_time": "0:17:50", "remaining_time": "1:18:54", "throughput": 4279.36, "total_tokens": 4579368} {"current_steps": 7040, "total_steps": 38160, "loss": 0.611, "lr": 0.0009784269971523777, "epoch": 3.689727463312369, "percentage": 18.45, "elapsed_time": "0:17:50", "remaining_time": "1:18:53", "throughput": 4279.43, "total_tokens": 4582440} {"current_steps": 7045, "total_steps": 38160, "loss": 0.4147, "lr": 0.0009783604981038463, "epoch": 3.6923480083857445, "percentage": 18.46, "elapsed_time": "0:17:51", "remaining_time": "1:18:52", "throughput": 4279.33, "total_tokens": 4585128} {"current_steps": 7050, "total_steps": 38160, "loss": 0.4583, "lr": 0.000978293898987756, "epoch": 3.6949685534591197, "percentage": 18.47, "elapsed_time": "0:17:52", "remaining_time": "1:18:51", "throughput": 4279.38, "total_tokens": 4588168} {"current_steps": 7055, "total_steps": 38160, "loss": 0.4511, "lr": 0.000978227199818039, "epoch": 3.697589098532495, "percentage": 18.49, "elapsed_time": "0:17:52", "remaining_time": "1:18:50", "throughput": 4279.47, "total_tokens": 4591400} {"current_steps": 7060, "total_steps": 38160, "loss": 0.4781, "lr": 0.0009781604006086474, "epoch": 3.70020964360587, "percentage": 18.5, "elapsed_time": "0:17:53", "remaining_time": "1:18:49", "throughput": 4279.43, "total_tokens": 4594280} {"current_steps": 7065, "total_steps": 38160, "loss": 0.3747, "lr": 0.0009780935013735553, "epoch": 3.702830188679245, "percentage": 18.51, "elapsed_time": "0:17:54", "remaining_time": "1:18:48", "throughput": 4280.0, "total_tokens": 4598536} {"current_steps": 7070, "total_steps": 38160, "loss": 0.5027, "lr": 0.0009780265021267572, "epoch": 3.7054507337526204, "percentage": 18.53, "elapsed_time": "0:17:55", "remaining_time": "1:18:48", "throughput": 4280.35, "total_tokens": 4602440} {"current_steps": 7075, "total_steps": 38160, "loss": 0.4903, "lr": 0.0009779594028822682, "epoch": 3.708071278825996, "percentage": 18.54, "elapsed_time": "0:17:55", "remaining_time": "1:18:47", "throughput": 4280.34, "total_tokens": 4605352} {"current_steps": 7080, "total_steps": 38160, "loss": 0.3695, "lr": 0.0009778922036541252, "epoch": 3.710691823899371, "percentage": 18.55, "elapsed_time": "0:17:56", "remaining_time": "1:18:47", "throughput": 4281.09, "total_tokens": 4610152} {"current_steps": 7085, "total_steps": 38160, "loss": 0.3967, "lr": 0.0009778249044563852, "epoch": 3.7133123689727463, "percentage": 18.57, "elapsed_time": "0:17:57", "remaining_time": "1:18:46", "throughput": 4281.02, "total_tokens": 4612872} {"current_steps": 7090, "total_steps": 38160, "loss": 0.5534, "lr": 0.0009777575053031263, "epoch": 3.7159329140461215, "percentage": 18.58, "elapsed_time": "0:17:58", "remaining_time": "1:18:45", "throughput": 4281.57, "total_tokens": 4617064} {"current_steps": 7095, "total_steps": 38160, "loss": 0.5525, "lr": 0.000977690006208448, "epoch": 3.718553459119497, "percentage": 18.59, "elapsed_time": "0:17:59", "remaining_time": "1:18:45", "throughput": 4282.26, "total_tokens": 4621608} {"current_steps": 7100, "total_steps": 38160, "loss": 0.4814, "lr": 0.0009776224071864703, "epoch": 3.7211740041928723, "percentage": 18.61, "elapsed_time": "0:17:59", "remaining_time": "1:18:43", "throughput": 4281.96, "total_tokens": 4623880} {"current_steps": 7105, "total_steps": 38160, "loss": 0.4466, "lr": 0.000977554708251334, "epoch": 3.7237945492662474, "percentage": 18.62, "elapsed_time": "0:18:00", "remaining_time": "1:18:43", "throughput": 4282.07, "total_tokens": 4627080} {"current_steps": 7110, "total_steps": 38160, "loss": 0.4294, "lr": 0.0009774869094172007, "epoch": 3.7264150943396226, "percentage": 18.63, "elapsed_time": "0:18:01", "remaining_time": "1:18:42", "throughput": 4282.28, "total_tokens": 4630536} {"current_steps": 7115, "total_steps": 38160, "loss": 0.5182, "lr": 0.0009774190106982537, "epoch": 3.7290356394129978, "percentage": 18.65, "elapsed_time": "0:18:01", "remaining_time": "1:18:41", "throughput": 4282.2, "total_tokens": 4633256} {"current_steps": 7120, "total_steps": 38160, "loss": 0.4746, "lr": 0.0009773510121086962, "epoch": 3.731656184486373, "percentage": 18.66, "elapsed_time": "0:18:02", "remaining_time": "1:18:39", "throughput": 4282.17, "total_tokens": 4636104} {"current_steps": 7125, "total_steps": 38160, "loss": 0.4587, "lr": 0.0009772829136627528, "epoch": 3.7342767295597485, "percentage": 18.67, "elapsed_time": "0:18:03", "remaining_time": "1:18:38", "throughput": 4282.25, "total_tokens": 4639272} {"current_steps": 7130, "total_steps": 38160, "loss": 0.3604, "lr": 0.0009772147153746691, "epoch": 3.7368972746331237, "percentage": 18.68, "elapsed_time": "0:18:04", "remaining_time": "1:18:37", "throughput": 4282.08, "total_tokens": 4641800} {"current_steps": 7135, "total_steps": 38160, "loss": 0.5978, "lr": 0.0009771464172587112, "epoch": 3.739517819706499, "percentage": 18.7, "elapsed_time": "0:18:04", "remaining_time": "1:18:36", "throughput": 4282.23, "total_tokens": 4645160} {"current_steps": 7140, "total_steps": 38160, "loss": 0.3712, "lr": 0.0009770780193291667, "epoch": 3.742138364779874, "percentage": 18.71, "elapsed_time": "0:18:05", "remaining_time": "1:18:35", "throughput": 4282.41, "total_tokens": 4648488} {"current_steps": 7145, "total_steps": 38160, "loss": 0.4317, "lr": 0.000977009521600343, "epoch": 3.7447589098532497, "percentage": 18.72, "elapsed_time": "0:18:06", "remaining_time": "1:18:35", "throughput": 4282.61, "total_tokens": 4651944} {"current_steps": 7150, "total_steps": 38160, "loss": 0.5142, "lr": 0.0009769409240865696, "epoch": 3.747379454926625, "percentage": 18.74, "elapsed_time": "0:18:07", "remaining_time": "1:18:34", "throughput": 4283.04, "total_tokens": 4655816} {"current_steps": 7155, "total_steps": 38160, "loss": 0.4404, "lr": 0.0009768722268021959, "epoch": 3.75, "percentage": 18.75, "elapsed_time": "0:18:07", "remaining_time": "1:18:33", "throughput": 4283.08, "total_tokens": 4658824} {"current_steps": 7160, "total_steps": 38160, "loss": 0.5171, "lr": 0.000976803429761593, "epoch": 3.752620545073375, "percentage": 18.76, "elapsed_time": "0:18:08", "remaining_time": "1:18:32", "throughput": 4283.38, "total_tokens": 4662440} {"current_steps": 7165, "total_steps": 38160, "loss": 0.4572, "lr": 0.000976734532979152, "epoch": 3.7552410901467503, "percentage": 18.78, "elapsed_time": "0:18:09", "remaining_time": "1:18:32", "throughput": 4283.76, "total_tokens": 4666280} {"current_steps": 7170, "total_steps": 38160, "loss": 0.3967, "lr": 0.000976665536469286, "epoch": 3.757861635220126, "percentage": 18.79, "elapsed_time": "0:18:10", "remaining_time": "1:18:31", "throughput": 4283.92, "total_tokens": 4669544} {"current_steps": 7175, "total_steps": 38160, "loss": 0.4521, "lr": 0.0009765964402464276, "epoch": 3.760482180293501, "percentage": 18.8, "elapsed_time": "0:18:10", "remaining_time": "1:18:30", "throughput": 4283.88, "total_tokens": 4672392} {"current_steps": 7180, "total_steps": 38160, "loss": 0.5575, "lr": 0.0009765272443250312, "epoch": 3.7631027253668763, "percentage": 18.82, "elapsed_time": "0:18:11", "remaining_time": "1:18:29", "throughput": 4284.51, "total_tokens": 4676872} {"current_steps": 7185, "total_steps": 38160, "loss": 0.6078, "lr": 0.0009764579487195717, "epoch": 3.7657232704402515, "percentage": 18.83, "elapsed_time": "0:18:12", "remaining_time": "1:18:29", "throughput": 4284.82, "total_tokens": 4680520} {"current_steps": 7190, "total_steps": 38160, "loss": 0.4637, "lr": 0.0009763885534445452, "epoch": 3.768343815513627, "percentage": 18.84, "elapsed_time": "0:18:13", "remaining_time": "1:18:28", "throughput": 4284.82, "total_tokens": 4683464} {"current_steps": 7195, "total_steps": 38160, "loss": 0.4517, "lr": 0.0009763190585144682, "epoch": 3.7709643605870022, "percentage": 18.85, "elapsed_time": "0:18:13", "remaining_time": "1:18:27", "throughput": 4284.94, "total_tokens": 4686728} {"current_steps": 7200, "total_steps": 38160, "loss": 0.476, "lr": 0.0009762494639438783, "epoch": 3.7735849056603774, "percentage": 18.87, "elapsed_time": "0:18:14", "remaining_time": "1:18:26", "throughput": 4285.25, "total_tokens": 4690376} {"current_steps": 7205, "total_steps": 38160, "loss": 0.4421, "lr": 0.0009761797697473339, "epoch": 3.7762054507337526, "percentage": 18.88, "elapsed_time": "0:18:15", "remaining_time": "1:18:26", "throughput": 4285.99, "total_tokens": 4695304} {"current_steps": 7210, "total_steps": 38160, "loss": 0.5524, "lr": 0.0009761099759394142, "epoch": 3.7788259958071277, "percentage": 18.89, "elapsed_time": "0:18:16", "remaining_time": "1:18:25", "throughput": 4285.98, "total_tokens": 4698216} {"current_steps": 7215, "total_steps": 38160, "loss": 0.5829, "lr": 0.0009760400825347194, "epoch": 3.781446540880503, "percentage": 18.91, "elapsed_time": "0:18:16", "remaining_time": "1:18:24", "throughput": 4286.14, "total_tokens": 4701512} {"current_steps": 7220, "total_steps": 38160, "loss": 0.5409, "lr": 0.00097597008954787, "epoch": 3.7840670859538785, "percentage": 18.92, "elapsed_time": "0:18:17", "remaining_time": "1:18:23", "throughput": 4286.26, "total_tokens": 4704744} {"current_steps": 7225, "total_steps": 38160, "loss": 0.612, "lr": 0.0009758999969935083, "epoch": 3.7866876310272537, "percentage": 18.93, "elapsed_time": "0:18:18", "remaining_time": "1:18:22", "throughput": 4286.38, "total_tokens": 4707880} {"current_steps": 7230, "total_steps": 38160, "loss": 0.4144, "lr": 0.0009758298048862965, "epoch": 3.789308176100629, "percentage": 18.95, "elapsed_time": "0:18:19", "remaining_time": "1:18:21", "throughput": 4286.49, "total_tokens": 4711080} {"current_steps": 7235, "total_steps": 38160, "loss": 0.4047, "lr": 0.0009757595132409181, "epoch": 3.791928721174004, "percentage": 18.96, "elapsed_time": "0:18:19", "remaining_time": "1:18:21", "throughput": 4286.8, "total_tokens": 4714760} {"current_steps": 7240, "total_steps": 38160, "loss": 0.4132, "lr": 0.0009756891220720771, "epoch": 3.7945492662473796, "percentage": 18.97, "elapsed_time": "0:18:20", "remaining_time": "1:18:20", "throughput": 4287.06, "total_tokens": 4718248} {"current_steps": 7245, "total_steps": 38160, "loss": 0.7935, "lr": 0.0009756186313944988, "epoch": 3.797169811320755, "percentage": 18.99, "elapsed_time": "0:18:21", "remaining_time": "1:18:19", "throughput": 4287.19, "total_tokens": 4721480} {"current_steps": 7250, "total_steps": 38160, "loss": 0.4794, "lr": 0.0009755480412229291, "epoch": 3.79979035639413, "percentage": 19.0, "elapsed_time": "0:18:21", "remaining_time": "1:18:18", "throughput": 4287.17, "total_tokens": 4724328} {"current_steps": 7255, "total_steps": 38160, "loss": 0.4169, "lr": 0.0009754773515721343, "epoch": 3.802410901467505, "percentage": 19.01, "elapsed_time": "0:18:22", "remaining_time": "1:18:17", "throughput": 4287.23, "total_tokens": 4727432} {"current_steps": 7260, "total_steps": 38160, "loss": 0.5702, "lr": 0.0009754065624569022, "epoch": 3.8050314465408803, "percentage": 19.03, "elapsed_time": "0:18:23", "remaining_time": "1:18:16", "throughput": 4287.46, "total_tokens": 4730952} {"current_steps": 7265, "total_steps": 38160, "loss": 0.5236, "lr": 0.000975335673892041, "epoch": 3.8076519916142555, "percentage": 19.04, "elapsed_time": "0:18:24", "remaining_time": "1:18:15", "throughput": 4287.38, "total_tokens": 4733704} {"current_steps": 7270, "total_steps": 38160, "loss": 0.4985, "lr": 0.0009752646858923797, "epoch": 3.810272536687631, "percentage": 19.05, "elapsed_time": "0:18:24", "remaining_time": "1:18:14", "throughput": 4287.28, "total_tokens": 4736424} {"current_steps": 7275, "total_steps": 38160, "loss": 0.456, "lr": 0.0009751935984727683, "epoch": 3.8128930817610063, "percentage": 19.06, "elapsed_time": "0:18:25", "remaining_time": "1:18:13", "throughput": 4287.49, "total_tokens": 4739944} {"current_steps": 7280, "total_steps": 38160, "loss": 0.4036, "lr": 0.0009751224116480772, "epoch": 3.8155136268343814, "percentage": 19.08, "elapsed_time": "0:18:26", "remaining_time": "1:18:12", "throughput": 4287.81, "total_tokens": 4743656} {"current_steps": 7285, "total_steps": 38160, "loss": 0.4539, "lr": 0.0009750511254331982, "epoch": 3.818134171907757, "percentage": 19.09, "elapsed_time": "0:18:26", "remaining_time": "1:18:11", "throughput": 4287.74, "total_tokens": 4746440} {"current_steps": 7290, "total_steps": 38160, "loss": 0.4757, "lr": 0.0009749797398430433, "epoch": 3.8207547169811322, "percentage": 19.1, "elapsed_time": "0:18:27", "remaining_time": "1:18:10", "throughput": 4287.87, "total_tokens": 4749672} {"current_steps": 7295, "total_steps": 38160, "loss": 0.5758, "lr": 0.0009749082548925459, "epoch": 3.8233752620545074, "percentage": 19.12, "elapsed_time": "0:18:28", "remaining_time": "1:18:09", "throughput": 4288.12, "total_tokens": 4753224} {"current_steps": 7300, "total_steps": 38160, "loss": 0.4205, "lr": 0.0009748366705966593, "epoch": 3.8259958071278826, "percentage": 19.13, "elapsed_time": "0:18:29", "remaining_time": "1:18:08", "throughput": 4288.07, "total_tokens": 4756072} {"current_steps": 7305, "total_steps": 38160, "loss": 0.418, "lr": 0.0009747649869703588, "epoch": 3.8286163522012577, "percentage": 19.14, "elapsed_time": "0:18:29", "remaining_time": "1:18:07", "throughput": 4288.23, "total_tokens": 4759368} {"current_steps": 7310, "total_steps": 38160, "loss": 0.5881, "lr": 0.0009746932040286391, "epoch": 3.831236897274633, "percentage": 19.16, "elapsed_time": "0:18:30", "remaining_time": "1:18:06", "throughput": 4288.24, "total_tokens": 4762280} {"current_steps": 7315, "total_steps": 38160, "loss": 0.4295, "lr": 0.000974621321786517, "epoch": 3.8338574423480085, "percentage": 19.17, "elapsed_time": "0:18:31", "remaining_time": "1:18:05", "throughput": 4288.32, "total_tokens": 4765544} {"current_steps": 7320, "total_steps": 38160, "loss": 0.4743, "lr": 0.000974549340259029, "epoch": 3.8364779874213837, "percentage": 19.18, "elapsed_time": "0:18:31", "remaining_time": "1:18:04", "throughput": 4288.27, "total_tokens": 4768424} {"current_steps": 7325, "total_steps": 38160, "loss": 0.4627, "lr": 0.000974477259461233, "epoch": 3.839098532494759, "percentage": 19.2, "elapsed_time": "0:18:32", "remaining_time": "1:18:03", "throughput": 4288.32, "total_tokens": 4771464} {"current_steps": 7330, "total_steps": 38160, "loss": 0.4337, "lr": 0.0009744050794082074, "epoch": 3.841719077568134, "percentage": 19.21, "elapsed_time": "0:18:33", "remaining_time": "1:18:03", "throughput": 4288.64, "total_tokens": 4775208} {"current_steps": 7335, "total_steps": 38160, "loss": 0.3622, "lr": 0.0009743328001150515, "epoch": 3.8443396226415096, "percentage": 19.22, "elapsed_time": "0:18:34", "remaining_time": "1:18:01", "throughput": 4288.48, "total_tokens": 4777768} {"current_steps": 7340, "total_steps": 38160, "loss": 0.4101, "lr": 0.0009742604215968853, "epoch": 3.846960167714885, "percentage": 19.23, "elapsed_time": "0:18:34", "remaining_time": "1:18:01", "throughput": 4288.99, "total_tokens": 4781864} {"current_steps": 7345, "total_steps": 38160, "loss": 0.405, "lr": 0.0009741879438688495, "epoch": 3.84958071278826, "percentage": 19.25, "elapsed_time": "0:18:35", "remaining_time": "1:18:00", "throughput": 4289.17, "total_tokens": 4785352} {"current_steps": 7350, "total_steps": 38160, "loss": 0.4652, "lr": 0.0009741153669461058, "epoch": 3.852201257861635, "percentage": 19.26, "elapsed_time": "0:18:36", "remaining_time": "1:17:59", "throughput": 4288.98, "total_tokens": 4787848} {"current_steps": 7355, "total_steps": 38160, "loss": 0.3329, "lr": 0.0009740426908438362, "epoch": 3.8548218029350103, "percentage": 19.27, "elapsed_time": "0:18:37", "remaining_time": "1:17:58", "throughput": 4289.05, "total_tokens": 4790952} {"current_steps": 7360, "total_steps": 38160, "loss": 0.2973, "lr": 0.0009739699155772439, "epoch": 3.8574423480083855, "percentage": 19.29, "elapsed_time": "0:18:37", "remaining_time": "1:17:57", "throughput": 4289.43, "total_tokens": 4794824} {"current_steps": 7365, "total_steps": 38160, "loss": 0.4267, "lr": 0.0009738970411615525, "epoch": 3.860062893081761, "percentage": 19.3, "elapsed_time": "0:18:38", "remaining_time": "1:17:57", "throughput": 4289.52, "total_tokens": 4798120} {"current_steps": 7370, "total_steps": 38160, "loss": 0.4385, "lr": 0.0009738240676120067, "epoch": 3.8626834381551363, "percentage": 19.31, "elapsed_time": "0:18:39", "remaining_time": "1:17:56", "throughput": 4289.8, "total_tokens": 4801704} {"current_steps": 7375, "total_steps": 38160, "loss": 0.6351, "lr": 0.0009737509949438717, "epoch": 3.8653039832285114, "percentage": 19.33, "elapsed_time": "0:18:40", "remaining_time": "1:17:55", "throughput": 4289.88, "total_tokens": 4804776} {"current_steps": 7380, "total_steps": 38160, "loss": 0.6406, "lr": 0.0009736778231724333, "epoch": 3.867924528301887, "percentage": 19.34, "elapsed_time": "0:18:40", "remaining_time": "1:17:54", "throughput": 4289.76, "total_tokens": 4807496} {"current_steps": 7385, "total_steps": 38160, "loss": 0.4659, "lr": 0.0009736045523129982, "epoch": 3.870545073375262, "percentage": 19.35, "elapsed_time": "0:18:41", "remaining_time": "1:17:52", "throughput": 4289.65, "total_tokens": 4810152} {"current_steps": 7390, "total_steps": 38160, "loss": 0.3608, "lr": 0.0009735311823808938, "epoch": 3.8731656184486374, "percentage": 19.37, "elapsed_time": "0:18:42", "remaining_time": "1:17:52", "throughput": 4289.91, "total_tokens": 4813736} {"current_steps": 7395, "total_steps": 38160, "loss": 0.5668, "lr": 0.0009734577133914687, "epoch": 3.8757861635220126, "percentage": 19.38, "elapsed_time": "0:18:42", "remaining_time": "1:17:51", "throughput": 4290.03, "total_tokens": 4816904} {"current_steps": 7400, "total_steps": 38160, "loss": 0.4104, "lr": 0.0009733841453600914, "epoch": 3.8784067085953877, "percentage": 19.39, "elapsed_time": "0:18:43", "remaining_time": "1:17:50", "throughput": 4290.12, "total_tokens": 4820168} {"current_steps": 7405, "total_steps": 38160, "loss": 0.6474, "lr": 0.0009733104783021515, "epoch": 3.881027253668763, "percentage": 19.41, "elapsed_time": "0:18:44", "remaining_time": "1:17:49", "throughput": 4290.15, "total_tokens": 4823176} {"current_steps": 7410, "total_steps": 38160, "loss": 0.4528, "lr": 0.0009732367122330593, "epoch": 3.8836477987421385, "percentage": 19.42, "elapsed_time": "0:18:44", "remaining_time": "1:17:48", "throughput": 4290.24, "total_tokens": 4826344} {"current_steps": 7415, "total_steps": 38160, "loss": 0.4533, "lr": 0.0009731628471682459, "epoch": 3.8862683438155137, "percentage": 19.43, "elapsed_time": "0:18:45", "remaining_time": "1:17:47", "throughput": 4290.56, "total_tokens": 4830120} {"current_steps": 7420, "total_steps": 38160, "loss": 0.4436, "lr": 0.000973088883123163, "epoch": 3.888888888888889, "percentage": 19.44, "elapsed_time": "0:18:46", "remaining_time": "1:17:46", "throughput": 4290.73, "total_tokens": 4833576} {"current_steps": 7425, "total_steps": 38160, "loss": 0.3908, "lr": 0.0009730148201132829, "epoch": 3.891509433962264, "percentage": 19.46, "elapsed_time": "0:18:47", "remaining_time": "1:17:46", "throughput": 4290.76, "total_tokens": 4836776} {"current_steps": 7430, "total_steps": 38160, "loss": 0.6002, "lr": 0.0009729406581540991, "epoch": 3.8941299790356396, "percentage": 19.47, "elapsed_time": "0:18:48", "remaining_time": "1:17:45", "throughput": 4291.18, "total_tokens": 4840808} {"current_steps": 7435, "total_steps": 38160, "loss": 0.5569, "lr": 0.0009728663972611251, "epoch": 3.896750524109015, "percentage": 19.48, "elapsed_time": "0:18:49", "remaining_time": "1:17:46", "throughput": 4292.54, "total_tokens": 4847624} {"current_steps": 7440, "total_steps": 38160, "loss": 0.5714, "lr": 0.0009727920374498955, "epoch": 3.89937106918239, "percentage": 19.5, "elapsed_time": "0:18:49", "remaining_time": "1:17:45", "throughput": 4292.5, "total_tokens": 4850504} {"current_steps": 7445, "total_steps": 38160, "loss": 0.3912, "lr": 0.0009727175787359656, "epoch": 3.901991614255765, "percentage": 19.51, "elapsed_time": "0:18:50", "remaining_time": "1:17:44", "throughput": 4292.52, "total_tokens": 4853448} {"current_steps": 7450, "total_steps": 38160, "loss": 0.4788, "lr": 0.0009726430211349113, "epoch": 3.9046121593291403, "percentage": 19.52, "elapsed_time": "0:18:51", "remaining_time": "1:17:43", "throughput": 4292.36, "total_tokens": 4856040} {"current_steps": 7455, "total_steps": 38160, "loss": 0.5021, "lr": 0.0009725683646623291, "epoch": 3.9072327044025155, "percentage": 19.54, "elapsed_time": "0:18:52", "remaining_time": "1:17:42", "throughput": 4292.76, "total_tokens": 4859976} {"current_steps": 7460, "total_steps": 38160, "loss": 0.4916, "lr": 0.0009724936093338365, "epoch": 3.909853249475891, "percentage": 19.55, "elapsed_time": "0:18:52", "remaining_time": "1:17:42", "throughput": 4292.91, "total_tokens": 4863304} {"current_steps": 7465, "total_steps": 38160, "loss": 0.6107, "lr": 0.0009724187551650712, "epoch": 3.9124737945492662, "percentage": 19.56, "elapsed_time": "0:18:53", "remaining_time": "1:17:41", "throughput": 4292.96, "total_tokens": 4866568} {"current_steps": 7470, "total_steps": 38160, "loss": 0.5308, "lr": 0.0009723438021716919, "epoch": 3.9150943396226414, "percentage": 19.58, "elapsed_time": "0:18:54", "remaining_time": "1:17:40", "throughput": 4293.25, "total_tokens": 4870312} {"current_steps": 7475, "total_steps": 38160, "loss": 0.6377, "lr": 0.0009722687503693782, "epoch": 3.917714884696017, "percentage": 19.59, "elapsed_time": "0:18:55", "remaining_time": "1:17:39", "throughput": 4293.51, "total_tokens": 4873864} {"current_steps": 7480, "total_steps": 38160, "loss": 0.5481, "lr": 0.0009721935997738296, "epoch": 3.920335429769392, "percentage": 19.6, "elapsed_time": "0:18:55", "remaining_time": "1:17:38", "throughput": 4293.62, "total_tokens": 4877032} {"current_steps": 7485, "total_steps": 38160, "loss": 0.5004, "lr": 0.0009721183504007671, "epoch": 3.9229559748427674, "percentage": 19.61, "elapsed_time": "0:18:56", "remaining_time": "1:17:37", "throughput": 4293.69, "total_tokens": 4880136} {"current_steps": 7490, "total_steps": 38160, "loss": 0.4855, "lr": 0.0009720430022659319, "epoch": 3.9255765199161425, "percentage": 19.63, "elapsed_time": "0:18:57", "remaining_time": "1:17:37", "throughput": 4294.0, "total_tokens": 4883720} {"current_steps": 7495, "total_steps": 38160, "loss": 0.5803, "lr": 0.000971967555385086, "epoch": 3.9281970649895177, "percentage": 19.64, "elapsed_time": "0:18:57", "remaining_time": "1:17:35", "throughput": 4293.89, "total_tokens": 4886440} {"current_steps": 7500, "total_steps": 38160, "loss": 0.4955, "lr": 0.000971892009774012, "epoch": 3.930817610062893, "percentage": 19.65, "elapsed_time": "0:18:58", "remaining_time": "1:17:34", "throughput": 4293.7, "total_tokens": 4888936} {"current_steps": 7505, "total_steps": 38160, "loss": 0.5093, "lr": 0.0009718163654485133, "epoch": 3.9334381551362685, "percentage": 19.67, "elapsed_time": "0:18:59", "remaining_time": "1:17:33", "throughput": 4293.29, "total_tokens": 4890952} {"current_steps": 7510, "total_steps": 38160, "loss": 0.5502, "lr": 0.0009717406224244136, "epoch": 3.9360587002096437, "percentage": 19.68, "elapsed_time": "0:18:59", "remaining_time": "1:17:32", "throughput": 4293.22, "total_tokens": 4893736} {"current_steps": 7515, "total_steps": 38160, "loss": 0.5686, "lr": 0.0009716647807175575, "epoch": 3.938679245283019, "percentage": 19.69, "elapsed_time": "0:19:00", "remaining_time": "1:17:31", "throughput": 4293.5, "total_tokens": 4897384} {"current_steps": 7520, "total_steps": 38160, "loss": 0.4949, "lr": 0.0009715888403438105, "epoch": 3.941299790356394, "percentage": 19.71, "elapsed_time": "0:19:01", "remaining_time": "1:17:30", "throughput": 4293.65, "total_tokens": 4900808} {"current_steps": 7525, "total_steps": 38160, "loss": 0.7748, "lr": 0.0009715128013190581, "epoch": 3.9439203354297696, "percentage": 19.72, "elapsed_time": "0:19:02", "remaining_time": "1:17:29", "throughput": 4293.56, "total_tokens": 4903592} {"current_steps": 7530, "total_steps": 38160, "loss": 0.4723, "lr": 0.0009714366636592069, "epoch": 3.9465408805031448, "percentage": 19.73, "elapsed_time": "0:19:02", "remaining_time": "1:17:28", "throughput": 4293.77, "total_tokens": 4907048} {"current_steps": 7535, "total_steps": 38160, "loss": 0.484, "lr": 0.0009713604273801844, "epoch": 3.94916142557652, "percentage": 19.75, "elapsed_time": "0:19:03", "remaining_time": "1:17:27", "throughput": 4293.71, "total_tokens": 4909960} {"current_steps": 7540, "total_steps": 38160, "loss": 0.366, "lr": 0.0009712840924979378, "epoch": 3.951781970649895, "percentage": 19.76, "elapsed_time": "0:19:04", "remaining_time": "1:17:27", "throughput": 4294.02, "total_tokens": 4913768} {"current_steps": 7545, "total_steps": 38160, "loss": 0.5326, "lr": 0.0009712076590284357, "epoch": 3.9544025157232703, "percentage": 19.77, "elapsed_time": "0:19:05", "remaining_time": "1:17:26", "throughput": 4294.3, "total_tokens": 4917416} {"current_steps": 7550, "total_steps": 38160, "loss": 0.3757, "lr": 0.0009711311269876674, "epoch": 3.9570230607966455, "percentage": 19.79, "elapsed_time": "0:19:06", "remaining_time": "1:17:26", "throughput": 4294.92, "total_tokens": 4922056} {"current_steps": 7555, "total_steps": 38160, "loss": 0.5003, "lr": 0.0009710544963916421, "epoch": 3.959643605870021, "percentage": 19.8, "elapsed_time": "0:19:06", "remaining_time": "1:17:25", "throughput": 4295.0, "total_tokens": 4925320} {"current_steps": 7560, "total_steps": 38160, "loss": 0.6686, "lr": 0.0009709777672563903, "epoch": 3.9622641509433962, "percentage": 19.81, "elapsed_time": "0:19:07", "remaining_time": "1:17:24", "throughput": 4294.97, "total_tokens": 4928168} {"current_steps": 7565, "total_steps": 38160, "loss": 0.4528, "lr": 0.0009709009395979628, "epoch": 3.9648846960167714, "percentage": 19.82, "elapsed_time": "0:19:08", "remaining_time": "1:17:23", "throughput": 4294.95, "total_tokens": 4931176} {"current_steps": 7570, "total_steps": 38160, "loss": 0.4192, "lr": 0.0009708240134324311, "epoch": 3.967505241090147, "percentage": 19.84, "elapsed_time": "0:19:08", "remaining_time": "1:17:22", "throughput": 4295.39, "total_tokens": 4935304} {"current_steps": 7575, "total_steps": 38160, "loss": 0.5299, "lr": 0.0009707469887758871, "epoch": 3.970125786163522, "percentage": 19.85, "elapsed_time": "0:19:09", "remaining_time": "1:17:22", "throughput": 4295.55, "total_tokens": 4938600} {"current_steps": 7580, "total_steps": 38160, "loss": 0.4068, "lr": 0.0009706698656444437, "epoch": 3.9727463312368974, "percentage": 19.86, "elapsed_time": "0:19:10", "remaining_time": "1:17:20", "throughput": 4295.55, "total_tokens": 4941512} {"current_steps": 7585, "total_steps": 38160, "loss": 0.4638, "lr": 0.000970592644054234, "epoch": 3.9753668763102725, "percentage": 19.88, "elapsed_time": "0:19:11", "remaining_time": "1:17:20", "throughput": 4295.65, "total_tokens": 4944744} {"current_steps": 7590, "total_steps": 38160, "loss": 0.4887, "lr": 0.000970515324021412, "epoch": 3.9779874213836477, "percentage": 19.89, "elapsed_time": "0:19:11", "remaining_time": "1:17:19", "throughput": 4295.8, "total_tokens": 4948072} {"current_steps": 7595, "total_steps": 38160, "loss": 0.5549, "lr": 0.0009704379055621523, "epoch": 3.980607966457023, "percentage": 19.9, "elapsed_time": "0:19:12", "remaining_time": "1:17:18", "throughput": 4296.04, "total_tokens": 4951656} {"current_steps": 7600, "total_steps": 38160, "loss": 0.3052, "lr": 0.0009703603886926497, "epoch": 3.9832285115303985, "percentage": 19.92, "elapsed_time": "0:19:13", "remaining_time": "1:17:17", "throughput": 4296.37, "total_tokens": 4955400} {"current_steps": 7605, "total_steps": 38160, "loss": 0.428, "lr": 0.0009702827734291198, "epoch": 3.9858490566037736, "percentage": 19.93, "elapsed_time": "0:19:14", "remaining_time": "1:17:16", "throughput": 4296.44, "total_tokens": 4958568} {"current_steps": 7610, "total_steps": 38160, "loss": 0.4542, "lr": 0.0009702050597877992, "epoch": 3.988469601677149, "percentage": 19.94, "elapsed_time": "0:19:14", "remaining_time": "1:17:15", "throughput": 4296.47, "total_tokens": 4961608} {"current_steps": 7615, "total_steps": 38160, "loss": 0.4521, "lr": 0.0009701272477849444, "epoch": 3.991090146750524, "percentage": 19.96, "elapsed_time": "0:19:15", "remaining_time": "1:17:15", "throughput": 4296.74, "total_tokens": 4965288} {"current_steps": 7620, "total_steps": 38160, "loss": 0.4247, "lr": 0.0009700493374368327, "epoch": 3.9937106918238996, "percentage": 19.97, "elapsed_time": "0:19:16", "remaining_time": "1:17:14", "throughput": 4296.8, "total_tokens": 4968424} {"current_steps": 7625, "total_steps": 38160, "loss": 0.4994, "lr": 0.0009699713287597624, "epoch": 3.9963312368972748, "percentage": 19.98, "elapsed_time": "0:19:17", "remaining_time": "1:17:13", "throughput": 4297.08, "total_tokens": 4972200} {"current_steps": 7630, "total_steps": 38160, "loss": 0.515, "lr": 0.0009698932217700518, "epoch": 3.99895178197065, "percentage": 19.99, "elapsed_time": "0:19:17", "remaining_time": "1:17:12", "throughput": 4297.23, "total_tokens": 4975560} {"current_steps": 7632, "total_steps": 38160, "eval_loss": 0.4608750343322754, "epoch": 4.0, "percentage": 20.0, "elapsed_time": "0:19:31", "remaining_time": "1:18:07", "throughput": 4246.33, "total_tokens": 4976128} {"current_steps": 7635, "total_steps": 38160, "loss": 0.4732, "lr": 0.0009698150164840399, "epoch": 4.001572327044025, "percentage": 20.01, "elapsed_time": "0:19:33", "remaining_time": "1:18:13", "throughput": 4240.78, "total_tokens": 4977984} {"current_steps": 7640, "total_steps": 38160, "loss": 0.3771, "lr": 0.0009697367129180866, "epoch": 4.0041928721174, "percentage": 20.02, "elapsed_time": "0:19:34", "remaining_time": "1:18:11", "throughput": 4240.76, "total_tokens": 4980896} {"current_steps": 7645, "total_steps": 38160, "loss": 0.4093, "lr": 0.000969658311088572, "epoch": 4.006813417190775, "percentage": 20.03, "elapsed_time": "0:19:35", "remaining_time": "1:18:11", "throughput": 4241.04, "total_tokens": 4984512} {"current_steps": 7650, "total_steps": 38160, "loss": 0.4575, "lr": 0.0009695798110118969, "epoch": 4.009433962264151, "percentage": 20.05, "elapsed_time": "0:19:36", "remaining_time": "1:18:10", "throughput": 4241.36, "total_tokens": 4988320} {"current_steps": 7655, "total_steps": 38160, "loss": 0.6352, "lr": 0.0009695012127044824, "epoch": 4.012054507337526, "percentage": 20.06, "elapsed_time": "0:19:36", "remaining_time": "1:18:09", "throughput": 4241.44, "total_tokens": 4991392} {"current_steps": 7660, "total_steps": 38160, "loss": 0.4822, "lr": 0.0009694225161827707, "epoch": 4.014675052410902, "percentage": 20.07, "elapsed_time": "0:19:37", "remaining_time": "1:18:09", "throughput": 4241.96, "total_tokens": 4995680} {"current_steps": 7665, "total_steps": 38160, "loss": 0.5754, "lr": 0.0009693437214632241, "epoch": 4.017295597484277, "percentage": 20.09, "elapsed_time": "0:19:38", "remaining_time": "1:18:08", "throughput": 4242.31, "total_tokens": 4999424} {"current_steps": 7670, "total_steps": 38160, "loss": 0.5263, "lr": 0.0009692648285623256, "epoch": 4.019916142557652, "percentage": 20.1, "elapsed_time": "0:19:39", "remaining_time": "1:18:07", "throughput": 4242.25, "total_tokens": 5002272} {"current_steps": 7675, "total_steps": 38160, "loss": 0.409, "lr": 0.0009691858374965784, "epoch": 4.022536687631027, "percentage": 20.11, "elapsed_time": "0:19:39", "remaining_time": "1:18:06", "throughput": 4242.5, "total_tokens": 5005888} {"current_steps": 7680, "total_steps": 38160, "loss": 0.3479, "lr": 0.0009691067482825069, "epoch": 4.0251572327044025, "percentage": 20.13, "elapsed_time": "0:19:40", "remaining_time": "1:18:06", "throughput": 4242.78, "total_tokens": 5009600} {"current_steps": 7685, "total_steps": 38160, "loss": 0.4309, "lr": 0.0009690275609366554, "epoch": 4.027777777777778, "percentage": 20.14, "elapsed_time": "0:19:41", "remaining_time": "1:18:05", "throughput": 4243.21, "total_tokens": 5013568} {"current_steps": 7690, "total_steps": 38160, "loss": 0.4858, "lr": 0.0009689482754755891, "epoch": 4.030398322851153, "percentage": 20.15, "elapsed_time": "0:19:42", "remaining_time": "1:18:04", "throughput": 4243.32, "total_tokens": 5016800} {"current_steps": 7695, "total_steps": 38160, "loss": 0.5316, "lr": 0.0009688688919158938, "epoch": 4.033018867924528, "percentage": 20.17, "elapsed_time": "0:19:43", "remaining_time": "1:18:03", "throughput": 4243.44, "total_tokens": 5020032} {"current_steps": 7700, "total_steps": 38160, "loss": 0.4836, "lr": 0.0009687894102741754, "epoch": 4.035639412997903, "percentage": 20.18, "elapsed_time": "0:19:43", "remaining_time": "1:18:02", "throughput": 4243.52, "total_tokens": 5023168} {"current_steps": 7705, "total_steps": 38160, "loss": 0.3718, "lr": 0.0009687098305670605, "epoch": 4.038259958071279, "percentage": 20.19, "elapsed_time": "0:19:44", "remaining_time": "1:18:01", "throughput": 4243.92, "total_tokens": 5027040} {"current_steps": 7710, "total_steps": 38160, "loss": 0.6156, "lr": 0.0009686301528111964, "epoch": 4.040880503144654, "percentage": 20.2, "elapsed_time": "0:19:45", "remaining_time": "1:18:01", "throughput": 4243.93, "total_tokens": 5030112} {"current_steps": 7715, "total_steps": 38160, "loss": 0.3784, "lr": 0.0009685503770232507, "epoch": 4.04350104821803, "percentage": 20.22, "elapsed_time": "0:19:46", "remaining_time": "1:18:00", "throughput": 4244.11, "total_tokens": 5033600} {"current_steps": 7720, "total_steps": 38160, "loss": 0.2836, "lr": 0.0009684705032199117, "epoch": 4.046121593291405, "percentage": 20.23, "elapsed_time": "0:19:46", "remaining_time": "1:17:59", "throughput": 4244.06, "total_tokens": 5036416} {"current_steps": 7725, "total_steps": 38160, "loss": 0.5517, "lr": 0.0009683905314178881, "epoch": 4.04874213836478, "percentage": 20.24, "elapsed_time": "0:19:47", "remaining_time": "1:17:58", "throughput": 4244.18, "total_tokens": 5039552} {"current_steps": 7730, "total_steps": 38160, "loss": 0.4939, "lr": 0.000968310461633909, "epoch": 4.051362683438155, "percentage": 20.26, "elapsed_time": "0:19:48", "remaining_time": "1:17:57", "throughput": 4244.77, "total_tokens": 5044032} {"current_steps": 7735, "total_steps": 38160, "loss": 0.3713, "lr": 0.0009682302938847238, "epoch": 4.05398322851153, "percentage": 20.27, "elapsed_time": "0:19:49", "remaining_time": "1:17:56", "throughput": 4244.9, "total_tokens": 5047232} {"current_steps": 7740, "total_steps": 38160, "loss": 0.5267, "lr": 0.0009681500281871031, "epoch": 4.056603773584905, "percentage": 20.28, "elapsed_time": "0:19:49", "remaining_time": "1:17:56", "throughput": 4245.1, "total_tokens": 5050624} {"current_steps": 7745, "total_steps": 38160, "loss": 0.4549, "lr": 0.0009680696645578377, "epoch": 4.059224318658281, "percentage": 20.3, "elapsed_time": "0:19:50", "remaining_time": "1:17:55", "throughput": 4245.69, "total_tokens": 5055008} {"current_steps": 7750, "total_steps": 38160, "loss": 0.4513, "lr": 0.0009679892030137382, "epoch": 4.061844863731656, "percentage": 20.31, "elapsed_time": "0:19:51", "remaining_time": "1:17:54", "throughput": 4245.79, "total_tokens": 5058240} {"current_steps": 7755, "total_steps": 38160, "loss": 0.3369, "lr": 0.0009679086435716368, "epoch": 4.064465408805032, "percentage": 20.32, "elapsed_time": "0:19:52", "remaining_time": "1:17:53", "throughput": 4245.66, "total_tokens": 5060864} {"current_steps": 7760, "total_steps": 38160, "loss": 0.5655, "lr": 0.0009678279862483852, "epoch": 4.067085953878407, "percentage": 20.34, "elapsed_time": "0:19:52", "remaining_time": "1:17:52", "throughput": 4245.9, "total_tokens": 5064384} {"current_steps": 7765, "total_steps": 38160, "loss": 0.4359, "lr": 0.0009677472310608561, "epoch": 4.069706498951782, "percentage": 20.35, "elapsed_time": "0:19:53", "remaining_time": "1:17:52", "throughput": 4246.19, "total_tokens": 5068096} {"current_steps": 7770, "total_steps": 38160, "loss": 0.524, "lr": 0.0009676663780259427, "epoch": 4.072327044025157, "percentage": 20.36, "elapsed_time": "0:19:54", "remaining_time": "1:17:50", "throughput": 4246.15, "total_tokens": 5070944} {"current_steps": 7775, "total_steps": 38160, "loss": 0.5017, "lr": 0.0009675854271605583, "epoch": 4.0749475890985325, "percentage": 20.37, "elapsed_time": "0:19:55", "remaining_time": "1:17:50", "throughput": 4246.44, "total_tokens": 5074624} {"current_steps": 7780, "total_steps": 38160, "loss": 0.5619, "lr": 0.0009675043784816371, "epoch": 4.077568134171908, "percentage": 20.39, "elapsed_time": "0:19:55", "remaining_time": "1:17:49", "throughput": 4246.25, "total_tokens": 5077216} {"current_steps": 7785, "total_steps": 38160, "loss": 0.5168, "lr": 0.0009674232320061336, "epoch": 4.080188679245283, "percentage": 20.4, "elapsed_time": "0:19:56", "remaining_time": "1:17:47", "throughput": 4246.13, "total_tokens": 5079872} {"current_steps": 7790, "total_steps": 38160, "loss": 0.5498, "lr": 0.0009673419877510226, "epoch": 4.082809224318658, "percentage": 20.41, "elapsed_time": "0:19:57", "remaining_time": "1:17:46", "throughput": 4246.03, "total_tokens": 5082592} {"current_steps": 7795, "total_steps": 38160, "loss": 0.4107, "lr": 0.0009672606457332994, "epoch": 4.085429769392033, "percentage": 20.43, "elapsed_time": "0:19:57", "remaining_time": "1:17:45", "throughput": 4246.26, "total_tokens": 5086144} {"current_steps": 7800, "total_steps": 38160, "loss": 0.3619, "lr": 0.0009671792059699798, "epoch": 4.088050314465409, "percentage": 20.44, "elapsed_time": "0:19:58", "remaining_time": "1:17:45", "throughput": 4246.53, "total_tokens": 5089696} {"current_steps": 7805, "total_steps": 38160, "loss": 0.4513, "lr": 0.0009670976684781003, "epoch": 4.090670859538784, "percentage": 20.45, "elapsed_time": "0:19:59", "remaining_time": "1:17:44", "throughput": 4246.54, "total_tokens": 5092672} {"current_steps": 7810, "total_steps": 38160, "loss": 0.4722, "lr": 0.0009670160332747174, "epoch": 4.09329140461216, "percentage": 20.47, "elapsed_time": "0:19:59", "remaining_time": "1:17:42", "throughput": 4246.23, "total_tokens": 5094848} {"current_steps": 7815, "total_steps": 38160, "loss": 0.3624, "lr": 0.0009669343003769085, "epoch": 4.095911949685535, "percentage": 20.48, "elapsed_time": "0:20:00", "remaining_time": "1:17:41", "throughput": 4246.07, "total_tokens": 5097408} {"current_steps": 7820, "total_steps": 38160, "loss": 0.4902, "lr": 0.0009668524698017709, "epoch": 4.09853249475891, "percentage": 20.49, "elapsed_time": "0:20:01", "remaining_time": "1:17:40", "throughput": 4245.9, "total_tokens": 5099872} {"current_steps": 7825, "total_steps": 38160, "loss": 0.5524, "lr": 0.0009667705415664227, "epoch": 4.101153039832285, "percentage": 20.51, "elapsed_time": "0:20:01", "remaining_time": "1:17:39", "throughput": 4246.13, "total_tokens": 5103392} {"current_steps": 7830, "total_steps": 38160, "loss": 0.4388, "lr": 0.0009666885156880026, "epoch": 4.10377358490566, "percentage": 20.52, "elapsed_time": "0:20:02", "remaining_time": "1:17:37", "throughput": 4245.9, "total_tokens": 5105696} {"current_steps": 7835, "total_steps": 38160, "loss": 0.5564, "lr": 0.0009666063921836692, "epoch": 4.106394129979035, "percentage": 20.53, "elapsed_time": "0:20:03", "remaining_time": "1:17:37", "throughput": 4246.15, "total_tokens": 5109312} {"current_steps": 7840, "total_steps": 38160, "loss": 0.5581, "lr": 0.0009665241710706019, "epoch": 4.109014675052411, "percentage": 20.55, "elapsed_time": "0:20:03", "remaining_time": "1:17:35", "throughput": 4245.99, "total_tokens": 5111840} {"current_steps": 7845, "total_steps": 38160, "loss": 0.5677, "lr": 0.0009664418523660003, "epoch": 4.111635220125786, "percentage": 20.56, "elapsed_time": "0:20:04", "remaining_time": "1:17:34", "throughput": 4245.99, "total_tokens": 5114752} {"current_steps": 7850, "total_steps": 38160, "loss": 0.5428, "lr": 0.0009663594360870847, "epoch": 4.114255765199162, "percentage": 20.57, "elapsed_time": "0:20:05", "remaining_time": "1:17:33", "throughput": 4246.0, "total_tokens": 5117760} {"current_steps": 7855, "total_steps": 38160, "loss": 0.5209, "lr": 0.0009662769222510955, "epoch": 4.116876310272537, "percentage": 20.58, "elapsed_time": "0:20:06", "remaining_time": "1:17:33", "throughput": 4246.53, "total_tokens": 5122176} {"current_steps": 7860, "total_steps": 38160, "loss": 0.8199, "lr": 0.0009661943108752939, "epoch": 4.119496855345912, "percentage": 20.6, "elapsed_time": "0:20:06", "remaining_time": "1:17:32", "throughput": 4246.19, "total_tokens": 5124256} {"current_steps": 7865, "total_steps": 38160, "loss": 0.5559, "lr": 0.0009661116019769609, "epoch": 4.122117400419287, "percentage": 20.61, "elapsed_time": "0:20:07", "remaining_time": "1:17:30", "throughput": 4246.08, "total_tokens": 5126912} {"current_steps": 7870, "total_steps": 38160, "loss": 0.5484, "lr": 0.0009660287955733986, "epoch": 4.1247379454926625, "percentage": 20.62, "elapsed_time": "0:20:08", "remaining_time": "1:17:29", "throughput": 4246.21, "total_tokens": 5130144} {"current_steps": 7875, "total_steps": 38160, "loss": 0.4658, "lr": 0.0009659458916819289, "epoch": 4.127358490566038, "percentage": 20.64, "elapsed_time": "0:20:08", "remaining_time": "1:17:29", "throughput": 4246.31, "total_tokens": 5133440} {"current_steps": 7880, "total_steps": 38160, "loss": 0.552, "lr": 0.0009658628903198945, "epoch": 4.129979035639413, "percentage": 20.65, "elapsed_time": "0:20:10", "remaining_time": "1:17:30", "throughput": 4247.47, "total_tokens": 5140064} {"current_steps": 7885, "total_steps": 38160, "loss": 0.5201, "lr": 0.0009657797915046583, "epoch": 4.132599580712788, "percentage": 20.66, "elapsed_time": "0:20:10", "remaining_time": "1:17:28", "throughput": 4247.39, "total_tokens": 5142720} {"current_steps": 7890, "total_steps": 38160, "loss": 0.4648, "lr": 0.0009656965952536036, "epoch": 4.135220125786163, "percentage": 20.68, "elapsed_time": "0:20:11", "remaining_time": "1:17:27", "throughput": 4247.36, "total_tokens": 5145632} {"current_steps": 7895, "total_steps": 38160, "loss": 0.4251, "lr": 0.0009656133015841342, "epoch": 4.137840670859539, "percentage": 20.69, "elapsed_time": "0:20:12", "remaining_time": "1:17:26", "throughput": 4247.23, "total_tokens": 5148224} {"current_steps": 7900, "total_steps": 38160, "loss": 0.5702, "lr": 0.000965529910513674, "epoch": 4.140461215932914, "percentage": 20.7, "elapsed_time": "0:20:12", "remaining_time": "1:17:26", "throughput": 4247.59, "total_tokens": 5152096} {"current_steps": 7905, "total_steps": 38160, "loss": 0.5996, "lr": 0.0009654464220596676, "epoch": 4.1430817610062896, "percentage": 20.72, "elapsed_time": "0:20:13", "remaining_time": "1:17:25", "throughput": 4247.94, "total_tokens": 5155968} {"current_steps": 7910, "total_steps": 38160, "loss": 0.4524, "lr": 0.0009653628362395799, "epoch": 4.145702306079665, "percentage": 20.73, "elapsed_time": "0:20:14", "remaining_time": "1:17:24", "throughput": 4248.06, "total_tokens": 5159168} {"current_steps": 7915, "total_steps": 38160, "loss": 0.3846, "lr": 0.0009652791530708958, "epoch": 4.14832285115304, "percentage": 20.74, "elapsed_time": "0:20:15", "remaining_time": "1:17:23", "throughput": 4248.3, "total_tokens": 5162816} {"current_steps": 7920, "total_steps": 38160, "loss": 0.5538, "lr": 0.0009651953725711212, "epoch": 4.150943396226415, "percentage": 20.75, "elapsed_time": "0:20:16", "remaining_time": "1:17:23", "throughput": 4248.86, "total_tokens": 5167232} {"current_steps": 7925, "total_steps": 38160, "loss": 0.5103, "lr": 0.0009651114947577818, "epoch": 4.15356394129979, "percentage": 20.77, "elapsed_time": "0:20:16", "remaining_time": "1:17:22", "throughput": 4248.98, "total_tokens": 5170560} {"current_steps": 7930, "total_steps": 38160, "loss": 0.4012, "lr": 0.0009650275196484239, "epoch": 4.156184486373165, "percentage": 20.78, "elapsed_time": "0:20:17", "remaining_time": "1:17:21", "throughput": 4248.87, "total_tokens": 5173184} {"current_steps": 7935, "total_steps": 38160, "loss": 0.439, "lr": 0.0009649434472606144, "epoch": 4.158805031446541, "percentage": 20.79, "elapsed_time": "0:20:18", "remaining_time": "1:17:20", "throughput": 4248.93, "total_tokens": 5176288} {"current_steps": 7940, "total_steps": 38160, "loss": 0.4282, "lr": 0.00096485927761194, "epoch": 4.161425576519916, "percentage": 20.81, "elapsed_time": "0:20:19", "remaining_time": "1:17:20", "throughput": 4249.62, "total_tokens": 5181216} {"current_steps": 7945, "total_steps": 38160, "loss": 0.3656, "lr": 0.0009647750107200082, "epoch": 4.164046121593292, "percentage": 20.82, "elapsed_time": "0:20:19", "remaining_time": "1:17:19", "throughput": 4249.67, "total_tokens": 5184256} {"current_steps": 7950, "total_steps": 38160, "loss": 0.3605, "lr": 0.0009646906466024465, "epoch": 4.166666666666667, "percentage": 20.83, "elapsed_time": "0:20:20", "remaining_time": "1:17:18", "throughput": 4249.84, "total_tokens": 5187616} {"current_steps": 7955, "total_steps": 38160, "loss": 0.6301, "lr": 0.000964606185276903, "epoch": 4.169287211740042, "percentage": 20.85, "elapsed_time": "0:20:21", "remaining_time": "1:17:17", "throughput": 4249.61, "total_tokens": 5189952} {"current_steps": 7960, "total_steps": 38160, "loss": 0.5209, "lr": 0.0009645216267610461, "epoch": 4.171907756813417, "percentage": 20.86, "elapsed_time": "0:20:21", "remaining_time": "1:17:16", "throughput": 4249.47, "total_tokens": 5192608} {"current_steps": 7965, "total_steps": 38160, "loss": 0.4311, "lr": 0.0009644369710725644, "epoch": 4.1745283018867925, "percentage": 20.87, "elapsed_time": "0:20:22", "remaining_time": "1:17:15", "throughput": 4249.72, "total_tokens": 5196256} {"current_steps": 7970, "total_steps": 38160, "loss": 0.4506, "lr": 0.0009643522182291669, "epoch": 4.177148846960168, "percentage": 20.89, "elapsed_time": "0:20:23", "remaining_time": "1:17:14", "throughput": 4249.96, "total_tokens": 5199840} {"current_steps": 7975, "total_steps": 38160, "loss": 0.3182, "lr": 0.000964267368248583, "epoch": 4.179769392033543, "percentage": 20.9, "elapsed_time": "0:20:24", "remaining_time": "1:17:13", "throughput": 4249.89, "total_tokens": 5202688} {"current_steps": 7980, "total_steps": 38160, "loss": 0.6421, "lr": 0.0009641824211485623, "epoch": 4.182389937106918, "percentage": 20.91, "elapsed_time": "0:20:24", "remaining_time": "1:17:12", "throughput": 4249.74, "total_tokens": 5205248} {"current_steps": 7985, "total_steps": 38160, "loss": 0.4044, "lr": 0.0009640973769468747, "epoch": 4.185010482180293, "percentage": 20.93, "elapsed_time": "0:20:25", "remaining_time": "1:17:10", "throughput": 4249.55, "total_tokens": 5207648} {"current_steps": 7990, "total_steps": 38160, "loss": 0.4176, "lr": 0.0009640122356613105, "epoch": 4.187631027253669, "percentage": 20.94, "elapsed_time": "0:20:26", "remaining_time": "1:17:09", "throughput": 4249.43, "total_tokens": 5210272} {"current_steps": 7995, "total_steps": 38160, "loss": 0.5846, "lr": 0.0009639269973096805, "epoch": 4.190251572327044, "percentage": 20.95, "elapsed_time": "0:20:27", "remaining_time": "1:17:09", "throughput": 4250.04, "total_tokens": 5214848} {"current_steps": 8000, "total_steps": 38160, "loss": 0.4246, "lr": 0.0009638416619098154, "epoch": 4.1928721174004195, "percentage": 20.96, "elapsed_time": "0:20:27", "remaining_time": "1:17:08", "throughput": 4250.07, "total_tokens": 5217888} {"current_steps": 8005, "total_steps": 38160, "loss": 0.5191, "lr": 0.0009637562294795663, "epoch": 4.195492662473795, "percentage": 20.98, "elapsed_time": "0:20:28", "remaining_time": "1:17:07", "throughput": 4250.5, "total_tokens": 5221952} {"current_steps": 8010, "total_steps": 38160, "loss": 0.5484, "lr": 0.0009636707000368049, "epoch": 4.19811320754717, "percentage": 20.99, "elapsed_time": "0:20:29", "remaining_time": "1:17:07", "throughput": 4250.58, "total_tokens": 5225120} {"current_steps": 8015, "total_steps": 38160, "loss": 0.5317, "lr": 0.000963585073599423, "epoch": 4.200733752620545, "percentage": 21.0, "elapsed_time": "0:20:30", "remaining_time": "1:17:06", "throughput": 4250.71, "total_tokens": 5228448} {"current_steps": 8020, "total_steps": 38160, "loss": 0.5416, "lr": 0.0009634993501853323, "epoch": 4.20335429769392, "percentage": 21.02, "elapsed_time": "0:20:30", "remaining_time": "1:17:04", "throughput": 4250.57, "total_tokens": 5230976} {"current_steps": 8025, "total_steps": 38160, "loss": 0.5286, "lr": 0.0009634135298124656, "epoch": 4.205974842767295, "percentage": 21.03, "elapsed_time": "0:20:31", "remaining_time": "1:17:03", "throughput": 4250.68, "total_tokens": 5234112} {"current_steps": 8030, "total_steps": 38160, "loss": 0.6072, "lr": 0.0009633276124987752, "epoch": 4.2085953878406706, "percentage": 21.04, "elapsed_time": "0:20:32", "remaining_time": "1:17:03", "throughput": 4251.24, "total_tokens": 5238592} {"current_steps": 8035, "total_steps": 38160, "loss": 0.454, "lr": 0.0009632415982622342, "epoch": 4.211215932914046, "percentage": 21.06, "elapsed_time": "0:20:32", "remaining_time": "1:17:02", "throughput": 4251.26, "total_tokens": 5241568} {"current_steps": 8040, "total_steps": 38160, "loss": 0.379, "lr": 0.0009631554871208359, "epoch": 4.213836477987422, "percentage": 21.07, "elapsed_time": "0:20:33", "remaining_time": "1:17:01", "throughput": 4251.33, "total_tokens": 5244704} {"current_steps": 8045, "total_steps": 38160, "loss": 0.3711, "lr": 0.0009630692790925936, "epoch": 4.216457023060797, "percentage": 21.08, "elapsed_time": "0:20:34", "remaining_time": "1:17:00", "throughput": 4251.48, "total_tokens": 5248000} {"current_steps": 8050, "total_steps": 38160, "loss": 0.3997, "lr": 0.0009629829741955411, "epoch": 4.219077568134172, "percentage": 21.1, "elapsed_time": "0:20:35", "remaining_time": "1:17:00", "throughput": 4251.9, "total_tokens": 5252096} {"current_steps": 8055, "total_steps": 38160, "loss": 0.5583, "lr": 0.0009628965724477325, "epoch": 4.221698113207547, "percentage": 21.11, "elapsed_time": "0:20:35", "remaining_time": "1:16:59", "throughput": 4251.97, "total_tokens": 5255360} {"current_steps": 8060, "total_steps": 38160, "loss": 0.6131, "lr": 0.0009628100738672419, "epoch": 4.2243186582809225, "percentage": 21.12, "elapsed_time": "0:20:36", "remaining_time": "1:16:59", "throughput": 4252.44, "total_tokens": 5259712} {"current_steps": 8065, "total_steps": 38160, "loss": 0.4479, "lr": 0.0009627234784721637, "epoch": 4.226939203354298, "percentage": 21.13, "elapsed_time": "0:20:37", "remaining_time": "1:16:58", "throughput": 4252.53, "total_tokens": 5262912} {"current_steps": 8070, "total_steps": 38160, "loss": 0.4879, "lr": 0.0009626367862806129, "epoch": 4.229559748427673, "percentage": 21.15, "elapsed_time": "0:20:38", "remaining_time": "1:16:57", "throughput": 4252.45, "total_tokens": 5265664} {"current_steps": 8075, "total_steps": 38160, "loss": 0.4378, "lr": 0.0009625499973107246, "epoch": 4.232180293501048, "percentage": 21.16, "elapsed_time": "0:20:38", "remaining_time": "1:16:56", "throughput": 4252.61, "total_tokens": 5268928} {"current_steps": 8080, "total_steps": 38160, "loss": 0.5138, "lr": 0.0009624631115806537, "epoch": 4.234800838574423, "percentage": 21.17, "elapsed_time": "0:20:39", "remaining_time": "1:16:55", "throughput": 4252.66, "total_tokens": 5272032} {"current_steps": 8085, "total_steps": 38160, "loss": 0.4155, "lr": 0.0009623761291085761, "epoch": 4.237421383647799, "percentage": 21.19, "elapsed_time": "0:20:40", "remaining_time": "1:16:54", "throughput": 4252.84, "total_tokens": 5275520} {"current_steps": 8090, "total_steps": 38160, "loss": 0.4939, "lr": 0.0009622890499126873, "epoch": 4.240041928721174, "percentage": 21.2, "elapsed_time": "0:20:41", "remaining_time": "1:16:53", "throughput": 4252.89, "total_tokens": 5278528} {"current_steps": 8095, "total_steps": 38160, "loss": 0.647, "lr": 0.0009622018740112032, "epoch": 4.2426624737945495, "percentage": 21.21, "elapsed_time": "0:20:41", "remaining_time": "1:16:52", "throughput": 4252.87, "total_tokens": 5281536} {"current_steps": 8100, "total_steps": 38160, "loss": 0.464, "lr": 0.0009621146014223603, "epoch": 4.245283018867925, "percentage": 21.23, "elapsed_time": "0:20:42", "remaining_time": "1:16:52", "throughput": 4253.71, "total_tokens": 5287168} {"current_steps": 8105, "total_steps": 38160, "loss": 0.4096, "lr": 0.0009620272321644148, "epoch": 4.2479035639413, "percentage": 21.24, "elapsed_time": "0:20:43", "remaining_time": "1:16:52", "throughput": 4254.02, "total_tokens": 5291008} {"current_steps": 8110, "total_steps": 38160, "loss": 0.3822, "lr": 0.0009619397662556434, "epoch": 4.250524109014675, "percentage": 21.25, "elapsed_time": "0:20:44", "remaining_time": "1:16:51", "throughput": 4254.08, "total_tokens": 5294144} {"current_steps": 8115, "total_steps": 38160, "loss": 0.5843, "lr": 0.000961852203714343, "epoch": 4.25314465408805, "percentage": 21.27, "elapsed_time": "0:20:45", "remaining_time": "1:16:50", "throughput": 4254.11, "total_tokens": 5297184} {"current_steps": 8120, "total_steps": 38160, "loss": 0.4539, "lr": 0.0009617645445588307, "epoch": 4.255765199161425, "percentage": 21.28, "elapsed_time": "0:20:45", "remaining_time": "1:16:49", "throughput": 4254.24, "total_tokens": 5300480} {"current_steps": 8125, "total_steps": 38160, "loss": 0.486, "lr": 0.0009616767888074438, "epoch": 4.2583857442348005, "percentage": 21.29, "elapsed_time": "0:20:46", "remaining_time": "1:16:48", "throughput": 4254.41, "total_tokens": 5303936} {"current_steps": 8130, "total_steps": 38160, "loss": 0.4166, "lr": 0.0009615889364785397, "epoch": 4.261006289308176, "percentage": 21.31, "elapsed_time": "0:20:47", "remaining_time": "1:16:47", "throughput": 4254.4, "total_tokens": 5306816} {"current_steps": 8135, "total_steps": 38160, "loss": 0.4514, "lr": 0.000961500987590496, "epoch": 4.263626834381552, "percentage": 21.32, "elapsed_time": "0:20:48", "remaining_time": "1:16:46", "throughput": 4254.41, "total_tokens": 5309792} {"current_steps": 8140, "total_steps": 38160, "loss": 0.5788, "lr": 0.0009614129421617111, "epoch": 4.266247379454927, "percentage": 21.33, "elapsed_time": "0:20:48", "remaining_time": "1:16:45", "throughput": 4254.49, "total_tokens": 5313056} {"current_steps": 8145, "total_steps": 38160, "loss": 0.3641, "lr": 0.0009613248002106027, "epoch": 4.268867924528302, "percentage": 21.34, "elapsed_time": "0:20:49", "remaining_time": "1:16:44", "throughput": 4254.29, "total_tokens": 5315488} {"current_steps": 8150, "total_steps": 38160, "loss": 0.4101, "lr": 0.000961236561755609, "epoch": 4.271488469601677, "percentage": 21.36, "elapsed_time": "0:20:50", "remaining_time": "1:16:43", "throughput": 4254.21, "total_tokens": 5318272} {"current_steps": 8155, "total_steps": 38160, "loss": 0.4947, "lr": 0.0009611482268151888, "epoch": 4.274109014675052, "percentage": 21.37, "elapsed_time": "0:20:50", "remaining_time": "1:16:42", "throughput": 4254.29, "total_tokens": 5321408} {"current_steps": 8160, "total_steps": 38160, "loss": 0.4156, "lr": 0.0009610597954078206, "epoch": 4.276729559748428, "percentage": 21.38, "elapsed_time": "0:20:51", "remaining_time": "1:16:41", "throughput": 4254.77, "total_tokens": 5325696} {"current_steps": 8165, "total_steps": 38160, "loss": 0.5661, "lr": 0.0009609712675520031, "epoch": 4.279350104821803, "percentage": 21.4, "elapsed_time": "0:20:52", "remaining_time": "1:16:40", "throughput": 4254.84, "total_tokens": 5328832} {"current_steps": 8170, "total_steps": 38160, "loss": 0.4966, "lr": 0.0009608826432662556, "epoch": 4.281970649895178, "percentage": 21.41, "elapsed_time": "0:20:53", "remaining_time": "1:16:40", "throughput": 4255.07, "total_tokens": 5332448} {"current_steps": 8175, "total_steps": 38160, "loss": 0.5179, "lr": 0.0009607939225691172, "epoch": 4.284591194968553, "percentage": 21.42, "elapsed_time": "0:20:53", "remaining_time": "1:16:39", "throughput": 4255.14, "total_tokens": 5335520} {"current_steps": 8180, "total_steps": 38160, "loss": 0.3562, "lr": 0.0009607051054791472, "epoch": 4.287211740041929, "percentage": 21.44, "elapsed_time": "0:20:54", "remaining_time": "1:16:38", "throughput": 4255.52, "total_tokens": 5339328} {"current_steps": 8185, "total_steps": 38160, "loss": 0.4998, "lr": 0.000960616192014925, "epoch": 4.289832285115304, "percentage": 21.45, "elapsed_time": "0:20:55", "remaining_time": "1:16:37", "throughput": 4255.54, "total_tokens": 5342368} {"current_steps": 8190, "total_steps": 38160, "loss": 0.608, "lr": 0.0009605271821950506, "epoch": 4.2924528301886795, "percentage": 21.46, "elapsed_time": "0:20:56", "remaining_time": "1:16:36", "throughput": 4255.62, "total_tokens": 5345632} {"current_steps": 8195, "total_steps": 38160, "loss": 0.5878, "lr": 0.0009604380760381434, "epoch": 4.295073375262055, "percentage": 21.48, "elapsed_time": "0:20:56", "remaining_time": "1:16:35", "throughput": 4255.61, "total_tokens": 5348608} {"current_steps": 8200, "total_steps": 38160, "loss": 0.406, "lr": 0.0009603488735628439, "epoch": 4.29769392033543, "percentage": 21.49, "elapsed_time": "0:20:57", "remaining_time": "1:16:34", "throughput": 4255.67, "total_tokens": 5351776} {"current_steps": 8205, "total_steps": 38160, "loss": 0.6108, "lr": 0.0009602595747878118, "epoch": 4.300314465408805, "percentage": 21.5, "elapsed_time": "0:20:58", "remaining_time": "1:16:33", "throughput": 4255.68, "total_tokens": 5354880} {"current_steps": 8210, "total_steps": 38160, "loss": 0.4517, "lr": 0.0009601701797317278, "epoch": 4.30293501048218, "percentage": 21.51, "elapsed_time": "0:20:58", "remaining_time": "1:16:32", "throughput": 4255.68, "total_tokens": 5357824} {"current_steps": 8215, "total_steps": 38160, "loss": 0.441, "lr": 0.0009600806884132917, "epoch": 4.305555555555555, "percentage": 21.53, "elapsed_time": "0:20:59", "remaining_time": "1:16:31", "throughput": 4255.58, "total_tokens": 5360512} {"current_steps": 8220, "total_steps": 38160, "loss": 0.3925, "lr": 0.0009599911008512248, "epoch": 4.3081761006289305, "percentage": 21.54, "elapsed_time": "0:21:00", "remaining_time": "1:16:30", "throughput": 4255.79, "total_tokens": 5364064} {"current_steps": 8225, "total_steps": 38160, "loss": 0.5446, "lr": 0.0009599014170642674, "epoch": 4.310796645702306, "percentage": 21.55, "elapsed_time": "0:21:01", "remaining_time": "1:16:29", "throughput": 4255.87, "total_tokens": 5367200} {"current_steps": 8230, "total_steps": 38160, "loss": 0.5148, "lr": 0.0009598116370711805, "epoch": 4.313417190775682, "percentage": 21.57, "elapsed_time": "0:21:01", "remaining_time": "1:16:28", "throughput": 4255.9, "total_tokens": 5370272} {"current_steps": 8235, "total_steps": 38160, "loss": 0.4852, "lr": 0.0009597217608907447, "epoch": 4.316037735849057, "percentage": 21.58, "elapsed_time": "0:21:02", "remaining_time": "1:16:27", "throughput": 4255.79, "total_tokens": 5372896} {"current_steps": 8240, "total_steps": 38160, "loss": 0.5564, "lr": 0.0009596317885417614, "epoch": 4.318658280922432, "percentage": 21.59, "elapsed_time": "0:21:03", "remaining_time": "1:16:27", "throughput": 4256.15, "total_tokens": 5376800} {"current_steps": 8245, "total_steps": 38160, "loss": 0.6302, "lr": 0.0009595417200430516, "epoch": 4.321278825995807, "percentage": 21.61, "elapsed_time": "0:21:04", "remaining_time": "1:16:26", "throughput": 4256.35, "total_tokens": 5380288} {"current_steps": 8250, "total_steps": 38160, "loss": 0.4361, "lr": 0.0009594515554134568, "epoch": 4.323899371069182, "percentage": 21.62, "elapsed_time": "0:21:04", "remaining_time": "1:16:25", "throughput": 4256.27, "total_tokens": 5383072} {"current_steps": 8255, "total_steps": 38160, "loss": 0.6242, "lr": 0.0009593612946718384, "epoch": 4.326519916142558, "percentage": 21.63, "elapsed_time": "0:21:05", "remaining_time": "1:16:24", "throughput": 4256.44, "total_tokens": 5386400} {"current_steps": 8260, "total_steps": 38160, "loss": 0.5854, "lr": 0.0009592709378370778, "epoch": 4.329140461215933, "percentage": 21.65, "elapsed_time": "0:21:06", "remaining_time": "1:16:23", "throughput": 4256.24, "total_tokens": 5388832} {"current_steps": 8265, "total_steps": 38160, "loss": 0.4671, "lr": 0.0009591804849280766, "epoch": 4.331761006289308, "percentage": 21.66, "elapsed_time": "0:21:06", "remaining_time": "1:16:22", "throughput": 4256.28, "total_tokens": 5391968} {"current_steps": 8270, "total_steps": 38160, "loss": 0.3859, "lr": 0.0009590899359637564, "epoch": 4.334381551362683, "percentage": 21.67, "elapsed_time": "0:21:08", "remaining_time": "1:16:23", "throughput": 4257.41, "total_tokens": 5398624} {"current_steps": 8275, "total_steps": 38160, "loss": 0.4945, "lr": 0.0009589992909630594, "epoch": 4.337002096436059, "percentage": 21.69, "elapsed_time": "0:21:08", "remaining_time": "1:16:22", "throughput": 4257.5, "total_tokens": 5401824} {"current_steps": 8280, "total_steps": 38160, "loss": 0.4005, "lr": 0.0009589085499449471, "epoch": 4.339622641509434, "percentage": 21.7, "elapsed_time": "0:21:09", "remaining_time": "1:16:21", "throughput": 4257.56, "total_tokens": 5404928} {"current_steps": 8285, "total_steps": 38160, "loss": 0.4341, "lr": 0.0009588177129284017, "epoch": 4.3422431865828095, "percentage": 21.71, "elapsed_time": "0:21:10", "remaining_time": "1:16:20", "throughput": 4257.73, "total_tokens": 5408320} {"current_steps": 8290, "total_steps": 38160, "loss": 0.5305, "lr": 0.0009587267799324253, "epoch": 4.344863731656185, "percentage": 21.72, "elapsed_time": "0:21:10", "remaining_time": "1:16:19", "throughput": 4257.52, "total_tokens": 5410752} {"current_steps": 8295, "total_steps": 38160, "loss": 0.3988, "lr": 0.0009586357509760399, "epoch": 4.34748427672956, "percentage": 21.74, "elapsed_time": "0:21:11", "remaining_time": "1:16:17", "throughput": 4257.4, "total_tokens": 5413312} {"current_steps": 8300, "total_steps": 38160, "loss": 0.5219, "lr": 0.0009585446260782878, "epoch": 4.350104821802935, "percentage": 21.75, "elapsed_time": "0:21:12", "remaining_time": "1:16:17", "throughput": 4257.66, "total_tokens": 5416992} {"current_steps": 8305, "total_steps": 38160, "loss": 0.3567, "lr": 0.0009584534052582313, "epoch": 4.35272536687631, "percentage": 21.76, "elapsed_time": "0:21:13", "remaining_time": "1:16:16", "throughput": 4257.93, "total_tokens": 5420672} {"current_steps": 8310, "total_steps": 38160, "loss": 0.4016, "lr": 0.0009583620885349527, "epoch": 4.355345911949685, "percentage": 21.78, "elapsed_time": "0:21:13", "remaining_time": "1:16:15", "throughput": 4257.83, "total_tokens": 5423360} {"current_steps": 8315, "total_steps": 38160, "loss": 0.4424, "lr": 0.0009582706759275546, "epoch": 4.3579664570230605, "percentage": 21.79, "elapsed_time": "0:21:14", "remaining_time": "1:16:14", "throughput": 4257.83, "total_tokens": 5426336} {"current_steps": 8320, "total_steps": 38160, "loss": 0.5122, "lr": 0.0009581791674551592, "epoch": 4.360587002096436, "percentage": 21.8, "elapsed_time": "0:21:15", "remaining_time": "1:16:13", "throughput": 4257.94, "total_tokens": 5429632} {"current_steps": 8325, "total_steps": 38160, "loss": 0.4458, "lr": 0.000958087563136909, "epoch": 4.363207547169811, "percentage": 21.82, "elapsed_time": "0:21:15", "remaining_time": "1:16:12", "throughput": 4258.2, "total_tokens": 5433312} {"current_steps": 8330, "total_steps": 38160, "loss": 0.5215, "lr": 0.000957995862991967, "epoch": 4.365828092243187, "percentage": 21.83, "elapsed_time": "0:21:16", "remaining_time": "1:16:12", "throughput": 4258.53, "total_tokens": 5437248} {"current_steps": 8335, "total_steps": 38160, "loss": 0.3906, "lr": 0.0009579040670395154, "epoch": 4.368448637316562, "percentage": 21.84, "elapsed_time": "0:21:17", "remaining_time": "1:16:11", "throughput": 4258.63, "total_tokens": 5440384} {"current_steps": 8340, "total_steps": 38160, "loss": 0.5543, "lr": 0.000957812175298757, "epoch": 4.371069182389937, "percentage": 21.86, "elapsed_time": "0:21:18", "remaining_time": "1:16:10", "throughput": 4258.89, "total_tokens": 5444000} {"current_steps": 8345, "total_steps": 38160, "loss": 0.4722, "lr": 0.0009577201877889145, "epoch": 4.373689727463312, "percentage": 21.87, "elapsed_time": "0:21:19", "remaining_time": "1:16:09", "throughput": 4259.28, "total_tokens": 5447936} {"current_steps": 8350, "total_steps": 38160, "loss": 0.5375, "lr": 0.0009576281045292308, "epoch": 4.376310272536688, "percentage": 21.88, "elapsed_time": "0:21:19", "remaining_time": "1:16:09", "throughput": 4259.51, "total_tokens": 5451488} {"current_steps": 8355, "total_steps": 38160, "loss": 0.4727, "lr": 0.0009575359255389686, "epoch": 4.378930817610063, "percentage": 21.89, "elapsed_time": "0:21:20", "remaining_time": "1:16:08", "throughput": 4259.93, "total_tokens": 5455520} {"current_steps": 8360, "total_steps": 38160, "loss": 0.6311, "lr": 0.0009574436508374104, "epoch": 4.381551362683438, "percentage": 21.91, "elapsed_time": "0:21:21", "remaining_time": "1:16:07", "throughput": 4259.96, "total_tokens": 5458560} {"current_steps": 8365, "total_steps": 38160, "loss": 0.4555, "lr": 0.0009573512804438594, "epoch": 4.384171907756813, "percentage": 21.92, "elapsed_time": "0:21:22", "remaining_time": "1:16:06", "throughput": 4260.0, "total_tokens": 5461600} {"current_steps": 8370, "total_steps": 38160, "loss": 0.4022, "lr": 0.0009572588143776381, "epoch": 4.386792452830189, "percentage": 21.93, "elapsed_time": "0:21:22", "remaining_time": "1:16:05", "throughput": 4260.39, "total_tokens": 5465536} {"current_steps": 8375, "total_steps": 38160, "loss": 0.4393, "lr": 0.0009571662526580897, "epoch": 4.389412997903564, "percentage": 21.95, "elapsed_time": "0:21:23", "remaining_time": "1:16:04", "throughput": 4260.39, "total_tokens": 5468416} {"current_steps": 8380, "total_steps": 38160, "loss": 0.5431, "lr": 0.0009570735953045768, "epoch": 4.3920335429769395, "percentage": 21.96, "elapsed_time": "0:21:24", "remaining_time": "1:16:04", "throughput": 4260.63, "total_tokens": 5472000} {"current_steps": 8385, "total_steps": 38160, "loss": 0.3958, "lr": 0.0009569808423364823, "epoch": 4.394654088050315, "percentage": 21.97, "elapsed_time": "0:21:25", "remaining_time": "1:16:03", "throughput": 4260.71, "total_tokens": 5475168} {"current_steps": 8390, "total_steps": 38160, "loss": 0.4136, "lr": 0.0009568879937732091, "epoch": 4.39727463312369, "percentage": 21.99, "elapsed_time": "0:21:25", "remaining_time": "1:16:01", "throughput": 4260.59, "total_tokens": 5477760} {"current_steps": 8395, "total_steps": 38160, "loss": 0.4071, "lr": 0.0009567950496341802, "epoch": 4.399895178197065, "percentage": 22.0, "elapsed_time": "0:21:26", "remaining_time": "1:16:00", "throughput": 4260.55, "total_tokens": 5480544} {"current_steps": 8400, "total_steps": 38160, "loss": 0.3677, "lr": 0.0009567020099388382, "epoch": 4.40251572327044, "percentage": 22.01, "elapsed_time": "0:21:27", "remaining_time": "1:15:59", "throughput": 4260.64, "total_tokens": 5483776} {"current_steps": 8405, "total_steps": 38160, "loss": 0.436, "lr": 0.0009566088747066459, "epoch": 4.405136268343815, "percentage": 22.03, "elapsed_time": "0:21:27", "remaining_time": "1:15:58", "throughput": 4260.33, "total_tokens": 5485888} {"current_steps": 8410, "total_steps": 38160, "loss": 0.6117, "lr": 0.0009565156439570866, "epoch": 4.4077568134171905, "percentage": 22.04, "elapsed_time": "0:21:28", "remaining_time": "1:15:57", "throughput": 4260.4, "total_tokens": 5489056} {"current_steps": 8415, "total_steps": 38160, "loss": 0.5614, "lr": 0.0009564223177096625, "epoch": 4.410377358490566, "percentage": 22.05, "elapsed_time": "0:21:29", "remaining_time": "1:15:56", "throughput": 4260.48, "total_tokens": 5492224} {"current_steps": 8420, "total_steps": 38160, "loss": 0.4064, "lr": 0.0009563288959838969, "epoch": 4.412997903563941, "percentage": 22.06, "elapsed_time": "0:21:29", "remaining_time": "1:15:55", "throughput": 4260.76, "total_tokens": 5495872} {"current_steps": 8425, "total_steps": 38160, "loss": 0.365, "lr": 0.0009562353787993321, "epoch": 4.415618448637317, "percentage": 22.08, "elapsed_time": "0:21:30", "remaining_time": "1:15:55", "throughput": 4261.0, "total_tokens": 5499488} {"current_steps": 8430, "total_steps": 38160, "loss": 0.5166, "lr": 0.0009561417661755312, "epoch": 4.418238993710692, "percentage": 22.09, "elapsed_time": "0:21:31", "remaining_time": "1:15:54", "throughput": 4261.24, "total_tokens": 5503104} {"current_steps": 8435, "total_steps": 38160, "loss": 0.4738, "lr": 0.0009560480581320768, "epoch": 4.420859538784067, "percentage": 22.1, "elapsed_time": "0:21:32", "remaining_time": "1:15:53", "throughput": 4261.55, "total_tokens": 5506912} {"current_steps": 8440, "total_steps": 38160, "loss": 0.5446, "lr": 0.0009559542546885714, "epoch": 4.423480083857442, "percentage": 22.12, "elapsed_time": "0:21:32", "remaining_time": "1:15:52", "throughput": 4261.31, "total_tokens": 5509312} {"current_steps": 8445, "total_steps": 38160, "loss": 0.3778, "lr": 0.0009558603558646378, "epoch": 4.426100628930818, "percentage": 22.13, "elapsed_time": "0:21:33", "remaining_time": "1:15:51", "throughput": 4261.26, "total_tokens": 5512096} {"current_steps": 8450, "total_steps": 38160, "loss": 0.5273, "lr": 0.0009557663616799185, "epoch": 4.428721174004193, "percentage": 22.14, "elapsed_time": "0:21:34", "remaining_time": "1:15:50", "throughput": 4261.3, "total_tokens": 5515168} {"current_steps": 8455, "total_steps": 38160, "loss": 0.4961, "lr": 0.0009556722721540759, "epoch": 4.431341719077568, "percentage": 22.16, "elapsed_time": "0:21:34", "remaining_time": "1:15:49", "throughput": 4261.42, "total_tokens": 5518464} {"current_steps": 8460, "total_steps": 38160, "loss": 0.4526, "lr": 0.0009555780873067927, "epoch": 4.433962264150943, "percentage": 22.17, "elapsed_time": "0:21:35", "remaining_time": "1:15:48", "throughput": 4261.37, "total_tokens": 5521344} {"current_steps": 8465, "total_steps": 38160, "loss": 0.5036, "lr": 0.000955483807157771, "epoch": 4.436582809224318, "percentage": 22.18, "elapsed_time": "0:21:36", "remaining_time": "1:15:47", "throughput": 4261.42, "total_tokens": 5524416} {"current_steps": 8470, "total_steps": 38160, "loss": 0.5626, "lr": 0.0009553894317267333, "epoch": 4.439203354297694, "percentage": 22.2, "elapsed_time": "0:21:37", "remaining_time": "1:15:46", "throughput": 4261.46, "total_tokens": 5527488} {"current_steps": 8475, "total_steps": 38160, "loss": 0.4634, "lr": 0.0009552949610334219, "epoch": 4.4418238993710695, "percentage": 22.21, "elapsed_time": "0:21:37", "remaining_time": "1:15:45", "throughput": 4261.35, "total_tokens": 5530144} {"current_steps": 8480, "total_steps": 38160, "loss": 0.5941, "lr": 0.000955200395097599, "epoch": 4.444444444444445, "percentage": 22.22, "elapsed_time": "0:21:38", "remaining_time": "1:15:44", "throughput": 4261.51, "total_tokens": 5533536} {"current_steps": 8485, "total_steps": 38160, "loss": 0.504, "lr": 0.0009551057339390464, "epoch": 4.44706498951782, "percentage": 22.24, "elapsed_time": "0:21:39", "remaining_time": "1:15:43", "throughput": 4261.36, "total_tokens": 5536032} {"current_steps": 8490, "total_steps": 38160, "loss": 0.4364, "lr": 0.0009550109775775666, "epoch": 4.449685534591195, "percentage": 22.25, "elapsed_time": "0:21:39", "remaining_time": "1:15:42", "throughput": 4261.58, "total_tokens": 5539552} {"current_steps": 8495, "total_steps": 38160, "loss": 0.5009, "lr": 0.0009549161260329811, "epoch": 4.45230607966457, "percentage": 22.26, "elapsed_time": "0:21:40", "remaining_time": "1:15:41", "throughput": 4261.58, "total_tokens": 5542528} {"current_steps": 8500, "total_steps": 38160, "loss": 0.5861, "lr": 0.0009548211793251322, "epoch": 4.454926624737945, "percentage": 22.27, "elapsed_time": "0:21:41", "remaining_time": "1:15:40", "throughput": 4261.55, "total_tokens": 5545408} {"current_steps": 8505, "total_steps": 38160, "loss": 0.3781, "lr": 0.0009547261374738814, "epoch": 4.4575471698113205, "percentage": 22.29, "elapsed_time": "0:21:42", "remaining_time": "1:15:39", "throughput": 4261.82, "total_tokens": 5549120} {"current_steps": 8510, "total_steps": 38160, "loss": 0.5381, "lr": 0.0009546310004991105, "epoch": 4.460167714884696, "percentage": 22.3, "elapsed_time": "0:21:42", "remaining_time": "1:15:39", "throughput": 4261.9, "total_tokens": 5552352} {"current_steps": 8515, "total_steps": 38160, "loss": 0.3616, "lr": 0.000954535768420721, "epoch": 4.462788259958071, "percentage": 22.31, "elapsed_time": "0:21:43", "remaining_time": "1:15:38", "throughput": 4261.87, "total_tokens": 5555296} {"current_steps": 8520, "total_steps": 38160, "loss": 0.3445, "lr": 0.0009544404412586343, "epoch": 4.465408805031447, "percentage": 22.33, "elapsed_time": "0:21:44", "remaining_time": "1:15:37", "throughput": 4262.02, "total_tokens": 5558720} {"current_steps": 8525, "total_steps": 38160, "loss": 0.4878, "lr": 0.0009543450190327917, "epoch": 4.468029350104822, "percentage": 22.34, "elapsed_time": "0:21:45", "remaining_time": "1:15:36", "throughput": 4262.2, "total_tokens": 5562176} {"current_steps": 8530, "total_steps": 38160, "loss": 0.6273, "lr": 0.0009542495017631547, "epoch": 4.470649895178197, "percentage": 22.35, "elapsed_time": "0:21:45", "remaining_time": "1:15:35", "throughput": 4262.32, "total_tokens": 5565408} {"current_steps": 8535, "total_steps": 38160, "loss": 0.442, "lr": 0.0009541538894697043, "epoch": 4.473270440251572, "percentage": 22.37, "elapsed_time": "0:21:46", "remaining_time": "1:15:34", "throughput": 4262.29, "total_tokens": 5568288} {"current_steps": 8540, "total_steps": 38160, "loss": 0.7042, "lr": 0.0009540581821724414, "epoch": 4.475890985324948, "percentage": 22.38, "elapsed_time": "0:21:47", "remaining_time": "1:15:33", "throughput": 4262.42, "total_tokens": 5571744} {"current_steps": 8545, "total_steps": 38160, "loss": 0.5257, "lr": 0.000953962379891387, "epoch": 4.478511530398323, "percentage": 22.39, "elapsed_time": "0:21:47", "remaining_time": "1:15:32", "throughput": 4262.51, "total_tokens": 5575008} {"current_steps": 8550, "total_steps": 38160, "loss": 0.5989, "lr": 0.0009538664826465818, "epoch": 4.481132075471698, "percentage": 22.41, "elapsed_time": "0:21:48", "remaining_time": "1:15:31", "throughput": 4262.45, "total_tokens": 5577824} {"current_steps": 8555, "total_steps": 38160, "loss": 0.4643, "lr": 0.0009537704904580864, "epoch": 4.483752620545073, "percentage": 22.42, "elapsed_time": "0:21:49", "remaining_time": "1:15:31", "throughput": 4262.59, "total_tokens": 5581216} {"current_steps": 8560, "total_steps": 38160, "loss": 0.4837, "lr": 0.0009536744033459815, "epoch": 4.486373165618448, "percentage": 22.43, "elapsed_time": "0:21:50", "remaining_time": "1:15:31", "throughput": 4263.27, "total_tokens": 5586272} {"current_steps": 8565, "total_steps": 38160, "loss": 0.4891, "lr": 0.0009535782213303669, "epoch": 4.488993710691824, "percentage": 22.44, "elapsed_time": "0:21:50", "remaining_time": "1:15:29", "throughput": 4263.05, "total_tokens": 5588608} {"current_steps": 8570, "total_steps": 38160, "loss": 0.3478, "lr": 0.0009534819444313631, "epoch": 4.4916142557651995, "percentage": 22.46, "elapsed_time": "0:21:51", "remaining_time": "1:15:28", "throughput": 4262.95, "total_tokens": 5591296} {"current_steps": 8575, "total_steps": 38160, "loss": 0.4076, "lr": 0.0009533855726691103, "epoch": 4.494234800838575, "percentage": 22.47, "elapsed_time": "0:21:52", "remaining_time": "1:15:27", "throughput": 4262.7, "total_tokens": 5593568} {"current_steps": 8580, "total_steps": 38160, "loss": 0.4665, "lr": 0.0009532891060637681, "epoch": 4.49685534591195, "percentage": 22.48, "elapsed_time": "0:21:52", "remaining_time": "1:15:26", "throughput": 4262.7, "total_tokens": 5596480} {"current_steps": 8585, "total_steps": 38160, "loss": 0.5953, "lr": 0.0009531925446355163, "epoch": 4.499475890985325, "percentage": 22.5, "elapsed_time": "0:21:53", "remaining_time": "1:15:25", "throughput": 4262.85, "total_tokens": 5599968} {"current_steps": 8590, "total_steps": 38160, "loss": 0.464, "lr": 0.0009530958884045545, "epoch": 4.5020964360587, "percentage": 22.51, "elapsed_time": "0:21:54", "remaining_time": "1:15:24", "throughput": 4262.95, "total_tokens": 5603168} {"current_steps": 8595, "total_steps": 38160, "loss": 0.6224, "lr": 0.000952999137391102, "epoch": 4.504716981132075, "percentage": 22.52, "elapsed_time": "0:21:55", "remaining_time": "1:15:23", "throughput": 4263.06, "total_tokens": 5606464} {"current_steps": 8600, "total_steps": 38160, "loss": 0.5292, "lr": 0.0009529022916153982, "epoch": 4.5073375262054505, "percentage": 22.54, "elapsed_time": "0:21:55", "remaining_time": "1:15:22", "throughput": 4262.97, "total_tokens": 5609216} {"current_steps": 8605, "total_steps": 38160, "loss": 0.4374, "lr": 0.0009528053510977017, "epoch": 4.509958071278826, "percentage": 22.55, "elapsed_time": "0:21:56", "remaining_time": "1:15:21", "throughput": 4263.2, "total_tokens": 5612800} {"current_steps": 8610, "total_steps": 38160, "loss": 0.4316, "lr": 0.0009527083158582919, "epoch": 4.512578616352201, "percentage": 22.56, "elapsed_time": "0:21:57", "remaining_time": "1:15:20", "throughput": 4263.13, "total_tokens": 5615488} {"current_steps": 8615, "total_steps": 38160, "loss": 0.403, "lr": 0.0009526111859174671, "epoch": 4.515199161425577, "percentage": 22.58, "elapsed_time": "0:21:58", "remaining_time": "1:15:20", "throughput": 4263.43, "total_tokens": 5619264} {"current_steps": 8620, "total_steps": 38160, "loss": 0.401, "lr": 0.0009525139612955458, "epoch": 4.517819706498952, "percentage": 22.59, "elapsed_time": "0:21:58", "remaining_time": "1:15:19", "throughput": 4263.78, "total_tokens": 5623104} {"current_steps": 8625, "total_steps": 38160, "loss": 0.4837, "lr": 0.0009524166420128664, "epoch": 4.520440251572327, "percentage": 22.6, "elapsed_time": "0:21:59", "remaining_time": "1:15:18", "throughput": 4263.83, "total_tokens": 5626144} {"current_steps": 8630, "total_steps": 38160, "loss": 0.4715, "lr": 0.0009523192280897867, "epoch": 4.523060796645702, "percentage": 22.62, "elapsed_time": "0:22:00", "remaining_time": "1:15:17", "throughput": 4263.89, "total_tokens": 5629216} {"current_steps": 8635, "total_steps": 38160, "loss": 0.542, "lr": 0.0009522217195466851, "epoch": 4.5256813417190775, "percentage": 22.63, "elapsed_time": "0:22:00", "remaining_time": "1:15:16", "throughput": 4264.02, "total_tokens": 5632448} {"current_steps": 8640, "total_steps": 38160, "loss": 0.5417, "lr": 0.0009521241164039589, "epoch": 4.528301886792453, "percentage": 22.64, "elapsed_time": "0:22:01", "remaining_time": "1:15:16", "throughput": 4264.43, "total_tokens": 5636704} {"current_steps": 8645, "total_steps": 38160, "loss": 0.4429, "lr": 0.0009520264186820258, "epoch": 4.530922431865828, "percentage": 22.65, "elapsed_time": "0:22:02", "remaining_time": "1:15:15", "throughput": 4265.01, "total_tokens": 5641408} {"current_steps": 8650, "total_steps": 38160, "loss": 0.4601, "lr": 0.0009519286264013227, "epoch": 4.533542976939203, "percentage": 22.67, "elapsed_time": "0:22:03", "remaining_time": "1:15:14", "throughput": 4264.91, "total_tokens": 5644096} {"current_steps": 8655, "total_steps": 38160, "loss": 0.4132, "lr": 0.0009518307395823069, "epoch": 4.536163522012579, "percentage": 22.68, "elapsed_time": "0:22:04", "remaining_time": "1:15:13", "throughput": 4264.82, "total_tokens": 5646720} {"current_steps": 8660, "total_steps": 38160, "loss": 0.5571, "lr": 0.0009517327582454551, "epoch": 4.538784067085954, "percentage": 22.69, "elapsed_time": "0:22:04", "remaining_time": "1:15:12", "throughput": 4264.84, "total_tokens": 5649696} {"current_steps": 8665, "total_steps": 38160, "loss": 0.404, "lr": 0.000951634682411264, "epoch": 4.5414046121593294, "percentage": 22.71, "elapsed_time": "0:22:05", "remaining_time": "1:15:11", "throughput": 4265.14, "total_tokens": 5653504} {"current_steps": 8670, "total_steps": 38160, "loss": 0.4892, "lr": 0.0009515365121002498, "epoch": 4.544025157232705, "percentage": 22.72, "elapsed_time": "0:22:06", "remaining_time": "1:15:11", "throughput": 4265.27, "total_tokens": 5656896} {"current_steps": 8675, "total_steps": 38160, "loss": 0.4828, "lr": 0.0009514382473329487, "epoch": 4.54664570230608, "percentage": 22.73, "elapsed_time": "0:22:07", "remaining_time": "1:15:10", "throughput": 4265.68, "total_tokens": 5660928} {"current_steps": 8680, "total_steps": 38160, "loss": 0.495, "lr": 0.0009513398881299164, "epoch": 4.549266247379455, "percentage": 22.75, "elapsed_time": "0:22:07", "remaining_time": "1:15:09", "throughput": 4265.73, "total_tokens": 5664064} {"current_steps": 8685, "total_steps": 38160, "loss": 0.5457, "lr": 0.0009512414345117289, "epoch": 4.55188679245283, "percentage": 22.76, "elapsed_time": "0:22:08", "remaining_time": "1:15:08", "throughput": 4265.81, "total_tokens": 5667232} {"current_steps": 8690, "total_steps": 38160, "loss": 0.4865, "lr": 0.0009511428864989813, "epoch": 4.554507337526205, "percentage": 22.77, "elapsed_time": "0:22:09", "remaining_time": "1:15:07", "throughput": 4265.82, "total_tokens": 5670176} {"current_steps": 8695, "total_steps": 38160, "loss": 0.3779, "lr": 0.0009510442441122886, "epoch": 4.5571278825995805, "percentage": 22.79, "elapsed_time": "0:22:09", "remaining_time": "1:15:06", "throughput": 4265.81, "total_tokens": 5673120} {"current_steps": 8700, "total_steps": 38160, "loss": 0.4978, "lr": 0.0009509455073722859, "epoch": 4.559748427672956, "percentage": 22.8, "elapsed_time": "0:22:10", "remaining_time": "1:15:05", "throughput": 4265.73, "total_tokens": 5675936} {"current_steps": 8705, "total_steps": 38160, "loss": 0.3701, "lr": 0.0009508466762996277, "epoch": 4.562368972746331, "percentage": 22.81, "elapsed_time": "0:22:11", "remaining_time": "1:15:04", "throughput": 4265.78, "total_tokens": 5679072} {"current_steps": 8710, "total_steps": 38160, "loss": 0.473, "lr": 0.0009507477509149883, "epoch": 4.564989517819707, "percentage": 22.82, "elapsed_time": "0:22:12", "remaining_time": "1:15:03", "throughput": 4265.81, "total_tokens": 5682112} {"current_steps": 8715, "total_steps": 38160, "loss": 0.5915, "lr": 0.0009506487312390619, "epoch": 4.567610062893082, "percentage": 22.84, "elapsed_time": "0:22:12", "remaining_time": "1:15:03", "throughput": 4266.04, "total_tokens": 5685696} {"current_steps": 8720, "total_steps": 38160, "loss": 0.4709, "lr": 0.0009505496172925622, "epoch": 4.570230607966457, "percentage": 22.85, "elapsed_time": "0:22:13", "remaining_time": "1:15:01", "throughput": 4265.84, "total_tokens": 5688096} {"current_steps": 8725, "total_steps": 38160, "loss": 0.449, "lr": 0.0009504504090962226, "epoch": 4.572851153039832, "percentage": 22.86, "elapsed_time": "0:22:14", "remaining_time": "1:15:00", "throughput": 4265.81, "total_tokens": 5691072} {"current_steps": 8730, "total_steps": 38160, "loss": 0.499, "lr": 0.0009503511066707966, "epoch": 4.5754716981132075, "percentage": 22.88, "elapsed_time": "0:22:14", "remaining_time": "1:15:00", "throughput": 4265.98, "total_tokens": 5694592} {"current_steps": 8735, "total_steps": 38160, "loss": 0.3839, "lr": 0.0009502517100370568, "epoch": 4.578092243186583, "percentage": 22.89, "elapsed_time": "0:22:15", "remaining_time": "1:14:58", "throughput": 4265.9, "total_tokens": 5697312} {"current_steps": 8740, "total_steps": 38160, "loss": 0.3425, "lr": 0.0009501522192157961, "epoch": 4.580712788259958, "percentage": 22.9, "elapsed_time": "0:22:16", "remaining_time": "1:14:58", "throughput": 4266.2, "total_tokens": 5701088} {"current_steps": 8745, "total_steps": 38160, "loss": 0.536, "lr": 0.0009500526342278266, "epoch": 4.583333333333333, "percentage": 22.92, "elapsed_time": "0:22:17", "remaining_time": "1:14:57", "throughput": 4266.17, "total_tokens": 5703904} {"current_steps": 8750, "total_steps": 38160, "loss": 0.4891, "lr": 0.0009499529550939807, "epoch": 4.585953878406709, "percentage": 22.93, "elapsed_time": "0:22:17", "remaining_time": "1:14:56", "throughput": 4266.13, "total_tokens": 5706816} {"current_steps": 8755, "total_steps": 38160, "loss": 0.4834, "lr": 0.0009498531818351098, "epoch": 4.588574423480084, "percentage": 22.94, "elapsed_time": "0:22:18", "remaining_time": "1:14:55", "throughput": 4266.1, "total_tokens": 5709632} {"current_steps": 8760, "total_steps": 38160, "loss": 0.5069, "lr": 0.0009497533144720854, "epoch": 4.591194968553459, "percentage": 22.96, "elapsed_time": "0:22:19", "remaining_time": "1:14:54", "throughput": 4266.43, "total_tokens": 5713472} {"current_steps": 8765, "total_steps": 38160, "loss": 0.6281, "lr": 0.0009496533530257988, "epoch": 4.593815513626835, "percentage": 22.97, "elapsed_time": "0:22:19", "remaining_time": "1:14:53", "throughput": 4266.55, "total_tokens": 5716736} {"current_steps": 8770, "total_steps": 38160, "loss": 0.4181, "lr": 0.0009495532975171605, "epoch": 4.59643605870021, "percentage": 22.98, "elapsed_time": "0:22:20", "remaining_time": "1:14:53", "throughput": 4266.86, "total_tokens": 5720672} {"current_steps": 8775, "total_steps": 38160, "loss": 0.6879, "lr": 0.0009494531479671014, "epoch": 4.599056603773585, "percentage": 23.0, "elapsed_time": "0:22:21", "remaining_time": "1:14:52", "throughput": 4266.98, "total_tokens": 5724000} {"current_steps": 8780, "total_steps": 38160, "loss": 0.658, "lr": 0.0009493529043965712, "epoch": 4.60167714884696, "percentage": 23.01, "elapsed_time": "0:22:22", "remaining_time": "1:14:51", "throughput": 4266.93, "total_tokens": 5726784} {"current_steps": 8785, "total_steps": 38160, "loss": 0.4756, "lr": 0.00094925256682654, "epoch": 4.604297693920335, "percentage": 23.02, "elapsed_time": "0:22:22", "remaining_time": "1:14:50", "throughput": 4267.11, "total_tokens": 5730272} {"current_steps": 8790, "total_steps": 38160, "loss": 0.4768, "lr": 0.000949152135277997, "epoch": 4.6069182389937104, "percentage": 23.03, "elapsed_time": "0:22:23", "remaining_time": "1:14:49", "throughput": 4267.07, "total_tokens": 5733120} {"current_steps": 8795, "total_steps": 38160, "loss": 0.3087, "lr": 0.0009490516097719515, "epoch": 4.609538784067086, "percentage": 23.05, "elapsed_time": "0:22:24", "remaining_time": "1:14:49", "throughput": 4267.67, "total_tokens": 5737824} {"current_steps": 8800, "total_steps": 38160, "loss": 0.4023, "lr": 0.0009489509903294324, "epoch": 4.612159329140461, "percentage": 23.06, "elapsed_time": "0:22:25", "remaining_time": "1:14:47", "throughput": 4267.53, "total_tokens": 5740384} {"current_steps": 8805, "total_steps": 38160, "loss": 0.4432, "lr": 0.000948850276971488, "epoch": 4.614779874213837, "percentage": 23.07, "elapsed_time": "0:22:25", "remaining_time": "1:14:46", "throughput": 4267.45, "total_tokens": 5743232} {"current_steps": 8810, "total_steps": 38160, "loss": 0.5587, "lr": 0.0009487494697191864, "epoch": 4.617400419287212, "percentage": 23.09, "elapsed_time": "0:22:26", "remaining_time": "1:14:45", "throughput": 4267.51, "total_tokens": 5746432} {"current_steps": 8815, "total_steps": 38160, "loss": 0.5473, "lr": 0.0009486485685936154, "epoch": 4.620020964360587, "percentage": 23.1, "elapsed_time": "0:22:27", "remaining_time": "1:14:45", "throughput": 4267.63, "total_tokens": 5749696} {"current_steps": 8820, "total_steps": 38160, "loss": 0.4, "lr": 0.0009485475736158822, "epoch": 4.622641509433962, "percentage": 23.11, "elapsed_time": "0:22:28", "remaining_time": "1:14:44", "throughput": 4267.82, "total_tokens": 5753152} {"current_steps": 8825, "total_steps": 38160, "loss": 0.423, "lr": 0.000948446484807114, "epoch": 4.6252620545073375, "percentage": 23.13, "elapsed_time": "0:22:28", "remaining_time": "1:14:43", "throughput": 4267.69, "total_tokens": 5755712} {"current_steps": 8830, "total_steps": 38160, "loss": 0.4963, "lr": 0.0009483453021884572, "epoch": 4.627882599580713, "percentage": 23.14, "elapsed_time": "0:22:29", "remaining_time": "1:14:42", "throughput": 4267.84, "total_tokens": 5759040} {"current_steps": 8835, "total_steps": 38160, "loss": 0.5579, "lr": 0.0009482440257810782, "epoch": 4.630503144654088, "percentage": 23.15, "elapsed_time": "0:22:30", "remaining_time": "1:14:40", "throughput": 4267.66, "total_tokens": 5761408} {"current_steps": 8840, "total_steps": 38160, "loss": 0.5347, "lr": 0.000948142655606163, "epoch": 4.633123689727463, "percentage": 23.17, "elapsed_time": "0:22:30", "remaining_time": "1:14:40", "throughput": 4267.77, "total_tokens": 5764672} {"current_steps": 8845, "total_steps": 38160, "loss": 0.449, "lr": 0.0009480411916849168, "epoch": 4.635744234800838, "percentage": 23.18, "elapsed_time": "0:22:31", "remaining_time": "1:14:39", "throughput": 4267.94, "total_tokens": 5768160} {"current_steps": 8850, "total_steps": 38160, "loss": 0.461, "lr": 0.0009479396340385649, "epoch": 4.638364779874214, "percentage": 23.19, "elapsed_time": "0:22:32", "remaining_time": "1:14:38", "throughput": 4267.69, "total_tokens": 5770400} {"current_steps": 8855, "total_steps": 38160, "loss": 0.375, "lr": 0.0009478379826883519, "epoch": 4.640985324947589, "percentage": 23.2, "elapsed_time": "0:22:32", "remaining_time": "1:14:37", "throughput": 4267.94, "total_tokens": 5774080} {"current_steps": 8860, "total_steps": 38160, "loss": 0.5176, "lr": 0.0009477362376555421, "epoch": 4.643605870020965, "percentage": 23.22, "elapsed_time": "0:22:33", "remaining_time": "1:14:36", "throughput": 4267.98, "total_tokens": 5777184} {"current_steps": 8865, "total_steps": 38160, "loss": 0.5122, "lr": 0.0009476343989614194, "epoch": 4.64622641509434, "percentage": 23.23, "elapsed_time": "0:22:34", "remaining_time": "1:14:35", "throughput": 4268.19, "total_tokens": 5780736} {"current_steps": 8870, "total_steps": 38160, "loss": 0.5396, "lr": 0.0009475324666272873, "epoch": 4.648846960167715, "percentage": 23.24, "elapsed_time": "0:22:35", "remaining_time": "1:14:34", "throughput": 4268.39, "total_tokens": 5784320} {"current_steps": 8875, "total_steps": 38160, "loss": 0.4563, "lr": 0.0009474304406744689, "epoch": 4.65146750524109, "percentage": 23.26, "elapsed_time": "0:22:35", "remaining_time": "1:14:34", "throughput": 4268.58, "total_tokens": 5787840} {"current_steps": 8880, "total_steps": 38160, "loss": 0.6148, "lr": 0.0009473283211243069, "epoch": 4.654088050314465, "percentage": 23.27, "elapsed_time": "0:22:36", "remaining_time": "1:14:33", "throughput": 4268.68, "total_tokens": 5791040} {"current_steps": 8885, "total_steps": 38160, "loss": 0.7608, "lr": 0.0009472261079981637, "epoch": 4.65670859538784, "percentage": 23.28, "elapsed_time": "0:22:37", "remaining_time": "1:14:32", "throughput": 4268.89, "total_tokens": 5794560} {"current_steps": 8890, "total_steps": 38160, "loss": 0.4817, "lr": 0.0009471238013174206, "epoch": 4.659329140461216, "percentage": 23.3, "elapsed_time": "0:22:38", "remaining_time": "1:14:31", "throughput": 4268.87, "total_tokens": 5797504} {"current_steps": 8895, "total_steps": 38160, "loss": 0.456, "lr": 0.0009470214011034795, "epoch": 4.661949685534591, "percentage": 23.31, "elapsed_time": "0:22:38", "remaining_time": "1:14:30", "throughput": 4268.64, "total_tokens": 5799808} {"current_steps": 8900, "total_steps": 38160, "loss": 0.3519, "lr": 0.0009469189073777612, "epoch": 4.664570230607967, "percentage": 23.32, "elapsed_time": "0:22:39", "remaining_time": "1:14:29", "throughput": 4268.64, "total_tokens": 5802752} {"current_steps": 8905, "total_steps": 38160, "loss": 0.4803, "lr": 0.0009468163201617061, "epoch": 4.667190775681342, "percentage": 23.34, "elapsed_time": "0:22:40", "remaining_time": "1:14:28", "throughput": 4268.79, "total_tokens": 5806144} {"current_steps": 8910, "total_steps": 38160, "loss": 0.5767, "lr": 0.0009467136394767744, "epoch": 4.669811320754717, "percentage": 23.35, "elapsed_time": "0:22:40", "remaining_time": "1:14:27", "throughput": 4268.94, "total_tokens": 5809536} {"current_steps": 8915, "total_steps": 38160, "loss": 0.4619, "lr": 0.0009466108653444458, "epoch": 4.672431865828092, "percentage": 23.36, "elapsed_time": "0:22:41", "remaining_time": "1:14:26", "throughput": 4269.15, "total_tokens": 5813088} {"current_steps": 8920, "total_steps": 38160, "loss": 0.3398, "lr": 0.0009465079977862193, "epoch": 4.6750524109014675, "percentage": 23.38, "elapsed_time": "0:22:42", "remaining_time": "1:14:25", "throughput": 4268.97, "total_tokens": 5815488} {"current_steps": 8925, "total_steps": 38160, "loss": 0.5981, "lr": 0.0009464050368236137, "epoch": 4.677672955974843, "percentage": 23.39, "elapsed_time": "0:22:42", "remaining_time": "1:14:24", "throughput": 4268.98, "total_tokens": 5818528} {"current_steps": 8930, "total_steps": 38160, "loss": 0.5419, "lr": 0.0009463019824781674, "epoch": 4.680293501048218, "percentage": 23.4, "elapsed_time": "0:22:43", "remaining_time": "1:14:23", "throughput": 4269.2, "total_tokens": 5822016} {"current_steps": 8935, "total_steps": 38160, "loss": 0.635, "lr": 0.0009461988347714377, "epoch": 4.682914046121593, "percentage": 23.41, "elapsed_time": "0:22:44", "remaining_time": "1:14:23", "throughput": 4269.5, "total_tokens": 5825952} {"current_steps": 8940, "total_steps": 38160, "loss": 0.3659, "lr": 0.0009460955937250025, "epoch": 4.685534591194968, "percentage": 23.43, "elapsed_time": "0:22:45", "remaining_time": "1:14:22", "throughput": 4269.33, "total_tokens": 5828416} {"current_steps": 8945, "total_steps": 38160, "loss": 0.4585, "lr": 0.0009459922593604584, "epoch": 4.688155136268344, "percentage": 23.44, "elapsed_time": "0:22:45", "remaining_time": "1:14:21", "throughput": 4269.7, "total_tokens": 5832352} {"current_steps": 8950, "total_steps": 38160, "loss": 0.5489, "lr": 0.0009458888316994219, "epoch": 4.690775681341719, "percentage": 23.45, "elapsed_time": "0:22:46", "remaining_time": "1:14:20", "throughput": 4269.76, "total_tokens": 5835488} {"current_steps": 8955, "total_steps": 38160, "loss": 0.5086, "lr": 0.0009457853107635286, "epoch": 4.693396226415095, "percentage": 23.47, "elapsed_time": "0:22:47", "remaining_time": "1:14:19", "throughput": 4269.8, "total_tokens": 5838624} {"current_steps": 8960, "total_steps": 38160, "loss": 0.4696, "lr": 0.0009456816965744342, "epoch": 4.69601677148847, "percentage": 23.48, "elapsed_time": "0:22:48", "remaining_time": "1:14:18", "throughput": 4270.16, "total_tokens": 5842592} {"current_steps": 8965, "total_steps": 38160, "loss": 0.5095, "lr": 0.0009455779891538134, "epoch": 4.698637316561845, "percentage": 23.49, "elapsed_time": "0:22:48", "remaining_time": "1:14:18", "throughput": 4270.34, "total_tokens": 5846080} {"current_steps": 8970, "total_steps": 38160, "loss": 0.5181, "lr": 0.0009454741885233606, "epoch": 4.70125786163522, "percentage": 23.51, "elapsed_time": "0:22:49", "remaining_time": "1:14:17", "throughput": 4270.51, "total_tokens": 5849536} {"current_steps": 8975, "total_steps": 38160, "loss": 0.4274, "lr": 0.0009453702947047899, "epoch": 4.703878406708595, "percentage": 23.52, "elapsed_time": "0:22:50", "remaining_time": "1:14:16", "throughput": 4270.35, "total_tokens": 5852032} {"current_steps": 8980, "total_steps": 38160, "loss": 0.5701, "lr": 0.0009452663077198347, "epoch": 4.70649895178197, "percentage": 23.53, "elapsed_time": "0:22:51", "remaining_time": "1:14:15", "throughput": 4270.39, "total_tokens": 5855072} {"current_steps": 8985, "total_steps": 38160, "loss": 0.519, "lr": 0.0009451622275902477, "epoch": 4.709119496855346, "percentage": 23.55, "elapsed_time": "0:22:51", "remaining_time": "1:14:14", "throughput": 4270.5, "total_tokens": 5858272} {"current_steps": 8990, "total_steps": 38160, "loss": 0.4722, "lr": 0.0009450580543378013, "epoch": 4.711740041928721, "percentage": 23.56, "elapsed_time": "0:22:52", "remaining_time": "1:14:13", "throughput": 4270.72, "total_tokens": 5861856} {"current_steps": 8995, "total_steps": 38160, "loss": 0.4775, "lr": 0.0009449537879842875, "epoch": 4.714360587002097, "percentage": 23.57, "elapsed_time": "0:22:53", "remaining_time": "1:14:12", "throughput": 4270.61, "total_tokens": 5864448} {"current_steps": 9000, "total_steps": 38160, "loss": 0.4251, "lr": 0.0009448494285515177, "epoch": 4.716981132075472, "percentage": 23.58, "elapsed_time": "0:22:53", "remaining_time": "1:14:11", "throughput": 4270.73, "total_tokens": 5867744} {"current_steps": 9005, "total_steps": 38160, "loss": 0.3952, "lr": 0.0009447449760613222, "epoch": 4.719601677148847, "percentage": 23.6, "elapsed_time": "0:22:54", "remaining_time": "1:14:10", "throughput": 4270.59, "total_tokens": 5870336} {"current_steps": 9010, "total_steps": 38160, "loss": 0.47, "lr": 0.0009446404305355519, "epoch": 4.722222222222222, "percentage": 23.61, "elapsed_time": "0:22:55", "remaining_time": "1:14:09", "throughput": 4270.75, "total_tokens": 5873728} {"current_steps": 9015, "total_steps": 38160, "loss": 0.4263, "lr": 0.0009445357919960762, "epoch": 4.7248427672955975, "percentage": 23.62, "elapsed_time": "0:22:56", "remaining_time": "1:14:08", "throughput": 4270.57, "total_tokens": 5876320} {"current_steps": 9020, "total_steps": 38160, "loss": 0.4311, "lr": 0.0009444310604647844, "epoch": 4.727463312368973, "percentage": 23.64, "elapsed_time": "0:22:56", "remaining_time": "1:14:07", "throughput": 4270.66, "total_tokens": 5879552} {"current_steps": 9025, "total_steps": 38160, "loss": 0.4144, "lr": 0.000944326235963585, "epoch": 4.730083857442348, "percentage": 23.65, "elapsed_time": "0:22:57", "remaining_time": "1:14:06", "throughput": 4270.58, "total_tokens": 5882432} {"current_steps": 9030, "total_steps": 38160, "loss": 0.5067, "lr": 0.0009442213185144062, "epoch": 4.732704402515723, "percentage": 23.66, "elapsed_time": "0:22:58", "remaining_time": "1:14:05", "throughput": 4270.53, "total_tokens": 5885248} {"current_steps": 9035, "total_steps": 38160, "loss": 0.4637, "lr": 0.0009441163081391954, "epoch": 4.735324947589098, "percentage": 23.68, "elapsed_time": "0:22:58", "remaining_time": "1:14:04", "throughput": 4270.35, "total_tokens": 5887680} {"current_steps": 9040, "total_steps": 38160, "loss": 0.4707, "lr": 0.00094401120485992, "epoch": 4.737945492662474, "percentage": 23.69, "elapsed_time": "0:22:59", "remaining_time": "1:14:03", "throughput": 4270.4, "total_tokens": 5890848} {"current_steps": 9045, "total_steps": 38160, "loss": 0.4611, "lr": 0.0009439060086985658, "epoch": 4.740566037735849, "percentage": 23.7, "elapsed_time": "0:23:00", "remaining_time": "1:14:02", "throughput": 4270.39, "total_tokens": 5893664} {"current_steps": 9050, "total_steps": 38160, "loss": 0.5205, "lr": 0.000943800719677139, "epoch": 4.743186582809225, "percentage": 23.72, "elapsed_time": "0:23:00", "remaining_time": "1:14:01", "throughput": 4270.59, "total_tokens": 5897216} {"current_steps": 9055, "total_steps": 38160, "loss": 0.4797, "lr": 0.0009436953378176649, "epoch": 4.7458071278826, "percentage": 23.73, "elapsed_time": "0:23:01", "remaining_time": "1:14:01", "throughput": 4270.83, "total_tokens": 5900992} {"current_steps": 9060, "total_steps": 38160, "loss": 0.5713, "lr": 0.0009435898631421879, "epoch": 4.748427672955975, "percentage": 23.74, "elapsed_time": "0:23:02", "remaining_time": "1:14:00", "throughput": 4270.8, "total_tokens": 5903904} {"current_steps": 9065, "total_steps": 38160, "loss": 0.5627, "lr": 0.0009434842956727724, "epoch": 4.75104821802935, "percentage": 23.76, "elapsed_time": "0:23:03", "remaining_time": "1:13:59", "throughput": 4270.89, "total_tokens": 5907008} {"current_steps": 9070, "total_steps": 38160, "loss": 0.4188, "lr": 0.0009433786354315017, "epoch": 4.753668763102725, "percentage": 23.77, "elapsed_time": "0:23:03", "remaining_time": "1:13:58", "throughput": 4270.93, "total_tokens": 5910112} {"current_steps": 9075, "total_steps": 38160, "loss": 0.4362, "lr": 0.0009432728824404789, "epoch": 4.7562893081761, "percentage": 23.78, "elapsed_time": "0:23:04", "remaining_time": "1:13:57", "throughput": 4270.99, "total_tokens": 5913216} {"current_steps": 9080, "total_steps": 38160, "loss": 0.469, "lr": 0.0009431670367218262, "epoch": 4.758909853249476, "percentage": 23.79, "elapsed_time": "0:23:05", "remaining_time": "1:13:56", "throughput": 4271.02, "total_tokens": 5916256} {"current_steps": 9085, "total_steps": 38160, "loss": 0.4846, "lr": 0.0009430610982976852, "epoch": 4.761530398322851, "percentage": 23.81, "elapsed_time": "0:23:05", "remaining_time": "1:13:55", "throughput": 4270.99, "total_tokens": 5919040} {"current_steps": 9090, "total_steps": 38160, "loss": 0.4371, "lr": 0.0009429550671902171, "epoch": 4.764150943396227, "percentage": 23.82, "elapsed_time": "0:23:06", "remaining_time": "1:13:54", "throughput": 4271.3, "total_tokens": 5922944} {"current_steps": 9095, "total_steps": 38160, "loss": 0.3677, "lr": 0.0009428489434216028, "epoch": 4.766771488469602, "percentage": 23.83, "elapsed_time": "0:23:07", "remaining_time": "1:13:53", "throughput": 4271.42, "total_tokens": 5926368} {"current_steps": 9100, "total_steps": 38160, "loss": 0.4331, "lr": 0.0009427427270140415, "epoch": 4.769392033542977, "percentage": 23.85, "elapsed_time": "0:23:08", "remaining_time": "1:13:53", "throughput": 4271.53, "total_tokens": 5929632} {"current_steps": 9105, "total_steps": 38160, "loss": 0.4749, "lr": 0.0009426364179897529, "epoch": 4.772012578616352, "percentage": 23.86, "elapsed_time": "0:23:08", "remaining_time": "1:13:52", "throughput": 4271.6, "total_tokens": 5932832} {"current_steps": 9110, "total_steps": 38160, "loss": 0.4059, "lr": 0.0009425300163709756, "epoch": 4.7746331236897275, "percentage": 23.87, "elapsed_time": "0:23:09", "remaining_time": "1:13:51", "throughput": 4271.83, "total_tokens": 5936608} {"current_steps": 9115, "total_steps": 38160, "loss": 0.5857, "lr": 0.0009424235221799673, "epoch": 4.777253668763103, "percentage": 23.89, "elapsed_time": "0:23:10", "remaining_time": "1:13:50", "throughput": 4272.17, "total_tokens": 5940640} {"current_steps": 9120, "total_steps": 38160, "loss": 0.4211, "lr": 0.0009423169354390058, "epoch": 4.779874213836478, "percentage": 23.9, "elapsed_time": "0:23:11", "remaining_time": "1:13:50", "throughput": 4272.44, "total_tokens": 5944416} {"current_steps": 9125, "total_steps": 38160, "loss": 0.4813, "lr": 0.0009422102561703875, "epoch": 4.782494758909853, "percentage": 23.91, "elapsed_time": "0:23:12", "remaining_time": "1:13:49", "throughput": 4272.75, "total_tokens": 5948352} {"current_steps": 9130, "total_steps": 38160, "loss": 0.4096, "lr": 0.0009421034843964287, "epoch": 4.785115303983228, "percentage": 23.93, "elapsed_time": "0:23:12", "remaining_time": "1:13:49", "throughput": 4272.98, "total_tokens": 5952000} {"current_steps": 9135, "total_steps": 38160, "loss": 0.4705, "lr": 0.0009419966201394646, "epoch": 4.787735849056604, "percentage": 23.94, "elapsed_time": "0:23:13", "remaining_time": "1:13:47", "throughput": 4272.83, "total_tokens": 5954528} {"current_steps": 9140, "total_steps": 38160, "loss": 0.4446, "lr": 0.0009418896634218503, "epoch": 4.790356394129979, "percentage": 23.95, "elapsed_time": "0:23:14", "remaining_time": "1:13:46", "throughput": 4272.88, "total_tokens": 5957664} {"current_steps": 9145, "total_steps": 38160, "loss": 0.3677, "lr": 0.0009417826142659596, "epoch": 4.7929769392033545, "percentage": 23.96, "elapsed_time": "0:23:14", "remaining_time": "1:13:45", "throughput": 4272.83, "total_tokens": 5960448} {"current_steps": 9150, "total_steps": 38160, "loss": 0.4175, "lr": 0.0009416754726941863, "epoch": 4.79559748427673, "percentage": 23.98, "elapsed_time": "0:23:15", "remaining_time": "1:13:44", "throughput": 4272.71, "total_tokens": 5963072} {"current_steps": 9155, "total_steps": 38160, "loss": 0.3815, "lr": 0.0009415682387289428, "epoch": 4.798218029350105, "percentage": 23.99, "elapsed_time": "0:23:16", "remaining_time": "1:13:43", "throughput": 4272.79, "total_tokens": 5966240} {"current_steps": 9160, "total_steps": 38160, "loss": 0.3954, "lr": 0.0009414609123926616, "epoch": 4.80083857442348, "percentage": 24.0, "elapsed_time": "0:23:17", "remaining_time": "1:13:43", "throughput": 4272.93, "total_tokens": 5969664} {"current_steps": 9165, "total_steps": 38160, "loss": 0.4527, "lr": 0.000941353493707794, "epoch": 4.803459119496855, "percentage": 24.02, "elapsed_time": "0:23:17", "remaining_time": "1:13:42", "throughput": 4272.82, "total_tokens": 5972320} {"current_steps": 9170, "total_steps": 38160, "loss": 0.5375, "lr": 0.0009412459826968107, "epoch": 4.80607966457023, "percentage": 24.03, "elapsed_time": "0:23:18", "remaining_time": "1:13:40", "throughput": 4272.83, "total_tokens": 5975264} {"current_steps": 9175, "total_steps": 38160, "loss": 0.5284, "lr": 0.0009411383793822017, "epoch": 4.808700209643606, "percentage": 24.04, "elapsed_time": "0:23:19", "remaining_time": "1:13:40", "throughput": 4272.88, "total_tokens": 5978336} {"current_steps": 9180, "total_steps": 38160, "loss": 0.5014, "lr": 0.0009410306837864766, "epoch": 4.811320754716981, "percentage": 24.06, "elapsed_time": "0:23:19", "remaining_time": "1:13:39", "throughput": 4272.93, "total_tokens": 5981536} {"current_steps": 9185, "total_steps": 38160, "loss": 0.6028, "lr": 0.000940922895932164, "epoch": 4.813941299790356, "percentage": 24.07, "elapsed_time": "0:23:20", "remaining_time": "1:13:38", "throughput": 4272.98, "total_tokens": 5984640} {"current_steps": 9190, "total_steps": 38160, "loss": 0.5123, "lr": 0.0009408150158418119, "epoch": 4.816561844863732, "percentage": 24.08, "elapsed_time": "0:23:21", "remaining_time": "1:13:37", "throughput": 4272.84, "total_tokens": 5987168} {"current_steps": 9195, "total_steps": 38160, "loss": 0.5258, "lr": 0.0009407070435379876, "epoch": 4.819182389937107, "percentage": 24.1, "elapsed_time": "0:23:22", "remaining_time": "1:13:36", "throughput": 4273.09, "total_tokens": 5990880} {"current_steps": 9200, "total_steps": 38160, "loss": 0.4991, "lr": 0.0009405989790432776, "epoch": 4.821802935010482, "percentage": 24.11, "elapsed_time": "0:23:22", "remaining_time": "1:13:35", "throughput": 4273.03, "total_tokens": 5993664} {"current_steps": 9205, "total_steps": 38160, "loss": 0.5406, "lr": 0.0009404908223802877, "epoch": 4.8244234800838575, "percentage": 24.12, "elapsed_time": "0:23:23", "remaining_time": "1:13:34", "throughput": 4273.2, "total_tokens": 5997216} {"current_steps": 9210, "total_steps": 38160, "loss": 0.3222, "lr": 0.0009403825735716433, "epoch": 4.827044025157233, "percentage": 24.14, "elapsed_time": "0:23:24", "remaining_time": "1:13:33", "throughput": 4273.06, "total_tokens": 5999840} {"current_steps": 9215, "total_steps": 38160, "loss": 0.4543, "lr": 0.0009402742326399887, "epoch": 4.829664570230608, "percentage": 24.15, "elapsed_time": "0:23:24", "remaining_time": "1:13:32", "throughput": 4273.12, "total_tokens": 6003008} {"current_steps": 9220, "total_steps": 38160, "loss": 0.502, "lr": 0.0009401657996079873, "epoch": 4.832285115303983, "percentage": 24.16, "elapsed_time": "0:23:25", "remaining_time": "1:13:32", "throughput": 4273.62, "total_tokens": 6007552} {"current_steps": 9225, "total_steps": 38160, "loss": 0.5055, "lr": 0.0009400572744983224, "epoch": 4.834905660377358, "percentage": 24.17, "elapsed_time": "0:23:26", "remaining_time": "1:13:31", "throughput": 4273.79, "total_tokens": 6011040} {"current_steps": 9230, "total_steps": 38160, "loss": 0.385, "lr": 0.0009399486573336963, "epoch": 4.837526205450734, "percentage": 24.19, "elapsed_time": "0:23:27", "remaining_time": "1:13:30", "throughput": 4273.65, "total_tokens": 6013536} {"current_steps": 9235, "total_steps": 38160, "loss": 0.4104, "lr": 0.00093983994813683, "epoch": 4.840146750524109, "percentage": 24.2, "elapsed_time": "0:23:27", "remaining_time": "1:13:29", "throughput": 4273.4, "total_tokens": 6015808} {"current_steps": 9240, "total_steps": 38160, "loss": 0.3601, "lr": 0.0009397311469304648, "epoch": 4.8427672955974845, "percentage": 24.21, "elapsed_time": "0:23:28", "remaining_time": "1:13:28", "throughput": 4273.58, "total_tokens": 6019328} {"current_steps": 9245, "total_steps": 38160, "loss": 0.4222, "lr": 0.0009396222537373602, "epoch": 4.84538784067086, "percentage": 24.23, "elapsed_time": "0:23:29", "remaining_time": "1:13:27", "throughput": 4273.67, "total_tokens": 6022496} {"current_steps": 9250, "total_steps": 38160, "loss": 0.43, "lr": 0.0009395132685802956, "epoch": 4.848008385744235, "percentage": 24.24, "elapsed_time": "0:23:29", "remaining_time": "1:13:26", "throughput": 4273.65, "total_tokens": 6025408} {"current_steps": 9255, "total_steps": 38160, "loss": 0.5481, "lr": 0.0009394041914820695, "epoch": 4.85062893081761, "percentage": 24.25, "elapsed_time": "0:23:30", "remaining_time": "1:13:25", "throughput": 4273.84, "total_tokens": 6029056} {"current_steps": 9260, "total_steps": 38160, "loss": 0.3347, "lr": 0.0009392950224654994, "epoch": 4.853249475890985, "percentage": 24.27, "elapsed_time": "0:23:31", "remaining_time": "1:13:24", "throughput": 4273.69, "total_tokens": 6031584} {"current_steps": 9265, "total_steps": 38160, "loss": 0.5179, "lr": 0.0009391857615534225, "epoch": 4.85587002096436, "percentage": 24.28, "elapsed_time": "0:23:32", "remaining_time": "1:13:23", "throughput": 4273.66, "total_tokens": 6034432} {"current_steps": 9270, "total_steps": 38160, "loss": 0.4154, "lr": 0.0009390764087686948, "epoch": 4.8584905660377355, "percentage": 24.29, "elapsed_time": "0:23:32", "remaining_time": "1:13:22", "throughput": 4273.8, "total_tokens": 6037792} {"current_steps": 9275, "total_steps": 38160, "loss": 0.4852, "lr": 0.0009389669641341916, "epoch": 4.861111111111111, "percentage": 24.31, "elapsed_time": "0:23:33", "remaining_time": "1:13:21", "throughput": 4273.83, "total_tokens": 6040832} {"current_steps": 9280, "total_steps": 38160, "loss": 0.5968, "lr": 0.0009388574276728075, "epoch": 4.863731656184486, "percentage": 24.32, "elapsed_time": "0:23:34", "remaining_time": "1:13:21", "throughput": 4274.03, "total_tokens": 6044480} {"current_steps": 9285, "total_steps": 38160, "loss": 0.4293, "lr": 0.0009387477994074562, "epoch": 4.866352201257862, "percentage": 24.33, "elapsed_time": "0:23:34", "remaining_time": "1:13:20", "throughput": 4274.08, "total_tokens": 6047520} {"current_steps": 9290, "total_steps": 38160, "loss": 0.4375, "lr": 0.0009386380793610707, "epoch": 4.868972746331237, "percentage": 24.34, "elapsed_time": "0:23:35", "remaining_time": "1:13:19", "throughput": 4274.26, "total_tokens": 6051008} {"current_steps": 9295, "total_steps": 38160, "loss": 0.502, "lr": 0.0009385282675566034, "epoch": 4.871593291404612, "percentage": 24.36, "elapsed_time": "0:23:36", "remaining_time": "1:13:18", "throughput": 4273.98, "total_tokens": 6053216} {"current_steps": 9300, "total_steps": 38160, "loss": 0.5634, "lr": 0.0009384183640170255, "epoch": 4.8742138364779874, "percentage": 24.37, "elapsed_time": "0:23:37", "remaining_time": "1:13:17", "throughput": 4274.21, "total_tokens": 6056864} {"current_steps": 9305, "total_steps": 38160, "loss": 0.4259, "lr": 0.0009383083687653275, "epoch": 4.876834381551363, "percentage": 24.38, "elapsed_time": "0:23:37", "remaining_time": "1:13:16", "throughput": 4274.2, "total_tokens": 6059744} {"current_steps": 9310, "total_steps": 38160, "loss": 0.3996, "lr": 0.0009381982818245193, "epoch": 4.879454926624738, "percentage": 24.4, "elapsed_time": "0:23:38", "remaining_time": "1:13:15", "throughput": 4274.19, "total_tokens": 6062624} {"current_steps": 9315, "total_steps": 38160, "loss": 0.4641, "lr": 0.0009380881032176299, "epoch": 4.882075471698113, "percentage": 24.41, "elapsed_time": "0:23:39", "remaining_time": "1:13:14", "throughput": 4274.35, "total_tokens": 6066080} {"current_steps": 9320, "total_steps": 38160, "loss": 0.5504, "lr": 0.0009379778329677071, "epoch": 4.884696016771488, "percentage": 24.42, "elapsed_time": "0:23:39", "remaining_time": "1:13:13", "throughput": 4274.58, "total_tokens": 6069696} {"current_steps": 9325, "total_steps": 38160, "loss": 0.5805, "lr": 0.0009378674710978184, "epoch": 4.887316561844864, "percentage": 24.44, "elapsed_time": "0:23:40", "remaining_time": "1:13:13", "throughput": 4274.83, "total_tokens": 6073408} {"current_steps": 9330, "total_steps": 38160, "loss": 0.3156, "lr": 0.0009377570176310503, "epoch": 4.889937106918239, "percentage": 24.45, "elapsed_time": "0:23:41", "remaining_time": "1:13:13", "throughput": 4275.49, "total_tokens": 6078592} {"current_steps": 9335, "total_steps": 38160, "loss": 0.3487, "lr": 0.0009376464725905082, "epoch": 4.8925576519916145, "percentage": 24.46, "elapsed_time": "0:23:43", "remaining_time": "1:13:15", "throughput": 4277.33, "total_tokens": 6088128} {"current_steps": 9340, "total_steps": 38160, "loss": 0.5041, "lr": 0.000937535835999317, "epoch": 4.89517819706499, "percentage": 24.48, "elapsed_time": "0:23:44", "remaining_time": "1:13:14", "throughput": 4277.21, "total_tokens": 6090816} {"current_steps": 9345, "total_steps": 38160, "loss": 0.481, "lr": 0.0009374251078806206, "epoch": 4.897798742138365, "percentage": 24.49, "elapsed_time": "0:23:44", "remaining_time": "1:13:13", "throughput": 4277.23, "total_tokens": 6093856} {"current_steps": 9350, "total_steps": 38160, "loss": 0.4495, "lr": 0.000937314288257582, "epoch": 4.90041928721174, "percentage": 24.5, "elapsed_time": "0:23:45", "remaining_time": "1:13:12", "throughput": 4277.55, "total_tokens": 6097792} {"current_steps": 9355, "total_steps": 38160, "loss": 0.3237, "lr": 0.0009372033771533835, "epoch": 4.903039832285115, "percentage": 24.52, "elapsed_time": "0:23:46", "remaining_time": "1:13:11", "throughput": 4277.37, "total_tokens": 6100160} {"current_steps": 9360, "total_steps": 38160, "loss": 0.572, "lr": 0.0009370923745912264, "epoch": 4.90566037735849, "percentage": 24.53, "elapsed_time": "0:23:46", "remaining_time": "1:13:10", "throughput": 4277.42, "total_tokens": 6103264} {"current_steps": 9365, "total_steps": 38160, "loss": 0.5739, "lr": 0.000936981280594331, "epoch": 4.9082809224318655, "percentage": 24.54, "elapsed_time": "0:23:47", "remaining_time": "1:13:09", "throughput": 4277.29, "total_tokens": 6105856} {"current_steps": 9370, "total_steps": 38160, "loss": 0.5515, "lr": 0.0009368700951859371, "epoch": 4.910901467505241, "percentage": 24.55, "elapsed_time": "0:23:48", "remaining_time": "1:13:08", "throughput": 4277.27, "total_tokens": 6108800} {"current_steps": 9375, "total_steps": 38160, "loss": 0.4227, "lr": 0.0009367588183893035, "epoch": 4.913522012578616, "percentage": 24.57, "elapsed_time": "0:23:48", "remaining_time": "1:13:07", "throughput": 4277.21, "total_tokens": 6111552} {"current_steps": 9380, "total_steps": 38160, "loss": 0.5367, "lr": 0.0009366474502277076, "epoch": 4.916142557651992, "percentage": 24.58, "elapsed_time": "0:23:49", "remaining_time": "1:13:06", "throughput": 4277.51, "total_tokens": 6115488} {"current_steps": 9385, "total_steps": 38160, "loss": 0.3995, "lr": 0.0009365359907244469, "epoch": 4.918763102725367, "percentage": 24.59, "elapsed_time": "0:23:50", "remaining_time": "1:13:05", "throughput": 4277.74, "total_tokens": 6119136} {"current_steps": 9390, "total_steps": 38160, "loss": 0.594, "lr": 0.0009364244399028372, "epoch": 4.921383647798742, "percentage": 24.61, "elapsed_time": "0:23:51", "remaining_time": "1:13:04", "throughput": 4277.61, "total_tokens": 6121696} {"current_steps": 9395, "total_steps": 38160, "loss": 0.411, "lr": 0.0009363127977862136, "epoch": 4.924004192872117, "percentage": 24.62, "elapsed_time": "0:23:51", "remaining_time": "1:13:03", "throughput": 4277.56, "total_tokens": 6124480} {"current_steps": 9400, "total_steps": 38160, "loss": 0.4497, "lr": 0.0009362010643979304, "epoch": 4.926624737945493, "percentage": 24.63, "elapsed_time": "0:23:52", "remaining_time": "1:13:02", "throughput": 4277.38, "total_tokens": 6127008} {"current_steps": 9405, "total_steps": 38160, "loss": 0.299, "lr": 0.000936089239761361, "epoch": 4.929245283018868, "percentage": 24.65, "elapsed_time": "0:23:53", "remaining_time": "1:13:01", "throughput": 4277.4, "total_tokens": 6130080} {"current_steps": 9410, "total_steps": 38160, "loss": 0.4615, "lr": 0.0009359773238998978, "epoch": 4.931865828092243, "percentage": 24.66, "elapsed_time": "0:23:53", "remaining_time": "1:13:00", "throughput": 4277.62, "total_tokens": 6133632} {"current_steps": 9415, "total_steps": 38160, "loss": 0.4579, "lr": 0.0009358653168369524, "epoch": 4.934486373165618, "percentage": 24.67, "elapsed_time": "0:23:54", "remaining_time": "1:13:00", "throughput": 4277.76, "total_tokens": 6136992} {"current_steps": 9420, "total_steps": 38160, "loss": 0.3844, "lr": 0.0009357532185959554, "epoch": 4.937106918238994, "percentage": 24.69, "elapsed_time": "0:23:55", "remaining_time": "1:12:59", "throughput": 4277.72, "total_tokens": 6139776} {"current_steps": 9425, "total_steps": 38160, "loss": 0.5224, "lr": 0.0009356410292003562, "epoch": 4.939727463312369, "percentage": 24.7, "elapsed_time": "0:23:55", "remaining_time": "1:12:58", "throughput": 4277.78, "total_tokens": 6142880} {"current_steps": 9430, "total_steps": 38160, "loss": 0.4508, "lr": 0.0009355287486736239, "epoch": 4.9423480083857445, "percentage": 24.71, "elapsed_time": "0:23:56", "remaining_time": "1:12:57", "throughput": 4278.26, "total_tokens": 6147200} {"current_steps": 9435, "total_steps": 38160, "loss": 0.4614, "lr": 0.0009354163770392461, "epoch": 4.94496855345912, "percentage": 24.72, "elapsed_time": "0:23:57", "remaining_time": "1:12:56", "throughput": 4278.21, "total_tokens": 6150016} {"current_steps": 9440, "total_steps": 38160, "loss": 0.3989, "lr": 0.0009353039143207295, "epoch": 4.947589098532495, "percentage": 24.74, "elapsed_time": "0:23:58", "remaining_time": "1:12:55", "throughput": 4278.18, "total_tokens": 6152960} {"current_steps": 9445, "total_steps": 38160, "loss": 0.3747, "lr": 0.0009351913605416007, "epoch": 4.95020964360587, "percentage": 24.75, "elapsed_time": "0:23:58", "remaining_time": "1:12:54", "throughput": 4278.37, "total_tokens": 6156544} {"current_steps": 9450, "total_steps": 38160, "loss": 0.4762, "lr": 0.000935078715725404, "epoch": 4.952830188679245, "percentage": 24.76, "elapsed_time": "0:23:59", "remaining_time": "1:12:53", "throughput": 4278.41, "total_tokens": 6159584} {"current_steps": 9455, "total_steps": 38160, "loss": 0.4701, "lr": 0.0009349659798957034, "epoch": 4.95545073375262, "percentage": 24.78, "elapsed_time": "0:24:00", "remaining_time": "1:12:53", "throughput": 4278.48, "total_tokens": 6162752} {"current_steps": 9460, "total_steps": 38160, "loss": 0.3267, "lr": 0.0009348531530760823, "epoch": 4.9580712788259955, "percentage": 24.79, "elapsed_time": "0:24:01", "remaining_time": "1:12:52", "throughput": 4278.59, "total_tokens": 6166016} {"current_steps": 9465, "total_steps": 38160, "loss": 0.4365, "lr": 0.0009347402352901426, "epoch": 4.960691823899371, "percentage": 24.8, "elapsed_time": "0:24:01", "remaining_time": "1:12:51", "throughput": 4278.65, "total_tokens": 6169184} {"current_steps": 9470, "total_steps": 38160, "loss": 0.4662, "lr": 0.0009346272265615057, "epoch": 4.963312368972746, "percentage": 24.82, "elapsed_time": "0:24:02", "remaining_time": "1:12:50", "throughput": 4278.93, "total_tokens": 6172960} {"current_steps": 9475, "total_steps": 38160, "loss": 0.4414, "lr": 0.0009345141269138112, "epoch": 4.965932914046122, "percentage": 24.83, "elapsed_time": "0:24:03", "remaining_time": "1:12:49", "throughput": 4279.23, "total_tokens": 6176832} {"current_steps": 9480, "total_steps": 38160, "loss": 0.4619, "lr": 0.0009344009363707186, "epoch": 4.968553459119497, "percentage": 24.84, "elapsed_time": "0:24:04", "remaining_time": "1:12:48", "throughput": 4279.07, "total_tokens": 6179392} {"current_steps": 9485, "total_steps": 38160, "loss": 0.4093, "lr": 0.000934287654955906, "epoch": 4.971174004192872, "percentage": 24.86, "elapsed_time": "0:24:04", "remaining_time": "1:12:47", "throughput": 4278.99, "total_tokens": 6182208} {"current_steps": 9490, "total_steps": 38160, "loss": 0.5652, "lr": 0.0009341742826930708, "epoch": 4.973794549266247, "percentage": 24.87, "elapsed_time": "0:24:05", "remaining_time": "1:12:46", "throughput": 4279.07, "total_tokens": 6185376} {"current_steps": 9495, "total_steps": 38160, "loss": 0.3707, "lr": 0.0009340608196059289, "epoch": 4.976415094339623, "percentage": 24.88, "elapsed_time": "0:24:06", "remaining_time": "1:12:46", "throughput": 4279.24, "total_tokens": 6188896} {"current_steps": 9500, "total_steps": 38160, "loss": 0.4863, "lr": 0.0009339472657182155, "epoch": 4.979035639412998, "percentage": 24.9, "elapsed_time": "0:24:06", "remaining_time": "1:12:45", "throughput": 4279.24, "total_tokens": 6191840} {"current_steps": 9505, "total_steps": 38160, "loss": 0.4113, "lr": 0.0009338336210536848, "epoch": 4.981656184486373, "percentage": 24.91, "elapsed_time": "0:24:07", "remaining_time": "1:12:44", "throughput": 4279.2, "total_tokens": 6194784} {"current_steps": 9510, "total_steps": 38160, "loss": 0.362, "lr": 0.0009337198856361102, "epoch": 4.984276729559748, "percentage": 24.92, "elapsed_time": "0:24:08", "remaining_time": "1:12:43", "throughput": 4279.32, "total_tokens": 6198048} {"current_steps": 9515, "total_steps": 38160, "loss": 0.4549, "lr": 0.0009336060594892834, "epoch": 4.986897274633124, "percentage": 24.93, "elapsed_time": "0:24:09", "remaining_time": "1:12:43", "throughput": 4279.83, "total_tokens": 6202688} {"current_steps": 9520, "total_steps": 38160, "loss": 0.6448, "lr": 0.000933492142637016, "epoch": 4.989517819706499, "percentage": 24.95, "elapsed_time": "0:24:10", "remaining_time": "1:12:42", "throughput": 4279.92, "total_tokens": 6205952} {"current_steps": 9525, "total_steps": 38160, "loss": 0.3792, "lr": 0.0009333781351031379, "epoch": 4.9921383647798745, "percentage": 24.96, "elapsed_time": "0:24:10", "remaining_time": "1:12:41", "throughput": 4280.1, "total_tokens": 6209504} {"current_steps": 9530, "total_steps": 38160, "loss": 0.5207, "lr": 0.0009332640369114981, "epoch": 4.99475890985325, "percentage": 24.97, "elapsed_time": "0:24:11", "remaining_time": "1:12:40", "throughput": 4280.24, "total_tokens": 6212928} {"current_steps": 9535, "total_steps": 38160, "loss": 0.4182, "lr": 0.0009331498480859647, "epoch": 4.997379454926625, "percentage": 24.99, "elapsed_time": "0:24:12", "remaining_time": "1:12:40", "throughput": 4280.5, "total_tokens": 6216672} {"current_steps": 9540, "total_steps": 38160, "loss": 0.5856, "lr": 0.0009330355686504247, "epoch": 5.0, "percentage": 25.0, "elapsed_time": "0:24:13", "remaining_time": "1:12:39", "throughput": 4280.03, "total_tokens": 6219592} {"current_steps": 9540, "total_steps": 38160, "eval_loss": 0.4563165307044983, "epoch": 5.0, "percentage": 25.0, "elapsed_time": "0:24:26", "remaining_time": "1:13:20", "throughput": 4240.24, "total_tokens": 6219592} {"current_steps": 9545, "total_steps": 38160, "loss": 0.4495, "lr": 0.0009329211986287842, "epoch": 5.002620545073375, "percentage": 25.01, "elapsed_time": "0:24:29", "remaining_time": "1:13:24", "throughput": 4235.17, "total_tokens": 6222216} {"current_steps": 9550, "total_steps": 38160, "loss": 0.4668, "lr": 0.0009328067380449678, "epoch": 5.00524109014675, "percentage": 25.03, "elapsed_time": "0:24:29", "remaining_time": "1:13:23", "throughput": 4235.07, "total_tokens": 6224872} {"current_steps": 9555, "total_steps": 38160, "loss": 0.4595, "lr": 0.0009326921869229197, "epoch": 5.0078616352201255, "percentage": 25.04, "elapsed_time": "0:24:30", "remaining_time": "1:13:22", "throughput": 4235.15, "total_tokens": 6228072} {"current_steps": 9560, "total_steps": 38160, "loss": 0.5466, "lr": 0.0009325775452866023, "epoch": 5.010482180293501, "percentage": 25.05, "elapsed_time": "0:24:31", "remaining_time": "1:13:21", "throughput": 4235.12, "total_tokens": 6230984} {"current_steps": 9565, "total_steps": 38160, "loss": 0.5312, "lr": 0.0009324628131599977, "epoch": 5.013102725366877, "percentage": 25.07, "elapsed_time": "0:24:31", "remaining_time": "1:13:20", "throughput": 4235.16, "total_tokens": 6234056} {"current_steps": 9570, "total_steps": 38160, "loss": 0.3146, "lr": 0.0009323479905671064, "epoch": 5.015723270440252, "percentage": 25.08, "elapsed_time": "0:24:32", "remaining_time": "1:13:19", "throughput": 4235.44, "total_tokens": 6237800} {"current_steps": 9575, "total_steps": 38160, "loss": 0.6394, "lr": 0.0009322330775319479, "epoch": 5.018343815513627, "percentage": 25.09, "elapsed_time": "0:24:33", "remaining_time": "1:13:18", "throughput": 4235.48, "total_tokens": 6240808} {"current_steps": 9580, "total_steps": 38160, "loss": 0.5262, "lr": 0.0009321180740785607, "epoch": 5.020964360587002, "percentage": 25.1, "elapsed_time": "0:24:34", "remaining_time": "1:13:17", "throughput": 4235.57, "total_tokens": 6244040} {"current_steps": 9585, "total_steps": 38160, "loss": 0.5418, "lr": 0.0009320029802310023, "epoch": 5.023584905660377, "percentage": 25.12, "elapsed_time": "0:24:34", "remaining_time": "1:13:16", "throughput": 4235.58, "total_tokens": 6246952} {"current_steps": 9590, "total_steps": 38160, "loss": 0.4981, "lr": 0.0009318877960133489, "epoch": 5.026205450733753, "percentage": 25.13, "elapsed_time": "0:24:35", "remaining_time": "1:13:16", "throughput": 4235.79, "total_tokens": 6250472} {"current_steps": 9595, "total_steps": 38160, "loss": 0.428, "lr": 0.0009317725214496959, "epoch": 5.028825995807128, "percentage": 25.14, "elapsed_time": "0:24:36", "remaining_time": "1:13:15", "throughput": 4235.9, "total_tokens": 6253640} {"current_steps": 9600, "total_steps": 38160, "loss": 0.4619, "lr": 0.0009316571565641574, "epoch": 5.031446540880503, "percentage": 25.16, "elapsed_time": "0:24:37", "remaining_time": "1:13:14", "throughput": 4236.1, "total_tokens": 6257160} {"current_steps": 9605, "total_steps": 38160, "loss": 0.4198, "lr": 0.0009315417013808663, "epoch": 5.034067085953878, "percentage": 25.17, "elapsed_time": "0:24:37", "remaining_time": "1:13:13", "throughput": 4235.96, "total_tokens": 6259688} {"current_steps": 9610, "total_steps": 38160, "loss": 0.444, "lr": 0.0009314261559239745, "epoch": 5.036687631027253, "percentage": 25.18, "elapsed_time": "0:24:38", "remaining_time": "1:13:12", "throughput": 4236.11, "total_tokens": 6263080} {"current_steps": 9615, "total_steps": 38160, "loss": 0.2929, "lr": 0.000931310520217653, "epoch": 5.039308176100629, "percentage": 25.2, "elapsed_time": "0:24:39", "remaining_time": "1:13:12", "throughput": 4237.0, "total_tokens": 6269320} {"current_steps": 9620, "total_steps": 38160, "loss": 0.4562, "lr": 0.0009311947942860912, "epoch": 5.0419287211740045, "percentage": 25.21, "elapsed_time": "0:24:40", "remaining_time": "1:13:11", "throughput": 4237.07, "total_tokens": 6272392} {"current_steps": 9625, "total_steps": 38160, "loss": 0.5658, "lr": 0.0009310789781534979, "epoch": 5.04454926624738, "percentage": 25.22, "elapsed_time": "0:24:41", "remaining_time": "1:13:10", "throughput": 4237.07, "total_tokens": 6275496} {"current_steps": 9630, "total_steps": 38160, "loss": 0.4048, "lr": 0.0009309630718441003, "epoch": 5.047169811320755, "percentage": 25.24, "elapsed_time": "0:24:41", "remaining_time": "1:13:09", "throughput": 4236.85, "total_tokens": 6277960} {"current_steps": 9635, "total_steps": 38160, "loss": 0.8634, "lr": 0.0009308470753821445, "epoch": 5.04979035639413, "percentage": 25.25, "elapsed_time": "0:24:42", "remaining_time": "1:13:08", "throughput": 4236.66, "total_tokens": 6280520} {"current_steps": 9640, "total_steps": 38160, "loss": 0.4665, "lr": 0.0009307309887918962, "epoch": 5.052410901467505, "percentage": 25.26, "elapsed_time": "0:24:43", "remaining_time": "1:13:07", "throughput": 4236.63, "total_tokens": 6283304} {"current_steps": 9645, "total_steps": 38160, "loss": 0.5956, "lr": 0.000930614812097639, "epoch": 5.05503144654088, "percentage": 25.28, "elapsed_time": "0:24:43", "remaining_time": "1:13:06", "throughput": 4236.73, "total_tokens": 6286536} {"current_steps": 9650, "total_steps": 38160, "loss": 0.4682, "lr": 0.0009304985453236758, "epoch": 5.0576519916142555, "percentage": 25.29, "elapsed_time": "0:24:44", "remaining_time": "1:13:06", "throughput": 4236.84, "total_tokens": 6289928} {"current_steps": 9655, "total_steps": 38160, "loss": 0.5219, "lr": 0.0009303821884943284, "epoch": 5.060272536687631, "percentage": 25.3, "elapsed_time": "0:24:45", "remaining_time": "1:13:05", "throughput": 4237.02, "total_tokens": 6293416} {"current_steps": 9660, "total_steps": 38160, "loss": 0.5118, "lr": 0.0009302657416339371, "epoch": 5.062893081761007, "percentage": 25.31, "elapsed_time": "0:24:46", "remaining_time": "1:13:04", "throughput": 4237.31, "total_tokens": 6297320} {"current_steps": 9665, "total_steps": 38160, "loss": 0.4236, "lr": 0.0009301492047668615, "epoch": 5.065513626834382, "percentage": 25.33, "elapsed_time": "0:24:46", "remaining_time": "1:13:03", "throughput": 4237.23, "total_tokens": 6300008} {"current_steps": 9670, "total_steps": 38160, "loss": 0.4153, "lr": 0.0009300325779174796, "epoch": 5.068134171907757, "percentage": 25.34, "elapsed_time": "0:24:47", "remaining_time": "1:13:02", "throughput": 4237.6, "total_tokens": 6304136} {"current_steps": 9675, "total_steps": 38160, "loss": 0.5683, "lr": 0.0009299158611101885, "epoch": 5.070754716981132, "percentage": 25.35, "elapsed_time": "0:24:48", "remaining_time": "1:13:01", "throughput": 4237.52, "total_tokens": 6306792} {"current_steps": 9680, "total_steps": 38160, "loss": 0.529, "lr": 0.000929799054369404, "epoch": 5.073375262054507, "percentage": 25.37, "elapsed_time": "0:24:49", "remaining_time": "1:13:00", "throughput": 4237.55, "total_tokens": 6309800} {"current_steps": 9685, "total_steps": 38160, "loss": 0.5332, "lr": 0.0009296821577195606, "epoch": 5.075995807127883, "percentage": 25.38, "elapsed_time": "0:24:49", "remaining_time": "1:12:59", "throughput": 4237.41, "total_tokens": 6312360} {"current_steps": 9690, "total_steps": 38160, "loss": 0.516, "lr": 0.000929565171185112, "epoch": 5.078616352201258, "percentage": 25.39, "elapsed_time": "0:24:50", "remaining_time": "1:12:59", "throughput": 4237.58, "total_tokens": 6316008} {"current_steps": 9695, "total_steps": 38160, "loss": 0.4436, "lr": 0.0009294480947905304, "epoch": 5.081236897274633, "percentage": 25.41, "elapsed_time": "0:24:51", "remaining_time": "1:12:58", "throughput": 4237.53, "total_tokens": 6318952} {"current_steps": 9700, "total_steps": 38160, "loss": 0.4908, "lr": 0.0009293309285603067, "epoch": 5.083857442348008, "percentage": 25.42, "elapsed_time": "0:24:51", "remaining_time": "1:12:57", "throughput": 4237.58, "total_tokens": 6322056} {"current_steps": 9705, "total_steps": 38160, "loss": 0.4345, "lr": 0.0009292136725189506, "epoch": 5.086477987421383, "percentage": 25.43, "elapsed_time": "0:24:52", "remaining_time": "1:12:56", "throughput": 4237.55, "total_tokens": 6325000} {"current_steps": 9710, "total_steps": 38160, "loss": 0.4089, "lr": 0.0009290963266909912, "epoch": 5.089098532494759, "percentage": 25.45, "elapsed_time": "0:24:53", "remaining_time": "1:12:56", "throughput": 4238.19, "total_tokens": 6329960} {"current_steps": 9715, "total_steps": 38160, "loss": 0.3689, "lr": 0.0009289788911009756, "epoch": 5.0917190775681345, "percentage": 25.46, "elapsed_time": "0:24:54", "remaining_time": "1:12:55", "throughput": 4238.41, "total_tokens": 6333640} {"current_steps": 9720, "total_steps": 38160, "loss": 0.3953, "lr": 0.0009288613657734699, "epoch": 5.09433962264151, "percentage": 25.47, "elapsed_time": "0:24:55", "remaining_time": "1:12:54", "throughput": 4238.37, "total_tokens": 6336488} {"current_steps": 9725, "total_steps": 38160, "loss": 0.4734, "lr": 0.0009287437507330594, "epoch": 5.096960167714885, "percentage": 25.48, "elapsed_time": "0:24:55", "remaining_time": "1:12:53", "throughput": 4238.65, "total_tokens": 6340328} {"current_steps": 9730, "total_steps": 38160, "loss": 0.5456, "lr": 0.0009286260460043475, "epoch": 5.09958071278826, "percentage": 25.5, "elapsed_time": "0:24:56", "remaining_time": "1:12:52", "throughput": 4238.72, "total_tokens": 6343464} {"current_steps": 9735, "total_steps": 38160, "loss": 0.6591, "lr": 0.0009285082516119567, "epoch": 5.102201257861635, "percentage": 25.51, "elapsed_time": "0:24:57", "remaining_time": "1:12:52", "throughput": 4239.6, "total_tokens": 6349352} {"current_steps": 9740, "total_steps": 38160, "loss": 0.3976, "lr": 0.0009283903675805285, "epoch": 5.10482180293501, "percentage": 25.52, "elapsed_time": "0:24:58", "remaining_time": "1:12:51", "throughput": 4239.45, "total_tokens": 6351784} {"current_steps": 9745, "total_steps": 38160, "loss": 0.6016, "lr": 0.0009282723939347227, "epoch": 5.1074423480083855, "percentage": 25.54, "elapsed_time": "0:24:59", "remaining_time": "1:12:50", "throughput": 4239.66, "total_tokens": 6355368} {"current_steps": 9750, "total_steps": 38160, "loss": 0.5144, "lr": 0.0009281543306992181, "epoch": 5.110062893081761, "percentage": 25.55, "elapsed_time": "0:24:59", "remaining_time": "1:12:49", "throughput": 4239.65, "total_tokens": 6358312} {"current_steps": 9755, "total_steps": 38160, "loss": 0.4948, "lr": 0.0009280361778987121, "epoch": 5.112683438155136, "percentage": 25.56, "elapsed_time": "0:25:00", "remaining_time": "1:12:48", "throughput": 4239.53, "total_tokens": 6360776} {"current_steps": 9760, "total_steps": 38160, "loss": 0.5832, "lr": 0.0009279179355579211, "epoch": 5.115303983228512, "percentage": 25.58, "elapsed_time": "0:25:01", "remaining_time": "1:12:48", "throughput": 4239.72, "total_tokens": 6364424} {"current_steps": 9765, "total_steps": 38160, "loss": 0.4463, "lr": 0.0009277996037015798, "epoch": 5.117924528301887, "percentage": 25.59, "elapsed_time": "0:25:01", "remaining_time": "1:12:47", "throughput": 4239.77, "total_tokens": 6367496} {"current_steps": 9770, "total_steps": 38160, "loss": 0.4318, "lr": 0.000927681182354442, "epoch": 5.120545073375262, "percentage": 25.6, "elapsed_time": "0:25:02", "remaining_time": "1:12:46", "throughput": 4239.8, "total_tokens": 6370472} {"current_steps": 9775, "total_steps": 38160, "loss": 0.3693, "lr": 0.0009275626715412802, "epoch": 5.123165618448637, "percentage": 25.62, "elapsed_time": "0:25:03", "remaining_time": "1:12:45", "throughput": 4239.93, "total_tokens": 6373832} {"current_steps": 9780, "total_steps": 38160, "loss": 0.4469, "lr": 0.0009274440712868853, "epoch": 5.1257861635220126, "percentage": 25.63, "elapsed_time": "0:25:04", "remaining_time": "1:12:44", "throughput": 4240.22, "total_tokens": 6377672} {"current_steps": 9785, "total_steps": 38160, "loss": 0.4597, "lr": 0.0009273253816160673, "epoch": 5.128406708595388, "percentage": 25.64, "elapsed_time": "0:25:04", "remaining_time": "1:12:43", "throughput": 4240.24, "total_tokens": 6380712} {"current_steps": 9790, "total_steps": 38160, "loss": 0.4846, "lr": 0.0009272066025536545, "epoch": 5.131027253668763, "percentage": 25.66, "elapsed_time": "0:25:05", "remaining_time": "1:12:43", "throughput": 4240.59, "total_tokens": 6384776} {"current_steps": 9795, "total_steps": 38160, "loss": 0.4885, "lr": 0.0009270877341244945, "epoch": 5.133647798742138, "percentage": 25.67, "elapsed_time": "0:25:06", "remaining_time": "1:12:42", "throughput": 4240.55, "total_tokens": 6387560} {"current_steps": 9800, "total_steps": 38160, "loss": 0.601, "lr": 0.0009269687763534529, "epoch": 5.136268343815513, "percentage": 25.68, "elapsed_time": "0:25:07", "remaining_time": "1:12:41", "throughput": 4240.69, "total_tokens": 6390952} {"current_steps": 9805, "total_steps": 38160, "loss": 0.5004, "lr": 0.0009268497292654143, "epoch": 5.138888888888889, "percentage": 25.69, "elapsed_time": "0:25:07", "remaining_time": "1:12:40", "throughput": 4240.75, "total_tokens": 6394088} {"current_steps": 9810, "total_steps": 38160, "loss": 0.3887, "lr": 0.0009267305928852823, "epoch": 5.1415094339622645, "percentage": 25.71, "elapsed_time": "0:25:08", "remaining_time": "1:12:39", "throughput": 4240.79, "total_tokens": 6397064} {"current_steps": 9815, "total_steps": 38160, "loss": 0.6636, "lr": 0.0009266113672379786, "epoch": 5.14412997903564, "percentage": 25.72, "elapsed_time": "0:25:09", "remaining_time": "1:12:38", "throughput": 4241.0, "total_tokens": 6400584} {"current_steps": 9820, "total_steps": 38160, "loss": 0.3665, "lr": 0.0009264920523484437, "epoch": 5.146750524109015, "percentage": 25.73, "elapsed_time": "0:25:09", "remaining_time": "1:12:37", "throughput": 4241.15, "total_tokens": 6403976} {"current_steps": 9825, "total_steps": 38160, "loss": 0.4856, "lr": 0.0009263726482416374, "epoch": 5.14937106918239, "percentage": 25.75, "elapsed_time": "0:25:10", "remaining_time": "1:12:36", "throughput": 4241.02, "total_tokens": 6406536} {"current_steps": 9830, "total_steps": 38160, "loss": 0.4755, "lr": 0.0009262531549425372, "epoch": 5.151991614255765, "percentage": 25.76, "elapsed_time": "0:25:11", "remaining_time": "1:12:35", "throughput": 4241.31, "total_tokens": 6410312} {"current_steps": 9835, "total_steps": 38160, "loss": 0.4242, "lr": 0.0009261335724761402, "epoch": 5.15461215932914, "percentage": 25.77, "elapsed_time": "0:25:12", "remaining_time": "1:12:35", "throughput": 4241.62, "total_tokens": 6414184} {"current_steps": 9840, "total_steps": 38160, "loss": 0.6985, "lr": 0.0009260139008674612, "epoch": 5.1572327044025155, "percentage": 25.79, "elapsed_time": "0:25:12", "remaining_time": "1:12:34", "throughput": 4241.67, "total_tokens": 6417224} {"current_steps": 9845, "total_steps": 38160, "loss": 0.558, "lr": 0.0009258941401415344, "epoch": 5.159853249475891, "percentage": 25.8, "elapsed_time": "0:25:13", "remaining_time": "1:12:33", "throughput": 4241.97, "total_tokens": 6421128} {"current_steps": 9850, "total_steps": 38160, "loss": 0.4453, "lr": 0.0009257742903234123, "epoch": 5.162473794549266, "percentage": 25.81, "elapsed_time": "0:25:14", "remaining_time": "1:12:32", "throughput": 4242.05, "total_tokens": 6424232} {"current_steps": 9855, "total_steps": 38160, "loss": 0.4519, "lr": 0.0009256543514381664, "epoch": 5.165094339622642, "percentage": 25.83, "elapsed_time": "0:25:15", "remaining_time": "1:12:31", "throughput": 4242.17, "total_tokens": 6427464} {"current_steps": 9860, "total_steps": 38160, "loss": 0.4032, "lr": 0.0009255343235108859, "epoch": 5.167714884696017, "percentage": 25.84, "elapsed_time": "0:25:15", "remaining_time": "1:12:30", "throughput": 4242.19, "total_tokens": 6430504} {"current_steps": 9865, "total_steps": 38160, "loss": 0.5041, "lr": 0.00092541420656668, "epoch": 5.170335429769392, "percentage": 25.85, "elapsed_time": "0:25:16", "remaining_time": "1:12:30", "throughput": 4242.36, "total_tokens": 6434056} {"current_steps": 9870, "total_steps": 38160, "loss": 0.6509, "lr": 0.0009252940006306753, "epoch": 5.172955974842767, "percentage": 25.86, "elapsed_time": "0:25:17", "remaining_time": "1:12:29", "throughput": 4242.43, "total_tokens": 6437256} {"current_steps": 9875, "total_steps": 38160, "loss": 0.474, "lr": 0.0009251737057280179, "epoch": 5.1755765199161425, "percentage": 25.88, "elapsed_time": "0:25:18", "remaining_time": "1:12:28", "throughput": 4242.68, "total_tokens": 6441064} {"current_steps": 9880, "total_steps": 38160, "loss": 0.4038, "lr": 0.0009250533218838717, "epoch": 5.178197064989518, "percentage": 25.89, "elapsed_time": "0:25:18", "remaining_time": "1:12:27", "throughput": 4242.88, "total_tokens": 6444648} {"current_steps": 9885, "total_steps": 38160, "loss": 0.5103, "lr": 0.0009249328491234199, "epoch": 5.180817610062893, "percentage": 25.9, "elapsed_time": "0:25:19", "remaining_time": "1:12:26", "throughput": 4242.96, "total_tokens": 6447880} {"current_steps": 9890, "total_steps": 38160, "loss": 0.4401, "lr": 0.0009248122874718638, "epoch": 5.183438155136268, "percentage": 25.92, "elapsed_time": "0:25:20", "remaining_time": "1:12:25", "throughput": 4242.93, "total_tokens": 6450728} {"current_steps": 9895, "total_steps": 38160, "loss": 0.3819, "lr": 0.0009246916369544238, "epoch": 5.186058700209643, "percentage": 25.93, "elapsed_time": "0:25:21", "remaining_time": "1:12:24", "throughput": 4242.94, "total_tokens": 6453640} {"current_steps": 9900, "total_steps": 38160, "loss": 0.3705, "lr": 0.0009245708975963386, "epoch": 5.188679245283019, "percentage": 25.94, "elapsed_time": "0:25:21", "remaining_time": "1:12:23", "throughput": 4243.05, "total_tokens": 6456840} {"current_steps": 9905, "total_steps": 38160, "loss": 0.4282, "lr": 0.0009244500694228653, "epoch": 5.191299790356394, "percentage": 25.96, "elapsed_time": "0:25:22", "remaining_time": "1:12:22", "throughput": 4243.06, "total_tokens": 6459848} {"current_steps": 9910, "total_steps": 38160, "loss": 0.5484, "lr": 0.0009243291524592799, "epoch": 5.19392033542977, "percentage": 25.97, "elapsed_time": "0:25:23", "remaining_time": "1:12:22", "throughput": 4243.29, "total_tokens": 6463624} {"current_steps": 9915, "total_steps": 38160, "loss": 0.411, "lr": 0.0009242081467308766, "epoch": 5.196540880503145, "percentage": 25.98, "elapsed_time": "0:25:24", "remaining_time": "1:12:21", "throughput": 4243.49, "total_tokens": 6467176} {"current_steps": 9920, "total_steps": 38160, "loss": 0.4835, "lr": 0.0009240870522629688, "epoch": 5.19916142557652, "percentage": 26.0, "elapsed_time": "0:25:24", "remaining_time": "1:12:20", "throughput": 4243.44, "total_tokens": 6469896} {"current_steps": 9925, "total_steps": 38160, "loss": 0.5816, "lr": 0.0009239658690808879, "epoch": 5.201781970649895, "percentage": 26.01, "elapsed_time": "0:25:25", "remaining_time": "1:12:19", "throughput": 4243.47, "total_tokens": 6472904} {"current_steps": 9930, "total_steps": 38160, "loss": 0.5077, "lr": 0.000923844597209984, "epoch": 5.20440251572327, "percentage": 26.02, "elapsed_time": "0:25:26", "remaining_time": "1:12:18", "throughput": 4243.91, "total_tokens": 6477288} {"current_steps": 9935, "total_steps": 38160, "loss": 0.4665, "lr": 0.0009237232366756258, "epoch": 5.2070230607966455, "percentage": 26.04, "elapsed_time": "0:25:26", "remaining_time": "1:12:18", "throughput": 4244.01, "total_tokens": 6480488} {"current_steps": 9940, "total_steps": 38160, "loss": 0.3621, "lr": 0.0009236017875032007, "epoch": 5.209643605870021, "percentage": 26.05, "elapsed_time": "0:25:27", "remaining_time": "1:12:17", "throughput": 4244.0, "total_tokens": 6483368} {"current_steps": 9945, "total_steps": 38160, "loss": 0.5165, "lr": 0.0009234802497181143, "epoch": 5.212264150943396, "percentage": 26.06, "elapsed_time": "0:25:28", "remaining_time": "1:12:15", "throughput": 4243.88, "total_tokens": 6485928} {"current_steps": 9950, "total_steps": 38160, "loss": 0.5012, "lr": 0.0009233586233457909, "epoch": 5.214884696016772, "percentage": 26.07, "elapsed_time": "0:25:29", "remaining_time": "1:12:15", "throughput": 4244.12, "total_tokens": 6489768} {"current_steps": 9955, "total_steps": 38160, "loss": 0.4877, "lr": 0.0009232369084116736, "epoch": 5.217505241090147, "percentage": 26.09, "elapsed_time": "0:25:29", "remaining_time": "1:12:14", "throughput": 4244.31, "total_tokens": 6493352} {"current_steps": 9960, "total_steps": 38160, "loss": 0.4799, "lr": 0.0009231151049412234, "epoch": 5.220125786163522, "percentage": 26.1, "elapsed_time": "0:25:30", "remaining_time": "1:12:13", "throughput": 4244.19, "total_tokens": 6495944} {"current_steps": 9965, "total_steps": 38160, "loss": 0.4407, "lr": 0.0009229932129599205, "epoch": 5.222746331236897, "percentage": 26.11, "elapsed_time": "0:25:31", "remaining_time": "1:12:12", "throughput": 4244.09, "total_tokens": 6498472} {"current_steps": 9970, "total_steps": 38160, "loss": 0.5053, "lr": 0.0009228712324932634, "epoch": 5.2253668763102725, "percentage": 26.13, "elapsed_time": "0:25:31", "remaining_time": "1:12:11", "throughput": 4244.32, "total_tokens": 6502088} {"current_steps": 9975, "total_steps": 38160, "loss": 0.3549, "lr": 0.0009227491635667685, "epoch": 5.227987421383648, "percentage": 26.14, "elapsed_time": "0:25:32", "remaining_time": "1:12:10", "throughput": 4244.32, "total_tokens": 6505032} {"current_steps": 9980, "total_steps": 38160, "loss": 0.3512, "lr": 0.0009226270062059717, "epoch": 5.230607966457023, "percentage": 26.15, "elapsed_time": "0:25:33", "remaining_time": "1:12:09", "throughput": 4244.48, "total_tokens": 6508488} {"current_steps": 9985, "total_steps": 38160, "loss": 0.4555, "lr": 0.0009225047604364267, "epoch": 5.233228511530398, "percentage": 26.17, "elapsed_time": "0:25:34", "remaining_time": "1:12:08", "throughput": 4244.34, "total_tokens": 6510984} {"current_steps": 9990, "total_steps": 38160, "loss": 0.543, "lr": 0.0009223824262837062, "epoch": 5.235849056603773, "percentage": 26.18, "elapsed_time": "0:25:34", "remaining_time": "1:12:07", "throughput": 4244.48, "total_tokens": 6514376} {"current_steps": 9995, "total_steps": 38160, "loss": 0.5671, "lr": 0.0009222600037734008, "epoch": 5.238469601677149, "percentage": 26.19, "elapsed_time": "0:25:35", "remaining_time": "1:12:06", "throughput": 4244.47, "total_tokens": 6517192} {"current_steps": 10000, "total_steps": 38160, "loss": 0.3985, "lr": 0.00092213749293112, "epoch": 5.241090146750524, "percentage": 26.21, "elapsed_time": "0:25:36", "remaining_time": "1:12:05", "throughput": 4244.58, "total_tokens": 6520424} {"current_steps": 10005, "total_steps": 38160, "loss": 0.2486, "lr": 0.0009220148937824917, "epoch": 5.2437106918239, "percentage": 26.22, "elapsed_time": "0:25:36", "remaining_time": "1:12:05", "throughput": 4244.8, "total_tokens": 6523976} {"current_steps": 10010, "total_steps": 38160, "loss": 0.3861, "lr": 0.0009218922063531623, "epoch": 5.246331236897275, "percentage": 26.23, "elapsed_time": "0:25:37", "remaining_time": "1:12:03", "throughput": 4244.64, "total_tokens": 6526408} {"current_steps": 10015, "total_steps": 38160, "loss": 0.4884, "lr": 0.0009217694306687963, "epoch": 5.24895178197065, "percentage": 26.24, "elapsed_time": "0:25:38", "remaining_time": "1:12:02", "throughput": 4244.6, "total_tokens": 6529288} {"current_steps": 10020, "total_steps": 38160, "loss": 0.4861, "lr": 0.0009216465667550774, "epoch": 5.251572327044025, "percentage": 26.26, "elapsed_time": "0:25:38", "remaining_time": "1:12:01", "throughput": 4244.6, "total_tokens": 6532072} {"current_steps": 10025, "total_steps": 38160, "loss": 0.4291, "lr": 0.0009215236146377071, "epoch": 5.2541928721174, "percentage": 26.27, "elapsed_time": "0:25:39", "remaining_time": "1:12:01", "throughput": 4245.06, "total_tokens": 6536520} {"current_steps": 10030, "total_steps": 38160, "loss": 0.504, "lr": 0.0009214005743424056, "epoch": 5.256813417190775, "percentage": 26.28, "elapsed_time": "0:25:40", "remaining_time": "1:12:00", "throughput": 4245.19, "total_tokens": 6539880} {"current_steps": 10035, "total_steps": 38160, "loss": 0.472, "lr": 0.0009212774458949116, "epoch": 5.259433962264151, "percentage": 26.3, "elapsed_time": "0:25:41", "remaining_time": "1:11:59", "throughput": 4245.16, "total_tokens": 6542632} {"current_steps": 10040, "total_steps": 38160, "loss": 0.4172, "lr": 0.000921154229320982, "epoch": 5.262054507337526, "percentage": 26.31, "elapsed_time": "0:25:41", "remaining_time": "1:11:58", "throughput": 4245.15, "total_tokens": 6545416} {"current_steps": 10045, "total_steps": 38160, "loss": 0.3985, "lr": 0.0009210309246463924, "epoch": 5.264675052410902, "percentage": 26.32, "elapsed_time": "0:25:42", "remaining_time": "1:11:57", "throughput": 4245.27, "total_tokens": 6548680} {"current_steps": 10050, "total_steps": 38160, "loss": 0.4183, "lr": 0.0009209075318969369, "epoch": 5.267295597484277, "percentage": 26.34, "elapsed_time": "0:25:43", "remaining_time": "1:11:56", "throughput": 4245.6, "total_tokens": 6552744} {"current_steps": 10055, "total_steps": 38160, "loss": 0.381, "lr": 0.0009207840510984276, "epoch": 5.269916142557652, "percentage": 26.35, "elapsed_time": "0:25:44", "remaining_time": "1:11:56", "throughput": 4246.06, "total_tokens": 6557128} {"current_steps": 10060, "total_steps": 38160, "loss": 0.4698, "lr": 0.0009206604822766953, "epoch": 5.272536687631027, "percentage": 26.36, "elapsed_time": "0:25:45", "remaining_time": "1:11:57", "throughput": 4247.48, "total_tokens": 6565352} {"current_steps": 10065, "total_steps": 38160, "loss": 0.4991, "lr": 0.0009205368254575892, "epoch": 5.2751572327044025, "percentage": 26.38, "elapsed_time": "0:25:46", "remaining_time": "1:11:56", "throughput": 4247.62, "total_tokens": 6568680} {"current_steps": 10070, "total_steps": 38160, "loss": 0.4317, "lr": 0.000920413080666977, "epoch": 5.277777777777778, "percentage": 26.39, "elapsed_time": "0:25:47", "remaining_time": "1:11:55", "throughput": 4247.93, "total_tokens": 6572520} {"current_steps": 10075, "total_steps": 38160, "loss": 0.5117, "lr": 0.0009202892479307448, "epoch": 5.280398322851153, "percentage": 26.4, "elapsed_time": "0:25:48", "remaining_time": "1:11:55", "throughput": 4248.18, "total_tokens": 6576232} {"current_steps": 10080, "total_steps": 38160, "loss": 0.4328, "lr": 0.0009201653272747967, "epoch": 5.283018867924528, "percentage": 26.42, "elapsed_time": "0:25:48", "remaining_time": "1:11:54", "throughput": 4248.14, "total_tokens": 6579016} {"current_steps": 10085, "total_steps": 38160, "loss": 0.4604, "lr": 0.0009200413187250558, "epoch": 5.285639412997903, "percentage": 26.43, "elapsed_time": "0:25:49", "remaining_time": "1:11:53", "throughput": 4248.15, "total_tokens": 6581864} {"current_steps": 10090, "total_steps": 38160, "loss": 0.5584, "lr": 0.000919917222307463, "epoch": 5.288259958071279, "percentage": 26.44, "elapsed_time": "0:25:50", "remaining_time": "1:11:52", "throughput": 4248.3, "total_tokens": 6585256} {"current_steps": 10095, "total_steps": 38160, "loss": 0.5544, "lr": 0.000919793038047978, "epoch": 5.290880503144654, "percentage": 26.45, "elapsed_time": "0:25:50", "remaining_time": "1:11:51", "throughput": 4248.26, "total_tokens": 6587976} {"current_steps": 10100, "total_steps": 38160, "loss": 0.6123, "lr": 0.0009196687659725787, "epoch": 5.29350104821803, "percentage": 26.47, "elapsed_time": "0:25:51", "remaining_time": "1:11:50", "throughput": 4248.33, "total_tokens": 6591080} {"current_steps": 10105, "total_steps": 38160, "loss": 0.5077, "lr": 0.0009195444061072612, "epoch": 5.296121593291405, "percentage": 26.48, "elapsed_time": "0:25:52", "remaining_time": "1:11:49", "throughput": 4248.36, "total_tokens": 6594088} {"current_steps": 10110, "total_steps": 38160, "loss": 0.3958, "lr": 0.0009194199584780405, "epoch": 5.29874213836478, "percentage": 26.49, "elapsed_time": "0:25:52", "remaining_time": "1:11:48", "throughput": 4248.53, "total_tokens": 6597544} {"current_steps": 10115, "total_steps": 38160, "loss": 0.4619, "lr": 0.0009192954231109496, "epoch": 5.301362683438155, "percentage": 26.51, "elapsed_time": "0:25:53", "remaining_time": "1:11:47", "throughput": 4248.58, "total_tokens": 6600552} {"current_steps": 10120, "total_steps": 38160, "loss": 0.5052, "lr": 0.0009191708000320396, "epoch": 5.30398322851153, "percentage": 26.52, "elapsed_time": "0:25:54", "remaining_time": "1:11:46", "throughput": 4248.42, "total_tokens": 6602888} {"current_steps": 10125, "total_steps": 38160, "loss": 0.4318, "lr": 0.0009190460892673805, "epoch": 5.306603773584905, "percentage": 26.53, "elapsed_time": "0:25:54", "remaining_time": "1:11:45", "throughput": 4248.58, "total_tokens": 6606344} {"current_steps": 10130, "total_steps": 38160, "loss": 0.5541, "lr": 0.0009189212908430601, "epoch": 5.309224318658281, "percentage": 26.55, "elapsed_time": "0:25:55", "remaining_time": "1:11:44", "throughput": 4248.72, "total_tokens": 6609864} {"current_steps": 10135, "total_steps": 38160, "loss": 0.3992, "lr": 0.0009187964047851851, "epoch": 5.311844863731656, "percentage": 26.56, "elapsed_time": "0:25:56", "remaining_time": "1:11:43", "throughput": 4248.66, "total_tokens": 6612616} {"current_steps": 10140, "total_steps": 38160, "loss": 0.41, "lr": 0.0009186714311198801, "epoch": 5.314465408805032, "percentage": 26.57, "elapsed_time": "0:25:57", "remaining_time": "1:11:42", "throughput": 4248.86, "total_tokens": 6616072} {"current_steps": 10145, "total_steps": 38160, "loss": 0.6494, "lr": 0.000918546369873288, "epoch": 5.317085953878407, "percentage": 26.59, "elapsed_time": "0:25:57", "remaining_time": "1:11:42", "throughput": 4249.03, "total_tokens": 6619528} {"current_steps": 10150, "total_steps": 38160, "loss": 0.4586, "lr": 0.0009184212210715704, "epoch": 5.319706498951782, "percentage": 26.6, "elapsed_time": "0:25:58", "remaining_time": "1:11:41", "throughput": 4249.15, "total_tokens": 6622824} {"current_steps": 10155, "total_steps": 38160, "loss": 0.5121, "lr": 0.0009182959847409072, "epoch": 5.322327044025157, "percentage": 26.61, "elapsed_time": "0:25:59", "remaining_time": "1:11:40", "throughput": 4249.28, "total_tokens": 6626152} {"current_steps": 10160, "total_steps": 38160, "loss": 0.4909, "lr": 0.0009181706609074959, "epoch": 5.3249475890985325, "percentage": 26.62, "elapsed_time": "0:26:00", "remaining_time": "1:11:39", "throughput": 4249.2, "total_tokens": 6628808} {"current_steps": 10165, "total_steps": 38160, "loss": 0.4692, "lr": 0.0009180452495975531, "epoch": 5.327568134171908, "percentage": 26.64, "elapsed_time": "0:26:00", "remaining_time": "1:11:38", "throughput": 4249.38, "total_tokens": 6632296} {"current_steps": 10170, "total_steps": 38160, "loss": 0.5079, "lr": 0.0009179197508373134, "epoch": 5.330188679245283, "percentage": 26.65, "elapsed_time": "0:26:01", "remaining_time": "1:11:37", "throughput": 4249.42, "total_tokens": 6635400} {"current_steps": 10175, "total_steps": 38160, "loss": 0.5115, "lr": 0.0009177941646530299, "epoch": 5.332809224318658, "percentage": 26.66, "elapsed_time": "0:26:02", "remaining_time": "1:11:36", "throughput": 4249.74, "total_tokens": 6639432} {"current_steps": 10180, "total_steps": 38160, "loss": 0.4979, "lr": 0.0009176684910709733, "epoch": 5.335429769392033, "percentage": 26.68, "elapsed_time": "0:26:03", "remaining_time": "1:11:36", "throughput": 4250.06, "total_tokens": 6643336} {"current_steps": 10185, "total_steps": 38160, "loss": 0.5011, "lr": 0.0009175427301174338, "epoch": 5.338050314465409, "percentage": 26.69, "elapsed_time": "0:26:03", "remaining_time": "1:11:35", "throughput": 4250.01, "total_tokens": 6646088} {"current_steps": 10190, "total_steps": 38160, "loss": 0.3204, "lr": 0.0009174168818187183, "epoch": 5.340670859538784, "percentage": 26.7, "elapsed_time": "0:26:04", "remaining_time": "1:11:34", "throughput": 4250.15, "total_tokens": 6649384} {"current_steps": 10195, "total_steps": 38160, "loss": 0.4406, "lr": 0.0009172909462011536, "epoch": 5.34329140461216, "percentage": 26.72, "elapsed_time": "0:26:05", "remaining_time": "1:11:33", "throughput": 4250.19, "total_tokens": 6652424} {"current_steps": 10200, "total_steps": 38160, "loss": 0.4578, "lr": 0.0009171649232910835, "epoch": 5.345911949685535, "percentage": 26.73, "elapsed_time": "0:26:05", "remaining_time": "1:11:32", "throughput": 4250.24, "total_tokens": 6655464} {"current_steps": 10205, "total_steps": 38160, "loss": 0.5131, "lr": 0.0009170388131148707, "epoch": 5.34853249475891, "percentage": 26.74, "elapsed_time": "0:26:06", "remaining_time": "1:11:31", "throughput": 4250.46, "total_tokens": 6659112} {"current_steps": 10210, "total_steps": 38160, "loss": 0.5255, "lr": 0.000916912615698896, "epoch": 5.351153039832285, "percentage": 26.76, "elapsed_time": "0:26:07", "remaining_time": "1:11:31", "throughput": 4250.83, "total_tokens": 6663304} {"current_steps": 10215, "total_steps": 38160, "loss": 0.3428, "lr": 0.0009167863310695585, "epoch": 5.35377358490566, "percentage": 26.77, "elapsed_time": "0:26:08", "remaining_time": "1:11:30", "throughput": 4251.04, "total_tokens": 6666888} {"current_steps": 10220, "total_steps": 38160, "loss": 0.445, "lr": 0.0009166599592532756, "epoch": 5.356394129979035, "percentage": 26.78, "elapsed_time": "0:26:09", "remaining_time": "1:11:29", "throughput": 4251.28, "total_tokens": 6670504} {"current_steps": 10225, "total_steps": 38160, "loss": 0.4037, "lr": 0.0009165335002764828, "epoch": 5.359014675052411, "percentage": 26.8, "elapsed_time": "0:26:09", "remaining_time": "1:11:28", "throughput": 4251.42, "total_tokens": 6673832} {"current_steps": 10230, "total_steps": 38160, "loss": 0.4534, "lr": 0.0009164069541656337, "epoch": 5.361635220125786, "percentage": 26.81, "elapsed_time": "0:26:10", "remaining_time": "1:11:27", "throughput": 4251.54, "total_tokens": 6677160} {"current_steps": 10235, "total_steps": 38160, "loss": 0.4561, "lr": 0.0009162803209472004, "epoch": 5.364255765199162, "percentage": 26.82, "elapsed_time": "0:26:11", "remaining_time": "1:11:27", "throughput": 4251.86, "total_tokens": 6681160} {"current_steps": 10240, "total_steps": 38160, "loss": 0.4473, "lr": 0.000916153600647673, "epoch": 5.366876310272537, "percentage": 26.83, "elapsed_time": "0:26:12", "remaining_time": "1:11:26", "throughput": 4251.99, "total_tokens": 6684424} {"current_steps": 10245, "total_steps": 38160, "loss": 0.4511, "lr": 0.0009160267932935602, "epoch": 5.369496855345912, "percentage": 26.85, "elapsed_time": "0:26:12", "remaining_time": "1:11:25", "throughput": 4252.07, "total_tokens": 6687528} {"current_steps": 10250, "total_steps": 38160, "loss": 0.5175, "lr": 0.0009158998989113885, "epoch": 5.372117400419287, "percentage": 26.86, "elapsed_time": "0:26:13", "remaining_time": "1:11:24", "throughput": 4251.99, "total_tokens": 6690120} {"current_steps": 10255, "total_steps": 38160, "loss": 0.5177, "lr": 0.0009157729175277028, "epoch": 5.3747379454926625, "percentage": 26.87, "elapsed_time": "0:26:14", "remaining_time": "1:11:23", "throughput": 4252.27, "total_tokens": 6693992} {"current_steps": 10260, "total_steps": 38160, "loss": 0.4517, "lr": 0.0009156458491690662, "epoch": 5.377358490566038, "percentage": 26.89, "elapsed_time": "0:26:15", "remaining_time": "1:11:23", "throughput": 4252.78, "total_tokens": 6698568} {"current_steps": 10265, "total_steps": 38160, "loss": 0.4792, "lr": 0.0009155186938620599, "epoch": 5.379979035639413, "percentage": 26.9, "elapsed_time": "0:26:15", "remaining_time": "1:11:22", "throughput": 4252.75, "total_tokens": 6701320} {"current_steps": 10270, "total_steps": 38160, "loss": 0.4477, "lr": 0.0009153914516332833, "epoch": 5.382599580712788, "percentage": 26.91, "elapsed_time": "0:26:16", "remaining_time": "1:11:21", "throughput": 4252.74, "total_tokens": 6704168} {"current_steps": 10275, "total_steps": 38160, "loss": 0.4924, "lr": 0.000915264122509354, "epoch": 5.385220125786163, "percentage": 26.93, "elapsed_time": "0:26:17", "remaining_time": "1:11:20", "throughput": 4252.92, "total_tokens": 6707688} {"current_steps": 10280, "total_steps": 38160, "loss": 0.43, "lr": 0.0009151367065169078, "epoch": 5.387840670859539, "percentage": 26.94, "elapsed_time": "0:26:17", "remaining_time": "1:11:19", "throughput": 4253.04, "total_tokens": 6711048} {"current_steps": 10285, "total_steps": 38160, "loss": 0.4936, "lr": 0.0009150092036825989, "epoch": 5.390461215932914, "percentage": 26.95, "elapsed_time": "0:26:18", "remaining_time": "1:11:18", "throughput": 4253.34, "total_tokens": 6715016} {"current_steps": 10290, "total_steps": 38160, "loss": 0.4604, "lr": 0.0009148816140330991, "epoch": 5.3930817610062896, "percentage": 26.97, "elapsed_time": "0:26:19", "remaining_time": "1:11:17", "throughput": 4253.19, "total_tokens": 6717448} {"current_steps": 10295, "total_steps": 38160, "loss": 0.3304, "lr": 0.000914753937595099, "epoch": 5.395702306079665, "percentage": 26.98, "elapsed_time": "0:26:20", "remaining_time": "1:11:16", "throughput": 4253.41, "total_tokens": 6721032} {"current_steps": 10300, "total_steps": 38160, "loss": 0.4551, "lr": 0.0009146261743953068, "epoch": 5.39832285115304, "percentage": 26.99, "elapsed_time": "0:26:20", "remaining_time": "1:11:15", "throughput": 4253.22, "total_tokens": 6723304} {"current_steps": 10305, "total_steps": 38160, "loss": 0.4522, "lr": 0.0009144983244604493, "epoch": 5.400943396226415, "percentage": 27.0, "elapsed_time": "0:26:21", "remaining_time": "1:11:14", "throughput": 4253.27, "total_tokens": 6726344} {"current_steps": 10310, "total_steps": 38160, "loss": 0.4791, "lr": 0.0009143703878172712, "epoch": 5.40356394129979, "percentage": 27.02, "elapsed_time": "0:26:22", "remaining_time": "1:11:14", "throughput": 4253.57, "total_tokens": 6730248} {"current_steps": 10315, "total_steps": 38160, "loss": 0.5017, "lr": 0.0009142423644925353, "epoch": 5.406184486373165, "percentage": 27.03, "elapsed_time": "0:26:22", "remaining_time": "1:11:13", "throughput": 4253.61, "total_tokens": 6733352} {"current_steps": 10320, "total_steps": 38160, "loss": 0.3537, "lr": 0.0009141142545130228, "epoch": 5.408805031446541, "percentage": 27.04, "elapsed_time": "0:26:23", "remaining_time": "1:11:12", "throughput": 4253.54, "total_tokens": 6736104} {"current_steps": 10325, "total_steps": 38160, "loss": 0.4525, "lr": 0.0009139860579055326, "epoch": 5.411425576519916, "percentage": 27.06, "elapsed_time": "0:26:24", "remaining_time": "1:11:11", "throughput": 4253.64, "total_tokens": 6739336} {"current_steps": 10330, "total_steps": 38160, "loss": 0.4934, "lr": 0.0009138577746968821, "epoch": 5.414046121593292, "percentage": 27.07, "elapsed_time": "0:26:25", "remaining_time": "1:11:10", "throughput": 4253.64, "total_tokens": 6742216} {"current_steps": 10335, "total_steps": 38160, "loss": 0.3772, "lr": 0.0009137294049139066, "epoch": 5.416666666666667, "percentage": 27.08, "elapsed_time": "0:26:25", "remaining_time": "1:11:09", "throughput": 4253.69, "total_tokens": 6745320} {"current_steps": 10340, "total_steps": 38160, "loss": 0.3665, "lr": 0.0009136009485834598, "epoch": 5.419287211740042, "percentage": 27.1, "elapsed_time": "0:26:26", "remaining_time": "1:11:08", "throughput": 4253.72, "total_tokens": 6748328} {"current_steps": 10345, "total_steps": 38160, "loss": 0.4354, "lr": 0.0009134724057324131, "epoch": 5.421907756813417, "percentage": 27.11, "elapsed_time": "0:26:27", "remaining_time": "1:11:07", "throughput": 4253.75, "total_tokens": 6751240} {"current_steps": 10350, "total_steps": 38160, "loss": 0.3864, "lr": 0.0009133437763876562, "epoch": 5.4245283018867925, "percentage": 27.12, "elapsed_time": "0:26:27", "remaining_time": "1:11:06", "throughput": 4253.79, "total_tokens": 6754344} {"current_steps": 10355, "total_steps": 38160, "loss": 0.4776, "lr": 0.000913215060576097, "epoch": 5.427148846960168, "percentage": 27.14, "elapsed_time": "0:26:28", "remaining_time": "1:11:05", "throughput": 4253.82, "total_tokens": 6757320} {"current_steps": 10360, "total_steps": 38160, "loss": 0.3887, "lr": 0.0009130862583246613, "epoch": 5.429769392033543, "percentage": 27.15, "elapsed_time": "0:26:29", "remaining_time": "1:11:04", "throughput": 4253.95, "total_tokens": 6760744} {"current_steps": 10365, "total_steps": 38160, "loss": 0.5245, "lr": 0.0009129573696602932, "epoch": 5.432389937106918, "percentage": 27.16, "elapsed_time": "0:26:30", "remaining_time": "1:11:03", "throughput": 4253.99, "total_tokens": 6763848} {"current_steps": 10370, "total_steps": 38160, "loss": 0.5376, "lr": 0.0009128283946099546, "epoch": 5.435010482180293, "percentage": 27.18, "elapsed_time": "0:26:30", "remaining_time": "1:11:02", "throughput": 4253.99, "total_tokens": 6766792} {"current_steps": 10375, "total_steps": 38160, "loss": 0.4155, "lr": 0.0009126993332006256, "epoch": 5.437631027253669, "percentage": 27.19, "elapsed_time": "0:26:31", "remaining_time": "1:11:01", "throughput": 4254.09, "total_tokens": 6770024} {"current_steps": 10380, "total_steps": 38160, "loss": 0.4799, "lr": 0.0009125701854593045, "epoch": 5.440251572327044, "percentage": 27.2, "elapsed_time": "0:26:32", "remaining_time": "1:11:00", "throughput": 4253.99, "total_tokens": 6772584} {"current_steps": 10385, "total_steps": 38160, "loss": 0.4307, "lr": 0.0009124409514130073, "epoch": 5.4428721174004195, "percentage": 27.21, "elapsed_time": "0:26:32", "remaining_time": "1:11:00", "throughput": 4254.13, "total_tokens": 6776040} {"current_steps": 10390, "total_steps": 38160, "loss": 0.4464, "lr": 0.0009123116310887686, "epoch": 5.445492662473795, "percentage": 27.23, "elapsed_time": "0:26:33", "remaining_time": "1:10:59", "throughput": 4254.61, "total_tokens": 6780616} {"current_steps": 10395, "total_steps": 38160, "loss": 0.5346, "lr": 0.0009121822245136404, "epoch": 5.44811320754717, "percentage": 27.24, "elapsed_time": "0:26:34", "remaining_time": "1:10:58", "throughput": 4254.66, "total_tokens": 6783720} {"current_steps": 10400, "total_steps": 38160, "loss": 0.4638, "lr": 0.0009120527317146934, "epoch": 5.450733752620545, "percentage": 27.25, "elapsed_time": "0:26:35", "remaining_time": "1:10:57", "throughput": 4254.7, "total_tokens": 6786824} {"current_steps": 10405, "total_steps": 38160, "loss": 0.5359, "lr": 0.0009119231527190158, "epoch": 5.45335429769392, "percentage": 27.27, "elapsed_time": "0:26:35", "remaining_time": "1:10:57", "throughput": 4255.0, "total_tokens": 6790696} {"current_steps": 10410, "total_steps": 38160, "loss": 0.4444, "lr": 0.0009117934875537141, "epoch": 5.455974842767295, "percentage": 27.28, "elapsed_time": "0:26:36", "remaining_time": "1:10:56", "throughput": 4255.2, "total_tokens": 6794408} {"current_steps": 10415, "total_steps": 38160, "loss": 0.4738, "lr": 0.0009116637362459129, "epoch": 5.4585953878406706, "percentage": 27.29, "elapsed_time": "0:26:37", "remaining_time": "1:10:55", "throughput": 4255.43, "total_tokens": 6798184} {"current_steps": 10420, "total_steps": 38160, "loss": 0.4221, "lr": 0.0009115338988227546, "epoch": 5.461215932914046, "percentage": 27.31, "elapsed_time": "0:26:38", "remaining_time": "1:10:55", "throughput": 4255.64, "total_tokens": 6801928} {"current_steps": 10425, "total_steps": 38160, "loss": 0.4152, "lr": 0.0009114039753113997, "epoch": 5.463836477987422, "percentage": 27.32, "elapsed_time": "0:26:39", "remaining_time": "1:10:54", "throughput": 4255.85, "total_tokens": 6805640} {"current_steps": 10430, "total_steps": 38160, "loss": 0.3503, "lr": 0.0009112739657390265, "epoch": 5.466457023060797, "percentage": 27.33, "elapsed_time": "0:26:39", "remaining_time": "1:10:53", "throughput": 4255.9, "total_tokens": 6808680} {"current_steps": 10435, "total_steps": 38160, "loss": 0.4651, "lr": 0.0009111438701328319, "epoch": 5.469077568134172, "percentage": 27.35, "elapsed_time": "0:26:40", "remaining_time": "1:10:52", "throughput": 4255.95, "total_tokens": 6811752} {"current_steps": 10440, "total_steps": 38160, "loss": 0.5068, "lr": 0.0009110136885200302, "epoch": 5.471698113207547, "percentage": 27.36, "elapsed_time": "0:26:41", "remaining_time": "1:10:51", "throughput": 4256.02, "total_tokens": 6814888} {"current_steps": 10445, "total_steps": 38160, "loss": 0.4504, "lr": 0.000910883420927854, "epoch": 5.4743186582809225, "percentage": 27.37, "elapsed_time": "0:26:42", "remaining_time": "1:10:50", "throughput": 4256.39, "total_tokens": 6819048} {"current_steps": 10450, "total_steps": 38160, "loss": 0.3449, "lr": 0.0009107530673835536, "epoch": 5.476939203354298, "percentage": 27.38, "elapsed_time": "0:26:42", "remaining_time": "1:10:50", "throughput": 4256.63, "total_tokens": 6822792} {"current_steps": 10455, "total_steps": 38160, "loss": 0.5606, "lr": 0.0009106226279143979, "epoch": 5.479559748427673, "percentage": 27.4, "elapsed_time": "0:26:43", "remaining_time": "1:10:49", "throughput": 4256.8, "total_tokens": 6826248} {"current_steps": 10460, "total_steps": 38160, "loss": 0.4173, "lr": 0.0009104921025476728, "epoch": 5.482180293501048, "percentage": 27.41, "elapsed_time": "0:26:44", "remaining_time": "1:10:48", "throughput": 4257.1, "total_tokens": 6830248} {"current_steps": 10465, "total_steps": 38160, "loss": 0.3953, "lr": 0.0009103614913106832, "epoch": 5.484800838574423, "percentage": 27.42, "elapsed_time": "0:26:45", "remaining_time": "1:10:47", "throughput": 4257.12, "total_tokens": 6833160} {"current_steps": 10470, "total_steps": 38160, "loss": 0.6306, "lr": 0.0009102307942307511, "epoch": 5.487421383647799, "percentage": 27.44, "elapsed_time": "0:26:45", "remaining_time": "1:10:46", "throughput": 4257.24, "total_tokens": 6836392} {"current_steps": 10475, "total_steps": 38160, "loss": 0.4849, "lr": 0.000910100011335217, "epoch": 5.490041928721174, "percentage": 27.45, "elapsed_time": "0:26:46", "remaining_time": "1:10:46", "throughput": 4257.7, "total_tokens": 6840872} {"current_steps": 10480, "total_steps": 38160, "loss": 0.4711, "lr": 0.0009099691426514392, "epoch": 5.4926624737945495, "percentage": 27.46, "elapsed_time": "0:26:47", "remaining_time": "1:10:45", "throughput": 4257.63, "total_tokens": 6843432} {"current_steps": 10485, "total_steps": 38160, "loss": 0.3772, "lr": 0.0009098381882067941, "epoch": 5.495283018867925, "percentage": 27.48, "elapsed_time": "0:26:48", "remaining_time": "1:10:44", "throughput": 4257.71, "total_tokens": 6846760} {"current_steps": 10490, "total_steps": 38160, "loss": 0.6064, "lr": 0.0009097071480286756, "epoch": 5.4979035639413, "percentage": 27.49, "elapsed_time": "0:26:48", "remaining_time": "1:10:43", "throughput": 4257.58, "total_tokens": 6849256} {"current_steps": 10495, "total_steps": 38160, "loss": 0.3687, "lr": 0.0009095760221444959, "epoch": 5.500524109014675, "percentage": 27.5, "elapsed_time": "0:26:49", "remaining_time": "1:10:42", "throughput": 4257.9, "total_tokens": 6853256} {"current_steps": 10500, "total_steps": 38160, "loss": 0.5559, "lr": 0.000909444810581685, "epoch": 5.50314465408805, "percentage": 27.52, "elapsed_time": "0:26:50", "remaining_time": "1:10:43", "throughput": 4258.78, "total_tokens": 6859688} {"current_steps": 10505, "total_steps": 38160, "loss": 0.4111, "lr": 0.000909313513367691, "epoch": 5.505765199161425, "percentage": 27.53, "elapsed_time": "0:26:51", "remaining_time": "1:10:42", "throughput": 4258.95, "total_tokens": 6863080} {"current_steps": 10510, "total_steps": 38160, "loss": 0.4143, "lr": 0.0009091821305299798, "epoch": 5.5083857442348005, "percentage": 27.54, "elapsed_time": "0:26:52", "remaining_time": "1:10:41", "throughput": 4258.86, "total_tokens": 6865704} {"current_steps": 10515, "total_steps": 38160, "loss": 0.5288, "lr": 0.000909050662096035, "epoch": 5.511006289308176, "percentage": 27.56, "elapsed_time": "0:26:52", "remaining_time": "1:10:40", "throughput": 4258.78, "total_tokens": 6868392} {"current_steps": 10520, "total_steps": 38160, "loss": 0.4456, "lr": 0.0009089191080933583, "epoch": 5.513626834381551, "percentage": 27.57, "elapsed_time": "0:26:53", "remaining_time": "1:10:39", "throughput": 4258.83, "total_tokens": 6871624} {"current_steps": 10525, "total_steps": 38160, "loss": 0.4149, "lr": 0.0009087874685494695, "epoch": 5.516247379454927, "percentage": 27.58, "elapsed_time": "0:26:54", "remaining_time": "1:10:38", "throughput": 4259.16, "total_tokens": 6875752} {"current_steps": 10530, "total_steps": 38160, "loss": 0.6435, "lr": 0.0009086557434919059, "epoch": 5.518867924528302, "percentage": 27.59, "elapsed_time": "0:26:55", "remaining_time": "1:10:37", "throughput": 4259.17, "total_tokens": 6878728} {"current_steps": 10535, "total_steps": 38160, "loss": 0.5396, "lr": 0.0009085239329482231, "epoch": 5.521488469601677, "percentage": 27.61, "elapsed_time": "0:26:55", "remaining_time": "1:10:37", "throughput": 4259.4, "total_tokens": 6882408} {"current_steps": 10540, "total_steps": 38160, "loss": 0.6065, "lr": 0.0009083920369459941, "epoch": 5.524109014675052, "percentage": 27.62, "elapsed_time": "0:26:56", "remaining_time": "1:10:36", "throughput": 4259.45, "total_tokens": 6885448} {"current_steps": 10545, "total_steps": 38160, "loss": 0.5129, "lr": 0.00090826005551281, "epoch": 5.526729559748428, "percentage": 27.63, "elapsed_time": "0:26:57", "remaining_time": "1:10:35", "throughput": 4259.69, "total_tokens": 6889192} {"current_steps": 10550, "total_steps": 38160, "loss": 0.5354, "lr": 0.0009081279886762802, "epoch": 5.529350104821803, "percentage": 27.65, "elapsed_time": "0:26:58", "remaining_time": "1:10:34", "throughput": 4259.81, "total_tokens": 6892424} {"current_steps": 10555, "total_steps": 38160, "loss": 0.4358, "lr": 0.0009079958364640313, "epoch": 5.531970649895178, "percentage": 27.66, "elapsed_time": "0:26:58", "remaining_time": "1:10:33", "throughput": 4259.82, "total_tokens": 6895368} {"current_steps": 10560, "total_steps": 38160, "loss": 0.4621, "lr": 0.0009078635989037081, "epoch": 5.534591194968553, "percentage": 27.67, "elapsed_time": "0:26:59", "remaining_time": "1:10:32", "throughput": 4260.25, "total_tokens": 6899784} {"current_steps": 10565, "total_steps": 38160, "loss": 0.4768, "lr": 0.000907731276022973, "epoch": 5.537211740041929, "percentage": 27.69, "elapsed_time": "0:27:00", "remaining_time": "1:10:31", "throughput": 4260.19, "total_tokens": 6902504} {"current_steps": 10570, "total_steps": 38160, "loss": 0.4833, "lr": 0.0009075988678495066, "epoch": 5.539832285115304, "percentage": 27.7, "elapsed_time": "0:27:01", "remaining_time": "1:10:31", "throughput": 4260.43, "total_tokens": 6906184} {"current_steps": 10575, "total_steps": 38160, "loss": 0.4664, "lr": 0.0009074663744110073, "epoch": 5.5424528301886795, "percentage": 27.71, "elapsed_time": "0:27:01", "remaining_time": "1:10:30", "throughput": 4260.46, "total_tokens": 6909320} {"current_steps": 10580, "total_steps": 38160, "loss": 0.5179, "lr": 0.0009073337957351911, "epoch": 5.545073375262055, "percentage": 27.73, "elapsed_time": "0:27:02", "remaining_time": "1:10:29", "throughput": 4260.45, "total_tokens": 6912168} {"current_steps": 10585, "total_steps": 38160, "loss": 0.4882, "lr": 0.0009072011318497919, "epoch": 5.54769392033543, "percentage": 27.74, "elapsed_time": "0:27:03", "remaining_time": "1:10:28", "throughput": 4260.63, "total_tokens": 6915784} {"current_steps": 10590, "total_steps": 38160, "loss": 0.5077, "lr": 0.0009070683827825615, "epoch": 5.550314465408805, "percentage": 27.75, "elapsed_time": "0:27:03", "remaining_time": "1:10:27", "throughput": 4260.7, "total_tokens": 6918920} {"current_steps": 10595, "total_steps": 38160, "loss": 0.4326, "lr": 0.0009069355485612695, "epoch": 5.55293501048218, "percentage": 27.76, "elapsed_time": "0:27:04", "remaining_time": "1:10:26", "throughput": 4260.71, "total_tokens": 6921992} {"current_steps": 10600, "total_steps": 38160, "loss": 0.4204, "lr": 0.0009068026292137034, "epoch": 5.555555555555555, "percentage": 27.78, "elapsed_time": "0:27:05", "remaining_time": "1:10:25", "throughput": 4260.68, "total_tokens": 6924840} {"current_steps": 10605, "total_steps": 38160, "loss": 0.4159, "lr": 0.0009066696247676682, "epoch": 5.5581761006289305, "percentage": 27.79, "elapsed_time": "0:27:05", "remaining_time": "1:10:24", "throughput": 4260.7, "total_tokens": 6927848} {"current_steps": 10610, "total_steps": 38160, "loss": 0.5864, "lr": 0.0009065365352509871, "epoch": 5.560796645702306, "percentage": 27.8, "elapsed_time": "0:27:06", "remaining_time": "1:10:23", "throughput": 4260.63, "total_tokens": 6930568} {"current_steps": 10615, "total_steps": 38160, "loss": 0.3766, "lr": 0.0009064033606915008, "epoch": 5.563417190775681, "percentage": 27.82, "elapsed_time": "0:27:07", "remaining_time": "1:10:23", "throughput": 4260.74, "total_tokens": 6933992} {"current_steps": 10620, "total_steps": 38160, "loss": 0.4264, "lr": 0.000906270101117068, "epoch": 5.566037735849057, "percentage": 27.83, "elapsed_time": "0:27:08", "remaining_time": "1:10:21", "throughput": 4260.67, "total_tokens": 6936680} {"current_steps": 10625, "total_steps": 38160, "loss": 0.4794, "lr": 0.0009061367565555649, "epoch": 5.568658280922432, "percentage": 27.84, "elapsed_time": "0:27:08", "remaining_time": "1:10:20", "throughput": 4260.44, "total_tokens": 6938792} {"current_steps": 10630, "total_steps": 38160, "loss": 0.425, "lr": 0.000906003327034886, "epoch": 5.571278825995807, "percentage": 27.86, "elapsed_time": "0:27:09", "remaining_time": "1:10:20", "throughput": 4260.72, "total_tokens": 6942664} {"current_steps": 10635, "total_steps": 38160, "loss": 0.4929, "lr": 0.0009058698125829428, "epoch": 5.573899371069182, "percentage": 27.87, "elapsed_time": "0:27:10", "remaining_time": "1:10:18", "throughput": 4260.54, "total_tokens": 6944968} {"current_steps": 10640, "total_steps": 38160, "loss": 0.4848, "lr": 0.0009057362132276653, "epoch": 5.576519916142558, "percentage": 27.88, "elapsed_time": "0:27:10", "remaining_time": "1:10:18", "throughput": 4260.63, "total_tokens": 6948264} {"current_steps": 10645, "total_steps": 38160, "loss": 0.3961, "lr": 0.0009056025289970009, "epoch": 5.579140461215933, "percentage": 27.9, "elapsed_time": "0:27:11", "remaining_time": "1:10:17", "throughput": 4260.66, "total_tokens": 6951304} {"current_steps": 10650, "total_steps": 38160, "loss": 0.414, "lr": 0.0009054687599189148, "epoch": 5.581761006289308, "percentage": 27.91, "elapsed_time": "0:27:12", "remaining_time": "1:10:16", "throughput": 4260.66, "total_tokens": 6954184} {"current_steps": 10655, "total_steps": 38160, "loss": 0.6058, "lr": 0.0009053349060213899, "epoch": 5.584381551362683, "percentage": 27.92, "elapsed_time": "0:27:12", "remaining_time": "1:10:14", "throughput": 4260.5, "total_tokens": 6956552} {"current_steps": 10660, "total_steps": 38160, "loss": 0.5398, "lr": 0.0009052009673324269, "epoch": 5.587002096436059, "percentage": 27.94, "elapsed_time": "0:27:13", "remaining_time": "1:10:13", "throughput": 4260.48, "total_tokens": 6959496} {"current_steps": 10665, "total_steps": 38160, "loss": 0.6328, "lr": 0.0009050669438800445, "epoch": 5.589622641509434, "percentage": 27.95, "elapsed_time": "0:27:14", "remaining_time": "1:10:13", "throughput": 4260.54, "total_tokens": 6962600} {"current_steps": 10670, "total_steps": 38160, "loss": 0.4769, "lr": 0.0009049328356922786, "epoch": 5.5922431865828095, "percentage": 27.96, "elapsed_time": "0:27:14", "remaining_time": "1:10:11", "throughput": 4260.45, "total_tokens": 6965160} {"current_steps": 10675, "total_steps": 38160, "loss": 0.45, "lr": 0.0009047986427971831, "epoch": 5.594863731656185, "percentage": 27.97, "elapsed_time": "0:27:15", "remaining_time": "1:10:10", "throughput": 4260.39, "total_tokens": 6967880} {"current_steps": 10680, "total_steps": 38160, "loss": 0.4558, "lr": 0.0009046643652228297, "epoch": 5.59748427672956, "percentage": 27.99, "elapsed_time": "0:27:16", "remaining_time": "1:10:10", "throughput": 4260.65, "total_tokens": 6971624} {"current_steps": 10685, "total_steps": 38160, "loss": 0.4963, "lr": 0.0009045300029973079, "epoch": 5.600104821802935, "percentage": 28.0, "elapsed_time": "0:27:16", "remaining_time": "1:10:09", "throughput": 4260.7, "total_tokens": 6974696} {"current_steps": 10690, "total_steps": 38160, "loss": 0.6451, "lr": 0.0009043955561487245, "epoch": 5.60272536687631, "percentage": 28.01, "elapsed_time": "0:27:17", "remaining_time": "1:10:08", "throughput": 4260.64, "total_tokens": 6977544} {"current_steps": 10695, "total_steps": 38160, "loss": 0.2922, "lr": 0.0009042610247052044, "epoch": 5.605345911949685, "percentage": 28.03, "elapsed_time": "0:27:18", "remaining_time": "1:10:08", "throughput": 4261.46, "total_tokens": 6983688} {"current_steps": 10700, "total_steps": 38160, "loss": 0.4446, "lr": 0.0009041264086948899, "epoch": 5.6079664570230605, "percentage": 28.04, "elapsed_time": "0:27:19", "remaining_time": "1:10:07", "throughput": 4261.61, "total_tokens": 6987112} {"current_steps": 10705, "total_steps": 38160, "loss": 0.6183, "lr": 0.0009039917081459414, "epoch": 5.610587002096436, "percentage": 28.05, "elapsed_time": "0:27:20", "remaining_time": "1:10:06", "throughput": 4261.69, "total_tokens": 6990312} {"current_steps": 10710, "total_steps": 38160, "loss": 0.4, "lr": 0.0009038569230865363, "epoch": 5.613207547169811, "percentage": 28.07, "elapsed_time": "0:27:20", "remaining_time": "1:10:05", "throughput": 4261.47, "total_tokens": 6992456} {"current_steps": 10715, "total_steps": 38160, "loss": 0.422, "lr": 0.0009037220535448705, "epoch": 5.615828092243187, "percentage": 28.08, "elapsed_time": "0:27:21", "remaining_time": "1:10:04", "throughput": 4261.28, "total_tokens": 6994792} {"current_steps": 10720, "total_steps": 38160, "loss": 0.4809, "lr": 0.0009035870995491571, "epoch": 5.618448637316562, "percentage": 28.09, "elapsed_time": "0:27:22", "remaining_time": "1:10:03", "throughput": 4261.32, "total_tokens": 6997960} {"current_steps": 10725, "total_steps": 38160, "loss": 0.5777, "lr": 0.0009034520611276265, "epoch": 5.621069182389937, "percentage": 28.11, "elapsed_time": "0:27:22", "remaining_time": "1:10:02", "throughput": 4261.52, "total_tokens": 7001640} {"current_steps": 10730, "total_steps": 38160, "loss": 0.4384, "lr": 0.0009033169383085278, "epoch": 5.623689727463312, "percentage": 28.12, "elapsed_time": "0:27:23", "remaining_time": "1:10:01", "throughput": 4261.5, "total_tokens": 7004456} {"current_steps": 10735, "total_steps": 38160, "loss": 0.5145, "lr": 0.0009031817311201268, "epoch": 5.626310272536688, "percentage": 28.13, "elapsed_time": "0:27:24", "remaining_time": "1:10:00", "throughput": 4261.38, "total_tokens": 7006888} {"current_steps": 10740, "total_steps": 38160, "loss": 0.4246, "lr": 0.0009030464395907074, "epoch": 5.628930817610063, "percentage": 28.14, "elapsed_time": "0:27:25", "remaining_time": "1:09:59", "throughput": 4261.58, "total_tokens": 7010600} {"current_steps": 10745, "total_steps": 38160, "loss": 0.4609, "lr": 0.0009029110637485711, "epoch": 5.631551362683438, "percentage": 28.16, "elapsed_time": "0:27:25", "remaining_time": "1:09:59", "throughput": 4261.79, "total_tokens": 7014312} {"current_steps": 10750, "total_steps": 38160, "loss": 0.3997, "lr": 0.0009027756036220368, "epoch": 5.634171907756813, "percentage": 28.17, "elapsed_time": "0:27:26", "remaining_time": "1:09:58", "throughput": 4261.99, "total_tokens": 7017896} {"current_steps": 10755, "total_steps": 38160, "loss": 0.5173, "lr": 0.0009026400592394415, "epoch": 5.636792452830189, "percentage": 28.18, "elapsed_time": "0:27:27", "remaining_time": "1:09:57", "throughput": 4262.11, "total_tokens": 7021256} {"current_steps": 10760, "total_steps": 38160, "loss": 0.4666, "lr": 0.0009025044306291393, "epoch": 5.639412997903564, "percentage": 28.2, "elapsed_time": "0:27:28", "remaining_time": "1:09:56", "throughput": 4262.32, "total_tokens": 7024968} {"current_steps": 10765, "total_steps": 38160, "loss": 0.535, "lr": 0.0009023687178195022, "epoch": 5.6420335429769395, "percentage": 28.21, "elapsed_time": "0:27:28", "remaining_time": "1:09:55", "throughput": 4262.21, "total_tokens": 7027528} {"current_steps": 10770, "total_steps": 38160, "loss": 0.4437, "lr": 0.0009022329208389196, "epoch": 5.644654088050315, "percentage": 28.22, "elapsed_time": "0:27:29", "remaining_time": "1:09:55", "throughput": 4262.23, "total_tokens": 7030632} {"current_steps": 10775, "total_steps": 38160, "loss": 0.4171, "lr": 0.000902097039715799, "epoch": 5.64727463312369, "percentage": 28.24, "elapsed_time": "0:27:30", "remaining_time": "1:09:54", "throughput": 4262.49, "total_tokens": 7034568} {"current_steps": 10780, "total_steps": 38160, "loss": 0.5121, "lr": 0.0009019610744785651, "epoch": 5.649895178197065, "percentage": 28.25, "elapsed_time": "0:27:31", "remaining_time": "1:09:53", "throughput": 4262.5, "total_tokens": 7037544} {"current_steps": 10785, "total_steps": 38160, "loss": 0.4691, "lr": 0.0009018250251556603, "epoch": 5.65251572327044, "percentage": 28.26, "elapsed_time": "0:27:31", "remaining_time": "1:09:52", "throughput": 4262.69, "total_tokens": 7041256} {"current_steps": 10790, "total_steps": 38160, "loss": 0.3817, "lr": 0.0009016888917755445, "epoch": 5.655136268343815, "percentage": 28.28, "elapsed_time": "0:27:32", "remaining_time": "1:09:51", "throughput": 4262.5, "total_tokens": 7043528} {"current_steps": 10795, "total_steps": 38160, "loss": 0.4573, "lr": 0.0009015526743666951, "epoch": 5.6577568134171905, "percentage": 28.29, "elapsed_time": "0:27:33", "remaining_time": "1:09:50", "throughput": 4262.57, "total_tokens": 7046696} {"current_steps": 10800, "total_steps": 38160, "loss": 0.5839, "lr": 0.0009014163729576074, "epoch": 5.660377358490566, "percentage": 28.3, "elapsed_time": "0:27:33", "remaining_time": "1:09:49", "throughput": 4262.75, "total_tokens": 7050216} {"current_steps": 10805, "total_steps": 38160, "loss": 0.6432, "lr": 0.0009012799875767943, "epoch": 5.662997903563941, "percentage": 28.31, "elapsed_time": "0:27:34", "remaining_time": "1:09:49", "throughput": 4262.95, "total_tokens": 7053832} {"current_steps": 10810, "total_steps": 38160, "loss": 0.4565, "lr": 0.0009011435182527856, "epoch": 5.665618448637317, "percentage": 28.33, "elapsed_time": "0:27:35", "remaining_time": "1:09:48", "throughput": 4262.92, "total_tokens": 7056584} {"current_steps": 10815, "total_steps": 38160, "loss": 0.354, "lr": 0.0009010069650141295, "epoch": 5.668238993710692, "percentage": 28.34, "elapsed_time": "0:27:36", "remaining_time": "1:09:47", "throughput": 4262.82, "total_tokens": 7059240} {"current_steps": 10820, "total_steps": 38160, "loss": 0.5406, "lr": 0.0009008703278893913, "epoch": 5.670859538784067, "percentage": 28.35, "elapsed_time": "0:27:36", "remaining_time": "1:09:46", "throughput": 4262.88, "total_tokens": 7062280} {"current_steps": 10825, "total_steps": 38160, "loss": 0.5165, "lr": 0.0009007336069071537, "epoch": 5.673480083857442, "percentage": 28.37, "elapsed_time": "0:27:37", "remaining_time": "1:09:45", "throughput": 4262.9, "total_tokens": 7065288} {"current_steps": 10830, "total_steps": 38160, "loss": 0.5141, "lr": 0.0009005968020960175, "epoch": 5.676100628930818, "percentage": 28.38, "elapsed_time": "0:27:38", "remaining_time": "1:09:44", "throughput": 4263.15, "total_tokens": 7069160} {"current_steps": 10835, "total_steps": 38160, "loss": 0.5069, "lr": 0.0009004599134846004, "epoch": 5.678721174004193, "percentage": 28.39, "elapsed_time": "0:27:38", "remaining_time": "1:09:43", "throughput": 4263.28, "total_tokens": 7072552} {"current_steps": 10840, "total_steps": 38160, "loss": 0.3626, "lr": 0.0009003229411015382, "epoch": 5.681341719077568, "percentage": 28.41, "elapsed_time": "0:27:39", "remaining_time": "1:09:42", "throughput": 4263.44, "total_tokens": 7076040} {"current_steps": 10845, "total_steps": 38160, "loss": 0.5555, "lr": 0.0009001858849754838, "epoch": 5.683962264150943, "percentage": 28.42, "elapsed_time": "0:27:40", "remaining_time": "1:09:42", "throughput": 4263.54, "total_tokens": 7079368} {"current_steps": 10850, "total_steps": 38160, "loss": 0.3895, "lr": 0.0009000487451351078, "epoch": 5.686582809224319, "percentage": 28.43, "elapsed_time": "0:27:41", "remaining_time": "1:09:41", "throughput": 4263.62, "total_tokens": 7082632} {"current_steps": 10855, "total_steps": 38160, "loss": 0.4962, "lr": 0.0008999115216090985, "epoch": 5.689203354297694, "percentage": 28.45, "elapsed_time": "0:27:41", "remaining_time": "1:09:40", "throughput": 4263.52, "total_tokens": 7085192} {"current_steps": 10860, "total_steps": 38160, "loss": 0.3954, "lr": 0.0008997742144261612, "epoch": 5.6918238993710695, "percentage": 28.46, "elapsed_time": "0:27:42", "remaining_time": "1:09:39", "throughput": 4263.52, "total_tokens": 7088040} {"current_steps": 10865, "total_steps": 38160, "loss": 0.5083, "lr": 0.000899636823615019, "epoch": 5.694444444444445, "percentage": 28.47, "elapsed_time": "0:27:43", "remaining_time": "1:09:38", "throughput": 4263.46, "total_tokens": 7090664} {"current_steps": 10870, "total_steps": 38160, "loss": 0.4523, "lr": 0.0008994993492044127, "epoch": 5.69706498951782, "percentage": 28.49, "elapsed_time": "0:27:43", "remaining_time": "1:09:37", "throughput": 4263.35, "total_tokens": 7093224} {"current_steps": 10875, "total_steps": 38160, "loss": 0.4764, "lr": 0.0008993617912231003, "epoch": 5.699685534591195, "percentage": 28.5, "elapsed_time": "0:27:44", "remaining_time": "1:09:35", "throughput": 4263.33, "total_tokens": 7096008} {"current_steps": 10880, "total_steps": 38160, "loss": 0.4381, "lr": 0.0008992241496998572, "epoch": 5.70230607966457, "percentage": 28.51, "elapsed_time": "0:27:45", "remaining_time": "1:09:35", "throughput": 4263.25, "total_tokens": 7098760} {"current_steps": 10885, "total_steps": 38160, "loss": 0.5294, "lr": 0.0008990864246634767, "epoch": 5.704926624737945, "percentage": 28.52, "elapsed_time": "0:27:45", "remaining_time": "1:09:34", "throughput": 4263.38, "total_tokens": 7102120} {"current_steps": 10890, "total_steps": 38160, "loss": 0.4552, "lr": 0.0008989486161427691, "epoch": 5.7075471698113205, "percentage": 28.54, "elapsed_time": "0:27:46", "remaining_time": "1:09:33", "throughput": 4263.53, "total_tokens": 7105672} {"current_steps": 10895, "total_steps": 38160, "loss": 0.4505, "lr": 0.0008988107241665624, "epoch": 5.710167714884696, "percentage": 28.55, "elapsed_time": "0:27:47", "remaining_time": "1:09:32", "throughput": 4263.75, "total_tokens": 7109288} {"current_steps": 10900, "total_steps": 38160, "loss": 0.3771, "lr": 0.0008986727487637022, "epoch": 5.712788259958071, "percentage": 28.56, "elapsed_time": "0:27:48", "remaining_time": "1:09:31", "throughput": 4263.77, "total_tokens": 7112264} {"current_steps": 10905, "total_steps": 38160, "loss": 0.4049, "lr": 0.0008985346899630513, "epoch": 5.715408805031447, "percentage": 28.58, "elapsed_time": "0:27:48", "remaining_time": "1:09:30", "throughput": 4263.72, "total_tokens": 7114984} {"current_steps": 10910, "total_steps": 38160, "loss": 0.4605, "lr": 0.0008983965477934899, "epoch": 5.718029350104822, "percentage": 28.59, "elapsed_time": "0:27:49", "remaining_time": "1:09:29", "throughput": 4263.73, "total_tokens": 7117896} {"current_steps": 10915, "total_steps": 38160, "loss": 0.3843, "lr": 0.0008982583222839158, "epoch": 5.720649895178197, "percentage": 28.6, "elapsed_time": "0:27:50", "remaining_time": "1:09:28", "throughput": 4263.84, "total_tokens": 7121192} {"current_steps": 10920, "total_steps": 38160, "loss": 0.4532, "lr": 0.0008981200134632444, "epoch": 5.723270440251572, "percentage": 28.62, "elapsed_time": "0:27:50", "remaining_time": "1:09:28", "throughput": 4263.99, "total_tokens": 7124680} {"current_steps": 10925, "total_steps": 38160, "loss": 0.4396, "lr": 0.000897981621360408, "epoch": 5.725890985324948, "percentage": 28.63, "elapsed_time": "0:27:51", "remaining_time": "1:09:27", "throughput": 4264.01, "total_tokens": 7127624} {"current_steps": 10930, "total_steps": 38160, "loss": 0.4346, "lr": 0.0008978431460043569, "epoch": 5.728511530398323, "percentage": 28.64, "elapsed_time": "0:27:52", "remaining_time": "1:09:27", "throughput": 4265.0, "total_tokens": 7134792} {"current_steps": 10935, "total_steps": 38160, "loss": 0.3616, "lr": 0.0008977045874240585, "epoch": 5.731132075471698, "percentage": 28.66, "elapsed_time": "0:27:53", "remaining_time": "1:09:26", "throughput": 4264.89, "total_tokens": 7137448} {"current_steps": 10940, "total_steps": 38160, "loss": 0.5137, "lr": 0.0008975659456484977, "epoch": 5.733752620545073, "percentage": 28.67, "elapsed_time": "0:27:54", "remaining_time": "1:09:25", "throughput": 4265.15, "total_tokens": 7141384} {"current_steps": 10945, "total_steps": 38160, "loss": 0.5386, "lr": 0.0008974272207066767, "epoch": 5.736373165618449, "percentage": 28.68, "elapsed_time": "0:27:55", "remaining_time": "1:09:25", "throughput": 4265.11, "total_tokens": 7144296} {"current_steps": 10950, "total_steps": 38160, "loss": 0.5761, "lr": 0.0008972884126276152, "epoch": 5.738993710691824, "percentage": 28.69, "elapsed_time": "0:27:55", "remaining_time": "1:09:24", "throughput": 4265.41, "total_tokens": 7148328} {"current_steps": 10955, "total_steps": 38160, "loss": 0.5339, "lr": 0.0008971495214403502, "epoch": 5.7416142557651995, "percentage": 28.71, "elapsed_time": "0:27:56", "remaining_time": "1:09:23", "throughput": 4265.4, "total_tokens": 7151304} {"current_steps": 10960, "total_steps": 38160, "loss": 0.4166, "lr": 0.0008970105471739364, "epoch": 5.744234800838575, "percentage": 28.72, "elapsed_time": "0:27:57", "remaining_time": "1:09:22", "throughput": 4265.69, "total_tokens": 7155240} {"current_steps": 10965, "total_steps": 38160, "loss": 0.3637, "lr": 0.0008968714898574454, "epoch": 5.74685534591195, "percentage": 28.73, "elapsed_time": "0:27:58", "remaining_time": "1:09:22", "throughput": 4266.04, "total_tokens": 7159496} {"current_steps": 10970, "total_steps": 38160, "loss": 0.3857, "lr": 0.0008967323495199665, "epoch": 5.749475890985325, "percentage": 28.75, "elapsed_time": "0:27:59", "remaining_time": "1:09:21", "throughput": 4266.34, "total_tokens": 7163688} {"current_steps": 10975, "total_steps": 38160, "loss": 0.3779, "lr": 0.0008965931261906061, "epoch": 5.7520964360587, "percentage": 28.76, "elapsed_time": "0:27:59", "remaining_time": "1:09:20", "throughput": 4266.36, "total_tokens": 7166728} {"current_steps": 10980, "total_steps": 38160, "loss": 0.5295, "lr": 0.0008964538198984885, "epoch": 5.754716981132075, "percentage": 28.77, "elapsed_time": "0:28:00", "remaining_time": "1:09:20", "throughput": 4266.43, "total_tokens": 7169928} {"current_steps": 10985, "total_steps": 38160, "loss": 0.5413, "lr": 0.0008963144306727547, "epoch": 5.7573375262054505, "percentage": 28.79, "elapsed_time": "0:28:01", "remaining_time": "1:09:19", "throughput": 4266.43, "total_tokens": 7172936} {"current_steps": 10990, "total_steps": 38160, "loss": 0.4003, "lr": 0.0008961749585425634, "epoch": 5.759958071278826, "percentage": 28.8, "elapsed_time": "0:28:01", "remaining_time": "1:09:18", "throughput": 4266.22, "total_tokens": 7175240} {"current_steps": 10995, "total_steps": 38160, "loss": 0.4606, "lr": 0.0008960354035370905, "epoch": 5.762578616352201, "percentage": 28.81, "elapsed_time": "0:28:02", "remaining_time": "1:09:17", "throughput": 4266.23, "total_tokens": 7178216} {"current_steps": 11000, "total_steps": 38160, "loss": 0.502, "lr": 0.0008958957656855294, "epoch": 5.765199161425577, "percentage": 28.83, "elapsed_time": "0:28:03", "remaining_time": "1:09:16", "throughput": 4266.47, "total_tokens": 7182056} {"current_steps": 11005, "total_steps": 38160, "loss": 0.4518, "lr": 0.0008957560450170907, "epoch": 5.767819706498952, "percentage": 28.84, "elapsed_time": "0:28:04", "remaining_time": "1:09:15", "throughput": 4266.79, "total_tokens": 7186056} {"current_steps": 11010, "total_steps": 38160, "loss": 0.5896, "lr": 0.0008956162415610025, "epoch": 5.770440251572327, "percentage": 28.85, "elapsed_time": "0:28:04", "remaining_time": "1:09:14", "throughput": 4266.73, "total_tokens": 7188808} {"current_steps": 11015, "total_steps": 38160, "loss": 0.4643, "lr": 0.00089547635534651, "epoch": 5.773060796645702, "percentage": 28.87, "elapsed_time": "0:28:05", "remaining_time": "1:09:13", "throughput": 4266.89, "total_tokens": 7192328} {"current_steps": 11020, "total_steps": 38160, "loss": 0.5348, "lr": 0.0008953363864028758, "epoch": 5.7756813417190775, "percentage": 28.88, "elapsed_time": "0:28:06", "remaining_time": "1:09:13", "throughput": 4266.92, "total_tokens": 7195368} {"current_steps": 11025, "total_steps": 38160, "loss": 0.4765, "lr": 0.0008951963347593796, "epoch": 5.778301886792453, "percentage": 28.89, "elapsed_time": "0:28:07", "remaining_time": "1:09:12", "throughput": 4267.32, "total_tokens": 7199752} {"current_steps": 11030, "total_steps": 38160, "loss": 0.6353, "lr": 0.0008950562004453191, "epoch": 5.780922431865828, "percentage": 28.9, "elapsed_time": "0:28:07", "remaining_time": "1:09:11", "throughput": 4267.51, "total_tokens": 7203432} {"current_steps": 11035, "total_steps": 38160, "loss": 0.4104, "lr": 0.0008949159834900082, "epoch": 5.783542976939203, "percentage": 28.92, "elapsed_time": "0:28:08", "remaining_time": "1:09:10", "throughput": 4267.36, "total_tokens": 7205864} {"current_steps": 11040, "total_steps": 38160, "loss": 0.4322, "lr": 0.0008947756839227792, "epoch": 5.786163522012579, "percentage": 28.93, "elapsed_time": "0:28:09", "remaining_time": "1:09:09", "throughput": 4267.26, "total_tokens": 7208424} {"current_steps": 11045, "total_steps": 38160, "loss": 0.7984, "lr": 0.0008946353017729809, "epoch": 5.788784067085954, "percentage": 28.94, "elapsed_time": "0:28:09", "remaining_time": "1:09:08", "throughput": 4267.28, "total_tokens": 7211464} {"current_steps": 11050, "total_steps": 38160, "loss": 0.5371, "lr": 0.0008944948370699798, "epoch": 5.7914046121593294, "percentage": 28.96, "elapsed_time": "0:28:10", "remaining_time": "1:09:07", "throughput": 4267.29, "total_tokens": 7214472} {"current_steps": 11055, "total_steps": 38160, "loss": 0.4932, "lr": 0.0008943542898431593, "epoch": 5.794025157232705, "percentage": 28.97, "elapsed_time": "0:28:11", "remaining_time": "1:09:07", "throughput": 4267.49, "total_tokens": 7218184} {"current_steps": 11060, "total_steps": 38160, "loss": 0.4376, "lr": 0.0008942136601219205, "epoch": 5.79664570230608, "percentage": 28.98, "elapsed_time": "0:28:12", "remaining_time": "1:09:06", "throughput": 4267.59, "total_tokens": 7221480} {"current_steps": 11065, "total_steps": 38160, "loss": 0.3608, "lr": 0.0008940729479356813, "epoch": 5.799266247379455, "percentage": 29.0, "elapsed_time": "0:28:12", "remaining_time": "1:09:05", "throughput": 4267.61, "total_tokens": 7224424} {"current_steps": 11070, "total_steps": 38160, "loss": 0.5063, "lr": 0.0008939321533138774, "epoch": 5.80188679245283, "percentage": 29.01, "elapsed_time": "0:28:13", "remaining_time": "1:09:04", "throughput": 4267.54, "total_tokens": 7227144} {"current_steps": 11075, "total_steps": 38160, "loss": 0.4675, "lr": 0.0008937912762859611, "epoch": 5.804507337526205, "percentage": 29.02, "elapsed_time": "0:28:14", "remaining_time": "1:09:03", "throughput": 4267.45, "total_tokens": 7229768} {"current_steps": 11080, "total_steps": 38160, "loss": 0.3752, "lr": 0.0008936503168814024, "epoch": 5.8071278825995805, "percentage": 29.04, "elapsed_time": "0:28:14", "remaining_time": "1:09:02", "throughput": 4267.64, "total_tokens": 7233352} {"current_steps": 11085, "total_steps": 38160, "loss": 0.4638, "lr": 0.0008935092751296885, "epoch": 5.809748427672956, "percentage": 29.05, "elapsed_time": "0:28:15", "remaining_time": "1:09:01", "throughput": 4267.63, "total_tokens": 7236328} {"current_steps": 11090, "total_steps": 38160, "loss": 0.5808, "lr": 0.0008933681510603235, "epoch": 5.812368972746331, "percentage": 29.06, "elapsed_time": "0:28:16", "remaining_time": "1:09:00", "throughput": 4267.55, "total_tokens": 7238952} {"current_steps": 11095, "total_steps": 38160, "loss": 0.4309, "lr": 0.0008932269447028292, "epoch": 5.814989517819707, "percentage": 29.07, "elapsed_time": "0:28:17", "remaining_time": "1:08:59", "throughput": 4267.73, "total_tokens": 7242568} {"current_steps": 11100, "total_steps": 38160, "loss": 0.5837, "lr": 0.0008930856560867442, "epoch": 5.817610062893082, "percentage": 29.09, "elapsed_time": "0:28:17", "remaining_time": "1:08:58", "throughput": 4267.7, "total_tokens": 7245320} {"current_steps": 11105, "total_steps": 38160, "loss": 0.4109, "lr": 0.0008929442852416245, "epoch": 5.820230607966457, "percentage": 29.1, "elapsed_time": "0:28:18", "remaining_time": "1:08:57", "throughput": 4267.7, "total_tokens": 7248264} {"current_steps": 11110, "total_steps": 38160, "loss": 0.5823, "lr": 0.0008928028321970433, "epoch": 5.822851153039832, "percentage": 29.11, "elapsed_time": "0:28:19", "remaining_time": "1:08:56", "throughput": 4267.71, "total_tokens": 7251176} {"current_steps": 11115, "total_steps": 38160, "loss": 0.5001, "lr": 0.0008926612969825909, "epoch": 5.8254716981132075, "percentage": 29.13, "elapsed_time": "0:28:19", "remaining_time": "1:08:55", "throughput": 4267.64, "total_tokens": 7253864} {"current_steps": 11120, "total_steps": 38160, "loss": 0.3716, "lr": 0.000892519679627875, "epoch": 5.828092243186583, "percentage": 29.14, "elapsed_time": "0:28:20", "remaining_time": "1:08:55", "throughput": 4267.9, "total_tokens": 7257704} {"current_steps": 11125, "total_steps": 38160, "loss": 0.4161, "lr": 0.00089237798016252, "epoch": 5.830712788259958, "percentage": 29.15, "elapsed_time": "0:28:21", "remaining_time": "1:08:54", "throughput": 4267.98, "total_tokens": 7260936} {"current_steps": 11130, "total_steps": 38160, "loss": 0.4924, "lr": 0.0008922361986161682, "epoch": 5.833333333333333, "percentage": 29.17, "elapsed_time": "0:28:22", "remaining_time": "1:08:53", "throughput": 4268.14, "total_tokens": 7264456} {"current_steps": 11135, "total_steps": 38160, "loss": 0.6527, "lr": 0.0008920943350184785, "epoch": 5.835953878406709, "percentage": 29.18, "elapsed_time": "0:28:22", "remaining_time": "1:08:52", "throughput": 4268.2, "total_tokens": 7267624} {"current_steps": 11140, "total_steps": 38160, "loss": 0.4372, "lr": 0.0008919523893991271, "epoch": 5.838574423480084, "percentage": 29.19, "elapsed_time": "0:28:23", "remaining_time": "1:08:51", "throughput": 4268.25, "total_tokens": 7270760} {"current_steps": 11145, "total_steps": 38160, "loss": 0.461, "lr": 0.0008918103617878075, "epoch": 5.841194968553459, "percentage": 29.21, "elapsed_time": "0:28:24", "remaining_time": "1:08:50", "throughput": 4268.23, "total_tokens": 7273608} {"current_steps": 11150, "total_steps": 38160, "loss": 0.5293, "lr": 0.0008916682522142302, "epoch": 5.843815513626835, "percentage": 29.22, "elapsed_time": "0:28:24", "remaining_time": "1:08:49", "throughput": 4268.16, "total_tokens": 7276264} {"current_steps": 11155, "total_steps": 38160, "loss": 0.4686, "lr": 0.000891526060708123, "epoch": 5.84643605870021, "percentage": 29.23, "elapsed_time": "0:28:25", "remaining_time": "1:08:48", "throughput": 4268.21, "total_tokens": 7279336} {"current_steps": 11160, "total_steps": 38160, "loss": 0.4798, "lr": 0.0008913837872992306, "epoch": 5.849056603773585, "percentage": 29.25, "elapsed_time": "0:28:26", "remaining_time": "1:08:47", "throughput": 4268.25, "total_tokens": 7282376} {"current_steps": 11165, "total_steps": 38160, "loss": 0.4315, "lr": 0.000891241432017315, "epoch": 5.85167714884696, "percentage": 29.26, "elapsed_time": "0:28:26", "remaining_time": "1:08:46", "throughput": 4268.3, "total_tokens": 7285448} {"current_steps": 11170, "total_steps": 38160, "loss": 0.5128, "lr": 0.0008910989948921555, "epoch": 5.854297693920335, "percentage": 29.27, "elapsed_time": "0:28:27", "remaining_time": "1:08:46", "throughput": 4268.38, "total_tokens": 7288648} {"current_steps": 11175, "total_steps": 38160, "loss": 0.3978, "lr": 0.000890956475953548, "epoch": 5.8569182389937104, "percentage": 29.28, "elapsed_time": "0:28:28", "remaining_time": "1:08:45", "throughput": 4268.35, "total_tokens": 7291432} {"current_steps": 11180, "total_steps": 38160, "loss": 0.312, "lr": 0.0008908138752313061, "epoch": 5.859538784067086, "percentage": 29.3, "elapsed_time": "0:28:29", "remaining_time": "1:08:44", "throughput": 4268.96, "total_tokens": 7296744} {"current_steps": 11185, "total_steps": 38160, "loss": 0.3891, "lr": 0.0008906711927552601, "epoch": 5.862159329140461, "percentage": 29.31, "elapsed_time": "0:28:29", "remaining_time": "1:08:43", "throughput": 4268.92, "total_tokens": 7299496} {"current_steps": 11190, "total_steps": 38160, "loss": 0.4399, "lr": 0.0008905284285552575, "epoch": 5.864779874213837, "percentage": 29.32, "elapsed_time": "0:28:30", "remaining_time": "1:08:42", "throughput": 4268.91, "total_tokens": 7302440} {"current_steps": 11195, "total_steps": 38160, "loss": 0.3457, "lr": 0.0008903855826611631, "epoch": 5.867400419287212, "percentage": 29.34, "elapsed_time": "0:28:31", "remaining_time": "1:08:42", "throughput": 4269.03, "total_tokens": 7305864} {"current_steps": 11200, "total_steps": 38160, "loss": 0.4865, "lr": 0.0008902426551028586, "epoch": 5.870020964360587, "percentage": 29.35, "elapsed_time": "0:28:32", "remaining_time": "1:08:41", "throughput": 4269.1, "total_tokens": 7309096} {"current_steps": 11205, "total_steps": 38160, "loss": 0.6475, "lr": 0.0008900996459102428, "epoch": 5.872641509433962, "percentage": 29.36, "elapsed_time": "0:28:32", "remaining_time": "1:08:40", "throughput": 4269.28, "total_tokens": 7312648} {"current_steps": 11210, "total_steps": 38160, "loss": 0.4452, "lr": 0.0008899565551132315, "epoch": 5.8752620545073375, "percentage": 29.38, "elapsed_time": "0:28:33", "remaining_time": "1:08:39", "throughput": 4269.47, "total_tokens": 7316264} {"current_steps": 11215, "total_steps": 38160, "loss": 0.5072, "lr": 0.0008898133827417578, "epoch": 5.877882599580713, "percentage": 29.39, "elapsed_time": "0:28:34", "remaining_time": "1:08:39", "throughput": 4269.85, "total_tokens": 7320584} {"current_steps": 11220, "total_steps": 38160, "loss": 0.6705, "lr": 0.0008896701288257716, "epoch": 5.880503144654088, "percentage": 29.4, "elapsed_time": "0:28:35", "remaining_time": "1:08:38", "throughput": 4269.93, "total_tokens": 7323880} {"current_steps": 11225, "total_steps": 38160, "loss": 0.4695, "lr": 0.00088952679339524, "epoch": 5.883123689727463, "percentage": 29.42, "elapsed_time": "0:28:35", "remaining_time": "1:08:37", "throughput": 4269.97, "total_tokens": 7326984} {"current_steps": 11230, "total_steps": 38160, "loss": 0.4332, "lr": 0.0008893833764801473, "epoch": 5.885744234800838, "percentage": 29.43, "elapsed_time": "0:28:36", "remaining_time": "1:08:36", "throughput": 4270.13, "total_tokens": 7330504} {"current_steps": 11235, "total_steps": 38160, "loss": 0.4837, "lr": 0.0008892398781104945, "epoch": 5.888364779874214, "percentage": 29.44, "elapsed_time": "0:28:37", "remaining_time": "1:08:35", "throughput": 4270.14, "total_tokens": 7333480} {"current_steps": 11240, "total_steps": 38160, "loss": 0.3579, "lr": 0.0008890962983162997, "epoch": 5.890985324947589, "percentage": 29.45, "elapsed_time": "0:28:38", "remaining_time": "1:08:34", "throughput": 4270.08, "total_tokens": 7336232} {"current_steps": 11245, "total_steps": 38160, "loss": 0.3555, "lr": 0.0008889526371275987, "epoch": 5.893605870020965, "percentage": 29.47, "elapsed_time": "0:28:38", "remaining_time": "1:08:33", "throughput": 4269.99, "total_tokens": 7338920} {"current_steps": 11250, "total_steps": 38160, "loss": 0.4063, "lr": 0.0008888088945744432, "epoch": 5.89622641509434, "percentage": 29.48, "elapsed_time": "0:28:39", "remaining_time": "1:08:32", "throughput": 4269.93, "total_tokens": 7341512} {"current_steps": 11255, "total_steps": 38160, "loss": 0.5801, "lr": 0.0008886650706869027, "epoch": 5.898846960167715, "percentage": 29.49, "elapsed_time": "0:28:40", "remaining_time": "1:08:31", "throughput": 4270.12, "total_tokens": 7345128} {"current_steps": 11260, "total_steps": 38160, "loss": 0.4342, "lr": 0.0008885211654950636, "epoch": 5.90146750524109, "percentage": 29.51, "elapsed_time": "0:28:40", "remaining_time": "1:08:31", "throughput": 4270.19, "total_tokens": 7348328} {"current_steps": 11265, "total_steps": 38160, "loss": 0.6321, "lr": 0.0008883771790290291, "epoch": 5.904088050314465, "percentage": 29.52, "elapsed_time": "0:28:41", "remaining_time": "1:08:30", "throughput": 4270.22, "total_tokens": 7351336} {"current_steps": 11270, "total_steps": 38160, "loss": 0.5116, "lr": 0.0008882331113189197, "epoch": 5.90670859538784, "percentage": 29.53, "elapsed_time": "0:28:42", "remaining_time": "1:08:29", "throughput": 4270.46, "total_tokens": 7355208} {"current_steps": 11275, "total_steps": 38160, "loss": 0.3714, "lr": 0.0008880889623948724, "epoch": 5.909329140461216, "percentage": 29.55, "elapsed_time": "0:28:42", "remaining_time": "1:08:28", "throughput": 4270.36, "total_tokens": 7357768} {"current_steps": 11280, "total_steps": 38160, "loss": 0.4762, "lr": 0.000887944732287042, "epoch": 5.911949685534591, "percentage": 29.56, "elapsed_time": "0:28:43", "remaining_time": "1:08:27", "throughput": 4270.4, "total_tokens": 7360808} {"current_steps": 11285, "total_steps": 38160, "loss": 0.4397, "lr": 0.0008878004210255995, "epoch": 5.914570230607967, "percentage": 29.57, "elapsed_time": "0:28:44", "remaining_time": "1:08:26", "throughput": 4270.26, "total_tokens": 7363208} {"current_steps": 11290, "total_steps": 38160, "loss": 0.378, "lr": 0.0008876560286407329, "epoch": 5.917190775681342, "percentage": 29.59, "elapsed_time": "0:28:45", "remaining_time": "1:08:25", "throughput": 4270.36, "total_tokens": 7366504} {"current_steps": 11295, "total_steps": 38160, "loss": 0.4209, "lr": 0.000887511555162648, "epoch": 5.919811320754717, "percentage": 29.6, "elapsed_time": "0:28:45", "remaining_time": "1:08:24", "throughput": 4270.45, "total_tokens": 7369800} {"current_steps": 11300, "total_steps": 38160, "loss": 0.4679, "lr": 0.0008873670006215666, "epoch": 5.922431865828092, "percentage": 29.61, "elapsed_time": "0:28:46", "remaining_time": "1:08:23", "throughput": 4270.45, "total_tokens": 7372680} {"current_steps": 11305, "total_steps": 38160, "loss": 0.4905, "lr": 0.0008872223650477281, "epoch": 5.9250524109014675, "percentage": 29.63, "elapsed_time": "0:28:47", "remaining_time": "1:08:23", "throughput": 4270.93, "total_tokens": 7377480} {"current_steps": 11310, "total_steps": 38160, "loss": 0.4177, "lr": 0.0008870776484713882, "epoch": 5.927672955974843, "percentage": 29.64, "elapsed_time": "0:28:48", "remaining_time": "1:08:22", "throughput": 4270.96, "total_tokens": 7380456} {"current_steps": 11315, "total_steps": 38160, "loss": 0.5529, "lr": 0.0008869328509228205, "epoch": 5.930293501048218, "percentage": 29.65, "elapsed_time": "0:28:48", "remaining_time": "1:08:21", "throughput": 4270.93, "total_tokens": 7383208} {"current_steps": 11320, "total_steps": 38160, "loss": 0.4184, "lr": 0.0008867879724323147, "epoch": 5.932914046121593, "percentage": 29.66, "elapsed_time": "0:28:49", "remaining_time": "1:08:20", "throughput": 4270.78, "total_tokens": 7385576} {"current_steps": 11325, "total_steps": 38160, "loss": 0.4013, "lr": 0.0008866430130301777, "epoch": 5.935534591194968, "percentage": 29.68, "elapsed_time": "0:28:49", "remaining_time": "1:08:19", "throughput": 4270.69, "total_tokens": 7388296} {"current_steps": 11330, "total_steps": 38160, "loss": 0.575, "lr": 0.0008864979727467335, "epoch": 5.938155136268344, "percentage": 29.69, "elapsed_time": "0:28:50", "remaining_time": "1:08:18", "throughput": 4270.85, "total_tokens": 7391784} {"current_steps": 11335, "total_steps": 38160, "loss": 0.4394, "lr": 0.000886352851612323, "epoch": 5.940775681341719, "percentage": 29.7, "elapsed_time": "0:28:51", "remaining_time": "1:08:17", "throughput": 4270.93, "total_tokens": 7395016} {"current_steps": 11340, "total_steps": 38160, "loss": 0.3806, "lr": 0.0008862076496573034, "epoch": 5.943396226415095, "percentage": 29.72, "elapsed_time": "0:28:52", "remaining_time": "1:08:17", "throughput": 4271.14, "total_tokens": 7398856} {"current_steps": 11345, "total_steps": 38160, "loss": 0.5034, "lr": 0.0008860623669120496, "epoch": 5.94601677148847, "percentage": 29.73, "elapsed_time": "0:28:52", "remaining_time": "1:08:16", "throughput": 4271.16, "total_tokens": 7401864} {"current_steps": 11350, "total_steps": 38160, "loss": 0.649, "lr": 0.0008859170034069533, "epoch": 5.948637316561845, "percentage": 29.74, "elapsed_time": "0:28:53", "remaining_time": "1:08:14", "throughput": 4271.05, "total_tokens": 7404360} {"current_steps": 11355, "total_steps": 38160, "loss": 0.5093, "lr": 0.0008857715591724225, "epoch": 5.95125786163522, "percentage": 29.76, "elapsed_time": "0:28:54", "remaining_time": "1:08:14", "throughput": 4271.08, "total_tokens": 7407464} {"current_steps": 11360, "total_steps": 38160, "loss": 0.5114, "lr": 0.0008856260342388827, "epoch": 5.953878406708595, "percentage": 29.77, "elapsed_time": "0:28:55", "remaining_time": "1:08:13", "throughput": 4271.29, "total_tokens": 7411144} {"current_steps": 11365, "total_steps": 38160, "loss": 0.4748, "lr": 0.0008854804286367758, "epoch": 5.95649895178197, "percentage": 29.78, "elapsed_time": "0:28:55", "remaining_time": "1:08:12", "throughput": 4271.38, "total_tokens": 7414376} {"current_steps": 11370, "total_steps": 38160, "loss": 0.5426, "lr": 0.0008853347423965612, "epoch": 5.959119496855346, "percentage": 29.8, "elapsed_time": "0:28:56", "remaining_time": "1:08:11", "throughput": 4271.47, "total_tokens": 7417672} {"current_steps": 11375, "total_steps": 38160, "loss": 0.4396, "lr": 0.0008851889755487146, "epoch": 5.961740041928721, "percentage": 29.81, "elapsed_time": "0:28:57", "remaining_time": "1:08:10", "throughput": 4271.43, "total_tokens": 7420392} {"current_steps": 11380, "total_steps": 38160, "loss": 0.4144, "lr": 0.0008850431281237288, "epoch": 5.964360587002097, "percentage": 29.82, "elapsed_time": "0:28:57", "remaining_time": "1:08:09", "throughput": 4271.58, "total_tokens": 7423880} {"current_steps": 11385, "total_steps": 38160, "loss": 0.5231, "lr": 0.0008848972001521134, "epoch": 5.966981132075472, "percentage": 29.83, "elapsed_time": "0:28:58", "remaining_time": "1:08:09", "throughput": 4271.81, "total_tokens": 7427624} {"current_steps": 11390, "total_steps": 38160, "loss": 0.4042, "lr": 0.0008847511916643948, "epoch": 5.969601677148847, "percentage": 29.85, "elapsed_time": "0:28:59", "remaining_time": "1:08:08", "throughput": 4271.82, "total_tokens": 7430536} {"current_steps": 11395, "total_steps": 38160, "loss": 0.5766, "lr": 0.0008846051026911164, "epoch": 5.972222222222222, "percentage": 29.86, "elapsed_time": "0:29:00", "remaining_time": "1:08:07", "throughput": 4271.73, "total_tokens": 7433192} {"current_steps": 11400, "total_steps": 38160, "loss": 0.4277, "lr": 0.0008844589332628383, "epoch": 5.9748427672955975, "percentage": 29.87, "elapsed_time": "0:29:00", "remaining_time": "1:08:06", "throughput": 4271.72, "total_tokens": 7436104} {"current_steps": 11405, "total_steps": 38160, "loss": 0.4061, "lr": 0.0008843126834101376, "epoch": 5.977463312368973, "percentage": 29.89, "elapsed_time": "0:29:01", "remaining_time": "1:08:05", "throughput": 4271.83, "total_tokens": 7439432} {"current_steps": 11410, "total_steps": 38160, "loss": 0.4266, "lr": 0.000884166353163608, "epoch": 5.980083857442348, "percentage": 29.9, "elapsed_time": "0:29:02", "remaining_time": "1:08:04", "throughput": 4271.72, "total_tokens": 7441960} {"current_steps": 11415, "total_steps": 38160, "loss": 0.3853, "lr": 0.0008840199425538599, "epoch": 5.982704402515723, "percentage": 29.91, "elapsed_time": "0:29:02", "remaining_time": "1:08:03", "throughput": 4271.9, "total_tokens": 7445576} {"current_steps": 11420, "total_steps": 38160, "loss": 0.4575, "lr": 0.0008838734516115213, "epoch": 5.985324947589098, "percentage": 29.93, "elapsed_time": "0:29:03", "remaining_time": "1:08:02", "throughput": 4271.8, "total_tokens": 7448104} {"current_steps": 11425, "total_steps": 38160, "loss": 0.5107, "lr": 0.0008837268803672359, "epoch": 5.987945492662474, "percentage": 29.94, "elapsed_time": "0:29:04", "remaining_time": "1:08:01", "throughput": 4272.04, "total_tokens": 7451976} {"current_steps": 11430, "total_steps": 38160, "loss": 0.4347, "lr": 0.0008835802288516647, "epoch": 5.990566037735849, "percentage": 29.95, "elapsed_time": "0:29:05", "remaining_time": "1:08:01", "throughput": 4272.51, "total_tokens": 7456744} {"current_steps": 11435, "total_steps": 38160, "loss": 0.5367, "lr": 0.0008834334970954861, "epoch": 5.993186582809225, "percentage": 29.97, "elapsed_time": "0:29:06", "remaining_time": "1:08:00", "throughput": 4272.69, "total_tokens": 7460392} {"current_steps": 11440, "total_steps": 38160, "loss": 0.4959, "lr": 0.0008832866851293941, "epoch": 5.9958071278826, "percentage": 29.98, "elapsed_time": "0:29:06", "remaining_time": "1:07:59", "throughput": 4272.74, "total_tokens": 7463496} {"current_steps": 11445, "total_steps": 38160, "loss": 0.5946, "lr": 0.0008831397929841005, "epoch": 5.998427672955975, "percentage": 29.99, "elapsed_time": "0:29:07", "remaining_time": "1:07:58", "throughput": 4272.75, "total_tokens": 7466376} {"current_steps": 11448, "total_steps": 38160, "eval_loss": 0.454883873462677, "epoch": 6.0, "percentage": 30.0, "elapsed_time": "0:29:21", "remaining_time": "1:08:30", "throughput": 4239.48, "total_tokens": 7467968} {"current_steps": 11450, "total_steps": 38160, "loss": 0.5258, "lr": 0.0008829928206903333, "epoch": 6.00104821802935, "percentage": 30.01, "elapsed_time": "0:29:23", "remaining_time": "1:08:33", "throughput": 4235.38, "total_tokens": 7468896} {"current_steps": 11455, "total_steps": 38160, "loss": 0.4819, "lr": 0.0008828457682788373, "epoch": 6.003668763102725, "percentage": 30.02, "elapsed_time": "0:29:24", "remaining_time": "1:08:32", "throughput": 4235.62, "total_tokens": 7472640} {"current_steps": 11460, "total_steps": 38160, "loss": 0.434, "lr": 0.0008826986357803743, "epoch": 6.0062893081761, "percentage": 30.03, "elapsed_time": "0:29:24", "remaining_time": "1:08:32", "throughput": 4235.81, "total_tokens": 7476192} {"current_steps": 11465, "total_steps": 38160, "loss": 0.3968, "lr": 0.0008825514232257228, "epoch": 6.008909853249476, "percentage": 30.04, "elapsed_time": "0:29:25", "remaining_time": "1:08:31", "throughput": 4235.98, "total_tokens": 7479712} {"current_steps": 11470, "total_steps": 38160, "loss": 0.4481, "lr": 0.000882404130645678, "epoch": 6.011530398322851, "percentage": 30.06, "elapsed_time": "0:29:26", "remaining_time": "1:08:30", "throughput": 4236.04, "total_tokens": 7482816} {"current_steps": 11475, "total_steps": 38160, "loss": 0.5462, "lr": 0.0008822567580710518, "epoch": 6.014150943396227, "percentage": 30.07, "elapsed_time": "0:29:27", "remaining_time": "1:08:29", "throughput": 4236.08, "total_tokens": 7485760} {"current_steps": 11480, "total_steps": 38160, "loss": 0.5274, "lr": 0.0008821093055326728, "epoch": 6.016771488469602, "percentage": 30.08, "elapsed_time": "0:29:27", "remaining_time": "1:08:28", "throughput": 4236.28, "total_tokens": 7489440} {"current_steps": 11485, "total_steps": 38160, "loss": 0.2983, "lr": 0.0008819617730613863, "epoch": 6.019392033542977, "percentage": 30.1, "elapsed_time": "0:29:28", "remaining_time": "1:08:27", "throughput": 4236.38, "total_tokens": 7492704} {"current_steps": 11490, "total_steps": 38160, "loss": 0.4871, "lr": 0.0008818141606880545, "epoch": 6.022012578616352, "percentage": 30.11, "elapsed_time": "0:29:29", "remaining_time": "1:08:26", "throughput": 4236.46, "total_tokens": 7495776} {"current_steps": 11495, "total_steps": 38160, "loss": 0.4376, "lr": 0.0008816664684435564, "epoch": 6.0246331236897275, "percentage": 30.12, "elapsed_time": "0:29:30", "remaining_time": "1:08:25", "throughput": 4236.42, "total_tokens": 7498560} {"current_steps": 11500, "total_steps": 38160, "loss": 0.443, "lr": 0.0008815186963587873, "epoch": 6.027253668763103, "percentage": 30.14, "elapsed_time": "0:29:30", "remaining_time": "1:08:24", "throughput": 4236.29, "total_tokens": 7500992} {"current_steps": 11505, "total_steps": 38160, "loss": 0.5716, "lr": 0.0008813708444646596, "epoch": 6.029874213836478, "percentage": 30.15, "elapsed_time": "0:29:31", "remaining_time": "1:08:23", "throughput": 4236.38, "total_tokens": 7504192} {"current_steps": 11510, "total_steps": 38160, "loss": 0.4538, "lr": 0.0008812229127921021, "epoch": 6.032494758909853, "percentage": 30.16, "elapsed_time": "0:29:32", "remaining_time": "1:08:23", "throughput": 4236.52, "total_tokens": 7507552} {"current_steps": 11515, "total_steps": 38160, "loss": 0.5338, "lr": 0.0008810749013720605, "epoch": 6.035115303983228, "percentage": 30.18, "elapsed_time": "0:29:32", "remaining_time": "1:08:22", "throughput": 4236.56, "total_tokens": 7510592} {"current_steps": 11520, "total_steps": 38160, "loss": 0.549, "lr": 0.0008809268102354969, "epoch": 6.037735849056604, "percentage": 30.19, "elapsed_time": "0:29:33", "remaining_time": "1:08:21", "throughput": 4236.61, "total_tokens": 7513664} {"current_steps": 11525, "total_steps": 38160, "loss": 0.4802, "lr": 0.0008807786394133905, "epoch": 6.040356394129979, "percentage": 30.2, "elapsed_time": "0:29:34", "remaining_time": "1:08:20", "throughput": 4236.53, "total_tokens": 7516320} {"current_steps": 11530, "total_steps": 38160, "loss": 0.385, "lr": 0.0008806303889367371, "epoch": 6.0429769392033545, "percentage": 30.21, "elapsed_time": "0:29:34", "remaining_time": "1:08:19", "throughput": 4236.43, "total_tokens": 7518944} {"current_steps": 11535, "total_steps": 38160, "loss": 0.4541, "lr": 0.0008804820588365485, "epoch": 6.04559748427673, "percentage": 30.23, "elapsed_time": "0:29:35", "remaining_time": "1:08:18", "throughput": 4236.31, "total_tokens": 7521376} {"current_steps": 11540, "total_steps": 38160, "loss": 0.4641, "lr": 0.0008803336491438543, "epoch": 6.048218029350105, "percentage": 30.24, "elapsed_time": "0:29:36", "remaining_time": "1:08:17", "throughput": 4236.87, "total_tokens": 7526432} {"current_steps": 11545, "total_steps": 38160, "loss": 0.3714, "lr": 0.0008801851598896995, "epoch": 6.05083857442348, "percentage": 30.25, "elapsed_time": "0:29:37", "remaining_time": "1:08:17", "throughput": 4237.52, "total_tokens": 7532064} {"current_steps": 11550, "total_steps": 38160, "loss": 0.4291, "lr": 0.0008800365911051467, "epoch": 6.053459119496855, "percentage": 30.27, "elapsed_time": "0:29:38", "remaining_time": "1:08:16", "throughput": 4237.62, "total_tokens": 7535360} {"current_steps": 11555, "total_steps": 38160, "loss": 0.3585, "lr": 0.0008798879428212747, "epoch": 6.05607966457023, "percentage": 30.28, "elapsed_time": "0:29:39", "remaining_time": "1:08:16", "throughput": 4237.87, "total_tokens": 7539232} {"current_steps": 11560, "total_steps": 38160, "loss": 0.5719, "lr": 0.0008797392150691792, "epoch": 6.058700209643606, "percentage": 30.29, "elapsed_time": "0:29:39", "remaining_time": "1:08:15", "throughput": 4237.98, "total_tokens": 7542464} {"current_steps": 11565, "total_steps": 38160, "loss": 0.3821, "lr": 0.000879590407879972, "epoch": 6.061320754716981, "percentage": 30.31, "elapsed_time": "0:29:40", "remaining_time": "1:08:14", "throughput": 4238.18, "total_tokens": 7546176} {"current_steps": 11570, "total_steps": 38160, "loss": 0.5764, "lr": 0.0008794415212847822, "epoch": 6.063941299790357, "percentage": 30.32, "elapsed_time": "0:29:41", "remaining_time": "1:08:13", "throughput": 4238.35, "total_tokens": 7549696} {"current_steps": 11575, "total_steps": 38160, "loss": 0.3708, "lr": 0.000879292555314755, "epoch": 6.066561844863732, "percentage": 30.33, "elapsed_time": "0:29:41", "remaining_time": "1:08:12", "throughput": 4238.33, "total_tokens": 7552544} {"current_steps": 11580, "total_steps": 38160, "loss": 0.374, "lr": 0.0008791435100010524, "epoch": 6.069182389937107, "percentage": 30.35, "elapsed_time": "0:29:42", "remaining_time": "1:08:11", "throughput": 4238.26, "total_tokens": 7555168} {"current_steps": 11585, "total_steps": 38160, "loss": 0.6497, "lr": 0.000878994385374853, "epoch": 6.071802935010482, "percentage": 30.36, "elapsed_time": "0:29:43", "remaining_time": "1:08:10", "throughput": 4238.38, "total_tokens": 7558528} {"current_steps": 11590, "total_steps": 38160, "loss": 0.5115, "lr": 0.0008788451814673521, "epoch": 6.0744234800838575, "percentage": 30.37, "elapsed_time": "0:29:44", "remaining_time": "1:08:09", "throughput": 4238.47, "total_tokens": 7561760} {"current_steps": 11595, "total_steps": 38160, "loss": 0.5464, "lr": 0.0008786958983097613, "epoch": 6.077044025157233, "percentage": 30.39, "elapsed_time": "0:29:44", "remaining_time": "1:08:09", "throughput": 4238.63, "total_tokens": 7565312} {"current_steps": 11600, "total_steps": 38160, "loss": 0.5093, "lr": 0.0008785465359333088, "epoch": 6.079664570230608, "percentage": 30.4, "elapsed_time": "0:29:45", "remaining_time": "1:08:08", "throughput": 4238.75, "total_tokens": 7568640} {"current_steps": 11605, "total_steps": 38160, "loss": 0.5056, "lr": 0.0008783970943692398, "epoch": 6.082285115303983, "percentage": 30.41, "elapsed_time": "0:29:46", "remaining_time": "1:08:07", "throughput": 4238.89, "total_tokens": 7572096} {"current_steps": 11610, "total_steps": 38160, "loss": 0.4786, "lr": 0.0008782475736488156, "epoch": 6.084905660377358, "percentage": 30.42, "elapsed_time": "0:29:47", "remaining_time": "1:08:06", "throughput": 4238.86, "total_tokens": 7574944} {"current_steps": 11615, "total_steps": 38160, "loss": 0.6351, "lr": 0.0008780979738033142, "epoch": 6.087526205450734, "percentage": 30.44, "elapsed_time": "0:29:47", "remaining_time": "1:08:05", "throughput": 4238.94, "total_tokens": 7578080} {"current_steps": 11620, "total_steps": 38160, "loss": 0.4412, "lr": 0.0008779482948640305, "epoch": 6.090146750524109, "percentage": 30.45, "elapsed_time": "0:29:48", "remaining_time": "1:08:04", "throughput": 4238.7, "total_tokens": 7580128} {"current_steps": 11625, "total_steps": 38160, "loss": 0.5, "lr": 0.0008777985368622752, "epoch": 6.0927672955974845, "percentage": 30.46, "elapsed_time": "0:29:49", "remaining_time": "1:08:03", "throughput": 4238.92, "total_tokens": 7583968} {"current_steps": 11630, "total_steps": 38160, "loss": 0.3776, "lr": 0.0008776486998293762, "epoch": 6.09538784067086, "percentage": 30.48, "elapsed_time": "0:29:49", "remaining_time": "1:08:02", "throughput": 4238.78, "total_tokens": 7586368} {"current_steps": 11635, "total_steps": 38160, "loss": 0.4767, "lr": 0.0008774987837966775, "epoch": 6.098008385744235, "percentage": 30.49, "elapsed_time": "0:29:50", "remaining_time": "1:08:01", "throughput": 4238.91, "total_tokens": 7589728} {"current_steps": 11640, "total_steps": 38160, "loss": 0.5784, "lr": 0.0008773487887955401, "epoch": 6.10062893081761, "percentage": 30.5, "elapsed_time": "0:29:51", "remaining_time": "1:08:00", "throughput": 4238.82, "total_tokens": 7592224} {"current_steps": 11645, "total_steps": 38160, "loss": 0.6193, "lr": 0.000877198714857341, "epoch": 6.103249475890985, "percentage": 30.52, "elapsed_time": "0:29:51", "remaining_time": "1:07:59", "throughput": 4238.94, "total_tokens": 7595648} {"current_steps": 11650, "total_steps": 38160, "loss": 0.3699, "lr": 0.000877048562013474, "epoch": 6.10587002096436, "percentage": 30.53, "elapsed_time": "0:29:52", "remaining_time": "1:07:59", "throughput": 4238.99, "total_tokens": 7598784} {"current_steps": 11655, "total_steps": 38160, "loss": 0.3931, "lr": 0.0008768983302953498, "epoch": 6.1084905660377355, "percentage": 30.54, "elapsed_time": "0:29:53", "remaining_time": "1:07:58", "throughput": 4239.11, "total_tokens": 7602112} {"current_steps": 11660, "total_steps": 38160, "loss": 0.4241, "lr": 0.0008767480197343945, "epoch": 6.111111111111111, "percentage": 30.56, "elapsed_time": "0:29:54", "remaining_time": "1:07:58", "throughput": 4239.94, "total_tokens": 7608768} {"current_steps": 11665, "total_steps": 38160, "loss": 0.5998, "lr": 0.0008765976303620515, "epoch": 6.113731656184487, "percentage": 30.57, "elapsed_time": "0:29:55", "remaining_time": "1:07:57", "throughput": 4240.09, "total_tokens": 7612224} {"current_steps": 11670, "total_steps": 38160, "loss": 0.3795, "lr": 0.0008764471622097809, "epoch": 6.116352201257862, "percentage": 30.58, "elapsed_time": "0:29:56", "remaining_time": "1:07:57", "throughput": 4240.51, "total_tokens": 7616768} {"current_steps": 11675, "total_steps": 38160, "loss": 0.4578, "lr": 0.0008762966153090588, "epoch": 6.118972746331237, "percentage": 30.59, "elapsed_time": "0:29:56", "remaining_time": "1:07:56", "throughput": 4240.54, "total_tokens": 7619840} {"current_steps": 11680, "total_steps": 38160, "loss": 0.4886, "lr": 0.0008761459896913776, "epoch": 6.121593291404612, "percentage": 30.61, "elapsed_time": "0:29:57", "remaining_time": "1:07:55", "throughput": 4240.63, "total_tokens": 7623104} {"current_steps": 11685, "total_steps": 38160, "loss": 0.5043, "lr": 0.0008759952853882466, "epoch": 6.1242138364779874, "percentage": 30.62, "elapsed_time": "0:29:58", "remaining_time": "1:07:54", "throughput": 4240.59, "total_tokens": 7625856} {"current_steps": 11690, "total_steps": 38160, "loss": 0.3367, "lr": 0.0008758445024311917, "epoch": 6.126834381551363, "percentage": 30.63, "elapsed_time": "0:29:59", "remaining_time": "1:07:53", "throughput": 4240.81, "total_tokens": 7629600} {"current_steps": 11695, "total_steps": 38160, "loss": 0.5205, "lr": 0.0008756936408517547, "epoch": 6.129454926624738, "percentage": 30.65, "elapsed_time": "0:29:59", "remaining_time": "1:07:52", "throughput": 4240.93, "total_tokens": 7632960} {"current_steps": 11700, "total_steps": 38160, "loss": 0.506, "lr": 0.000875542700681494, "epoch": 6.132075471698113, "percentage": 30.66, "elapsed_time": "0:30:00", "remaining_time": "1:07:51", "throughput": 4240.92, "total_tokens": 7635840} {"current_steps": 11705, "total_steps": 38160, "loss": 0.591, "lr": 0.0008753916819519849, "epoch": 6.134696016771488, "percentage": 30.67, "elapsed_time": "0:30:01", "remaining_time": "1:07:51", "throughput": 4241.05, "total_tokens": 7639232} {"current_steps": 11710, "total_steps": 38160, "loss": 0.4359, "lr": 0.0008752405846948186, "epoch": 6.137316561844864, "percentage": 30.69, "elapsed_time": "0:30:02", "remaining_time": "1:07:51", "throughput": 4241.9, "total_tokens": 7645888} {"current_steps": 11715, "total_steps": 38160, "loss": 0.3697, "lr": 0.0008750894089416029, "epoch": 6.139937106918239, "percentage": 30.7, "elapsed_time": "0:30:03", "remaining_time": "1:07:50", "throughput": 4241.87, "total_tokens": 7648608} {"current_steps": 11720, "total_steps": 38160, "loss": 0.5461, "lr": 0.0008749381547239621, "epoch": 6.1425576519916145, "percentage": 30.71, "elapsed_time": "0:30:03", "remaining_time": "1:07:49", "throughput": 4241.76, "total_tokens": 7651072} {"current_steps": 11725, "total_steps": 38160, "loss": 0.649, "lr": 0.000874786822073537, "epoch": 6.14517819706499, "percentage": 30.73, "elapsed_time": "0:30:04", "remaining_time": "1:07:48", "throughput": 4241.86, "total_tokens": 7654304} {"current_steps": 11730, "total_steps": 38160, "loss": 0.4655, "lr": 0.0008746354110219843, "epoch": 6.147798742138365, "percentage": 30.74, "elapsed_time": "0:30:05", "remaining_time": "1:07:47", "throughput": 4241.96, "total_tokens": 7657568} {"current_steps": 11735, "total_steps": 38160, "loss": 0.3936, "lr": 0.0008744839216009779, "epoch": 6.15041928721174, "percentage": 30.75, "elapsed_time": "0:30:05", "remaining_time": "1:07:46", "throughput": 4242.11, "total_tokens": 7661056} {"current_steps": 11740, "total_steps": 38160, "loss": 0.3983, "lr": 0.0008743323538422072, "epoch": 6.153039832285115, "percentage": 30.77, "elapsed_time": "0:30:07", "remaining_time": "1:07:46", "throughput": 4242.87, "total_tokens": 7667360} {"current_steps": 11745, "total_steps": 38160, "loss": 0.4151, "lr": 0.0008741807077773789, "epoch": 6.15566037735849, "percentage": 30.78, "elapsed_time": "0:30:07", "remaining_time": "1:07:46", "throughput": 4243.12, "total_tokens": 7671200} {"current_steps": 11750, "total_steps": 38160, "loss": 0.6407, "lr": 0.0008740289834382153, "epoch": 6.1582809224318655, "percentage": 30.79, "elapsed_time": "0:30:08", "remaining_time": "1:07:45", "throughput": 4243.15, "total_tokens": 7674144} {"current_steps": 11755, "total_steps": 38160, "loss": 0.4225, "lr": 0.0008738771808564555, "epoch": 6.160901467505241, "percentage": 30.8, "elapsed_time": "0:30:09", "remaining_time": "1:07:44", "throughput": 4243.26, "total_tokens": 7677408} {"current_steps": 11760, "total_steps": 38160, "loss": 0.6041, "lr": 0.000873725300063855, "epoch": 6.163522012578617, "percentage": 30.82, "elapsed_time": "0:30:09", "remaining_time": "1:07:43", "throughput": 4243.23, "total_tokens": 7680160} {"current_steps": 11765, "total_steps": 38160, "loss": 0.4923, "lr": 0.0008735733410921853, "epoch": 6.166142557651992, "percentage": 30.83, "elapsed_time": "0:30:10", "remaining_time": "1:07:42", "throughput": 4243.21, "total_tokens": 7682848} {"current_steps": 11770, "total_steps": 38160, "loss": 0.481, "lr": 0.0008734213039732346, "epoch": 6.168763102725367, "percentage": 30.84, "elapsed_time": "0:30:11", "remaining_time": "1:07:41", "throughput": 4243.22, "total_tokens": 7685728} {"current_steps": 11775, "total_steps": 38160, "loss": 0.424, "lr": 0.0008732691887388073, "epoch": 6.171383647798742, "percentage": 30.86, "elapsed_time": "0:30:12", "remaining_time": "1:07:40", "throughput": 4243.34, "total_tokens": 7688960} {"current_steps": 11780, "total_steps": 38160, "loss": 0.5266, "lr": 0.0008731169954207243, "epoch": 6.174004192872117, "percentage": 30.87, "elapsed_time": "0:30:12", "remaining_time": "1:07:39", "throughput": 4243.35, "total_tokens": 7691872} {"current_steps": 11785, "total_steps": 38160, "loss": 0.4943, "lr": 0.0008729647240508225, "epoch": 6.176624737945493, "percentage": 30.88, "elapsed_time": "0:30:13", "remaining_time": "1:07:38", "throughput": 4243.23, "total_tokens": 7694336} {"current_steps": 11790, "total_steps": 38160, "loss": 0.4882, "lr": 0.0008728123746609555, "epoch": 6.179245283018868, "percentage": 30.9, "elapsed_time": "0:30:14", "remaining_time": "1:07:37", "throughput": 4243.25, "total_tokens": 7697280} {"current_steps": 11795, "total_steps": 38160, "loss": 0.5042, "lr": 0.000872659947282993, "epoch": 6.181865828092243, "percentage": 30.91, "elapsed_time": "0:30:14", "remaining_time": "1:07:36", "throughput": 4243.36, "total_tokens": 7700640} {"current_steps": 11800, "total_steps": 38160, "loss": 0.463, "lr": 0.000872507441948821, "epoch": 6.184486373165618, "percentage": 30.92, "elapsed_time": "0:30:15", "remaining_time": "1:07:35", "throughput": 4243.46, "total_tokens": 7704064} {"current_steps": 11805, "total_steps": 38160, "loss": 0.4987, "lr": 0.0008723548586903418, "epoch": 6.187106918238993, "percentage": 30.94, "elapsed_time": "0:30:16", "remaining_time": "1:07:34", "throughput": 4243.65, "total_tokens": 7707712} {"current_steps": 11810, "total_steps": 38160, "loss": 0.5091, "lr": 0.0008722021975394745, "epoch": 6.189727463312369, "percentage": 30.95, "elapsed_time": "0:30:16", "remaining_time": "1:07:33", "throughput": 4243.67, "total_tokens": 7710656} {"current_steps": 11815, "total_steps": 38160, "loss": 0.5585, "lr": 0.0008720494585281536, "epoch": 6.1923480083857445, "percentage": 30.96, "elapsed_time": "0:30:17", "remaining_time": "1:07:33", "throughput": 4243.71, "total_tokens": 7713664} {"current_steps": 11820, "total_steps": 38160, "loss": 0.4969, "lr": 0.0008718966416883306, "epoch": 6.19496855345912, "percentage": 30.97, "elapsed_time": "0:30:18", "remaining_time": "1:07:31", "throughput": 4243.55, "total_tokens": 7716000} {"current_steps": 11825, "total_steps": 38160, "loss": 0.5014, "lr": 0.0008717437470519729, "epoch": 6.197589098532495, "percentage": 30.99, "elapsed_time": "0:30:18", "remaining_time": "1:07:30", "throughput": 4243.44, "total_tokens": 7718432} {"current_steps": 11830, "total_steps": 38160, "loss": 0.4404, "lr": 0.0008715907746510645, "epoch": 6.20020964360587, "percentage": 31.0, "elapsed_time": "0:30:19", "remaining_time": "1:07:29", "throughput": 4243.41, "total_tokens": 7721216} {"current_steps": 11835, "total_steps": 38160, "loss": 0.4312, "lr": 0.0008714377245176054, "epoch": 6.202830188679245, "percentage": 31.01, "elapsed_time": "0:30:20", "remaining_time": "1:07:28", "throughput": 4243.44, "total_tokens": 7724128} {"current_steps": 11840, "total_steps": 38160, "loss": 0.369, "lr": 0.0008712845966836119, "epoch": 6.20545073375262, "percentage": 31.03, "elapsed_time": "0:30:21", "remaining_time": "1:07:28", "throughput": 4243.64, "total_tokens": 7727744} {"current_steps": 11845, "total_steps": 38160, "loss": 0.5373, "lr": 0.0008711313911811165, "epoch": 6.2080712788259955, "percentage": 31.04, "elapsed_time": "0:30:21", "remaining_time": "1:07:27", "throughput": 4243.71, "total_tokens": 7730880} {"current_steps": 11850, "total_steps": 38160, "loss": 0.4952, "lr": 0.0008709781080421681, "epoch": 6.210691823899371, "percentage": 31.05, "elapsed_time": "0:30:22", "remaining_time": "1:07:26", "throughput": 4243.77, "total_tokens": 7734048} {"current_steps": 11855, "total_steps": 38160, "loss": 0.4092, "lr": 0.0008708247472988319, "epoch": 6.213312368972747, "percentage": 31.07, "elapsed_time": "0:30:23", "remaining_time": "1:07:25", "throughput": 4243.73, "total_tokens": 7736832} {"current_steps": 11860, "total_steps": 38160, "loss": 0.4648, "lr": 0.0008706713089831893, "epoch": 6.215932914046122, "percentage": 31.08, "elapsed_time": "0:30:23", "remaining_time": "1:07:24", "throughput": 4243.75, "total_tokens": 7739808} {"current_steps": 11865, "total_steps": 38160, "loss": 0.4229, "lr": 0.0008705177931273377, "epoch": 6.218553459119497, "percentage": 31.09, "elapsed_time": "0:30:24", "remaining_time": "1:07:23", "throughput": 4243.86, "total_tokens": 7743072} {"current_steps": 11870, "total_steps": 38160, "loss": 0.4816, "lr": 0.0008703641997633907, "epoch": 6.221174004192872, "percentage": 31.11, "elapsed_time": "0:30:25", "remaining_time": "1:07:22", "throughput": 4243.95, "total_tokens": 7746336} {"current_steps": 11875, "total_steps": 38160, "loss": 0.5304, "lr": 0.0008702105289234786, "epoch": 6.223794549266247, "percentage": 31.12, "elapsed_time": "0:30:25", "remaining_time": "1:07:21", "throughput": 4243.86, "total_tokens": 7748864} {"current_steps": 11880, "total_steps": 38160, "loss": 0.3853, "lr": 0.0008700567806397473, "epoch": 6.226415094339623, "percentage": 31.13, "elapsed_time": "0:30:26", "remaining_time": "1:07:20", "throughput": 4243.77, "total_tokens": 7751424} {"current_steps": 11885, "total_steps": 38160, "loss": 0.5361, "lr": 0.0008699029549443595, "epoch": 6.229035639412998, "percentage": 31.15, "elapsed_time": "0:30:27", "remaining_time": "1:07:19", "throughput": 4243.79, "total_tokens": 7754272} {"current_steps": 11890, "total_steps": 38160, "loss": 0.4135, "lr": 0.0008697490518694935, "epoch": 6.231656184486373, "percentage": 31.16, "elapsed_time": "0:30:27", "remaining_time": "1:07:18", "throughput": 4243.99, "total_tokens": 7757920} {"current_steps": 11895, "total_steps": 38160, "loss": 0.4202, "lr": 0.0008695950714473442, "epoch": 6.234276729559748, "percentage": 31.17, "elapsed_time": "0:30:28", "remaining_time": "1:07:18", "throughput": 4244.21, "total_tokens": 7761792} {"current_steps": 11900, "total_steps": 38160, "loss": 0.3798, "lr": 0.0008694410137101224, "epoch": 6.236897274633123, "percentage": 31.18, "elapsed_time": "0:30:29", "remaining_time": "1:07:17", "throughput": 4244.25, "total_tokens": 7764832} {"current_steps": 11905, "total_steps": 38160, "loss": 0.4562, "lr": 0.0008692868786900554, "epoch": 6.239517819706499, "percentage": 31.2, "elapsed_time": "0:30:30", "remaining_time": "1:07:16", "throughput": 4244.51, "total_tokens": 7768640} {"current_steps": 11910, "total_steps": 38160, "loss": 0.351, "lr": 0.0008691326664193865, "epoch": 6.2421383647798745, "percentage": 31.21, "elapsed_time": "0:30:30", "remaining_time": "1:07:15", "throughput": 4244.47, "total_tokens": 7771360} {"current_steps": 11915, "total_steps": 38160, "loss": 0.3572, "lr": 0.000868978376930375, "epoch": 6.24475890985325, "percentage": 31.22, "elapsed_time": "0:30:31", "remaining_time": "1:07:14", "throughput": 4244.69, "total_tokens": 7775104} {"current_steps": 11920, "total_steps": 38160, "loss": 0.4327, "lr": 0.0008688240102552965, "epoch": 6.247379454926625, "percentage": 31.24, "elapsed_time": "0:30:33", "remaining_time": "1:07:15", "throughput": 4245.74, "total_tokens": 7782720} {"current_steps": 11925, "total_steps": 38160, "loss": 0.4042, "lr": 0.000868669566426443, "epoch": 6.25, "percentage": 31.25, "elapsed_time": "0:30:33", "remaining_time": "1:07:14", "throughput": 4245.75, "total_tokens": 7785568} {"current_steps": 11930, "total_steps": 38160, "loss": 0.49, "lr": 0.0008685150454761222, "epoch": 6.252620545073375, "percentage": 31.26, "elapsed_time": "0:30:34", "remaining_time": "1:07:13", "throughput": 4245.96, "total_tokens": 7789248} {"current_steps": 11935, "total_steps": 38160, "loss": 0.4147, "lr": 0.000868360447436658, "epoch": 6.25524109014675, "percentage": 31.28, "elapsed_time": "0:30:35", "remaining_time": "1:07:12", "throughput": 4245.88, "total_tokens": 7791744} {"current_steps": 11940, "total_steps": 38160, "loss": 0.5974, "lr": 0.0008682057723403907, "epoch": 6.2578616352201255, "percentage": 31.29, "elapsed_time": "0:30:35", "remaining_time": "1:07:11", "throughput": 4245.97, "total_tokens": 7795008} {"current_steps": 11945, "total_steps": 38160, "loss": 0.5317, "lr": 0.0008680510202196765, "epoch": 6.260482180293501, "percentage": 31.3, "elapsed_time": "0:30:36", "remaining_time": "1:07:10", "throughput": 4246.03, "total_tokens": 7798144} {"current_steps": 11950, "total_steps": 38160, "loss": 0.3955, "lr": 0.0008678961911068879, "epoch": 6.263102725366876, "percentage": 31.32, "elapsed_time": "0:30:37", "remaining_time": "1:07:09", "throughput": 4245.95, "total_tokens": 7800608} {"current_steps": 11955, "total_steps": 38160, "loss": 0.5911, "lr": 0.0008677412850344133, "epoch": 6.265723270440252, "percentage": 31.33, "elapsed_time": "0:30:37", "remaining_time": "1:07:08", "throughput": 4246.1, "total_tokens": 7804000} {"current_steps": 11960, "total_steps": 38160, "loss": 0.4244, "lr": 0.0008675863020346573, "epoch": 6.268343815513627, "percentage": 31.34, "elapsed_time": "0:30:38", "remaining_time": "1:07:07", "throughput": 4246.21, "total_tokens": 7807296} {"current_steps": 11965, "total_steps": 38160, "loss": 0.4356, "lr": 0.0008674312421400405, "epoch": 6.270964360587002, "percentage": 31.35, "elapsed_time": "0:30:39", "remaining_time": "1:07:07", "throughput": 4246.37, "total_tokens": 7810816} {"current_steps": 11970, "total_steps": 38160, "loss": 0.5008, "lr": 0.0008672761053829997, "epoch": 6.273584905660377, "percentage": 31.37, "elapsed_time": "0:30:40", "remaining_time": "1:07:06", "throughput": 4246.7, "total_tokens": 7814976} {"current_steps": 11975, "total_steps": 38160, "loss": 0.7242, "lr": 0.0008671208917959878, "epoch": 6.276205450733753, "percentage": 31.38, "elapsed_time": "0:30:41", "remaining_time": "1:07:05", "throughput": 4246.9, "total_tokens": 7818656} {"current_steps": 11980, "total_steps": 38160, "loss": 0.493, "lr": 0.0008669656014114737, "epoch": 6.278825995807128, "percentage": 31.39, "elapsed_time": "0:30:41", "remaining_time": "1:07:04", "throughput": 4246.91, "total_tokens": 7821664} {"current_steps": 11985, "total_steps": 38160, "loss": 0.3606, "lr": 0.0008668102342619424, "epoch": 6.281446540880503, "percentage": 31.41, "elapsed_time": "0:30:42", "remaining_time": "1:07:03", "throughput": 4246.98, "total_tokens": 7824800} {"current_steps": 11990, "total_steps": 38160, "loss": 0.5086, "lr": 0.0008666547903798947, "epoch": 6.284067085953878, "percentage": 31.42, "elapsed_time": "0:30:43", "remaining_time": "1:07:02", "throughput": 4246.9, "total_tokens": 7827456} {"current_steps": 11995, "total_steps": 38160, "loss": 0.4613, "lr": 0.000866499269797848, "epoch": 6.286687631027253, "percentage": 31.43, "elapsed_time": "0:30:43", "remaining_time": "1:07:02", "throughput": 4247.35, "total_tokens": 7832064} {"current_steps": 12000, "total_steps": 38160, "loss": 0.4913, "lr": 0.0008663436725483354, "epoch": 6.289308176100629, "percentage": 31.45, "elapsed_time": "0:30:44", "remaining_time": "1:07:01", "throughput": 4247.36, "total_tokens": 7834976} {"current_steps": 12005, "total_steps": 38160, "loss": 0.4015, "lr": 0.0008661879986639058, "epoch": 6.2919287211740045, "percentage": 31.46, "elapsed_time": "0:30:45", "remaining_time": "1:07:00", "throughput": 4247.38, "total_tokens": 7837920} {"current_steps": 12010, "total_steps": 38160, "loss": 0.4642, "lr": 0.0008660322481771246, "epoch": 6.29454926624738, "percentage": 31.47, "elapsed_time": "0:30:45", "remaining_time": "1:06:59", "throughput": 4247.3, "total_tokens": 7840448} {"current_steps": 12015, "total_steps": 38160, "loss": 0.4557, "lr": 0.0008658764211205731, "epoch": 6.297169811320755, "percentage": 31.49, "elapsed_time": "0:30:46", "remaining_time": "1:06:58", "throughput": 4247.38, "total_tokens": 7843680} {"current_steps": 12020, "total_steps": 38160, "loss": 0.451, "lr": 0.0008657205175268484, "epoch": 6.29979035639413, "percentage": 31.5, "elapsed_time": "0:30:47", "remaining_time": "1:06:57", "throughput": 4247.54, "total_tokens": 7847264} {"current_steps": 12025, "total_steps": 38160, "loss": 0.4006, "lr": 0.0008655645374285637, "epoch": 6.302410901467505, "percentage": 31.51, "elapsed_time": "0:30:48", "remaining_time": "1:06:56", "throughput": 4247.53, "total_tokens": 7850144} {"current_steps": 12030, "total_steps": 38160, "loss": 0.4147, "lr": 0.0008654084808583485, "epoch": 6.30503144654088, "percentage": 31.53, "elapsed_time": "0:30:48", "remaining_time": "1:06:56", "throughput": 4247.69, "total_tokens": 7853696} {"current_steps": 12035, "total_steps": 38160, "loss": 0.4479, "lr": 0.0008652523478488478, "epoch": 6.3076519916142555, "percentage": 31.54, "elapsed_time": "0:30:49", "remaining_time": "1:06:55", "throughput": 4247.72, "total_tokens": 7856736} {"current_steps": 12040, "total_steps": 38160, "loss": 0.454, "lr": 0.000865096138432723, "epoch": 6.310272536687631, "percentage": 31.55, "elapsed_time": "0:30:50", "remaining_time": "1:06:54", "throughput": 4247.98, "total_tokens": 7860640} {"current_steps": 12045, "total_steps": 38160, "loss": 0.3651, "lr": 0.0008649398526426512, "epoch": 6.312893081761006, "percentage": 31.56, "elapsed_time": "0:30:51", "remaining_time": "1:06:53", "throughput": 4248.02, "total_tokens": 7863680} {"current_steps": 12050, "total_steps": 38160, "loss": 0.5772, "lr": 0.0008647834905113256, "epoch": 6.315513626834382, "percentage": 31.58, "elapsed_time": "0:30:51", "remaining_time": "1:06:52", "throughput": 4248.05, "total_tokens": 7866688} {"current_steps": 12055, "total_steps": 38160, "loss": 0.3919, "lr": 0.0008646270520714556, "epoch": 6.318134171907757, "percentage": 31.59, "elapsed_time": "0:30:52", "remaining_time": "1:06:51", "throughput": 4248.09, "total_tokens": 7869824} {"current_steps": 12060, "total_steps": 38160, "loss": 0.4257, "lr": 0.0008644705373557663, "epoch": 6.320754716981132, "percentage": 31.6, "elapsed_time": "0:30:53", "remaining_time": "1:06:50", "throughput": 4248.1, "total_tokens": 7872640} {"current_steps": 12065, "total_steps": 38160, "loss": 0.5007, "lr": 0.0008643139463969985, "epoch": 6.323375262054507, "percentage": 31.62, "elapsed_time": "0:30:53", "remaining_time": "1:06:49", "throughput": 4248.09, "total_tokens": 7875424} {"current_steps": 12070, "total_steps": 38160, "loss": 0.4794, "lr": 0.0008641572792279095, "epoch": 6.325995807127883, "percentage": 31.63, "elapsed_time": "0:30:54", "remaining_time": "1:06:49", "throughput": 4248.36, "total_tokens": 7879360} {"current_steps": 12075, "total_steps": 38160, "loss": 0.4035, "lr": 0.0008640005358812723, "epoch": 6.328616352201258, "percentage": 31.64, "elapsed_time": "0:30:55", "remaining_time": "1:06:48", "throughput": 4248.33, "total_tokens": 7882144} {"current_steps": 12080, "total_steps": 38160, "loss": 0.4214, "lr": 0.0008638437163898756, "epoch": 6.331236897274633, "percentage": 31.66, "elapsed_time": "0:30:56", "remaining_time": "1:06:47", "throughput": 4248.61, "total_tokens": 7886176} {"current_steps": 12085, "total_steps": 38160, "loss": 0.4354, "lr": 0.0008636868207865244, "epoch": 6.333857442348008, "percentage": 31.67, "elapsed_time": "0:30:56", "remaining_time": "1:06:46", "throughput": 4248.8, "total_tokens": 7889760} {"current_steps": 12090, "total_steps": 38160, "loss": 0.5271, "lr": 0.0008635298491040394, "epoch": 6.336477987421383, "percentage": 31.68, "elapsed_time": "0:30:57", "remaining_time": "1:06:45", "throughput": 4248.75, "total_tokens": 7892448} {"current_steps": 12095, "total_steps": 38160, "loss": 0.43, "lr": 0.0008633728013752574, "epoch": 6.339098532494759, "percentage": 31.7, "elapsed_time": "0:30:58", "remaining_time": "1:06:44", "throughput": 4249.06, "total_tokens": 7896608} {"current_steps": 12100, "total_steps": 38160, "loss": 0.4722, "lr": 0.000863215677633031, "epoch": 6.3417190775681345, "percentage": 31.71, "elapsed_time": "0:30:59", "remaining_time": "1:06:44", "throughput": 4249.1, "total_tokens": 7899584} {"current_steps": 12105, "total_steps": 38160, "loss": 0.5179, "lr": 0.0008630584779102285, "epoch": 6.34433962264151, "percentage": 31.72, "elapsed_time": "0:30:59", "remaining_time": "1:06:43", "throughput": 4249.21, "total_tokens": 7903008} {"current_steps": 12110, "total_steps": 38160, "loss": 0.4946, "lr": 0.0008629012022397344, "epoch": 6.346960167714885, "percentage": 31.73, "elapsed_time": "0:31:00", "remaining_time": "1:06:42", "throughput": 4249.15, "total_tokens": 7905696} {"current_steps": 12115, "total_steps": 38160, "loss": 0.5467, "lr": 0.0008627438506544491, "epoch": 6.34958071278826, "percentage": 31.75, "elapsed_time": "0:31:01", "remaining_time": "1:06:41", "throughput": 4249.19, "total_tokens": 7908832} {"current_steps": 12120, "total_steps": 38160, "loss": 0.4859, "lr": 0.0008625864231872886, "epoch": 6.352201257861635, "percentage": 31.76, "elapsed_time": "0:31:01", "remaining_time": "1:06:40", "throughput": 4249.15, "total_tokens": 7911520} {"current_steps": 12125, "total_steps": 38160, "loss": 0.5447, "lr": 0.000862428919871185, "epoch": 6.35482180293501, "percentage": 31.77, "elapsed_time": "0:31:02", "remaining_time": "1:06:39", "throughput": 4249.26, "total_tokens": 7914848} {"current_steps": 12130, "total_steps": 38160, "loss": 0.4779, "lr": 0.0008622713407390861, "epoch": 6.3574423480083855, "percentage": 31.79, "elapsed_time": "0:31:03", "remaining_time": "1:06:38", "throughput": 4249.45, "total_tokens": 7918400} {"current_steps": 12135, "total_steps": 38160, "loss": 0.7211, "lr": 0.0008621136858239557, "epoch": 6.360062893081761, "percentage": 31.8, "elapsed_time": "0:31:04", "remaining_time": "1:06:37", "throughput": 4249.41, "total_tokens": 7921248} {"current_steps": 12140, "total_steps": 38160, "loss": 0.5338, "lr": 0.0008619559551587736, "epoch": 6.362683438155136, "percentage": 31.81, "elapsed_time": "0:31:05", "remaining_time": "1:06:37", "throughput": 4249.92, "total_tokens": 7926240} {"current_steps": 12145, "total_steps": 38160, "loss": 0.4684, "lr": 0.0008617981487765349, "epoch": 6.365303983228512, "percentage": 31.83, "elapsed_time": "0:31:05", "remaining_time": "1:06:36", "throughput": 4250.2, "total_tokens": 7930176} {"current_steps": 12150, "total_steps": 38160, "loss": 0.4651, "lr": 0.0008616402667102512, "epoch": 6.367924528301887, "percentage": 31.84, "elapsed_time": "0:31:06", "remaining_time": "1:06:35", "throughput": 4250.21, "total_tokens": 7933120} {"current_steps": 12155, "total_steps": 38160, "loss": 0.5498, "lr": 0.0008614823089929495, "epoch": 6.370545073375262, "percentage": 31.85, "elapsed_time": "0:31:07", "remaining_time": "1:06:34", "throughput": 4250.1, "total_tokens": 7935552} {"current_steps": 12160, "total_steps": 38160, "loss": 0.3325, "lr": 0.0008613242756576728, "epoch": 6.373165618448637, "percentage": 31.87, "elapsed_time": "0:31:07", "remaining_time": "1:06:33", "throughput": 4249.95, "total_tokens": 7937824} {"current_steps": 12165, "total_steps": 38160, "loss": 0.5816, "lr": 0.0008611661667374798, "epoch": 6.3757861635220126, "percentage": 31.88, "elapsed_time": "0:31:08", "remaining_time": "1:06:32", "throughput": 4249.79, "total_tokens": 7940128} {"current_steps": 12170, "total_steps": 38160, "loss": 0.2921, "lr": 0.0008610079822654451, "epoch": 6.378406708595388, "percentage": 31.89, "elapsed_time": "0:31:09", "remaining_time": "1:06:31", "throughput": 4249.8, "total_tokens": 7943008} {"current_steps": 12175, "total_steps": 38160, "loss": 0.4181, "lr": 0.0008608497222746591, "epoch": 6.381027253668763, "percentage": 31.91, "elapsed_time": "0:31:09", "remaining_time": "1:06:30", "throughput": 4249.69, "total_tokens": 7945472} {"current_steps": 12180, "total_steps": 38160, "loss": 0.4193, "lr": 0.000860691386798228, "epoch": 6.383647798742138, "percentage": 31.92, "elapsed_time": "0:31:10", "remaining_time": "1:06:29", "throughput": 4249.75, "total_tokens": 7948608} {"current_steps": 12185, "total_steps": 38160, "loss": 0.3705, "lr": 0.000860532975869274, "epoch": 6.386268343815513, "percentage": 31.93, "elapsed_time": "0:31:11", "remaining_time": "1:06:28", "throughput": 4249.69, "total_tokens": 7951296} {"current_steps": 12190, "total_steps": 38160, "loss": 0.3677, "lr": 0.0008603744895209342, "epoch": 6.388888888888889, "percentage": 31.94, "elapsed_time": "0:31:11", "remaining_time": "1:06:27", "throughput": 4250.02, "total_tokens": 7955488} {"current_steps": 12195, "total_steps": 38160, "loss": 0.4384, "lr": 0.0008602159277863628, "epoch": 6.3915094339622645, "percentage": 31.96, "elapsed_time": "0:31:12", "remaining_time": "1:06:27", "throughput": 4250.15, "total_tokens": 7958880} {"current_steps": 12200, "total_steps": 38160, "loss": 0.4718, "lr": 0.0008600572906987289, "epoch": 6.39412997903564, "percentage": 31.97, "elapsed_time": "0:31:13", "remaining_time": "1:06:26", "throughput": 4250.14, "total_tokens": 7961888} {"current_steps": 12205, "total_steps": 38160, "loss": 0.4611, "lr": 0.0008598985782912174, "epoch": 6.396750524109015, "percentage": 31.98, "elapsed_time": "0:31:14", "remaining_time": "1:06:25", "throughput": 4250.17, "total_tokens": 7964896} {"current_steps": 12210, "total_steps": 38160, "loss": 0.4752, "lr": 0.0008597397905970293, "epoch": 6.39937106918239, "percentage": 32.0, "elapsed_time": "0:31:14", "remaining_time": "1:06:24", "throughput": 4250.24, "total_tokens": 7968032} {"current_steps": 12215, "total_steps": 38160, "loss": 0.3763, "lr": 0.0008595809276493812, "epoch": 6.401991614255765, "percentage": 32.01, "elapsed_time": "0:31:15", "remaining_time": "1:06:23", "throughput": 4250.28, "total_tokens": 7971040} {"current_steps": 12220, "total_steps": 38160, "loss": 0.4012, "lr": 0.0008594219894815054, "epoch": 6.40461215932914, "percentage": 32.02, "elapsed_time": "0:31:16", "remaining_time": "1:06:22", "throughput": 4250.47, "total_tokens": 7974560} {"current_steps": 12225, "total_steps": 38160, "loss": 0.3975, "lr": 0.0008592629761266497, "epoch": 6.4072327044025155, "percentage": 32.04, "elapsed_time": "0:31:16", "remaining_time": "1:06:21", "throughput": 4250.64, "total_tokens": 7978144} {"current_steps": 12230, "total_steps": 38160, "loss": 0.3665, "lr": 0.0008591038876180784, "epoch": 6.409853249475891, "percentage": 32.05, "elapsed_time": "0:31:17", "remaining_time": "1:06:20", "throughput": 4250.65, "total_tokens": 7981024} {"current_steps": 12235, "total_steps": 38160, "loss": 0.4919, "lr": 0.0008589447239890705, "epoch": 6.412473794549266, "percentage": 32.06, "elapsed_time": "0:31:18", "remaining_time": "1:06:20", "throughput": 4250.75, "total_tokens": 7984448} {"current_steps": 12240, "total_steps": 38160, "loss": 0.4948, "lr": 0.0008587854852729213, "epoch": 6.415094339622642, "percentage": 32.08, "elapsed_time": "0:31:19", "remaining_time": "1:06:19", "throughput": 4250.8, "total_tokens": 7987520} {"current_steps": 12245, "total_steps": 38160, "loss": 0.4648, "lr": 0.000858626171502942, "epoch": 6.417714884696017, "percentage": 32.09, "elapsed_time": "0:31:19", "remaining_time": "1:06:18", "throughput": 4250.87, "total_tokens": 7990784} {"current_steps": 12250, "total_steps": 38160, "loss": 0.4822, "lr": 0.0008584667827124589, "epoch": 6.420335429769392, "percentage": 32.1, "elapsed_time": "0:31:20", "remaining_time": "1:06:17", "throughput": 4250.9, "total_tokens": 7993792} {"current_steps": 12255, "total_steps": 38160, "loss": 0.4911, "lr": 0.0008583073189348145, "epoch": 6.422955974842767, "percentage": 32.11, "elapsed_time": "0:31:21", "remaining_time": "1:06:16", "throughput": 4250.89, "total_tokens": 7996768} {"current_steps": 12260, "total_steps": 38160, "loss": 0.3561, "lr": 0.0008581477802033668, "epoch": 6.4255765199161425, "percentage": 32.13, "elapsed_time": "0:31:21", "remaining_time": "1:06:15", "throughput": 4250.83, "total_tokens": 7999424} {"current_steps": 12265, "total_steps": 38160, "loss": 0.3708, "lr": 0.0008579881665514895, "epoch": 6.428197064989518, "percentage": 32.14, "elapsed_time": "0:31:22", "remaining_time": "1:06:14", "throughput": 4251.12, "total_tokens": 8003456} {"current_steps": 12270, "total_steps": 38160, "loss": 0.3894, "lr": 0.0008578284780125718, "epoch": 6.430817610062893, "percentage": 32.15, "elapsed_time": "0:31:23", "remaining_time": "1:06:14", "throughput": 4251.33, "total_tokens": 8007360} {"current_steps": 12275, "total_steps": 38160, "loss": 0.3258, "lr": 0.0008576687146200189, "epoch": 6.433438155136268, "percentage": 32.17, "elapsed_time": "0:31:24", "remaining_time": "1:06:13", "throughput": 4251.3, "total_tokens": 8010112} {"current_steps": 12280, "total_steps": 38160, "loss": 0.4395, "lr": 0.0008575088764072511, "epoch": 6.436058700209643, "percentage": 32.18, "elapsed_time": "0:31:24", "remaining_time": "1:06:12", "throughput": 4251.32, "total_tokens": 8013024} {"current_steps": 12285, "total_steps": 38160, "loss": 0.5921, "lr": 0.0008573489634077054, "epoch": 6.438679245283019, "percentage": 32.19, "elapsed_time": "0:31:25", "remaining_time": "1:06:11", "throughput": 4251.24, "total_tokens": 8015584} {"current_steps": 12290, "total_steps": 38160, "loss": 0.4583, "lr": 0.0008571889756548333, "epoch": 6.441299790356394, "percentage": 32.21, "elapsed_time": "0:31:26", "remaining_time": "1:06:10", "throughput": 4251.32, "total_tokens": 8018720} {"current_steps": 12295, "total_steps": 38160, "loss": 0.3981, "lr": 0.0008570289131821025, "epoch": 6.44392033542977, "percentage": 32.22, "elapsed_time": "0:31:26", "remaining_time": "1:06:09", "throughput": 4251.2, "total_tokens": 8021184} {"current_steps": 12300, "total_steps": 38160, "loss": 0.5335, "lr": 0.0008568687760229963, "epoch": 6.446540880503145, "percentage": 32.23, "elapsed_time": "0:31:27", "remaining_time": "1:06:08", "throughput": 4251.3, "total_tokens": 8024416} {"current_steps": 12305, "total_steps": 38160, "loss": 0.3656, "lr": 0.0008567085642110135, "epoch": 6.44916142557652, "percentage": 32.25, "elapsed_time": "0:31:28", "remaining_time": "1:06:07", "throughput": 4251.48, "total_tokens": 8028160} {"current_steps": 12310, "total_steps": 38160, "loss": 0.3174, "lr": 0.0008565482777796687, "epoch": 6.451781970649895, "percentage": 32.26, "elapsed_time": "0:31:29", "remaining_time": "1:06:06", "throughput": 4251.53, "total_tokens": 8031296} {"current_steps": 12315, "total_steps": 38160, "loss": 0.5499, "lr": 0.0008563879167624919, "epoch": 6.45440251572327, "percentage": 32.27, "elapsed_time": "0:31:29", "remaining_time": "1:06:05", "throughput": 4251.63, "total_tokens": 8034624} {"current_steps": 12320, "total_steps": 38160, "loss": 0.439, "lr": 0.0008562274811930287, "epoch": 6.4570230607966455, "percentage": 32.29, "elapsed_time": "0:31:30", "remaining_time": "1:06:05", "throughput": 4251.82, "total_tokens": 8038176} {"current_steps": 12325, "total_steps": 38160, "loss": 0.4652, "lr": 0.0008560669711048406, "epoch": 6.459643605870021, "percentage": 32.3, "elapsed_time": "0:31:31", "remaining_time": "1:06:04", "throughput": 4252.04, "total_tokens": 8041920} {"current_steps": 12330, "total_steps": 38160, "loss": 0.4552, "lr": 0.0008559063865315042, "epoch": 6.462264150943396, "percentage": 32.31, "elapsed_time": "0:31:32", "remaining_time": "1:06:03", "throughput": 4252.08, "total_tokens": 8044992} {"current_steps": 12335, "total_steps": 38160, "loss": 0.4647, "lr": 0.0008557457275066122, "epoch": 6.464884696016772, "percentage": 32.32, "elapsed_time": "0:31:32", "remaining_time": "1:06:02", "throughput": 4252.18, "total_tokens": 8048352} {"current_steps": 12340, "total_steps": 38160, "loss": 0.56, "lr": 0.0008555849940637725, "epoch": 6.467505241090147, "percentage": 32.34, "elapsed_time": "0:31:33", "remaining_time": "1:06:01", "throughput": 4252.16, "total_tokens": 8051168} {"current_steps": 12345, "total_steps": 38160, "loss": 0.4892, "lr": 0.000855424186236609, "epoch": 6.470125786163522, "percentage": 32.35, "elapsed_time": "0:31:34", "remaining_time": "1:06:01", "throughput": 4252.35, "total_tokens": 8054848} {"current_steps": 12350, "total_steps": 38160, "loss": 0.4054, "lr": 0.0008552633040587605, "epoch": 6.472746331236897, "percentage": 32.36, "elapsed_time": "0:31:34", "remaining_time": "1:06:00", "throughput": 4252.41, "total_tokens": 8057952} {"current_steps": 12355, "total_steps": 38160, "loss": 0.4657, "lr": 0.0008551023475638819, "epoch": 6.4753668763102725, "percentage": 32.38, "elapsed_time": "0:31:35", "remaining_time": "1:05:59", "throughput": 4252.53, "total_tokens": 8061344} {"current_steps": 12360, "total_steps": 38160, "loss": 0.4734, "lr": 0.0008549413167856432, "epoch": 6.477987421383648, "percentage": 32.39, "elapsed_time": "0:31:36", "remaining_time": "1:05:58", "throughput": 4252.64, "total_tokens": 8064704} {"current_steps": 12365, "total_steps": 38160, "loss": 0.5329, "lr": 0.0008547802117577307, "epoch": 6.480607966457023, "percentage": 32.4, "elapsed_time": "0:31:37", "remaining_time": "1:05:57", "throughput": 4252.59, "total_tokens": 8067360} {"current_steps": 12370, "total_steps": 38160, "loss": 0.5293, "lr": 0.0008546190325138454, "epoch": 6.483228511530398, "percentage": 32.42, "elapsed_time": "0:31:37", "remaining_time": "1:05:56", "throughput": 4252.88, "total_tokens": 8071520} {"current_steps": 12375, "total_steps": 38160, "loss": 0.4592, "lr": 0.000854457779087704, "epoch": 6.485849056603773, "percentage": 32.43, "elapsed_time": "0:31:38", "remaining_time": "1:05:56", "throughput": 4253.18, "total_tokens": 8075680} {"current_steps": 12380, "total_steps": 38160, "loss": 0.8798, "lr": 0.0008542964515130392, "epoch": 6.488469601677149, "percentage": 32.44, "elapsed_time": "0:31:39", "remaining_time": "1:05:55", "throughput": 4252.93, "total_tokens": 8077600} {"current_steps": 12385, "total_steps": 38160, "loss": 0.4477, "lr": 0.0008541350498235989, "epoch": 6.491090146750524, "percentage": 32.46, "elapsed_time": "0:31:39", "remaining_time": "1:05:53", "throughput": 4252.76, "total_tokens": 8079872} {"current_steps": 12390, "total_steps": 38160, "loss": 0.4257, "lr": 0.0008539735740531462, "epoch": 6.4937106918239, "percentage": 32.47, "elapsed_time": "0:31:40", "remaining_time": "1:05:53", "throughput": 4252.75, "total_tokens": 8082720} {"current_steps": 12395, "total_steps": 38160, "loss": 0.5171, "lr": 0.0008538120242354602, "epoch": 6.496331236897275, "percentage": 32.48, "elapsed_time": "0:31:41", "remaining_time": "1:05:52", "throughput": 4252.79, "total_tokens": 8085728} {"current_steps": 12400, "total_steps": 38160, "loss": 0.4551, "lr": 0.0008536504004043353, "epoch": 6.49895178197065, "percentage": 32.49, "elapsed_time": "0:31:42", "remaining_time": "1:05:51", "throughput": 4252.94, "total_tokens": 8089280} {"current_steps": 12405, "total_steps": 38160, "loss": 0.4527, "lr": 0.0008534887025935811, "epoch": 6.501572327044025, "percentage": 32.51, "elapsed_time": "0:31:42", "remaining_time": "1:05:50", "throughput": 4253.04, "total_tokens": 8092576} {"current_steps": 12410, "total_steps": 38160, "loss": 0.5061, "lr": 0.0008533269308370233, "epoch": 6.5041928721174, "percentage": 32.52, "elapsed_time": "0:31:43", "remaining_time": "1:05:49", "throughput": 4253.15, "total_tokens": 8096032} {"current_steps": 12415, "total_steps": 38160, "loss": 0.5204, "lr": 0.0008531650851685025, "epoch": 6.506813417190775, "percentage": 32.53, "elapsed_time": "0:31:44", "remaining_time": "1:05:48", "throughput": 4253.27, "total_tokens": 8099424} {"current_steps": 12420, "total_steps": 38160, "loss": 0.4263, "lr": 0.000853003165621875, "epoch": 6.509433962264151, "percentage": 32.55, "elapsed_time": "0:31:44", "remaining_time": "1:05:47", "throughput": 4253.19, "total_tokens": 8101952} {"current_steps": 12425, "total_steps": 38160, "loss": 0.4507, "lr": 0.0008528411722310126, "epoch": 6.512054507337526, "percentage": 32.56, "elapsed_time": "0:31:45", "remaining_time": "1:05:47", "throughput": 4253.33, "total_tokens": 8105472} {"current_steps": 12430, "total_steps": 38160, "loss": 0.5952, "lr": 0.0008526791050298022, "epoch": 6.514675052410902, "percentage": 32.57, "elapsed_time": "0:31:46", "remaining_time": "1:05:46", "throughput": 4253.3, "total_tokens": 8108256} {"current_steps": 12435, "total_steps": 38160, "loss": 0.4012, "lr": 0.0008525169640521467, "epoch": 6.517295597484277, "percentage": 32.59, "elapsed_time": "0:31:47", "remaining_time": "1:05:45", "throughput": 4253.26, "total_tokens": 8111008} {"current_steps": 12440, "total_steps": 38160, "loss": 0.5125, "lr": 0.0008523547493319641, "epoch": 6.519916142557652, "percentage": 32.6, "elapsed_time": "0:31:47", "remaining_time": "1:05:44", "throughput": 4253.34, "total_tokens": 8114208} {"current_steps": 12445, "total_steps": 38160, "loss": 0.3581, "lr": 0.0008521924609031877, "epoch": 6.522536687631027, "percentage": 32.61, "elapsed_time": "0:31:48", "remaining_time": "1:05:43", "throughput": 4253.41, "total_tokens": 8117376} {"current_steps": 12450, "total_steps": 38160, "loss": 0.552, "lr": 0.0008520300987997667, "epoch": 6.5251572327044025, "percentage": 32.63, "elapsed_time": "0:31:49", "remaining_time": "1:05:42", "throughput": 4253.41, "total_tokens": 8120256} {"current_steps": 12455, "total_steps": 38160, "loss": 0.3039, "lr": 0.000851867663055665, "epoch": 6.527777777777778, "percentage": 32.64, "elapsed_time": "0:31:49", "remaining_time": "1:05:41", "throughput": 4253.32, "total_tokens": 8122848} {"current_steps": 12460, "total_steps": 38160, "loss": 0.4057, "lr": 0.0008517051537048625, "epoch": 6.530398322851153, "percentage": 32.65, "elapsed_time": "0:31:50", "remaining_time": "1:05:40", "throughput": 4253.48, "total_tokens": 8126336} {"current_steps": 12465, "total_steps": 38160, "loss": 0.2915, "lr": 0.0008515425707813544, "epoch": 6.533018867924528, "percentage": 32.67, "elapsed_time": "0:31:51", "remaining_time": "1:05:39", "throughput": 4253.6, "total_tokens": 8129760} {"current_steps": 12470, "total_steps": 38160, "loss": 0.4261, "lr": 0.0008513799143191512, "epoch": 6.535639412997903, "percentage": 32.68, "elapsed_time": "0:31:52", "remaining_time": "1:05:39", "throughput": 4253.75, "total_tokens": 8133248} {"current_steps": 12475, "total_steps": 38160, "loss": 0.5014, "lr": 0.0008512171843522786, "epoch": 6.538259958071279, "percentage": 32.69, "elapsed_time": "0:31:52", "remaining_time": "1:05:38", "throughput": 4253.73, "total_tokens": 8136032} {"current_steps": 12480, "total_steps": 38160, "loss": 0.3864, "lr": 0.000851054380914778, "epoch": 6.540880503144654, "percentage": 32.7, "elapsed_time": "0:31:53", "remaining_time": "1:05:37", "throughput": 4254.03, "total_tokens": 8140224} {"current_steps": 12485, "total_steps": 38160, "loss": 0.4901, "lr": 0.0008508915040407057, "epoch": 6.54350104821803, "percentage": 32.72, "elapsed_time": "0:31:54", "remaining_time": "1:05:36", "throughput": 4254.08, "total_tokens": 8143424} {"current_steps": 12490, "total_steps": 38160, "loss": 0.4258, "lr": 0.0008507285537641342, "epoch": 6.546121593291405, "percentage": 32.73, "elapsed_time": "0:31:54", "remaining_time": "1:05:35", "throughput": 4254.09, "total_tokens": 8146336} {"current_steps": 12495, "total_steps": 38160, "loss": 0.5317, "lr": 0.0008505655301191504, "epoch": 6.54874213836478, "percentage": 32.74, "elapsed_time": "0:31:55", "remaining_time": "1:05:34", "throughput": 4253.96, "total_tokens": 8148768} {"current_steps": 12500, "total_steps": 38160, "loss": 0.3388, "lr": 0.0008504024331398572, "epoch": 6.551362683438155, "percentage": 32.76, "elapsed_time": "0:31:56", "remaining_time": "1:05:33", "throughput": 4254.01, "total_tokens": 8151840} {"current_steps": 12505, "total_steps": 38160, "loss": 0.4166, "lr": 0.0008502392628603727, "epoch": 6.55398322851153, "percentage": 32.77, "elapsed_time": "0:31:56", "remaining_time": "1:05:32", "throughput": 4253.97, "total_tokens": 8154560} {"current_steps": 12510, "total_steps": 38160, "loss": 0.4563, "lr": 0.0008500760193148301, "epoch": 6.556603773584905, "percentage": 32.78, "elapsed_time": "0:31:57", "remaining_time": "1:05:31", "throughput": 4254.13, "total_tokens": 8158144} {"current_steps": 12515, "total_steps": 38160, "loss": 0.578, "lr": 0.0008499127025373781, "epoch": 6.559224318658281, "percentage": 32.8, "elapsed_time": "0:31:58", "remaining_time": "1:05:30", "throughput": 4254.04, "total_tokens": 8160672} {"current_steps": 12520, "total_steps": 38160, "loss": 0.435, "lr": 0.0008497493125621807, "epoch": 6.561844863731656, "percentage": 32.81, "elapsed_time": "0:31:59", "remaining_time": "1:05:30", "throughput": 4254.09, "total_tokens": 8163744} {"current_steps": 12525, "total_steps": 38160, "loss": 0.6367, "lr": 0.0008495858494234173, "epoch": 6.564465408805032, "percentage": 32.82, "elapsed_time": "0:31:59", "remaining_time": "1:05:29", "throughput": 4254.22, "total_tokens": 8167104} {"current_steps": 12530, "total_steps": 38160, "loss": 0.4019, "lr": 0.0008494223131552825, "epoch": 6.567085953878407, "percentage": 32.84, "elapsed_time": "0:32:00", "remaining_time": "1:05:28", "throughput": 4254.29, "total_tokens": 8170304} {"current_steps": 12535, "total_steps": 38160, "loss": 0.4366, "lr": 0.0008492587037919864, "epoch": 6.569706498951782, "percentage": 32.85, "elapsed_time": "0:32:01", "remaining_time": "1:05:27", "throughput": 4254.28, "total_tokens": 8173184} {"current_steps": 12540, "total_steps": 38160, "loss": 0.4857, "lr": 0.0008490950213677537, "epoch": 6.572327044025157, "percentage": 32.86, "elapsed_time": "0:32:02", "remaining_time": "1:05:26", "throughput": 4254.62, "total_tokens": 8177472} {"current_steps": 12545, "total_steps": 38160, "loss": 0.42, "lr": 0.0008489312659168254, "epoch": 6.5749475890985325, "percentage": 32.87, "elapsed_time": "0:32:02", "remaining_time": "1:05:25", "throughput": 4254.63, "total_tokens": 8180480} {"current_steps": 12550, "total_steps": 38160, "loss": 0.3848, "lr": 0.0008487674374734569, "epoch": 6.577568134171908, "percentage": 32.89, "elapsed_time": "0:32:03", "remaining_time": "1:05:25", "throughput": 4255.04, "total_tokens": 8185088} {"current_steps": 12555, "total_steps": 38160, "loss": 0.5492, "lr": 0.0008486035360719197, "epoch": 6.580188679245283, "percentage": 32.9, "elapsed_time": "0:32:04", "remaining_time": "1:05:24", "throughput": 4255.13, "total_tokens": 8188384} {"current_steps": 12560, "total_steps": 38160, "loss": 0.5095, "lr": 0.0008484395617464997, "epoch": 6.582809224318658, "percentage": 32.91, "elapsed_time": "0:32:05", "remaining_time": "1:05:23", "throughput": 4255.15, "total_tokens": 8191360} {"current_steps": 12565, "total_steps": 38160, "loss": 0.3772, "lr": 0.0008482755145314986, "epoch": 6.585429769392033, "percentage": 32.93, "elapsed_time": "0:32:05", "remaining_time": "1:05:22", "throughput": 4255.27, "total_tokens": 8194816} {"current_steps": 12570, "total_steps": 38160, "loss": 0.3541, "lr": 0.0008481113944612331, "epoch": 6.588050314465409, "percentage": 32.94, "elapsed_time": "0:32:06", "remaining_time": "1:05:22", "throughput": 4255.34, "total_tokens": 8198016} {"current_steps": 12575, "total_steps": 38160, "loss": 0.464, "lr": 0.0008479472015700356, "epoch": 6.590670859538784, "percentage": 32.95, "elapsed_time": "0:32:07", "remaining_time": "1:05:20", "throughput": 4255.21, "total_tokens": 8200448} {"current_steps": 12580, "total_steps": 38160, "loss": 0.6162, "lr": 0.0008477829358922529, "epoch": 6.59329140461216, "percentage": 32.97, "elapsed_time": "0:32:07", "remaining_time": "1:05:20", "throughput": 4255.24, "total_tokens": 8203488} {"current_steps": 12585, "total_steps": 38160, "loss": 0.4729, "lr": 0.0008476185974622477, "epoch": 6.595911949685535, "percentage": 32.98, "elapsed_time": "0:32:08", "remaining_time": "1:05:19", "throughput": 4255.25, "total_tokens": 8206464} {"current_steps": 12590, "total_steps": 38160, "loss": 0.3953, "lr": 0.0008474541863143978, "epoch": 6.59853249475891, "percentage": 32.99, "elapsed_time": "0:32:09", "remaining_time": "1:05:19", "throughput": 4256.1, "total_tokens": 8212928} {"current_steps": 12595, "total_steps": 38160, "loss": 0.466, "lr": 0.0008472897024830961, "epoch": 6.601153039832285, "percentage": 33.01, "elapsed_time": "0:32:10", "remaining_time": "1:05:18", "throughput": 4256.14, "total_tokens": 8216128} {"current_steps": 12600, "total_steps": 38160, "loss": 0.5521, "lr": 0.0008471251460027508, "epoch": 6.60377358490566, "percentage": 33.02, "elapsed_time": "0:32:11", "remaining_time": "1:05:17", "throughput": 4256.0, "total_tokens": 8218496} {"current_steps": 12605, "total_steps": 38160, "loss": 0.2868, "lr": 0.0008469605169077852, "epoch": 6.606394129979035, "percentage": 33.03, "elapsed_time": "0:32:11", "remaining_time": "1:05:16", "throughput": 4256.1, "total_tokens": 8221824} {"current_steps": 12610, "total_steps": 38160, "loss": 0.3995, "lr": 0.0008467958152326377, "epoch": 6.609014675052411, "percentage": 33.05, "elapsed_time": "0:32:12", "remaining_time": "1:05:15", "throughput": 4256.25, "total_tokens": 8225376} {"current_steps": 12615, "total_steps": 38160, "loss": 0.5321, "lr": 0.0008466310410117622, "epoch": 6.611635220125786, "percentage": 33.06, "elapsed_time": "0:32:13", "remaining_time": "1:05:14", "throughput": 4256.21, "total_tokens": 8228224} {"current_steps": 12620, "total_steps": 38160, "loss": 0.5081, "lr": 0.0008464661942796275, "epoch": 6.614255765199162, "percentage": 33.07, "elapsed_time": "0:32:13", "remaining_time": "1:05:13", "throughput": 4256.09, "total_tokens": 8230656} {"current_steps": 12625, "total_steps": 38160, "loss": 0.3925, "lr": 0.0008463012750707175, "epoch": 6.616876310272537, "percentage": 33.08, "elapsed_time": "0:32:14", "remaining_time": "1:05:12", "throughput": 4256.06, "total_tokens": 8233408} {"current_steps": 12630, "total_steps": 38160, "loss": 0.5182, "lr": 0.0008461362834195316, "epoch": 6.619496855345912, "percentage": 33.1, "elapsed_time": "0:32:15", "remaining_time": "1:05:12", "throughput": 4256.25, "total_tokens": 8237216} {"current_steps": 12635, "total_steps": 38160, "loss": 0.5346, "lr": 0.0008459712193605842, "epoch": 6.622117400419287, "percentage": 33.11, "elapsed_time": "0:32:15", "remaining_time": "1:05:11", "throughput": 4256.22, "total_tokens": 8240000} {"current_steps": 12640, "total_steps": 38160, "loss": 0.4752, "lr": 0.0008458060829284048, "epoch": 6.6247379454926625, "percentage": 33.12, "elapsed_time": "0:32:16", "remaining_time": "1:05:10", "throughput": 4256.2, "total_tokens": 8242848} {"current_steps": 12645, "total_steps": 38160, "loss": 0.4139, "lr": 0.0008456408741575378, "epoch": 6.627358490566038, "percentage": 33.14, "elapsed_time": "0:32:17", "remaining_time": "1:05:09", "throughput": 4256.33, "total_tokens": 8246304} {"current_steps": 12650, "total_steps": 38160, "loss": 0.4318, "lr": 0.0008454755930825435, "epoch": 6.629979035639413, "percentage": 33.15, "elapsed_time": "0:32:18", "remaining_time": "1:05:08", "throughput": 4256.51, "total_tokens": 8249984} {"current_steps": 12655, "total_steps": 38160, "loss": 0.5294, "lr": 0.0008453102397379963, "epoch": 6.632599580712788, "percentage": 33.16, "elapsed_time": "0:32:19", "remaining_time": "1:05:08", "throughput": 4256.81, "total_tokens": 8254240} {"current_steps": 12660, "total_steps": 38160, "loss": 0.401, "lr": 0.0008451448141584868, "epoch": 6.635220125786163, "percentage": 33.18, "elapsed_time": "0:32:19", "remaining_time": "1:05:07", "throughput": 4256.84, "total_tokens": 8257312} {"current_steps": 12665, "total_steps": 38160, "loss": 0.4558, "lr": 0.0008449793163786194, "epoch": 6.637840670859539, "percentage": 33.19, "elapsed_time": "0:32:20", "remaining_time": "1:05:06", "throughput": 4257.05, "total_tokens": 8261216} {"current_steps": 12670, "total_steps": 38160, "loss": 0.4347, "lr": 0.0008448137464330149, "epoch": 6.640461215932914, "percentage": 33.2, "elapsed_time": "0:32:21", "remaining_time": "1:05:05", "throughput": 4257.16, "total_tokens": 8264608} {"current_steps": 12675, "total_steps": 38160, "loss": 0.4949, "lr": 0.0008446481043563086, "epoch": 6.6430817610062896, "percentage": 33.22, "elapsed_time": "0:32:22", "remaining_time": "1:05:04", "throughput": 4257.34, "total_tokens": 8268384} {"current_steps": 12680, "total_steps": 38160, "loss": 0.4476, "lr": 0.0008444823901831507, "epoch": 6.645702306079665, "percentage": 33.23, "elapsed_time": "0:32:22", "remaining_time": "1:05:04", "throughput": 4257.52, "total_tokens": 8272000} {"current_steps": 12685, "total_steps": 38160, "loss": 0.3707, "lr": 0.0008443166039482067, "epoch": 6.64832285115304, "percentage": 33.24, "elapsed_time": "0:32:23", "remaining_time": "1:05:03", "throughput": 4257.75, "total_tokens": 8275776} {"current_steps": 12690, "total_steps": 38160, "loss": 0.4095, "lr": 0.0008441507456861575, "epoch": 6.650943396226415, "percentage": 33.25, "elapsed_time": "0:32:24", "remaining_time": "1:05:02", "throughput": 4257.84, "total_tokens": 8279008} {"current_steps": 12695, "total_steps": 38160, "loss": 0.4693, "lr": 0.0008439848154316985, "epoch": 6.65356394129979, "percentage": 33.27, "elapsed_time": "0:32:25", "remaining_time": "1:05:01", "throughput": 4257.85, "total_tokens": 8281952} {"current_steps": 12700, "total_steps": 38160, "loss": 0.3935, "lr": 0.0008438188132195406, "epoch": 6.656184486373165, "percentage": 33.28, "elapsed_time": "0:32:25", "remaining_time": "1:05:00", "throughput": 4257.98, "total_tokens": 8285472} {"current_steps": 12705, "total_steps": 38160, "loss": 0.5488, "lr": 0.0008436527390844094, "epoch": 6.658805031446541, "percentage": 33.29, "elapsed_time": "0:32:26", "remaining_time": "1:05:00", "throughput": 4257.99, "total_tokens": 8288416} {"current_steps": 12710, "total_steps": 38160, "loss": 0.4886, "lr": 0.0008434865930610458, "epoch": 6.661425576519916, "percentage": 33.31, "elapsed_time": "0:32:27", "remaining_time": "1:04:59", "throughput": 4258.17, "total_tokens": 8292064} {"current_steps": 12715, "total_steps": 38160, "loss": 0.4834, "lr": 0.0008433203751842057, "epoch": 6.664046121593291, "percentage": 33.32, "elapsed_time": "0:32:28", "remaining_time": "1:04:58", "throughput": 4258.18, "total_tokens": 8295008} {"current_steps": 12720, "total_steps": 38160, "loss": 0.4277, "lr": 0.0008431540854886598, "epoch": 6.666666666666667, "percentage": 33.33, "elapsed_time": "0:32:28", "remaining_time": "1:04:57", "throughput": 4258.29, "total_tokens": 8298432} {"current_steps": 12725, "total_steps": 38160, "loss": 0.4358, "lr": 0.0008429877240091941, "epoch": 6.669287211740042, "percentage": 33.35, "elapsed_time": "0:32:29", "remaining_time": "1:04:56", "throughput": 4258.47, "total_tokens": 8302240} {"current_steps": 12730, "total_steps": 38160, "loss": 0.5249, "lr": 0.0008428212907806097, "epoch": 6.671907756813417, "percentage": 33.36, "elapsed_time": "0:32:30", "remaining_time": "1:04:55", "throughput": 4258.43, "total_tokens": 8304960} {"current_steps": 12735, "total_steps": 38160, "loss": 0.3754, "lr": 0.0008426547858377222, "epoch": 6.6745283018867925, "percentage": 33.37, "elapsed_time": "0:32:30", "remaining_time": "1:04:55", "throughput": 4258.52, "total_tokens": 8308320} {"current_steps": 12740, "total_steps": 38160, "loss": 0.4585, "lr": 0.0008424882092153629, "epoch": 6.677148846960168, "percentage": 33.39, "elapsed_time": "0:32:31", "remaining_time": "1:04:54", "throughput": 4258.55, "total_tokens": 8311360} {"current_steps": 12745, "total_steps": 38160, "loss": 0.4932, "lr": 0.0008423215609483774, "epoch": 6.679769392033543, "percentage": 33.4, "elapsed_time": "0:32:32", "remaining_time": "1:04:53", "throughput": 4258.87, "total_tokens": 8315680} {"current_steps": 12750, "total_steps": 38160, "loss": 0.5664, "lr": 0.0008421548410716269, "epoch": 6.682389937106918, "percentage": 33.41, "elapsed_time": "0:32:33", "remaining_time": "1:04:52", "throughput": 4259.02, "total_tokens": 8319200} {"current_steps": 12755, "total_steps": 38160, "loss": 0.4498, "lr": 0.0008419880496199869, "epoch": 6.685010482180293, "percentage": 33.43, "elapsed_time": "0:32:34", "remaining_time": "1:04:52", "throughput": 4259.19, "total_tokens": 8322816} {"current_steps": 12760, "total_steps": 38160, "loss": 0.4765, "lr": 0.0008418211866283488, "epoch": 6.687631027253669, "percentage": 33.44, "elapsed_time": "0:32:34", "remaining_time": "1:04:51", "throughput": 4259.11, "total_tokens": 8325408} {"current_steps": 12765, "total_steps": 38160, "loss": 0.3864, "lr": 0.0008416542521316182, "epoch": 6.690251572327044, "percentage": 33.45, "elapsed_time": "0:32:35", "remaining_time": "1:04:50", "throughput": 4259.36, "total_tokens": 8329408} {"current_steps": 12770, "total_steps": 38160, "loss": 0.6115, "lr": 0.0008414872461647156, "epoch": 6.6928721174004195, "percentage": 33.46, "elapsed_time": "0:32:36", "remaining_time": "1:04:49", "throughput": 4259.44, "total_tokens": 8332736} {"current_steps": 12775, "total_steps": 38160, "loss": 0.2981, "lr": 0.0008413201687625772, "epoch": 6.695492662473795, "percentage": 33.48, "elapsed_time": "0:32:37", "remaining_time": "1:04:49", "throughput": 4260.02, "total_tokens": 8338272} {"current_steps": 12780, "total_steps": 38160, "loss": 0.6451, "lr": 0.0008411530199601534, "epoch": 6.69811320754717, "percentage": 33.49, "elapsed_time": "0:32:38", "remaining_time": "1:04:48", "throughput": 4260.09, "total_tokens": 8341472} {"current_steps": 12785, "total_steps": 38160, "loss": 0.4336, "lr": 0.0008409857997924097, "epoch": 6.700733752620545, "percentage": 33.5, "elapsed_time": "0:32:38", "remaining_time": "1:04:47", "throughput": 4260.05, "total_tokens": 8344288} {"current_steps": 12790, "total_steps": 38160, "loss": 0.4324, "lr": 0.0008408185082943271, "epoch": 6.70335429769392, "percentage": 33.52, "elapsed_time": "0:32:39", "remaining_time": "1:04:46", "throughput": 4260.1, "total_tokens": 8347392} {"current_steps": 12795, "total_steps": 38160, "loss": 0.4294, "lr": 0.0008406511455009007, "epoch": 6.705974842767295, "percentage": 33.53, "elapsed_time": "0:32:40", "remaining_time": "1:04:45", "throughput": 4260.16, "total_tokens": 8350656} {"current_steps": 12800, "total_steps": 38160, "loss": 0.4348, "lr": 0.000840483711447141, "epoch": 6.7085953878406706, "percentage": 33.54, "elapsed_time": "0:32:40", "remaining_time": "1:04:45", "throughput": 4260.25, "total_tokens": 8353888} {"current_steps": 12805, "total_steps": 38160, "loss": 0.4652, "lr": 0.0008403162061680736, "epoch": 6.711215932914046, "percentage": 33.56, "elapsed_time": "0:32:41", "remaining_time": "1:04:44", "throughput": 4260.22, "total_tokens": 8356736} {"current_steps": 12810, "total_steps": 38160, "loss": 0.4642, "lr": 0.0008401486296987382, "epoch": 6.713836477987421, "percentage": 33.57, "elapsed_time": "0:32:42", "remaining_time": "1:04:43", "throughput": 4260.5, "total_tokens": 8360992} {"current_steps": 12815, "total_steps": 38160, "loss": 0.4635, "lr": 0.0008399809820741901, "epoch": 6.716457023060797, "percentage": 33.58, "elapsed_time": "0:32:43", "remaining_time": "1:04:42", "throughput": 4260.53, "total_tokens": 8364000} {"current_steps": 12820, "total_steps": 38160, "loss": 0.3957, "lr": 0.0008398132633294993, "epoch": 6.719077568134172, "percentage": 33.6, "elapsed_time": "0:32:43", "remaining_time": "1:04:41", "throughput": 4260.39, "total_tokens": 8366304} {"current_steps": 12825, "total_steps": 38160, "loss": 0.3767, "lr": 0.0008396454734997506, "epoch": 6.721698113207547, "percentage": 33.61, "elapsed_time": "0:32:44", "remaining_time": "1:04:40", "throughput": 4260.53, "total_tokens": 8369792} {"current_steps": 12830, "total_steps": 38160, "loss": 0.4095, "lr": 0.0008394776126200436, "epoch": 6.7243186582809225, "percentage": 33.62, "elapsed_time": "0:32:45", "remaining_time": "1:04:39", "throughput": 4260.47, "total_tokens": 8372384} {"current_steps": 12835, "total_steps": 38160, "loss": 0.4371, "lr": 0.0008393096807254931, "epoch": 6.726939203354298, "percentage": 33.63, "elapsed_time": "0:32:45", "remaining_time": "1:04:38", "throughput": 4260.33, "total_tokens": 8374720} {"current_steps": 12840, "total_steps": 38160, "loss": 0.5546, "lr": 0.0008391416778512284, "epoch": 6.729559748427673, "percentage": 33.65, "elapsed_time": "0:32:46", "remaining_time": "1:04:37", "throughput": 4260.46, "total_tokens": 8378144} {"current_steps": 12845, "total_steps": 38160, "loss": 0.4281, "lr": 0.0008389736040323939, "epoch": 6.732180293501048, "percentage": 33.66, "elapsed_time": "0:32:47", "remaining_time": "1:04:37", "throughput": 4260.56, "total_tokens": 8381536} {"current_steps": 12850, "total_steps": 38160, "loss": 0.4457, "lr": 0.0008388054593041485, "epoch": 6.734800838574423, "percentage": 33.67, "elapsed_time": "0:32:47", "remaining_time": "1:04:36", "throughput": 4260.56, "total_tokens": 8384416} {"current_steps": 12855, "total_steps": 38160, "loss": 0.3916, "lr": 0.0008386372437016665, "epoch": 6.737421383647799, "percentage": 33.69, "elapsed_time": "0:32:48", "remaining_time": "1:04:35", "throughput": 4260.62, "total_tokens": 8387616} {"current_steps": 12860, "total_steps": 38160, "loss": 0.4568, "lr": 0.0008384689572601364, "epoch": 6.740041928721174, "percentage": 33.7, "elapsed_time": "0:32:49", "remaining_time": "1:04:34", "throughput": 4260.56, "total_tokens": 8390208} {"current_steps": 12865, "total_steps": 38160, "loss": 0.4068, "lr": 0.000838300600014762, "epoch": 6.7426624737945495, "percentage": 33.71, "elapsed_time": "0:32:50", "remaining_time": "1:04:33", "throughput": 4260.71, "total_tokens": 8393792} {"current_steps": 12870, "total_steps": 38160, "loss": 0.5482, "lr": 0.0008381321720007613, "epoch": 6.745283018867925, "percentage": 33.73, "elapsed_time": "0:32:50", "remaining_time": "1:04:32", "throughput": 4260.8, "total_tokens": 8397120} {"current_steps": 12875, "total_steps": 38160, "loss": 0.5794, "lr": 0.0008379636732533681, "epoch": 6.7479035639413, "percentage": 33.74, "elapsed_time": "0:32:51", "remaining_time": "1:04:31", "throughput": 4260.82, "total_tokens": 8400160} {"current_steps": 12880, "total_steps": 38160, "loss": 0.6804, "lr": 0.0008377951038078302, "epoch": 6.750524109014675, "percentage": 33.75, "elapsed_time": "0:32:52", "remaining_time": "1:04:31", "throughput": 4261.05, "total_tokens": 8404032} {"current_steps": 12885, "total_steps": 38160, "loss": 0.4872, "lr": 0.0008376264636994102, "epoch": 6.75314465408805, "percentage": 33.77, "elapsed_time": "0:32:53", "remaining_time": "1:04:30", "throughput": 4261.18, "total_tokens": 8407392} {"current_steps": 12890, "total_steps": 38160, "loss": 0.495, "lr": 0.000837457752963386, "epoch": 6.755765199161425, "percentage": 33.78, "elapsed_time": "0:32:53", "remaining_time": "1:04:29", "throughput": 4261.24, "total_tokens": 8410656} {"current_steps": 12895, "total_steps": 38160, "loss": 0.5307, "lr": 0.0008372889716350496, "epoch": 6.7583857442348005, "percentage": 33.79, "elapsed_time": "0:32:54", "remaining_time": "1:04:28", "throughput": 4261.19, "total_tokens": 8413344} {"current_steps": 12900, "total_steps": 38160, "loss": 0.4827, "lr": 0.0008371201197497084, "epoch": 6.761006289308176, "percentage": 33.81, "elapsed_time": "0:32:55", "remaining_time": "1:04:27", "throughput": 4261.36, "total_tokens": 8416960} {"current_steps": 12905, "total_steps": 38160, "loss": 0.5753, "lr": 0.0008369511973426842, "epoch": 6.763626834381551, "percentage": 33.82, "elapsed_time": "0:32:55", "remaining_time": "1:04:26", "throughput": 4261.45, "total_tokens": 8420352} {"current_steps": 12910, "total_steps": 38160, "loss": 0.4976, "lr": 0.0008367822044493138, "epoch": 6.766247379454927, "percentage": 33.83, "elapsed_time": "0:32:56", "remaining_time": "1:04:25", "throughput": 4261.47, "total_tokens": 8423360} {"current_steps": 12915, "total_steps": 38160, "loss": 0.306, "lr": 0.0008366131411049483, "epoch": 6.768867924528302, "percentage": 33.84, "elapsed_time": "0:32:57", "remaining_time": "1:04:25", "throughput": 4261.61, "total_tokens": 8426816} {"current_steps": 12920, "total_steps": 38160, "loss": 0.5961, "lr": 0.000836444007344954, "epoch": 6.771488469601677, "percentage": 33.86, "elapsed_time": "0:32:58", "remaining_time": "1:04:24", "throughput": 4261.66, "total_tokens": 8429856} {"current_steps": 12925, "total_steps": 38160, "loss": 0.601, "lr": 0.0008362748032047119, "epoch": 6.774109014675052, "percentage": 33.87, "elapsed_time": "0:32:58", "remaining_time": "1:04:23", "throughput": 4261.7, "total_tokens": 8433056} {"current_steps": 12930, "total_steps": 38160, "loss": 0.5084, "lr": 0.0008361055287196171, "epoch": 6.776729559748428, "percentage": 33.88, "elapsed_time": "0:32:59", "remaining_time": "1:04:22", "throughput": 4261.83, "total_tokens": 8436448} {"current_steps": 12935, "total_steps": 38160, "loss": 0.3257, "lr": 0.0008359361839250803, "epoch": 6.779350104821803, "percentage": 33.9, "elapsed_time": "0:33:00", "remaining_time": "1:04:21", "throughput": 4261.78, "total_tokens": 8439200} {"current_steps": 12940, "total_steps": 38160, "loss": 0.4871, "lr": 0.0008357667688565265, "epoch": 6.781970649895178, "percentage": 33.91, "elapsed_time": "0:33:01", "remaining_time": "1:04:20", "throughput": 4262.01, "total_tokens": 8443072} {"current_steps": 12945, "total_steps": 38160, "loss": 0.4065, "lr": 0.0008355972835493951, "epoch": 6.784591194968553, "percentage": 33.92, "elapsed_time": "0:33:01", "remaining_time": "1:04:20", "throughput": 4262.03, "total_tokens": 8445952} {"current_steps": 12950, "total_steps": 38160, "loss": 0.5755, "lr": 0.0008354277280391408, "epoch": 6.787211740041929, "percentage": 33.94, "elapsed_time": "0:33:02", "remaining_time": "1:04:19", "throughput": 4262.03, "total_tokens": 8448768} {"current_steps": 12955, "total_steps": 38160, "loss": 0.33, "lr": 0.0008352581023612324, "epoch": 6.789832285115304, "percentage": 33.95, "elapsed_time": "0:33:02", "remaining_time": "1:04:18", "throughput": 4261.92, "total_tokens": 8451232} {"current_steps": 12960, "total_steps": 38160, "loss": 0.4144, "lr": 0.0008350884065511541, "epoch": 6.7924528301886795, "percentage": 33.96, "elapsed_time": "0:33:03", "remaining_time": "1:04:17", "throughput": 4262.06, "total_tokens": 8454688} {"current_steps": 12965, "total_steps": 38160, "loss": 0.3353, "lr": 0.0008349186406444038, "epoch": 6.795073375262055, "percentage": 33.98, "elapsed_time": "0:33:04", "remaining_time": "1:04:16", "throughput": 4262.16, "total_tokens": 8458048} {"current_steps": 12970, "total_steps": 38160, "loss": 0.5017, "lr": 0.0008347488046764949, "epoch": 6.79769392033543, "percentage": 33.99, "elapsed_time": "0:33:05", "remaining_time": "1:04:15", "throughput": 4262.15, "total_tokens": 8460960} {"current_steps": 12975, "total_steps": 38160, "loss": 0.5133, "lr": 0.0008345788986829551, "epoch": 6.800314465408805, "percentage": 34.0, "elapsed_time": "0:33:05", "remaining_time": "1:04:14", "throughput": 4262.29, "total_tokens": 8464448} {"current_steps": 12980, "total_steps": 38160, "loss": 0.3469, "lr": 0.0008344089226993268, "epoch": 6.80293501048218, "percentage": 34.01, "elapsed_time": "0:33:06", "remaining_time": "1:04:13", "throughput": 4262.45, "total_tokens": 8468000} {"current_steps": 12985, "total_steps": 38160, "loss": 0.4938, "lr": 0.000834238876761167, "epoch": 6.805555555555555, "percentage": 34.03, "elapsed_time": "0:33:07", "remaining_time": "1:04:13", "throughput": 4262.74, "total_tokens": 8472288} {"current_steps": 12990, "total_steps": 38160, "loss": 0.3875, "lr": 0.0008340687609040473, "epoch": 6.8081761006289305, "percentage": 34.04, "elapsed_time": "0:33:08", "remaining_time": "1:04:12", "throughput": 4262.83, "total_tokens": 8475616} {"current_steps": 12995, "total_steps": 38160, "loss": 0.6011, "lr": 0.0008338985751635542, "epoch": 6.810796645702306, "percentage": 34.05, "elapsed_time": "0:33:08", "remaining_time": "1:04:11", "throughput": 4262.71, "total_tokens": 8477984} {"current_steps": 13000, "total_steps": 38160, "loss": 0.472, "lr": 0.0008337283195752883, "epoch": 6.813417190775681, "percentage": 34.07, "elapsed_time": "0:33:09", "remaining_time": "1:04:10", "throughput": 4262.71, "total_tokens": 8480864} {"current_steps": 13005, "total_steps": 38160, "loss": 0.5079, "lr": 0.0008335579941748654, "epoch": 6.816037735849057, "percentage": 34.08, "elapsed_time": "0:33:10", "remaining_time": "1:04:09", "throughput": 4262.68, "total_tokens": 8483680} {"current_steps": 13010, "total_steps": 38160, "loss": 0.4217, "lr": 0.0008333875989979156, "epoch": 6.818658280922432, "percentage": 34.09, "elapsed_time": "0:33:10", "remaining_time": "1:04:08", "throughput": 4262.85, "total_tokens": 8487296} {"current_steps": 13015, "total_steps": 38160, "loss": 0.3954, "lr": 0.0008332171340800835, "epoch": 6.821278825995807, "percentage": 34.11, "elapsed_time": "0:33:11", "remaining_time": "1:04:08", "throughput": 4262.91, "total_tokens": 8490528} {"current_steps": 13020, "total_steps": 38160, "loss": 0.4765, "lr": 0.0008330465994570287, "epoch": 6.823899371069182, "percentage": 34.12, "elapsed_time": "0:33:12", "remaining_time": "1:04:07", "throughput": 4262.93, "total_tokens": 8493536} {"current_steps": 13025, "total_steps": 38160, "loss": 0.5643, "lr": 0.0008328759951644247, "epoch": 6.826519916142558, "percentage": 34.13, "elapsed_time": "0:33:13", "remaining_time": "1:04:06", "throughput": 4263.13, "total_tokens": 8497472} {"current_steps": 13030, "total_steps": 38160, "loss": 0.5276, "lr": 0.0008327053212379603, "epoch": 6.829140461215933, "percentage": 34.15, "elapsed_time": "0:33:13", "remaining_time": "1:04:05", "throughput": 4263.11, "total_tokens": 8500288} {"current_steps": 13035, "total_steps": 38160, "loss": 0.4773, "lr": 0.0008325345777133382, "epoch": 6.831761006289308, "percentage": 34.16, "elapsed_time": "0:33:14", "remaining_time": "1:04:04", "throughput": 4263.08, "total_tokens": 8503136} {"current_steps": 13040, "total_steps": 38160, "loss": 0.3163, "lr": 0.0008323637646262763, "epoch": 6.834381551362683, "percentage": 34.17, "elapsed_time": "0:33:15", "remaining_time": "1:04:03", "throughput": 4263.33, "total_tokens": 8507168} {"current_steps": 13045, "total_steps": 38160, "loss": 0.4946, "lr": 0.0008321928820125067, "epoch": 6.837002096436059, "percentage": 34.19, "elapsed_time": "0:33:16", "remaining_time": "1:04:02", "throughput": 4263.25, "total_tokens": 8509760} {"current_steps": 13050, "total_steps": 38160, "loss": 0.352, "lr": 0.000832021929907776, "epoch": 6.839622641509434, "percentage": 34.2, "elapsed_time": "0:33:16", "remaining_time": "1:04:02", "throughput": 4263.22, "total_tokens": 8512672} {"current_steps": 13055, "total_steps": 38160, "loss": 0.4384, "lr": 0.0008318509083478454, "epoch": 6.8422431865828095, "percentage": 34.21, "elapsed_time": "0:33:17", "remaining_time": "1:04:01", "throughput": 4263.38, "total_tokens": 8516320} {"current_steps": 13060, "total_steps": 38160, "loss": 0.4656, "lr": 0.0008316798173684907, "epoch": 6.844863731656185, "percentage": 34.22, "elapsed_time": "0:33:18", "remaining_time": "1:04:00", "throughput": 4263.42, "total_tokens": 8519456} {"current_steps": 13065, "total_steps": 38160, "loss": 0.5708, "lr": 0.0008315086570055024, "epoch": 6.84748427672956, "percentage": 34.24, "elapsed_time": "0:33:18", "remaining_time": "1:03:59", "throughput": 4263.46, "total_tokens": 8522560} {"current_steps": 13070, "total_steps": 38160, "loss": 0.4366, "lr": 0.000831337427294685, "epoch": 6.850104821802935, "percentage": 34.25, "elapsed_time": "0:33:19", "remaining_time": "1:03:58", "throughput": 4263.53, "total_tokens": 8525792} {"current_steps": 13075, "total_steps": 38160, "loss": 0.4427, "lr": 0.0008311661282718579, "epoch": 6.85272536687631, "percentage": 34.26, "elapsed_time": "0:33:20", "remaining_time": "1:03:57", "throughput": 4263.53, "total_tokens": 8528704} {"current_steps": 13080, "total_steps": 38160, "loss": 0.4338, "lr": 0.0008309947599728549, "epoch": 6.855345911949685, "percentage": 34.28, "elapsed_time": "0:33:21", "remaining_time": "1:03:57", "throughput": 4263.61, "total_tokens": 8532000} {"current_steps": 13085, "total_steps": 38160, "loss": 0.5273, "lr": 0.0008308233224335243, "epoch": 6.8579664570230605, "percentage": 34.29, "elapsed_time": "0:33:21", "remaining_time": "1:03:56", "throughput": 4263.64, "total_tokens": 8535136} {"current_steps": 13090, "total_steps": 38160, "loss": 0.5353, "lr": 0.0008306518156897289, "epoch": 6.860587002096436, "percentage": 34.3, "elapsed_time": "0:33:22", "remaining_time": "1:03:55", "throughput": 4263.76, "total_tokens": 8538592} {"current_steps": 13095, "total_steps": 38160, "loss": 0.5044, "lr": 0.0008304802397773459, "epoch": 6.863207547169811, "percentage": 34.32, "elapsed_time": "0:33:23", "remaining_time": "1:03:54", "throughput": 4263.7, "total_tokens": 8541344} {"current_steps": 13100, "total_steps": 38160, "loss": 0.4897, "lr": 0.0008303085947322672, "epoch": 6.865828092243187, "percentage": 34.33, "elapsed_time": "0:33:23", "remaining_time": "1:03:53", "throughput": 4263.78, "total_tokens": 8544576} {"current_steps": 13105, "total_steps": 38160, "loss": 0.4547, "lr": 0.0008301368805903988, "epoch": 6.868448637316562, "percentage": 34.34, "elapsed_time": "0:33:24", "remaining_time": "1:03:52", "throughput": 4263.81, "total_tokens": 8547680} {"current_steps": 13110, "total_steps": 38160, "loss": 0.5323, "lr": 0.0008299650973876611, "epoch": 6.871069182389937, "percentage": 34.36, "elapsed_time": "0:33:25", "remaining_time": "1:03:51", "throughput": 4263.81, "total_tokens": 8550720} {"current_steps": 13115, "total_steps": 38160, "loss": 0.4107, "lr": 0.0008297932451599898, "epoch": 6.873689727463312, "percentage": 34.37, "elapsed_time": "0:33:26", "remaining_time": "1:03:51", "throughput": 4263.91, "total_tokens": 8554112} {"current_steps": 13120, "total_steps": 38160, "loss": 0.3433, "lr": 0.0008296213239433339, "epoch": 6.876310272536688, "percentage": 34.38, "elapsed_time": "0:33:26", "remaining_time": "1:03:50", "throughput": 4264.12, "total_tokens": 8557856} {"current_steps": 13125, "total_steps": 38160, "loss": 0.4905, "lr": 0.0008294493337736577, "epoch": 6.878930817610063, "percentage": 34.39, "elapsed_time": "0:33:27", "remaining_time": "1:03:49", "throughput": 4264.16, "total_tokens": 8560960} {"current_steps": 13130, "total_steps": 38160, "loss": 0.4376, "lr": 0.0008292772746869392, "epoch": 6.881551362683438, "percentage": 34.41, "elapsed_time": "0:33:28", "remaining_time": "1:03:48", "throughput": 4264.26, "total_tokens": 8564288} {"current_steps": 13135, "total_steps": 38160, "loss": 0.4508, "lr": 0.0008291051467191717, "epoch": 6.884171907756813, "percentage": 34.42, "elapsed_time": "0:33:29", "remaining_time": "1:03:48", "throughput": 4264.57, "total_tokens": 8568608} {"current_steps": 13140, "total_steps": 38160, "loss": 0.4379, "lr": 0.000828932949906362, "epoch": 6.886792452830189, "percentage": 34.43, "elapsed_time": "0:33:29", "remaining_time": "1:03:47", "throughput": 4264.64, "total_tokens": 8571872} {"current_steps": 13145, "total_steps": 38160, "loss": 0.5778, "lr": 0.0008287606842845319, "epoch": 6.889412997903564, "percentage": 34.45, "elapsed_time": "0:33:30", "remaining_time": "1:03:46", "throughput": 4264.52, "total_tokens": 8574336} {"current_steps": 13150, "total_steps": 38160, "loss": 0.4574, "lr": 0.0008285883498897174, "epoch": 6.8920335429769395, "percentage": 34.46, "elapsed_time": "0:33:31", "remaining_time": "1:03:45", "throughput": 4264.53, "total_tokens": 8577248} {"current_steps": 13155, "total_steps": 38160, "loss": 0.4605, "lr": 0.0008284159467579686, "epoch": 6.894654088050315, "percentage": 34.47, "elapsed_time": "0:33:32", "remaining_time": "1:03:44", "throughput": 4264.75, "total_tokens": 8581120} {"current_steps": 13160, "total_steps": 38160, "loss": 0.3867, "lr": 0.0008282434749253507, "epoch": 6.89727463312369, "percentage": 34.49, "elapsed_time": "0:33:32", "remaining_time": "1:03:43", "throughput": 4265.03, "total_tokens": 8585280} {"current_steps": 13165, "total_steps": 38160, "loss": 0.4382, "lr": 0.0008280709344279426, "epoch": 6.899895178197065, "percentage": 34.5, "elapsed_time": "0:33:33", "remaining_time": "1:03:43", "throughput": 4265.52, "total_tokens": 8590464} {"current_steps": 13170, "total_steps": 38160, "loss": 0.4316, "lr": 0.0008278983253018377, "epoch": 6.90251572327044, "percentage": 34.51, "elapsed_time": "0:33:34", "remaining_time": "1:03:42", "throughput": 4265.53, "total_tokens": 8593408} {"current_steps": 13175, "total_steps": 38160, "loss": 0.4278, "lr": 0.0008277256475831443, "epoch": 6.905136268343815, "percentage": 34.53, "elapsed_time": "0:33:35", "remaining_time": "1:03:41", "throughput": 4265.66, "total_tokens": 8596832} {"current_steps": 13180, "total_steps": 38160, "loss": 0.3475, "lr": 0.0008275529013079841, "epoch": 6.9077568134171905, "percentage": 34.54, "elapsed_time": "0:33:36", "remaining_time": "1:03:41", "throughput": 4265.69, "total_tokens": 8600000} {"current_steps": 13185, "total_steps": 38160, "loss": 0.4878, "lr": 0.0008273800865124941, "epoch": 6.910377358490566, "percentage": 34.55, "elapsed_time": "0:33:36", "remaining_time": "1:03:40", "throughput": 4265.6, "total_tokens": 8602560} {"current_steps": 13190, "total_steps": 38160, "loss": 0.5999, "lr": 0.0008272072032328246, "epoch": 6.912997903563941, "percentage": 34.56, "elapsed_time": "0:33:37", "remaining_time": "1:03:39", "throughput": 4265.5, "total_tokens": 8605088} {"current_steps": 13195, "total_steps": 38160, "loss": 0.5354, "lr": 0.0008270342515051414, "epoch": 6.915618448637317, "percentage": 34.58, "elapsed_time": "0:33:38", "remaining_time": "1:03:38", "throughput": 4265.66, "total_tokens": 8608704} {"current_steps": 13200, "total_steps": 38160, "loss": 0.4455, "lr": 0.0008268612313656238, "epoch": 6.918238993710692, "percentage": 34.59, "elapsed_time": "0:33:38", "remaining_time": "1:03:37", "throughput": 4265.81, "total_tokens": 8612320} {"current_steps": 13205, "total_steps": 38160, "loss": 0.5224, "lr": 0.0008266881428504655, "epoch": 6.920859538784067, "percentage": 34.6, "elapsed_time": "0:33:39", "remaining_time": "1:03:36", "throughput": 4265.83, "total_tokens": 8615360} {"current_steps": 13210, "total_steps": 38160, "loss": 0.3791, "lr": 0.000826514985995875, "epoch": 6.923480083857442, "percentage": 34.62, "elapsed_time": "0:33:40", "remaining_time": "1:03:35", "throughput": 4265.89, "total_tokens": 8618464} {"current_steps": 13215, "total_steps": 38160, "loss": 0.2977, "lr": 0.0008263417608380743, "epoch": 6.926100628930818, "percentage": 34.63, "elapsed_time": "0:33:41", "remaining_time": "1:03:34", "throughput": 4265.97, "total_tokens": 8621664} {"current_steps": 13220, "total_steps": 38160, "loss": 0.3941, "lr": 0.0008261684674133003, "epoch": 6.928721174004193, "percentage": 34.64, "elapsed_time": "0:33:41", "remaining_time": "1:03:34", "throughput": 4265.98, "total_tokens": 8624608} {"current_steps": 13225, "total_steps": 38160, "loss": 0.382, "lr": 0.0008259951057578041, "epoch": 6.931341719077568, "percentage": 34.66, "elapsed_time": "0:33:42", "remaining_time": "1:03:32", "throughput": 4265.83, "total_tokens": 8626880} {"current_steps": 13230, "total_steps": 38160, "loss": 0.5649, "lr": 0.000825821675907851, "epoch": 6.933962264150943, "percentage": 34.67, "elapsed_time": "0:33:43", "remaining_time": "1:03:32", "throughput": 4266.09, "total_tokens": 8630880} {"current_steps": 13235, "total_steps": 38160, "loss": 0.5179, "lr": 0.0008256481778997205, "epoch": 6.936582809224319, "percentage": 34.68, "elapsed_time": "0:33:43", "remaining_time": "1:03:31", "throughput": 4266.1, "total_tokens": 8633856} {"current_steps": 13240, "total_steps": 38160, "loss": 0.5288, "lr": 0.0008254746117697062, "epoch": 6.939203354297694, "percentage": 34.7, "elapsed_time": "0:33:44", "remaining_time": "1:03:30", "throughput": 4265.99, "total_tokens": 8636288} {"current_steps": 13245, "total_steps": 38160, "loss": 0.6388, "lr": 0.0008253009775541165, "epoch": 6.9418238993710695, "percentage": 34.71, "elapsed_time": "0:33:45", "remaining_time": "1:03:29", "throughput": 4265.92, "total_tokens": 8638880} {"current_steps": 13250, "total_steps": 38160, "loss": 0.5228, "lr": 0.0008251272752892733, "epoch": 6.944444444444445, "percentage": 34.72, "elapsed_time": "0:33:45", "remaining_time": "1:03:28", "throughput": 4265.98, "total_tokens": 8642080} {"current_steps": 13255, "total_steps": 38160, "loss": 0.4319, "lr": 0.0008249535050115135, "epoch": 6.94706498951782, "percentage": 34.74, "elapsed_time": "0:33:46", "remaining_time": "1:03:27", "throughput": 4265.89, "total_tokens": 8644672} {"current_steps": 13260, "total_steps": 38160, "loss": 0.3994, "lr": 0.0008247796667571879, "epoch": 6.949685534591195, "percentage": 34.75, "elapsed_time": "0:33:47", "remaining_time": "1:03:26", "throughput": 4266.01, "total_tokens": 8648160} {"current_steps": 13265, "total_steps": 38160, "loss": 0.4164, "lr": 0.000824605760562661, "epoch": 6.95230607966457, "percentage": 34.76, "elapsed_time": "0:33:47", "remaining_time": "1:03:25", "throughput": 4266.03, "total_tokens": 8651168} {"current_steps": 13270, "total_steps": 38160, "loss": 0.4114, "lr": 0.0008244317864643125, "epoch": 6.954926624737945, "percentage": 34.77, "elapsed_time": "0:33:48", "remaining_time": "1:03:24", "throughput": 4266.02, "total_tokens": 8653984} {"current_steps": 13275, "total_steps": 38160, "loss": 0.3767, "lr": 0.0008242577444985355, "epoch": 6.9575471698113205, "percentage": 34.79, "elapsed_time": "0:33:49", "remaining_time": "1:03:23", "throughput": 4265.93, "total_tokens": 8656544} {"current_steps": 13280, "total_steps": 38160, "loss": 0.4178, "lr": 0.0008240836347017375, "epoch": 6.960167714884696, "percentage": 34.8, "elapsed_time": "0:33:49", "remaining_time": "1:03:23", "throughput": 4265.93, "total_tokens": 8659456} {"current_steps": 13285, "total_steps": 38160, "loss": 0.3962, "lr": 0.0008239094571103408, "epoch": 6.962788259958071, "percentage": 34.81, "elapsed_time": "0:33:50", "remaining_time": "1:03:22", "throughput": 4265.87, "total_tokens": 8662112} {"current_steps": 13290, "total_steps": 38160, "loss": 0.5381, "lr": 0.0008237352117607808, "epoch": 6.965408805031447, "percentage": 34.83, "elapsed_time": "0:33:51", "remaining_time": "1:03:21", "throughput": 4266.03, "total_tokens": 8665760} {"current_steps": 13295, "total_steps": 38160, "loss": 0.5083, "lr": 0.000823560898689508, "epoch": 6.968029350104822, "percentage": 34.84, "elapsed_time": "0:33:52", "remaining_time": "1:03:20", "throughput": 4266.15, "total_tokens": 8669152} {"current_steps": 13300, "total_steps": 38160, "loss": 0.4564, "lr": 0.0008233865179329865, "epoch": 6.970649895178197, "percentage": 34.85, "elapsed_time": "0:33:52", "remaining_time": "1:03:19", "throughput": 4266.05, "total_tokens": 8671648} {"current_steps": 13305, "total_steps": 38160, "loss": 0.5372, "lr": 0.0008232120695276948, "epoch": 6.973270440251572, "percentage": 34.87, "elapsed_time": "0:33:53", "remaining_time": "1:03:18", "throughput": 4266.38, "total_tokens": 8676192} {"current_steps": 13310, "total_steps": 38160, "loss": 0.5555, "lr": 0.0008230375535101255, "epoch": 6.975890985324948, "percentage": 34.88, "elapsed_time": "0:33:54", "remaining_time": "1:03:18", "throughput": 4266.36, "total_tokens": 8679008} {"current_steps": 13315, "total_steps": 38160, "loss": 0.4376, "lr": 0.0008228629699167855, "epoch": 6.978511530398323, "percentage": 34.89, "elapsed_time": "0:33:55", "remaining_time": "1:03:17", "throughput": 4266.57, "total_tokens": 8682848} {"current_steps": 13320, "total_steps": 38160, "loss": 0.3494, "lr": 0.0008226883187841957, "epoch": 6.981132075471698, "percentage": 34.91, "elapsed_time": "0:33:55", "remaining_time": "1:03:16", "throughput": 4266.48, "total_tokens": 8685376} {"current_steps": 13325, "total_steps": 38160, "loss": 0.6178, "lr": 0.0008225136001488908, "epoch": 6.983752620545073, "percentage": 34.92, "elapsed_time": "0:33:56", "remaining_time": "1:03:15", "throughput": 4266.56, "total_tokens": 8688672} {"current_steps": 13330, "total_steps": 38160, "loss": 0.5177, "lr": 0.0008223388140474205, "epoch": 6.986373165618449, "percentage": 34.93, "elapsed_time": "0:33:57", "remaining_time": "1:03:14", "throughput": 4266.73, "total_tokens": 8692256} {"current_steps": 13335, "total_steps": 38160, "loss": 0.57, "lr": 0.0008221639605163476, "epoch": 6.988993710691824, "percentage": 34.94, "elapsed_time": "0:33:58", "remaining_time": "1:03:14", "throughput": 4266.91, "total_tokens": 8695968} {"current_steps": 13340, "total_steps": 38160, "loss": 0.4332, "lr": 0.0008219890395922495, "epoch": 6.9916142557651995, "percentage": 34.96, "elapsed_time": "0:33:58", "remaining_time": "1:03:13", "throughput": 4267.13, "total_tokens": 8699808} {"current_steps": 13345, "total_steps": 38160, "loss": 0.53, "lr": 0.0008218140513117178, "epoch": 6.994234800838575, "percentage": 34.97, "elapsed_time": "0:33:59", "remaining_time": "1:03:12", "throughput": 4267.07, "total_tokens": 8702432} {"current_steps": 13350, "total_steps": 38160, "loss": 0.5606, "lr": 0.0008216389957113582, "epoch": 6.99685534591195, "percentage": 34.98, "elapsed_time": "0:34:00", "remaining_time": "1:03:11", "throughput": 4267.16, "total_tokens": 8705792} {"current_steps": 13355, "total_steps": 38160, "loss": 0.4937, "lr": 0.0008214638728277899, "epoch": 6.999475890985325, "percentage": 35.0, "elapsed_time": "0:34:00", "remaining_time": "1:03:10", "throughput": 4267.24, "total_tokens": 8709056} {"current_steps": 13356, "total_steps": 38160, "eval_loss": 0.45616984367370605, "epoch": 7.0, "percentage": 35.0, "elapsed_time": "0:34:14", "remaining_time": "1:03:35", "throughput": 4238.69, "total_tokens": 8709168} {"current_steps": 13360, "total_steps": 38160, "loss": 0.5044, "lr": 0.0008212886826976469, "epoch": 7.0020964360587, "percentage": 35.01, "elapsed_time": "0:34:16", "remaining_time": "1:03:37", "throughput": 4235.55, "total_tokens": 8711536} {"current_steps": 13365, "total_steps": 38160, "loss": 0.5529, "lr": 0.0008211134253575769, "epoch": 7.004716981132075, "percentage": 35.02, "elapsed_time": "0:34:17", "remaining_time": "1:03:37", "throughput": 4235.83, "total_tokens": 8715728} {"current_steps": 13370, "total_steps": 38160, "loss": 0.4851, "lr": 0.000820938100844242, "epoch": 7.0073375262054505, "percentage": 35.04, "elapsed_time": "0:34:18", "remaining_time": "1:03:36", "throughput": 4235.96, "total_tokens": 8719216} {"current_steps": 13375, "total_steps": 38160, "loss": 0.3688, "lr": 0.0008207627091943177, "epoch": 7.009958071278826, "percentage": 35.05, "elapsed_time": "0:34:19", "remaining_time": "1:03:35", "throughput": 4235.97, "total_tokens": 8722160} {"current_steps": 13380, "total_steps": 38160, "loss": 0.3595, "lr": 0.000820587250444494, "epoch": 7.012578616352202, "percentage": 35.06, "elapsed_time": "0:34:19", "remaining_time": "1:03:34", "throughput": 4236.09, "total_tokens": 8725584} {"current_steps": 13385, "total_steps": 38160, "loss": 0.4327, "lr": 0.0008204117246314752, "epoch": 7.015199161425577, "percentage": 35.08, "elapsed_time": "0:34:20", "remaining_time": "1:03:33", "throughput": 4236.04, "total_tokens": 8728272} {"current_steps": 13390, "total_steps": 38160, "loss": 0.4537, "lr": 0.0008202361317919788, "epoch": 7.017819706498952, "percentage": 35.09, "elapsed_time": "0:34:21", "remaining_time": "1:03:33", "throughput": 4236.13, "total_tokens": 8731568} {"current_steps": 13395, "total_steps": 38160, "loss": 0.4914, "lr": 0.0008200604719627373, "epoch": 7.020440251572327, "percentage": 35.1, "elapsed_time": "0:34:21", "remaining_time": "1:03:32", "throughput": 4236.24, "total_tokens": 8735120} {"current_steps": 13400, "total_steps": 38160, "loss": 0.3515, "lr": 0.0008198847451804964, "epoch": 7.023060796645702, "percentage": 35.12, "elapsed_time": "0:34:22", "remaining_time": "1:03:31", "throughput": 4236.12, "total_tokens": 8737552} {"current_steps": 13405, "total_steps": 38160, "loss": 0.4118, "lr": 0.0008197089514820162, "epoch": 7.0256813417190775, "percentage": 35.13, "elapsed_time": "0:34:23", "remaining_time": "1:03:30", "throughput": 4236.39, "total_tokens": 8741712} {"current_steps": 13410, "total_steps": 38160, "loss": 0.5109, "lr": 0.0008195330909040708, "epoch": 7.028301886792453, "percentage": 35.14, "elapsed_time": "0:34:24", "remaining_time": "1:03:29", "throughput": 4236.33, "total_tokens": 8744464} {"current_steps": 13415, "total_steps": 38160, "loss": 0.4089, "lr": 0.0008193571634834483, "epoch": 7.030922431865828, "percentage": 35.15, "elapsed_time": "0:34:24", "remaining_time": "1:03:28", "throughput": 4236.47, "total_tokens": 8748048} {"current_steps": 13420, "total_steps": 38160, "loss": 0.3926, "lr": 0.0008191811692569506, "epoch": 7.033542976939203, "percentage": 35.17, "elapsed_time": "0:34:25", "remaining_time": "1:03:28", "throughput": 4236.49, "total_tokens": 8751024} {"current_steps": 13425, "total_steps": 38160, "loss": 0.4449, "lr": 0.0008190051082613936, "epoch": 7.036163522012578, "percentage": 35.18, "elapsed_time": "0:34:26", "remaining_time": "1:03:26", "throughput": 4236.34, "total_tokens": 8753264} {"current_steps": 13430, "total_steps": 38160, "loss": 0.47, "lr": 0.0008188289805336074, "epoch": 7.038784067085954, "percentage": 35.19, "elapsed_time": "0:34:26", "remaining_time": "1:03:26", "throughput": 4236.35, "total_tokens": 8756240} {"current_steps": 13435, "total_steps": 38160, "loss": 0.3895, "lr": 0.0008186527861104359, "epoch": 7.0414046121593294, "percentage": 35.21, "elapsed_time": "0:34:27", "remaining_time": "1:03:25", "throughput": 4236.37, "total_tokens": 8759184} {"current_steps": 13440, "total_steps": 38160, "loss": 0.5598, "lr": 0.0008184765250287369, "epoch": 7.044025157232705, "percentage": 35.22, "elapsed_time": "0:34:28", "remaining_time": "1:03:24", "throughput": 4236.55, "total_tokens": 8762864} {"current_steps": 13445, "total_steps": 38160, "loss": 0.3384, "lr": 0.0008183001973253823, "epoch": 7.04664570230608, "percentage": 35.23, "elapsed_time": "0:34:29", "remaining_time": "1:03:23", "throughput": 4236.99, "total_tokens": 8767856} {"current_steps": 13450, "total_steps": 38160, "loss": 0.5116, "lr": 0.0008181238030372576, "epoch": 7.049266247379455, "percentage": 35.25, "elapsed_time": "0:34:30", "remaining_time": "1:03:23", "throughput": 4237.12, "total_tokens": 8771344} {"current_steps": 13455, "total_steps": 38160, "loss": 0.4563, "lr": 0.0008179473422012628, "epoch": 7.05188679245283, "percentage": 35.26, "elapsed_time": "0:34:30", "remaining_time": "1:03:22", "throughput": 4237.35, "total_tokens": 8775216} {"current_steps": 13460, "total_steps": 38160, "loss": 0.514, "lr": 0.0008177708148543114, "epoch": 7.054507337526205, "percentage": 35.27, "elapsed_time": "0:34:31", "remaining_time": "1:03:21", "throughput": 4237.64, "total_tokens": 8779536} {"current_steps": 13465, "total_steps": 38160, "loss": 0.5847, "lr": 0.0008175942210333307, "epoch": 7.0571278825995805, "percentage": 35.29, "elapsed_time": "0:34:32", "remaining_time": "1:03:21", "throughput": 4237.69, "total_tokens": 8782640} {"current_steps": 13470, "total_steps": 38160, "loss": 0.6584, "lr": 0.0008174175607752626, "epoch": 7.059748427672956, "percentage": 35.3, "elapsed_time": "0:34:33", "remaining_time": "1:03:20", "throughput": 4237.89, "total_tokens": 8786384} {"current_steps": 13475, "total_steps": 38160, "loss": 0.4124, "lr": 0.0008172408341170617, "epoch": 7.062368972746331, "percentage": 35.31, "elapsed_time": "0:34:34", "remaining_time": "1:03:19", "throughput": 4237.95, "total_tokens": 8789616} {"current_steps": 13480, "total_steps": 38160, "loss": 0.4984, "lr": 0.0008170640410956976, "epoch": 7.064989517819707, "percentage": 35.32, "elapsed_time": "0:34:34", "remaining_time": "1:03:18", "throughput": 4238.0, "total_tokens": 8792816} {"current_steps": 13485, "total_steps": 38160, "loss": 0.4206, "lr": 0.0008168871817481536, "epoch": 7.067610062893082, "percentage": 35.34, "elapsed_time": "0:34:35", "remaining_time": "1:03:17", "throughput": 4238.23, "total_tokens": 8796784} {"current_steps": 13490, "total_steps": 38160, "loss": 0.4806, "lr": 0.0008167102561114261, "epoch": 7.070230607966457, "percentage": 35.35, "elapsed_time": "0:34:36", "remaining_time": "1:03:17", "throughput": 4238.29, "total_tokens": 8800016} {"current_steps": 13495, "total_steps": 38160, "loss": 0.491, "lr": 0.0008165332642225265, "epoch": 7.072851153039832, "percentage": 35.36, "elapsed_time": "0:34:37", "remaining_time": "1:03:16", "throughput": 4238.31, "total_tokens": 8803088} {"current_steps": 13500, "total_steps": 38160, "loss": 0.3977, "lr": 0.0008163562061184791, "epoch": 7.0754716981132075, "percentage": 35.38, "elapsed_time": "0:34:37", "remaining_time": "1:03:15", "throughput": 4238.34, "total_tokens": 8806096} {"current_steps": 13505, "total_steps": 38160, "loss": 0.5086, "lr": 0.0008161790818363227, "epoch": 7.078092243186583, "percentage": 35.39, "elapsed_time": "0:34:38", "remaining_time": "1:03:14", "throughput": 4238.28, "total_tokens": 8808624} {"current_steps": 13510, "total_steps": 38160, "loss": 0.5875, "lr": 0.0008160018914131094, "epoch": 7.080712788259958, "percentage": 35.4, "elapsed_time": "0:34:39", "remaining_time": "1:03:13", "throughput": 4238.39, "total_tokens": 8811920} {"current_steps": 13515, "total_steps": 38160, "loss": 0.303, "lr": 0.0008158246348859057, "epoch": 7.083333333333333, "percentage": 35.42, "elapsed_time": "0:34:40", "remaining_time": "1:03:13", "throughput": 4239.04, "total_tokens": 8817904} {"current_steps": 13520, "total_steps": 38160, "loss": 0.4137, "lr": 0.0008156473122917913, "epoch": 7.085953878406708, "percentage": 35.43, "elapsed_time": "0:34:40", "remaining_time": "1:03:12", "throughput": 4238.97, "total_tokens": 8820496} {"current_steps": 13525, "total_steps": 38160, "loss": 0.5168, "lr": 0.0008154699236678604, "epoch": 7.088574423480084, "percentage": 35.44, "elapsed_time": "0:34:41", "remaining_time": "1:03:11", "throughput": 4238.91, "total_tokens": 8823120} {"current_steps": 13530, "total_steps": 38160, "loss": 0.4433, "lr": 0.0008152924690512205, "epoch": 7.091194968553459, "percentage": 35.46, "elapsed_time": "0:34:42", "remaining_time": "1:03:10", "throughput": 4238.97, "total_tokens": 8826192} {"current_steps": 13535, "total_steps": 38160, "loss": 0.4837, "lr": 0.0008151149484789932, "epoch": 7.093815513626835, "percentage": 35.47, "elapsed_time": "0:34:42", "remaining_time": "1:03:09", "throughput": 4239.05, "total_tokens": 8829456} {"current_steps": 13540, "total_steps": 38160, "loss": 0.5701, "lr": 0.0008149373619883136, "epoch": 7.09643605870021, "percentage": 35.48, "elapsed_time": "0:34:43", "remaining_time": "1:03:08", "throughput": 4238.98, "total_tokens": 8832112} {"current_steps": 13545, "total_steps": 38160, "loss": 0.5487, "lr": 0.0008147597096163308, "epoch": 7.099056603773585, "percentage": 35.5, "elapsed_time": "0:34:44", "remaining_time": "1:03:07", "throughput": 4238.95, "total_tokens": 8834832} {"current_steps": 13550, "total_steps": 38160, "loss": 0.5138, "lr": 0.0008145819914002079, "epoch": 7.10167714884696, "percentage": 35.51, "elapsed_time": "0:34:44", "remaining_time": "1:03:06", "throughput": 4239.11, "total_tokens": 8838480} {"current_steps": 13555, "total_steps": 38160, "loss": 0.3967, "lr": 0.0008144042073771214, "epoch": 7.104297693920335, "percentage": 35.52, "elapsed_time": "0:34:45", "remaining_time": "1:03:06", "throughput": 4239.29, "total_tokens": 8842128} {"current_steps": 13560, "total_steps": 38160, "loss": 0.3805, "lr": 0.0008142263575842615, "epoch": 7.1069182389937104, "percentage": 35.53, "elapsed_time": "0:34:46", "remaining_time": "1:03:05", "throughput": 4239.47, "total_tokens": 8845872} {"current_steps": 13565, "total_steps": 38160, "loss": 0.4291, "lr": 0.0008140484420588323, "epoch": 7.109538784067086, "percentage": 35.55, "elapsed_time": "0:34:47", "remaining_time": "1:03:04", "throughput": 4239.47, "total_tokens": 8848720} {"current_steps": 13570, "total_steps": 38160, "loss": 0.3817, "lr": 0.000813870460838052, "epoch": 7.112159329140461, "percentage": 35.56, "elapsed_time": "0:34:48", "remaining_time": "1:03:03", "throughput": 4239.79, "total_tokens": 8853072} {"current_steps": 13575, "total_steps": 38160, "loss": 0.4459, "lr": 0.0008136924139591522, "epoch": 7.114779874213837, "percentage": 35.57, "elapsed_time": "0:34:48", "remaining_time": "1:03:02", "throughput": 4239.85, "total_tokens": 8856208} {"current_steps": 13580, "total_steps": 38160, "loss": 0.4896, "lr": 0.0008135143014593782, "epoch": 7.117400419287212, "percentage": 35.59, "elapsed_time": "0:34:49", "remaining_time": "1:03:02", "throughput": 4239.95, "total_tokens": 8859600} {"current_steps": 13585, "total_steps": 38160, "loss": 0.4631, "lr": 0.000813336123375989, "epoch": 7.120020964360587, "percentage": 35.6, "elapsed_time": "0:34:50", "remaining_time": "1:03:01", "throughput": 4239.94, "total_tokens": 8862576} {"current_steps": 13590, "total_steps": 38160, "loss": 0.4266, "lr": 0.0008131578797462575, "epoch": 7.122641509433962, "percentage": 35.61, "elapsed_time": "0:34:51", "remaining_time": "1:03:00", "throughput": 4240.21, "total_tokens": 8866704} {"current_steps": 13595, "total_steps": 38160, "loss": 0.3733, "lr": 0.0008129795706074703, "epoch": 7.1252620545073375, "percentage": 35.63, "elapsed_time": "0:34:51", "remaining_time": "1:02:59", "throughput": 4240.19, "total_tokens": 8869584} {"current_steps": 13600, "total_steps": 38160, "loss": 0.4099, "lr": 0.0008128011959969277, "epoch": 7.127882599580713, "percentage": 35.64, "elapsed_time": "0:34:52", "remaining_time": "1:02:58", "throughput": 4240.31, "total_tokens": 8873040} {"current_steps": 13605, "total_steps": 38160, "loss": 0.5118, "lr": 0.0008126227559519434, "epoch": 7.130503144654088, "percentage": 35.65, "elapsed_time": "0:34:53", "remaining_time": "1:02:58", "throughput": 4240.36, "total_tokens": 8876208} {"current_steps": 13610, "total_steps": 38160, "loss": 0.4171, "lr": 0.0008124442505098452, "epoch": 7.133123689727463, "percentage": 35.67, "elapsed_time": "0:34:54", "remaining_time": "1:02:57", "throughput": 4240.6, "total_tokens": 8880240} {"current_steps": 13615, "total_steps": 38160, "loss": 0.4278, "lr": 0.0008122656797079744, "epoch": 7.135744234800838, "percentage": 35.68, "elapsed_time": "0:34:54", "remaining_time": "1:02:56", "throughput": 4240.63, "total_tokens": 8883280} {"current_steps": 13620, "total_steps": 38160, "loss": 0.4942, "lr": 0.0008120870435836858, "epoch": 7.138364779874214, "percentage": 35.69, "elapsed_time": "0:34:55", "remaining_time": "1:02:55", "throughput": 4240.64, "total_tokens": 8886192} {"current_steps": 13625, "total_steps": 38160, "loss": 0.3903, "lr": 0.0008119083421743481, "epoch": 7.140985324947589, "percentage": 35.7, "elapsed_time": "0:34:56", "remaining_time": "1:02:54", "throughput": 4240.72, "total_tokens": 8889456} {"current_steps": 13630, "total_steps": 38160, "loss": 0.3926, "lr": 0.0008117295755173437, "epoch": 7.143605870020965, "percentage": 35.72, "elapsed_time": "0:34:56", "remaining_time": "1:02:53", "throughput": 4240.76, "total_tokens": 8892528} {"current_steps": 13635, "total_steps": 38160, "loss": 0.4672, "lr": 0.0008115507436500687, "epoch": 7.14622641509434, "percentage": 35.73, "elapsed_time": "0:34:57", "remaining_time": "1:02:52", "throughput": 4240.86, "total_tokens": 8895824} {"current_steps": 13640, "total_steps": 38160, "loss": 0.4712, "lr": 0.0008113718466099322, "epoch": 7.148846960167715, "percentage": 35.74, "elapsed_time": "0:34:58", "remaining_time": "1:02:52", "throughput": 4240.79, "total_tokens": 8898544} {"current_steps": 13645, "total_steps": 38160, "loss": 0.577, "lr": 0.0008111928844343579, "epoch": 7.15146750524109, "percentage": 35.76, "elapsed_time": "0:34:59", "remaining_time": "1:02:51", "throughput": 4241.02, "total_tokens": 8902480} {"current_steps": 13650, "total_steps": 38160, "loss": 0.5884, "lr": 0.0008110138571607823, "epoch": 7.154088050314465, "percentage": 35.77, "elapsed_time": "0:34:59", "remaining_time": "1:02:50", "throughput": 4241.13, "total_tokens": 8905968} {"current_steps": 13655, "total_steps": 38160, "loss": 0.4214, "lr": 0.0008108347648266563, "epoch": 7.15670859538784, "percentage": 35.78, "elapsed_time": "0:35:00", "remaining_time": "1:02:49", "throughput": 4241.22, "total_tokens": 8909296} {"current_steps": 13660, "total_steps": 38160, "loss": 0.4116, "lr": 0.0008106556074694434, "epoch": 7.159329140461216, "percentage": 35.8, "elapsed_time": "0:35:01", "remaining_time": "1:02:48", "throughput": 4241.11, "total_tokens": 8911792} {"current_steps": 13665, "total_steps": 38160, "loss": 0.4895, "lr": 0.0008104763851266216, "epoch": 7.161949685534591, "percentage": 35.81, "elapsed_time": "0:35:02", "remaining_time": "1:02:48", "throughput": 4241.22, "total_tokens": 8915280} {"current_steps": 13670, "total_steps": 38160, "loss": 0.3875, "lr": 0.0008102970978356822, "epoch": 7.164570230607967, "percentage": 35.82, "elapsed_time": "0:35:02", "remaining_time": "1:02:47", "throughput": 4241.34, "total_tokens": 8918736} {"current_steps": 13675, "total_steps": 38160, "loss": 0.517, "lr": 0.00081011774563413, "epoch": 7.167190775681342, "percentage": 35.84, "elapsed_time": "0:35:03", "remaining_time": "1:02:46", "throughput": 4241.37, "total_tokens": 8921776} {"current_steps": 13680, "total_steps": 38160, "loss": 0.5473, "lr": 0.0008099383285594835, "epoch": 7.169811320754717, "percentage": 35.85, "elapsed_time": "0:35:04", "remaining_time": "1:02:45", "throughput": 4241.47, "total_tokens": 8925264} {"current_steps": 13685, "total_steps": 38160, "loss": 0.5019, "lr": 0.0008097588466492746, "epoch": 7.172431865828092, "percentage": 35.86, "elapsed_time": "0:35:05", "remaining_time": "1:02:44", "throughput": 4241.5, "total_tokens": 8928400} {"current_steps": 13690, "total_steps": 38160, "loss": 0.5617, "lr": 0.0008095792999410487, "epoch": 7.1750524109014675, "percentage": 35.88, "elapsed_time": "0:35:05", "remaining_time": "1:02:43", "throughput": 4241.58, "total_tokens": 8931792} {"current_steps": 13695, "total_steps": 38160, "loss": 0.3799, "lr": 0.0008093996884723653, "epoch": 7.177672955974843, "percentage": 35.89, "elapsed_time": "0:35:06", "remaining_time": "1:02:43", "throughput": 4241.58, "total_tokens": 8934768} {"current_steps": 13700, "total_steps": 38160, "loss": 0.2672, "lr": 0.0008092200122807969, "epoch": 7.180293501048218, "percentage": 35.9, "elapsed_time": "0:35:07", "remaining_time": "1:02:42", "throughput": 4241.56, "total_tokens": 8937552} {"current_steps": 13705, "total_steps": 38160, "loss": 0.5046, "lr": 0.0008090402714039295, "epoch": 7.182914046121593, "percentage": 35.91, "elapsed_time": "0:35:07", "remaining_time": "1:02:41", "throughput": 4241.8, "total_tokens": 8941520} {"current_steps": 13710, "total_steps": 38160, "loss": 0.3223, "lr": 0.0008088604658793632, "epoch": 7.185534591194968, "percentage": 35.93, "elapsed_time": "0:35:08", "remaining_time": "1:02:40", "throughput": 4242.06, "total_tokens": 8945616} {"current_steps": 13715, "total_steps": 38160, "loss": 0.5364, "lr": 0.0008086805957447111, "epoch": 7.188155136268344, "percentage": 35.94, "elapsed_time": "0:35:09", "remaining_time": "1:02:39", "throughput": 4242.07, "total_tokens": 8948592} {"current_steps": 13720, "total_steps": 38160, "loss": 0.4536, "lr": 0.0008085006610376, "epoch": 7.190775681341719, "percentage": 35.95, "elapsed_time": "0:35:10", "remaining_time": "1:02:38", "throughput": 4242.04, "total_tokens": 8951344} {"current_steps": 13725, "total_steps": 38160, "loss": 0.4619, "lr": 0.0008083206617956702, "epoch": 7.193396226415095, "percentage": 35.97, "elapsed_time": "0:35:10", "remaining_time": "1:02:38", "throughput": 4242.22, "total_tokens": 8955056} {"current_steps": 13730, "total_steps": 38160, "loss": 0.3745, "lr": 0.0008081405980565755, "epoch": 7.19601677148847, "percentage": 35.98, "elapsed_time": "0:35:11", "remaining_time": "1:02:37", "throughput": 4242.25, "total_tokens": 8958128} {"current_steps": 13735, "total_steps": 38160, "loss": 0.4136, "lr": 0.0008079604698579829, "epoch": 7.198637316561845, "percentage": 35.99, "elapsed_time": "0:35:12", "remaining_time": "1:02:36", "throughput": 4242.43, "total_tokens": 8961840} {"current_steps": 13740, "total_steps": 38160, "loss": 0.5137, "lr": 0.0008077802772375736, "epoch": 7.20125786163522, "percentage": 36.01, "elapsed_time": "0:35:13", "remaining_time": "1:02:35", "throughput": 4242.51, "total_tokens": 8965040} {"current_steps": 13745, "total_steps": 38160, "loss": 0.4618, "lr": 0.0008076000202330416, "epoch": 7.203878406708595, "percentage": 36.02, "elapsed_time": "0:35:13", "remaining_time": "1:02:35", "throughput": 4242.79, "total_tokens": 8969200} {"current_steps": 13750, "total_steps": 38160, "loss": 0.6347, "lr": 0.0008074196988820945, "epoch": 7.20649895178197, "percentage": 36.03, "elapsed_time": "0:35:14", "remaining_time": "1:02:34", "throughput": 4242.9, "total_tokens": 8972624} {"current_steps": 13755, "total_steps": 38160, "loss": 0.4528, "lr": 0.0008072393132224539, "epoch": 7.209119496855346, "percentage": 36.05, "elapsed_time": "0:35:15", "remaining_time": "1:02:33", "throughput": 4242.94, "total_tokens": 8975728} {"current_steps": 13760, "total_steps": 38160, "loss": 0.5816, "lr": 0.0008070588632918541, "epoch": 7.211740041928721, "percentage": 36.06, "elapsed_time": "0:35:16", "remaining_time": "1:02:32", "throughput": 4243.08, "total_tokens": 8979312} {"current_steps": 13765, "total_steps": 38160, "loss": 0.4455, "lr": 0.000806878349128043, "epoch": 7.214360587002097, "percentage": 36.07, "elapsed_time": "0:35:16", "remaining_time": "1:02:31", "throughput": 4243.04, "total_tokens": 8982032} {"current_steps": 13770, "total_steps": 38160, "loss": 0.4512, "lr": 0.0008066977707687826, "epoch": 7.216981132075472, "percentage": 36.08, "elapsed_time": "0:35:17", "remaining_time": "1:02:30", "throughput": 4242.93, "total_tokens": 8984432} {"current_steps": 13775, "total_steps": 38160, "loss": 0.5145, "lr": 0.0008065171282518473, "epoch": 7.219601677148847, "percentage": 36.1, "elapsed_time": "0:35:18", "remaining_time": "1:02:29", "throughput": 4243.23, "total_tokens": 8988624} {"current_steps": 13780, "total_steps": 38160, "loss": 0.6847, "lr": 0.0008063364216150257, "epoch": 7.222222222222222, "percentage": 36.11, "elapsed_time": "0:35:19", "remaining_time": "1:02:29", "throughput": 4243.27, "total_tokens": 8991664} {"current_steps": 13785, "total_steps": 38160, "loss": 0.4462, "lr": 0.0008061556508961199, "epoch": 7.2248427672955975, "percentage": 36.12, "elapsed_time": "0:35:19", "remaining_time": "1:02:28", "throughput": 4243.37, "total_tokens": 8994928} {"current_steps": 13790, "total_steps": 38160, "loss": 0.613, "lr": 0.0008059748161329443, "epoch": 7.227463312368973, "percentage": 36.14, "elapsed_time": "0:35:20", "remaining_time": "1:02:27", "throughput": 4243.37, "total_tokens": 8997872} {"current_steps": 13795, "total_steps": 38160, "loss": 0.4907, "lr": 0.0008057939173633282, "epoch": 7.230083857442348, "percentage": 36.15, "elapsed_time": "0:35:21", "remaining_time": "1:02:26", "throughput": 4243.69, "total_tokens": 9002384} {"current_steps": 13800, "total_steps": 38160, "loss": 0.3982, "lr": 0.0008056129546251132, "epoch": 7.232704402515723, "percentage": 36.16, "elapsed_time": "0:35:22", "remaining_time": "1:02:25", "throughput": 4243.7, "total_tokens": 9005296} {"current_steps": 13805, "total_steps": 38160, "loss": 0.515, "lr": 0.0008054319279561546, "epoch": 7.235324947589098, "percentage": 36.18, "elapsed_time": "0:35:22", "remaining_time": "1:02:25", "throughput": 4244.12, "total_tokens": 9009968} {"current_steps": 13810, "total_steps": 38160, "loss": 0.5005, "lr": 0.0008052508373943214, "epoch": 7.237945492662474, "percentage": 36.19, "elapsed_time": "0:35:23", "remaining_time": "1:02:24", "throughput": 4244.33, "total_tokens": 9013776} {"current_steps": 13815, "total_steps": 38160, "loss": 0.3898, "lr": 0.0008050696829774954, "epoch": 7.240566037735849, "percentage": 36.2, "elapsed_time": "0:35:24", "remaining_time": "1:02:23", "throughput": 4244.42, "total_tokens": 9017072} {"current_steps": 13820, "total_steps": 38160, "loss": 0.7093, "lr": 0.0008048884647435721, "epoch": 7.243186582809225, "percentage": 36.22, "elapsed_time": "0:35:25", "remaining_time": "1:02:22", "throughput": 4244.47, "total_tokens": 9020272} {"current_steps": 13825, "total_steps": 38160, "loss": 0.4195, "lr": 0.0008047071827304604, "epoch": 7.2458071278826, "percentage": 36.23, "elapsed_time": "0:35:26", "remaining_time": "1:02:22", "throughput": 4244.74, "total_tokens": 9024528} {"current_steps": 13830, "total_steps": 38160, "loss": 0.3952, "lr": 0.0008045258369760824, "epoch": 7.248427672955975, "percentage": 36.24, "elapsed_time": "0:35:26", "remaining_time": "1:02:21", "throughput": 4244.74, "total_tokens": 9027376} {"current_steps": 13835, "total_steps": 38160, "loss": 0.5103, "lr": 0.0008043444275183735, "epoch": 7.25104821802935, "percentage": 36.26, "elapsed_time": "0:35:27", "remaining_time": "1:02:20", "throughput": 4244.85, "total_tokens": 9030832} {"current_steps": 13840, "total_steps": 38160, "loss": 0.5963, "lr": 0.0008041629543952824, "epoch": 7.253668763102725, "percentage": 36.27, "elapsed_time": "0:35:28", "remaining_time": "1:02:19", "throughput": 4244.91, "total_tokens": 9034064} {"current_steps": 13845, "total_steps": 38160, "loss": 0.4463, "lr": 0.0008039814176447714, "epoch": 7.2562893081761, "percentage": 36.28, "elapsed_time": "0:35:28", "remaining_time": "1:02:18", "throughput": 4244.94, "total_tokens": 9037072} {"current_steps": 13850, "total_steps": 38160, "loss": 0.3723, "lr": 0.0008037998173048157, "epoch": 7.258909853249476, "percentage": 36.29, "elapsed_time": "0:35:29", "remaining_time": "1:02:18", "throughput": 4245.06, "total_tokens": 9040624} {"current_steps": 13855, "total_steps": 38160, "loss": 0.4349, "lr": 0.0008036181534134044, "epoch": 7.261530398322851, "percentage": 36.31, "elapsed_time": "0:35:30", "remaining_time": "1:02:17", "throughput": 4245.11, "total_tokens": 9043792} {"current_steps": 13860, "total_steps": 38160, "loss": 0.4474, "lr": 0.0008034364260085391, "epoch": 7.264150943396227, "percentage": 36.32, "elapsed_time": "0:35:31", "remaining_time": "1:02:16", "throughput": 4245.08, "total_tokens": 9046640} {"current_steps": 13865, "total_steps": 38160, "loss": 0.4617, "lr": 0.0008032546351282353, "epoch": 7.266771488469602, "percentage": 36.33, "elapsed_time": "0:35:31", "remaining_time": "1:02:15", "throughput": 4245.02, "total_tokens": 9049328} {"current_steps": 13870, "total_steps": 38160, "loss": 0.4862, "lr": 0.0008030727808105215, "epoch": 7.269392033542977, "percentage": 36.35, "elapsed_time": "0:35:32", "remaining_time": "1:02:14", "throughput": 4245.16, "total_tokens": 9052944} {"current_steps": 13875, "total_steps": 38160, "loss": 0.3041, "lr": 0.0008028908630934397, "epoch": 7.272012578616352, "percentage": 36.36, "elapsed_time": "0:35:33", "remaining_time": "1:02:13", "throughput": 4245.03, "total_tokens": 9055344} {"current_steps": 13880, "total_steps": 38160, "loss": 0.4101, "lr": 0.0008027088820150447, "epoch": 7.2746331236897275, "percentage": 36.37, "elapsed_time": "0:35:33", "remaining_time": "1:02:12", "throughput": 4245.17, "total_tokens": 9058928} {"current_steps": 13885, "total_steps": 38160, "loss": 0.558, "lr": 0.0008025268376134054, "epoch": 7.277253668763103, "percentage": 36.39, "elapsed_time": "0:35:34", "remaining_time": "1:02:12", "throughput": 4245.3, "total_tokens": 9062384} {"current_steps": 13890, "total_steps": 38160, "loss": 0.4016, "lr": 0.0008023447299266027, "epoch": 7.279874213836478, "percentage": 36.4, "elapsed_time": "0:35:35", "remaining_time": "1:02:11", "throughput": 4245.52, "total_tokens": 9066288} {"current_steps": 13895, "total_steps": 38160, "loss": 0.483, "lr": 0.0008021625589927321, "epoch": 7.282494758909853, "percentage": 36.41, "elapsed_time": "0:35:36", "remaining_time": "1:02:10", "throughput": 4245.67, "total_tokens": 9070000} {"current_steps": 13900, "total_steps": 38160, "loss": 0.4258, "lr": 0.0008019803248499013, "epoch": 7.285115303983228, "percentage": 36.43, "elapsed_time": "0:35:36", "remaining_time": "1:02:09", "throughput": 4245.67, "total_tokens": 9072784} {"current_steps": 13905, "total_steps": 38160, "loss": 0.3632, "lr": 0.0008017980275362318, "epoch": 7.287735849056604, "percentage": 36.44, "elapsed_time": "0:35:37", "remaining_time": "1:02:08", "throughput": 4245.66, "total_tokens": 9075632} {"current_steps": 13910, "total_steps": 38160, "loss": 0.5909, "lr": 0.000801615667089858, "epoch": 7.290356394129979, "percentage": 36.45, "elapsed_time": "0:35:38", "remaining_time": "1:02:07", "throughput": 4245.65, "total_tokens": 9078448} {"current_steps": 13915, "total_steps": 38160, "loss": 0.4789, "lr": 0.0008014332435489275, "epoch": 7.2929769392033545, "percentage": 36.46, "elapsed_time": "0:35:39", "remaining_time": "1:02:07", "throughput": 4245.87, "total_tokens": 9082352} {"current_steps": 13920, "total_steps": 38160, "loss": 0.5357, "lr": 0.0008012507569516016, "epoch": 7.29559748427673, "percentage": 36.48, "elapsed_time": "0:35:39", "remaining_time": "1:02:06", "throughput": 4245.86, "total_tokens": 9085104} {"current_steps": 13925, "total_steps": 38160, "loss": 0.4528, "lr": 0.0008010682073360541, "epoch": 7.298218029350105, "percentage": 36.49, "elapsed_time": "0:35:40", "remaining_time": "1:02:05", "throughput": 4245.82, "total_tokens": 9087856} {"current_steps": 13930, "total_steps": 38160, "loss": 0.3554, "lr": 0.0008008855947404724, "epoch": 7.30083857442348, "percentage": 36.5, "elapsed_time": "0:35:41", "remaining_time": "1:02:04", "throughput": 4245.93, "total_tokens": 9091216} {"current_steps": 13935, "total_steps": 38160, "loss": 0.4548, "lr": 0.000800702919203057, "epoch": 7.303459119496855, "percentage": 36.52, "elapsed_time": "0:35:41", "remaining_time": "1:02:03", "throughput": 4245.97, "total_tokens": 9094256} {"current_steps": 13940, "total_steps": 38160, "loss": 0.3648, "lr": 0.0008005201807620214, "epoch": 7.30607966457023, "percentage": 36.53, "elapsed_time": "0:35:42", "remaining_time": "1:02:02", "throughput": 4246.21, "total_tokens": 9098192} {"current_steps": 13945, "total_steps": 38160, "loss": 0.4895, "lr": 0.0008003373794555926, "epoch": 7.308700209643606, "percentage": 36.54, "elapsed_time": "0:35:43", "remaining_time": "1:02:01", "throughput": 4246.06, "total_tokens": 9100432} {"current_steps": 13950, "total_steps": 38160, "loss": 0.4409, "lr": 0.0008001545153220104, "epoch": 7.311320754716981, "percentage": 36.56, "elapsed_time": "0:35:44", "remaining_time": "1:02:00", "throughput": 4246.2, "total_tokens": 9104016} {"current_steps": 13955, "total_steps": 38160, "loss": 0.8389, "lr": 0.000799971588399528, "epoch": 7.313941299790357, "percentage": 36.57, "elapsed_time": "0:35:44", "remaining_time": "1:02:00", "throughput": 4246.24, "total_tokens": 9107088} {"current_steps": 13960, "total_steps": 38160, "loss": 0.55, "lr": 0.0007997885987264115, "epoch": 7.316561844863732, "percentage": 36.58, "elapsed_time": "0:35:45", "remaining_time": "1:01:59", "throughput": 4246.27, "total_tokens": 9110064} {"current_steps": 13965, "total_steps": 38160, "loss": 0.5204, "lr": 0.0007996055463409403, "epoch": 7.319182389937107, "percentage": 36.6, "elapsed_time": "0:35:46", "remaining_time": "1:01:58", "throughput": 4246.28, "total_tokens": 9113040} {"current_steps": 13970, "total_steps": 38160, "loss": 0.4462, "lr": 0.000799422431281407, "epoch": 7.321802935010482, "percentage": 36.61, "elapsed_time": "0:35:46", "remaining_time": "1:01:57", "throughput": 4246.32, "total_tokens": 9116208} {"current_steps": 13975, "total_steps": 38160, "loss": 0.4334, "lr": 0.000799239253586117, "epoch": 7.3244234800838575, "percentage": 36.62, "elapsed_time": "0:35:47", "remaining_time": "1:01:56", "throughput": 4246.35, "total_tokens": 9119280} {"current_steps": 13980, "total_steps": 38160, "loss": 0.4759, "lr": 0.0007990560132933891, "epoch": 7.327044025157233, "percentage": 36.64, "elapsed_time": "0:35:48", "remaining_time": "1:01:56", "throughput": 4246.75, "total_tokens": 9124048} {"current_steps": 13985, "total_steps": 38160, "loss": 0.4615, "lr": 0.0007988727104415549, "epoch": 7.329664570230608, "percentage": 36.65, "elapsed_time": "0:35:49", "remaining_time": "1:01:55", "throughput": 4246.99, "total_tokens": 9128080} {"current_steps": 13990, "total_steps": 38160, "loss": 0.4807, "lr": 0.0007986893450689594, "epoch": 7.332285115303983, "percentage": 36.66, "elapsed_time": "0:35:50", "remaining_time": "1:01:54", "throughput": 4247.02, "total_tokens": 9131120} {"current_steps": 13995, "total_steps": 38160, "loss": 0.5207, "lr": 0.0007985059172139606, "epoch": 7.334905660377358, "percentage": 36.67, "elapsed_time": "0:35:50", "remaining_time": "1:01:53", "throughput": 4246.97, "total_tokens": 9133776} {"current_steps": 14000, "total_steps": 38160, "loss": 0.5255, "lr": 0.0007983224269149296, "epoch": 7.337526205450734, "percentage": 36.69, "elapsed_time": "0:35:51", "remaining_time": "1:01:52", "throughput": 4247.19, "total_tokens": 9137680} {"current_steps": 14005, "total_steps": 38160, "loss": 0.4007, "lr": 0.00079813887421025, "epoch": 7.340146750524109, "percentage": 36.7, "elapsed_time": "0:35:52", "remaining_time": "1:01:51", "throughput": 4247.29, "total_tokens": 9140912} {"current_steps": 14010, "total_steps": 38160, "loss": 0.432, "lr": 0.0007979552591383195, "epoch": 7.3427672955974845, "percentage": 36.71, "elapsed_time": "0:35:52", "remaining_time": "1:01:51", "throughput": 4247.41, "total_tokens": 9144432} {"current_steps": 14015, "total_steps": 38160, "loss": 0.5337, "lr": 0.0007977715817375481, "epoch": 7.34538784067086, "percentage": 36.73, "elapsed_time": "0:35:53", "remaining_time": "1:01:50", "throughput": 4247.45, "total_tokens": 9147504} {"current_steps": 14020, "total_steps": 38160, "loss": 0.4339, "lr": 0.0007975878420463588, "epoch": 7.348008385744235, "percentage": 36.74, "elapsed_time": "0:35:54", "remaining_time": "1:01:49", "throughput": 4247.42, "total_tokens": 9150256} {"current_steps": 14025, "total_steps": 38160, "loss": 0.4559, "lr": 0.0007974040401031882, "epoch": 7.35062893081761, "percentage": 36.75, "elapsed_time": "0:35:55", "remaining_time": "1:01:48", "throughput": 4247.5, "total_tokens": 9153552} {"current_steps": 14030, "total_steps": 38160, "loss": 0.3517, "lr": 0.0007972201759464851, "epoch": 7.353249475890985, "percentage": 36.77, "elapsed_time": "0:35:55", "remaining_time": "1:01:47", "throughput": 4247.55, "total_tokens": 9156624} {"current_steps": 14035, "total_steps": 38160, "loss": 0.4204, "lr": 0.0007970362496147121, "epoch": 7.35587002096436, "percentage": 36.78, "elapsed_time": "0:35:56", "remaining_time": "1:01:46", "throughput": 4247.62, "total_tokens": 9159792} {"current_steps": 14040, "total_steps": 38160, "loss": 0.4115, "lr": 0.0007968522611463447, "epoch": 7.3584905660377355, "percentage": 36.79, "elapsed_time": "0:35:57", "remaining_time": "1:01:45", "throughput": 4247.7, "total_tokens": 9162960} {"current_steps": 14045, "total_steps": 38160, "loss": 0.4692, "lr": 0.0007966682105798708, "epoch": 7.361111111111111, "percentage": 36.81, "elapsed_time": "0:35:57", "remaining_time": "1:01:45", "throughput": 4247.82, "total_tokens": 9166416} {"current_steps": 14050, "total_steps": 38160, "loss": 0.5502, "lr": 0.0007964840979537918, "epoch": 7.363731656184487, "percentage": 36.82, "elapsed_time": "0:35:58", "remaining_time": "1:01:44", "throughput": 4247.91, "total_tokens": 9169712} {"current_steps": 14055, "total_steps": 38160, "loss": 0.4286, "lr": 0.0007962999233066219, "epoch": 7.366352201257862, "percentage": 36.83, "elapsed_time": "0:35:59", "remaining_time": "1:01:43", "throughput": 4247.82, "total_tokens": 9172208} {"current_steps": 14060, "total_steps": 38160, "loss": 0.4556, "lr": 0.0007961156866768885, "epoch": 7.368972746331237, "percentage": 36.84, "elapsed_time": "0:35:59", "remaining_time": "1:01:42", "throughput": 4247.73, "total_tokens": 9174640} {"current_steps": 14065, "total_steps": 38160, "loss": 0.4601, "lr": 0.0007959313881031317, "epoch": 7.371593291404612, "percentage": 36.86, "elapsed_time": "0:36:00", "remaining_time": "1:01:41", "throughput": 4247.91, "total_tokens": 9178416} {"current_steps": 14070, "total_steps": 38160, "loss": 0.4582, "lr": 0.0007957470276239048, "epoch": 7.3742138364779874, "percentage": 36.87, "elapsed_time": "0:36:01", "remaining_time": "1:01:40", "throughput": 4247.85, "total_tokens": 9181040} {"current_steps": 14075, "total_steps": 38160, "loss": 0.4726, "lr": 0.0007955626052777735, "epoch": 7.376834381551363, "percentage": 36.88, "elapsed_time": "0:36:02", "remaining_time": "1:01:39", "throughput": 4247.88, "total_tokens": 9184048} {"current_steps": 14080, "total_steps": 38160, "loss": 0.3861, "lr": 0.0007953781211033173, "epoch": 7.379454926624738, "percentage": 36.9, "elapsed_time": "0:36:02", "remaining_time": "1:01:38", "throughput": 4247.98, "total_tokens": 9187344} {"current_steps": 14085, "total_steps": 38160, "loss": 0.3606, "lr": 0.000795193575139128, "epoch": 7.382075471698113, "percentage": 36.91, "elapsed_time": "0:36:03", "remaining_time": "1:01:37", "throughput": 4248.07, "total_tokens": 9190608} {"current_steps": 14090, "total_steps": 38160, "loss": 0.414, "lr": 0.0007950089674238106, "epoch": 7.384696016771488, "percentage": 36.92, "elapsed_time": "0:36:04", "remaining_time": "1:01:37", "throughput": 4248.2, "total_tokens": 9194160} {"current_steps": 14095, "total_steps": 38160, "loss": 0.4101, "lr": 0.0007948242979959828, "epoch": 7.387316561844864, "percentage": 36.94, "elapsed_time": "0:36:04", "remaining_time": "1:01:36", "throughput": 4248.13, "total_tokens": 9196688} {"current_steps": 14100, "total_steps": 38160, "loss": 0.4712, "lr": 0.0007946395668942754, "epoch": 7.389937106918239, "percentage": 36.95, "elapsed_time": "0:36:05", "remaining_time": "1:01:35", "throughput": 4248.43, "total_tokens": 9200880} {"current_steps": 14105, "total_steps": 38160, "loss": 0.4208, "lr": 0.0007944547741573319, "epoch": 7.3925576519916145, "percentage": 36.96, "elapsed_time": "0:36:06", "remaining_time": "1:01:34", "throughput": 4248.61, "total_tokens": 9204720} {"current_steps": 14110, "total_steps": 38160, "loss": 0.4418, "lr": 0.0007942699198238091, "epoch": 7.39517819706499, "percentage": 36.98, "elapsed_time": "0:36:07", "remaining_time": "1:01:33", "throughput": 4248.52, "total_tokens": 9207184} {"current_steps": 14115, "total_steps": 38160, "loss": 0.4567, "lr": 0.0007940850039323763, "epoch": 7.397798742138365, "percentage": 36.99, "elapsed_time": "0:36:07", "remaining_time": "1:01:32", "throughput": 4248.54, "total_tokens": 9210224} {"current_steps": 14120, "total_steps": 38160, "loss": 0.3753, "lr": 0.0007939000265217156, "epoch": 7.40041928721174, "percentage": 37.0, "elapsed_time": "0:36:08", "remaining_time": "1:01:32", "throughput": 4248.69, "total_tokens": 9213776} {"current_steps": 14125, "total_steps": 38160, "loss": 0.474, "lr": 0.0007937149876305226, "epoch": 7.403039832285115, "percentage": 37.02, "elapsed_time": "0:36:09", "remaining_time": "1:01:31", "throughput": 4248.61, "total_tokens": 9216368} {"current_steps": 14130, "total_steps": 38160, "loss": 0.69, "lr": 0.000793529887297505, "epoch": 7.40566037735849, "percentage": 37.03, "elapsed_time": "0:36:10", "remaining_time": "1:01:30", "throughput": 4248.8, "total_tokens": 9220112} {"current_steps": 14135, "total_steps": 38160, "loss": 0.4839, "lr": 0.0007933447255613835, "epoch": 7.4082809224318655, "percentage": 37.04, "elapsed_time": "0:36:10", "remaining_time": "1:01:29", "throughput": 4248.81, "total_tokens": 9223120} {"current_steps": 14140, "total_steps": 38160, "loss": 0.5661, "lr": 0.0007931595024608924, "epoch": 7.410901467505241, "percentage": 37.05, "elapsed_time": "0:36:11", "remaining_time": "1:01:28", "throughput": 4248.75, "total_tokens": 9225744} {"current_steps": 14145, "total_steps": 38160, "loss": 0.4063, "lr": 0.0007929742180347776, "epoch": 7.413522012578617, "percentage": 37.07, "elapsed_time": "0:36:12", "remaining_time": "1:01:27", "throughput": 4248.89, "total_tokens": 9229200} {"current_steps": 14150, "total_steps": 38160, "loss": 0.4953, "lr": 0.0007927888723217991, "epoch": 7.416142557651992, "percentage": 37.08, "elapsed_time": "0:36:12", "remaining_time": "1:01:27", "throughput": 4249.02, "total_tokens": 9232752} {"current_steps": 14155, "total_steps": 38160, "loss": 0.3778, "lr": 0.0007926034653607288, "epoch": 7.418763102725367, "percentage": 37.09, "elapsed_time": "0:36:14", "remaining_time": "1:01:26", "throughput": 4249.56, "total_tokens": 9238704} {"current_steps": 14160, "total_steps": 38160, "loss": 0.6838, "lr": 0.0007924179971903516, "epoch": 7.421383647798742, "percentage": 37.11, "elapsed_time": "0:36:14", "remaining_time": "1:01:25", "throughput": 4249.57, "total_tokens": 9241648} {"current_steps": 14165, "total_steps": 38160, "loss": 0.4638, "lr": 0.0007922324678494655, "epoch": 7.424004192872117, "percentage": 37.12, "elapsed_time": "0:36:15", "remaining_time": "1:01:25", "throughput": 4249.65, "total_tokens": 9244944} {"current_steps": 14170, "total_steps": 38160, "loss": 0.4263, "lr": 0.0007920468773768811, "epoch": 7.426624737945493, "percentage": 37.13, "elapsed_time": "0:36:16", "remaining_time": "1:01:24", "throughput": 4249.72, "total_tokens": 9248144} {"current_steps": 14175, "total_steps": 38160, "loss": 0.5039, "lr": 0.0007918612258114217, "epoch": 7.429245283018868, "percentage": 37.15, "elapsed_time": "0:36:16", "remaining_time": "1:01:23", "throughput": 4249.86, "total_tokens": 9251792} {"current_steps": 14180, "total_steps": 38160, "loss": 0.527, "lr": 0.0007916755131919238, "epoch": 7.431865828092243, "percentage": 37.16, "elapsed_time": "0:36:17", "remaining_time": "1:01:22", "throughput": 4249.98, "total_tokens": 9255248} {"current_steps": 14185, "total_steps": 38160, "loss": 0.4411, "lr": 0.000791489739557236, "epoch": 7.434486373165618, "percentage": 37.17, "elapsed_time": "0:36:18", "remaining_time": "1:01:21", "throughput": 4249.95, "total_tokens": 9258096} {"current_steps": 14190, "total_steps": 38160, "loss": 0.4667, "lr": 0.0007913039049462203, "epoch": 7.437106918238994, "percentage": 37.19, "elapsed_time": "0:36:19", "remaining_time": "1:01:20", "throughput": 4249.9, "total_tokens": 9260816} {"current_steps": 14195, "total_steps": 38160, "loss": 0.417, "lr": 0.0007911180093977511, "epoch": 7.439727463312369, "percentage": 37.2, "elapsed_time": "0:36:19", "remaining_time": "1:01:19", "throughput": 4249.86, "total_tokens": 9263472} {"current_steps": 14200, "total_steps": 38160, "loss": 0.4111, "lr": 0.0007909320529507154, "epoch": 7.4423480083857445, "percentage": 37.21, "elapsed_time": "0:36:20", "remaining_time": "1:01:19", "throughput": 4249.95, "total_tokens": 9266832} {"current_steps": 14205, "total_steps": 38160, "loss": 0.4715, "lr": 0.0007907460356440134, "epoch": 7.44496855345912, "percentage": 37.22, "elapsed_time": "0:36:21", "remaining_time": "1:01:18", "throughput": 4250.11, "total_tokens": 9270512} {"current_steps": 14210, "total_steps": 38160, "loss": 0.5031, "lr": 0.0007905599575165577, "epoch": 7.447589098532495, "percentage": 37.24, "elapsed_time": "0:36:21", "remaining_time": "1:01:17", "throughput": 4250.25, "total_tokens": 9274032} {"current_steps": 14215, "total_steps": 38160, "loss": 0.4235, "lr": 0.0007903738186072739, "epoch": 7.45020964360587, "percentage": 37.25, "elapsed_time": "0:36:22", "remaining_time": "1:01:16", "throughput": 4250.21, "total_tokens": 9276720} {"current_steps": 14220, "total_steps": 38160, "loss": 0.3976, "lr": 0.0007901876189550999, "epoch": 7.452830188679245, "percentage": 37.26, "elapsed_time": "0:36:23", "remaining_time": "1:01:15", "throughput": 4250.19, "total_tokens": 9279504} {"current_steps": 14225, "total_steps": 38160, "loss": 0.4048, "lr": 0.0007900013585989867, "epoch": 7.45545073375262, "percentage": 37.28, "elapsed_time": "0:36:24", "remaining_time": "1:01:14", "throughput": 4250.32, "total_tokens": 9282864} {"current_steps": 14230, "total_steps": 38160, "loss": 0.5498, "lr": 0.0007898150375778979, "epoch": 7.4580712788259955, "percentage": 37.29, "elapsed_time": "0:36:24", "remaining_time": "1:01:13", "throughput": 4250.26, "total_tokens": 9285520} {"current_steps": 14235, "total_steps": 38160, "loss": 0.4932, "lr": 0.0007896286559308095, "epoch": 7.460691823899371, "percentage": 37.3, "elapsed_time": "0:36:25", "remaining_time": "1:01:13", "throughput": 4250.53, "total_tokens": 9289840} {"current_steps": 14240, "total_steps": 38160, "loss": 0.3892, "lr": 0.0007894422136967105, "epoch": 7.463312368972747, "percentage": 37.32, "elapsed_time": "0:36:26", "remaining_time": "1:01:12", "throughput": 4250.37, "total_tokens": 9292016} {"current_steps": 14245, "total_steps": 38160, "loss": 0.4387, "lr": 0.0007892557109146026, "epoch": 7.465932914046122, "percentage": 37.33, "elapsed_time": "0:36:26", "remaining_time": "1:01:11", "throughput": 4250.46, "total_tokens": 9295312} {"current_steps": 14250, "total_steps": 38160, "loss": 0.5697, "lr": 0.0007890691476234999, "epoch": 7.468553459119497, "percentage": 37.34, "elapsed_time": "0:36:27", "remaining_time": "1:01:10", "throughput": 4250.41, "total_tokens": 9298032} {"current_steps": 14255, "total_steps": 38160, "loss": 0.5247, "lr": 0.0007888825238624294, "epoch": 7.471174004192872, "percentage": 37.36, "elapsed_time": "0:36:28", "remaining_time": "1:01:09", "throughput": 4250.55, "total_tokens": 9301552} {"current_steps": 14260, "total_steps": 38160, "loss": 0.3697, "lr": 0.0007886958396704307, "epoch": 7.473794549266247, "percentage": 37.37, "elapsed_time": "0:36:29", "remaining_time": "1:01:08", "throughput": 4250.59, "total_tokens": 9304688} {"current_steps": 14265, "total_steps": 38160, "loss": 0.5378, "lr": 0.0007885090950865559, "epoch": 7.476415094339623, "percentage": 37.38, "elapsed_time": "0:36:29", "remaining_time": "1:01:07", "throughput": 4250.6, "total_tokens": 9307664} {"current_steps": 14270, "total_steps": 38160, "loss": 0.4533, "lr": 0.0007883222901498701, "epoch": 7.479035639412998, "percentage": 37.4, "elapsed_time": "0:36:30", "remaining_time": "1:01:07", "throughput": 4250.62, "total_tokens": 9310736} {"current_steps": 14275, "total_steps": 38160, "loss": 0.4625, "lr": 0.0007881354248994503, "epoch": 7.481656184486373, "percentage": 37.41, "elapsed_time": "0:36:31", "remaining_time": "1:01:06", "throughput": 4250.92, "total_tokens": 9315056} {"current_steps": 14280, "total_steps": 38160, "loss": 0.4263, "lr": 0.0007879484993743869, "epoch": 7.484276729559748, "percentage": 37.42, "elapsed_time": "0:36:32", "remaining_time": "1:01:05", "throughput": 4251.07, "total_tokens": 9318672} {"current_steps": 14285, "total_steps": 38160, "loss": 0.5667, "lr": 0.0007877615136137827, "epoch": 7.486897274633124, "percentage": 37.43, "elapsed_time": "0:36:33", "remaining_time": "1:01:05", "throughput": 4251.69, "total_tokens": 9325040} {"current_steps": 14290, "total_steps": 38160, "loss": 0.3758, "lr": 0.0007875744676567527, "epoch": 7.489517819706499, "percentage": 37.45, "elapsed_time": "0:36:34", "remaining_time": "1:01:04", "throughput": 4251.79, "total_tokens": 9328496} {"current_steps": 14295, "total_steps": 38160, "loss": 0.4862, "lr": 0.0007873873615424248, "epoch": 7.4921383647798745, "percentage": 37.46, "elapsed_time": "0:36:34", "remaining_time": "1:01:04", "throughput": 4251.89, "total_tokens": 9331824} {"current_steps": 14300, "total_steps": 38160, "loss": 0.3472, "lr": 0.0007872001953099396, "epoch": 7.49475890985325, "percentage": 37.47, "elapsed_time": "0:36:35", "remaining_time": "1:01:03", "throughput": 4251.89, "total_tokens": 9334768} {"current_steps": 14305, "total_steps": 38160, "loss": 0.5203, "lr": 0.0007870129689984501, "epoch": 7.497379454926625, "percentage": 37.49, "elapsed_time": "0:36:36", "remaining_time": "1:01:02", "throughput": 4251.88, "total_tokens": 9337616} {"current_steps": 14310, "total_steps": 38160, "loss": 0.523, "lr": 0.000786825682647122, "epoch": 7.5, "percentage": 37.5, "elapsed_time": "0:36:36", "remaining_time": "1:01:01", "throughput": 4251.85, "total_tokens": 9340304} {"current_steps": 14315, "total_steps": 38160, "loss": 0.5174, "lr": 0.0007866383362951332, "epoch": 7.502620545073375, "percentage": 37.51, "elapsed_time": "0:36:37", "remaining_time": "1:01:00", "throughput": 4251.9, "total_tokens": 9343440} {"current_steps": 14320, "total_steps": 38160, "loss": 0.5171, "lr": 0.0007864509299816746, "epoch": 7.50524109014675, "percentage": 37.53, "elapsed_time": "0:36:38", "remaining_time": "1:00:59", "throughput": 4252.0, "total_tokens": 9346864} {"current_steps": 14325, "total_steps": 38160, "loss": 0.5289, "lr": 0.0007862634637459496, "epoch": 7.5078616352201255, "percentage": 37.54, "elapsed_time": "0:36:38", "remaining_time": "1:00:58", "throughput": 4252.14, "total_tokens": 9350384} {"current_steps": 14330, "total_steps": 38160, "loss": 0.4157, "lr": 0.0007860759376271737, "epoch": 7.510482180293501, "percentage": 37.55, "elapsed_time": "0:36:39", "remaining_time": "1:00:58", "throughput": 4252.33, "total_tokens": 9354256} {"current_steps": 14335, "total_steps": 38160, "loss": 0.411, "lr": 0.0007858883516645755, "epoch": 7.513102725366876, "percentage": 37.57, "elapsed_time": "0:36:40", "remaining_time": "1:00:57", "throughput": 4252.4, "total_tokens": 9357456} {"current_steps": 14340, "total_steps": 38160, "loss": 0.4099, "lr": 0.0007857007058973957, "epoch": 7.515723270440252, "percentage": 37.58, "elapsed_time": "0:36:41", "remaining_time": "1:00:56", "throughput": 4252.43, "total_tokens": 9360560} {"current_steps": 14345, "total_steps": 38160, "loss": 0.4908, "lr": 0.0007855130003648876, "epoch": 7.518343815513627, "percentage": 37.59, "elapsed_time": "0:36:41", "remaining_time": "1:00:55", "throughput": 4252.37, "total_tokens": 9363248} {"current_steps": 14350, "total_steps": 38160, "loss": 0.39, "lr": 0.0007853252351063171, "epoch": 7.520964360587002, "percentage": 37.6, "elapsed_time": "0:36:42", "remaining_time": "1:00:54", "throughput": 4252.54, "total_tokens": 9367088} {"current_steps": 14355, "total_steps": 38160, "loss": 0.4103, "lr": 0.0007851374101609627, "epoch": 7.523584905660377, "percentage": 37.62, "elapsed_time": "0:36:43", "remaining_time": "1:00:54", "throughput": 4252.75, "total_tokens": 9370960} {"current_steps": 14360, "total_steps": 38160, "loss": 0.4452, "lr": 0.000784949525568115, "epoch": 7.526205450733753, "percentage": 37.63, "elapsed_time": "0:36:44", "remaining_time": "1:00:53", "throughput": 4252.77, "total_tokens": 9373936} {"current_steps": 14365, "total_steps": 38160, "loss": 0.3592, "lr": 0.0007847615813670776, "epoch": 7.528825995807128, "percentage": 37.64, "elapsed_time": "0:36:44", "remaining_time": "1:00:52", "throughput": 4252.86, "total_tokens": 9377264} {"current_steps": 14370, "total_steps": 38160, "loss": 0.5298, "lr": 0.000784573577597166, "epoch": 7.531446540880503, "percentage": 37.66, "elapsed_time": "0:36:45", "remaining_time": "1:00:51", "throughput": 4252.87, "total_tokens": 9380240} {"current_steps": 14375, "total_steps": 38160, "loss": 0.3196, "lr": 0.0007843855142977086, "epoch": 7.534067085953878, "percentage": 37.67, "elapsed_time": "0:36:46", "remaining_time": "1:00:51", "throughput": 4253.26, "total_tokens": 9385136} {"current_steps": 14380, "total_steps": 38160, "loss": 0.5362, "lr": 0.000784197391508046, "epoch": 7.536687631027254, "percentage": 37.68, "elapsed_time": "0:36:47", "remaining_time": "1:00:50", "throughput": 4253.2, "total_tokens": 9387760} {"current_steps": 14385, "total_steps": 38160, "loss": 0.5478, "lr": 0.0007840092092675313, "epoch": 7.539308176100629, "percentage": 37.7, "elapsed_time": "0:36:47", "remaining_time": "1:00:49", "throughput": 4253.32, "total_tokens": 9391184} {"current_steps": 14390, "total_steps": 38160, "loss": 0.4375, "lr": 0.0007838209676155302, "epoch": 7.5419287211740045, "percentage": 37.71, "elapsed_time": "0:36:48", "remaining_time": "1:00:48", "throughput": 4253.26, "total_tokens": 9393776} {"current_steps": 14395, "total_steps": 38160, "loss": 0.5174, "lr": 0.0007836326665914209, "epoch": 7.54454926624738, "percentage": 37.72, "elapsed_time": "0:36:49", "remaining_time": "1:00:47", "throughput": 4253.32, "total_tokens": 9397008} {"current_steps": 14400, "total_steps": 38160, "loss": 0.5739, "lr": 0.0007834443062345932, "epoch": 7.547169811320755, "percentage": 37.74, "elapsed_time": "0:36:50", "remaining_time": "1:00:46", "throughput": 4253.37, "total_tokens": 9400144} {"current_steps": 14405, "total_steps": 38160, "loss": 0.3379, "lr": 0.0007832558865844507, "epoch": 7.54979035639413, "percentage": 37.75, "elapsed_time": "0:36:50", "remaining_time": "1:00:45", "throughput": 4253.51, "total_tokens": 9403728} {"current_steps": 14410, "total_steps": 38160, "loss": 0.5834, "lr": 0.0007830674076804083, "epoch": 7.552410901467505, "percentage": 37.76, "elapsed_time": "0:36:51", "remaining_time": "1:00:45", "throughput": 4253.83, "total_tokens": 9408112} {"current_steps": 14415, "total_steps": 38160, "loss": 0.5586, "lr": 0.0007828788695618934, "epoch": 7.55503144654088, "percentage": 37.78, "elapsed_time": "0:36:52", "remaining_time": "1:00:44", "throughput": 4253.86, "total_tokens": 9411152} {"current_steps": 14420, "total_steps": 38160, "loss": 0.3373, "lr": 0.0007826902722683462, "epoch": 7.5576519916142555, "percentage": 37.79, "elapsed_time": "0:36:53", "remaining_time": "1:00:43", "throughput": 4253.96, "total_tokens": 9414416} {"current_steps": 14425, "total_steps": 38160, "loss": 0.4263, "lr": 0.0007825016158392193, "epoch": 7.560272536687631, "percentage": 37.8, "elapsed_time": "0:36:53", "remaining_time": "1:00:42", "throughput": 4253.92, "total_tokens": 9417168} {"current_steps": 14430, "total_steps": 38160, "loss": 0.3947, "lr": 0.0007823129003139773, "epoch": 7.562893081761006, "percentage": 37.81, "elapsed_time": "0:36:54", "remaining_time": "1:00:41", "throughput": 4254.1, "total_tokens": 9420880} {"current_steps": 14435, "total_steps": 38160, "loss": 0.4368, "lr": 0.0007821241257320972, "epoch": 7.565513626834382, "percentage": 37.83, "elapsed_time": "0:36:55", "remaining_time": "1:00:40", "throughput": 4254.18, "total_tokens": 9424144} {"current_steps": 14440, "total_steps": 38160, "loss": 0.4703, "lr": 0.0007819352921330689, "epoch": 7.568134171907757, "percentage": 37.84, "elapsed_time": "0:36:55", "remaining_time": "1:00:39", "throughput": 4254.04, "total_tokens": 9426448} {"current_steps": 14445, "total_steps": 38160, "loss": 0.5075, "lr": 0.0007817463995563938, "epoch": 7.570754716981132, "percentage": 37.85, "elapsed_time": "0:36:56", "remaining_time": "1:00:39", "throughput": 4254.08, "total_tokens": 9429456} {"current_steps": 14450, "total_steps": 38160, "loss": 0.5214, "lr": 0.0007815574480415864, "epoch": 7.573375262054507, "percentage": 37.87, "elapsed_time": "0:36:57", "remaining_time": "1:00:38", "throughput": 4254.17, "total_tokens": 9432720} {"current_steps": 14455, "total_steps": 38160, "loss": 0.5838, "lr": 0.0007813684376281729, "epoch": 7.575995807127883, "percentage": 37.88, "elapsed_time": "0:36:57", "remaining_time": "1:00:37", "throughput": 4254.12, "total_tokens": 9435344} {"current_steps": 14460, "total_steps": 38160, "loss": 0.5739, "lr": 0.0007811793683556922, "epoch": 7.578616352201258, "percentage": 37.89, "elapsed_time": "0:36:58", "remaining_time": "1:00:36", "throughput": 4254.14, "total_tokens": 9438416} {"current_steps": 14465, "total_steps": 38160, "loss": 0.4325, "lr": 0.0007809902402636957, "epoch": 7.581236897274633, "percentage": 37.91, "elapsed_time": "0:36:59", "remaining_time": "1:00:35", "throughput": 4254.06, "total_tokens": 9440912} {"current_steps": 14470, "total_steps": 38160, "loss": 0.2744, "lr": 0.0007808010533917464, "epoch": 7.583857442348008, "percentage": 37.92, "elapsed_time": "0:37:00", "remaining_time": "1:00:34", "throughput": 4254.14, "total_tokens": 9444272} {"current_steps": 14475, "total_steps": 38160, "loss": 0.5842, "lr": 0.0007806118077794205, "epoch": 7.586477987421384, "percentage": 37.93, "elapsed_time": "0:37:00", "remaining_time": "1:00:33", "throughput": 4254.05, "total_tokens": 9446704} {"current_steps": 14480, "total_steps": 38160, "loss": 0.4543, "lr": 0.0007804225034663058, "epoch": 7.589098532494759, "percentage": 37.95, "elapsed_time": "0:37:01", "remaining_time": "1:00:32", "throughput": 4254.15, "total_tokens": 9450128} {"current_steps": 14485, "total_steps": 38160, "loss": 0.5578, "lr": 0.0007802331404920024, "epoch": 7.5917190775681345, "percentage": 37.96, "elapsed_time": "0:37:02", "remaining_time": "1:00:31", "throughput": 4254.15, "total_tokens": 9453072} {"current_steps": 14490, "total_steps": 38160, "loss": 0.3653, "lr": 0.0007800437188961232, "epoch": 7.59433962264151, "percentage": 37.97, "elapsed_time": "0:37:02", "remaining_time": "1:00:30", "throughput": 4254.13, "total_tokens": 9455856} {"current_steps": 14495, "total_steps": 38160, "loss": 0.5641, "lr": 0.0007798542387182929, "epoch": 7.596960167714885, "percentage": 37.98, "elapsed_time": "0:37:03", "remaining_time": "1:00:30", "throughput": 4254.14, "total_tokens": 9458736} {"current_steps": 14500, "total_steps": 38160, "loss": 0.3246, "lr": 0.0007796646999981488, "epoch": 7.59958071278826, "percentage": 38.0, "elapsed_time": "0:37:04", "remaining_time": "1:00:29", "throughput": 4254.2, "total_tokens": 9461840} {"current_steps": 14505, "total_steps": 38160, "loss": 0.4102, "lr": 0.0007794751027753397, "epoch": 7.602201257861635, "percentage": 38.01, "elapsed_time": "0:37:05", "remaining_time": "1:00:29", "throughput": 4254.86, "total_tokens": 9468368} {"current_steps": 14510, "total_steps": 38160, "loss": 0.607, "lr": 0.0007792854470895278, "epoch": 7.60482180293501, "percentage": 38.02, "elapsed_time": "0:37:05", "remaining_time": "1:00:28", "throughput": 4254.79, "total_tokens": 9470928} {"current_steps": 14515, "total_steps": 38160, "loss": 0.7042, "lr": 0.0007790957329803865, "epoch": 7.6074423480083855, "percentage": 38.04, "elapsed_time": "0:37:06", "remaining_time": "1:00:27", "throughput": 4255.04, "total_tokens": 9475024} {"current_steps": 14520, "total_steps": 38160, "loss": 0.522, "lr": 0.0007789059604876019, "epoch": 7.610062893081761, "percentage": 38.05, "elapsed_time": "0:37:07", "remaining_time": "1:00:26", "throughput": 4255.36, "total_tokens": 9479408} {"current_steps": 14525, "total_steps": 38160, "loss": 0.3987, "lr": 0.0007787161296508724, "epoch": 7.612683438155136, "percentage": 38.06, "elapsed_time": "0:37:08", "remaining_time": "1:00:25", "throughput": 4255.4, "total_tokens": 9482480} {"current_steps": 14530, "total_steps": 38160, "loss": 0.3798, "lr": 0.0007785262405099083, "epoch": 7.615303983228512, "percentage": 38.08, "elapsed_time": "0:37:08", "remaining_time": "1:00:24", "throughput": 4255.29, "total_tokens": 9484816} {"current_steps": 14535, "total_steps": 38160, "loss": 0.5205, "lr": 0.0007783362931044322, "epoch": 7.617924528301887, "percentage": 38.09, "elapsed_time": "0:37:09", "remaining_time": "1:00:24", "throughput": 4255.3, "total_tokens": 9487728} {"current_steps": 14540, "total_steps": 38160, "loss": 0.6397, "lr": 0.0007781462874741793, "epoch": 7.620545073375262, "percentage": 38.1, "elapsed_time": "0:37:10", "remaining_time": "1:00:23", "throughput": 4255.26, "total_tokens": 9490448} {"current_steps": 14545, "total_steps": 38160, "loss": 0.497, "lr": 0.000777956223658896, "epoch": 7.623165618448637, "percentage": 38.12, "elapsed_time": "0:37:10", "remaining_time": "1:00:22", "throughput": 4255.26, "total_tokens": 9493360} {"current_steps": 14550, "total_steps": 38160, "loss": 0.3769, "lr": 0.000777766101698342, "epoch": 7.6257861635220126, "percentage": 38.13, "elapsed_time": "0:37:11", "remaining_time": "1:00:21", "throughput": 4255.34, "total_tokens": 9496560} {"current_steps": 14555, "total_steps": 38160, "loss": 0.3481, "lr": 0.0007775759216322882, "epoch": 7.628406708595388, "percentage": 38.14, "elapsed_time": "0:37:12", "remaining_time": "1:00:20", "throughput": 4255.38, "total_tokens": 9499632} {"current_steps": 14560, "total_steps": 38160, "loss": 0.4815, "lr": 0.0007773856835005187, "epoch": 7.631027253668763, "percentage": 38.16, "elapsed_time": "0:37:13", "remaining_time": "1:00:19", "throughput": 4255.62, "total_tokens": 9503696} {"current_steps": 14565, "total_steps": 38160, "loss": 0.547, "lr": 0.0007771953873428285, "epoch": 7.633647798742138, "percentage": 38.17, "elapsed_time": "0:37:13", "remaining_time": "1:00:18", "throughput": 4255.66, "total_tokens": 9506768} {"current_steps": 14570, "total_steps": 38160, "loss": 0.4116, "lr": 0.0007770050331990259, "epoch": 7.636268343815514, "percentage": 38.18, "elapsed_time": "0:37:14", "remaining_time": "1:00:17", "throughput": 4255.64, "total_tokens": 9509488} {"current_steps": 14575, "total_steps": 38160, "loss": 0.409, "lr": 0.0007768146211089304, "epoch": 7.638888888888889, "percentage": 38.19, "elapsed_time": "0:37:15", "remaining_time": "1:00:17", "throughput": 4255.64, "total_tokens": 9512336} {"current_steps": 14580, "total_steps": 38160, "loss": 0.5688, "lr": 0.0007766241511123744, "epoch": 7.6415094339622645, "percentage": 38.21, "elapsed_time": "0:37:15", "remaining_time": "1:00:16", "throughput": 4255.66, "total_tokens": 9515376} {"current_steps": 14585, "total_steps": 38160, "loss": 0.3843, "lr": 0.0007764336232492018, "epoch": 7.64412997903564, "percentage": 38.22, "elapsed_time": "0:37:16", "remaining_time": "1:00:15", "throughput": 4255.64, "total_tokens": 9518160} {"current_steps": 14590, "total_steps": 38160, "loss": 0.4344, "lr": 0.0007762430375592689, "epoch": 7.646750524109015, "percentage": 38.23, "elapsed_time": "0:37:17", "remaining_time": "1:00:14", "throughput": 4255.62, "total_tokens": 9520912} {"current_steps": 14595, "total_steps": 38160, "loss": 0.4269, "lr": 0.0007760523940824441, "epoch": 7.64937106918239, "percentage": 38.25, "elapsed_time": "0:37:17", "remaining_time": "1:00:13", "throughput": 4255.59, "total_tokens": 9523728} {"current_steps": 14600, "total_steps": 38160, "loss": 0.6168, "lr": 0.0007758616928586077, "epoch": 7.651991614255765, "percentage": 38.26, "elapsed_time": "0:37:18", "remaining_time": "1:00:12", "throughput": 4255.56, "total_tokens": 9526416} {"current_steps": 14605, "total_steps": 38160, "loss": 0.4775, "lr": 0.0007756709339276527, "epoch": 7.65461215932914, "percentage": 38.27, "elapsed_time": "0:37:19", "remaining_time": "1:00:11", "throughput": 4255.69, "total_tokens": 9529936} {"current_steps": 14610, "total_steps": 38160, "loss": 0.4746, "lr": 0.0007754801173294831, "epoch": 7.6572327044025155, "percentage": 38.29, "elapsed_time": "0:37:20", "remaining_time": "1:00:10", "throughput": 4255.79, "total_tokens": 9533232} {"current_steps": 14615, "total_steps": 38160, "loss": 0.4101, "lr": 0.0007752892431040158, "epoch": 7.659853249475891, "percentage": 38.3, "elapsed_time": "0:37:20", "remaining_time": "1:00:09", "throughput": 4255.91, "total_tokens": 9536656} {"current_steps": 14620, "total_steps": 38160, "loss": 0.5077, "lr": 0.0007750983112911796, "epoch": 7.662473794549266, "percentage": 38.31, "elapsed_time": "0:37:21", "remaining_time": "1:00:09", "throughput": 4255.87, "total_tokens": 9539344} {"current_steps": 14625, "total_steps": 38160, "loss": 0.5181, "lr": 0.0007749073219309151, "epoch": 7.665094339622642, "percentage": 38.33, "elapsed_time": "0:37:22", "remaining_time": "1:00:08", "throughput": 4255.99, "total_tokens": 9542832} {"current_steps": 14630, "total_steps": 38160, "loss": 0.5023, "lr": 0.0007747162750631751, "epoch": 7.667714884696017, "percentage": 38.34, "elapsed_time": "0:37:23", "remaining_time": "1:00:07", "throughput": 4256.16, "total_tokens": 9546640} {"current_steps": 14635, "total_steps": 38160, "loss": 0.3644, "lr": 0.0007745251707279246, "epoch": 7.670335429769392, "percentage": 38.35, "elapsed_time": "0:37:23", "remaining_time": "1:00:06", "throughput": 4256.26, "total_tokens": 9550000} {"current_steps": 14640, "total_steps": 38160, "loss": 0.4755, "lr": 0.0007743340089651403, "epoch": 7.672955974842767, "percentage": 38.36, "elapsed_time": "0:37:24", "remaining_time": "1:00:05", "throughput": 4256.37, "total_tokens": 9553424} {"current_steps": 14645, "total_steps": 38160, "loss": 0.4975, "lr": 0.0007741427898148111, "epoch": 7.6755765199161425, "percentage": 38.38, "elapsed_time": "0:37:25", "remaining_time": "1:00:04", "throughput": 4256.34, "total_tokens": 9556144} {"current_steps": 14650, "total_steps": 38160, "loss": 0.4264, "lr": 0.0007739515133169379, "epoch": 7.678197064989518, "percentage": 38.39, "elapsed_time": "0:37:25", "remaining_time": "1:00:04", "throughput": 4256.34, "total_tokens": 9559024} {"current_steps": 14655, "total_steps": 38160, "loss": 0.5298, "lr": 0.0007737601795115334, "epoch": 7.680817610062893, "percentage": 38.4, "elapsed_time": "0:37:26", "remaining_time": "1:00:03", "throughput": 4256.47, "total_tokens": 9562640} {"current_steps": 14660, "total_steps": 38160, "loss": 0.4243, "lr": 0.0007735687884386226, "epoch": 7.683438155136268, "percentage": 38.42, "elapsed_time": "0:37:27", "remaining_time": "1:00:02", "throughput": 4256.41, "total_tokens": 9565360} {"current_steps": 14665, "total_steps": 38160, "loss": 0.4878, "lr": 0.0007733773401382424, "epoch": 7.686058700209644, "percentage": 38.43, "elapsed_time": "0:37:28", "remaining_time": "1:00:01", "throughput": 4256.5, "total_tokens": 9568688} {"current_steps": 14670, "total_steps": 38160, "loss": 0.3909, "lr": 0.0007731858346504414, "epoch": 7.688679245283019, "percentage": 38.44, "elapsed_time": "0:37:28", "remaining_time": "1:00:00", "throughput": 4256.49, "total_tokens": 9571568} {"current_steps": 14675, "total_steps": 38160, "loss": 0.4515, "lr": 0.0007729942720152805, "epoch": 7.691299790356394, "percentage": 38.46, "elapsed_time": "0:37:29", "remaining_time": "0:59:59", "throughput": 4256.43, "total_tokens": 9574128} {"current_steps": 14680, "total_steps": 38160, "loss": 0.4586, "lr": 0.0007728026522728324, "epoch": 7.69392033542977, "percentage": 38.47, "elapsed_time": "0:37:30", "remaining_time": "0:59:58", "throughput": 4256.59, "total_tokens": 9577680} {"current_steps": 14685, "total_steps": 38160, "loss": 0.4292, "lr": 0.0007726109754631817, "epoch": 7.696540880503145, "percentage": 38.48, "elapsed_time": "0:37:30", "remaining_time": "0:59:58", "throughput": 4256.61, "total_tokens": 9580656} {"current_steps": 14690, "total_steps": 38160, "loss": 0.481, "lr": 0.000772419241626425, "epoch": 7.69916142557652, "percentage": 38.5, "elapsed_time": "0:37:31", "remaining_time": "0:59:57", "throughput": 4256.83, "total_tokens": 9584496} {"current_steps": 14695, "total_steps": 38160, "loss": 0.5081, "lr": 0.000772227450802671, "epoch": 7.701781970649895, "percentage": 38.51, "elapsed_time": "0:37:32", "remaining_time": "0:59:57", "throughput": 4257.52, "total_tokens": 9591056} {"current_steps": 14700, "total_steps": 38160, "loss": 0.4314, "lr": 0.0007720356030320399, "epoch": 7.70440251572327, "percentage": 38.52, "elapsed_time": "0:37:33", "remaining_time": "0:59:56", "throughput": 4257.6, "total_tokens": 9594320} {"current_steps": 14705, "total_steps": 38160, "loss": 0.4557, "lr": 0.0007718436983546642, "epoch": 7.7070230607966455, "percentage": 38.54, "elapsed_time": "0:37:34", "remaining_time": "0:59:55", "throughput": 4257.69, "total_tokens": 9597616} {"current_steps": 14710, "total_steps": 38160, "loss": 0.5053, "lr": 0.0007716517368106882, "epoch": 7.709643605870021, "percentage": 38.55, "elapsed_time": "0:37:34", "remaining_time": "0:59:54", "throughput": 4257.81, "total_tokens": 9601072} {"current_steps": 14715, "total_steps": 38160, "loss": 0.4347, "lr": 0.000771459718440268, "epoch": 7.712264150943396, "percentage": 38.56, "elapsed_time": "0:37:35", "remaining_time": "0:59:53", "throughput": 4257.96, "total_tokens": 9604752} {"current_steps": 14720, "total_steps": 38160, "loss": 0.4397, "lr": 0.0007712676432835717, "epoch": 7.714884696016772, "percentage": 38.57, "elapsed_time": "0:37:36", "remaining_time": "0:59:53", "throughput": 4257.95, "total_tokens": 9607600} {"current_steps": 14725, "total_steps": 38160, "loss": 0.4708, "lr": 0.0007710755113807794, "epoch": 7.717505241090147, "percentage": 38.59, "elapsed_time": "0:37:37", "remaining_time": "0:59:52", "throughput": 4258.1, "total_tokens": 9611184} {"current_steps": 14730, "total_steps": 38160, "loss": 0.4491, "lr": 0.0007708833227720824, "epoch": 7.720125786163522, "percentage": 38.6, "elapsed_time": "0:37:37", "remaining_time": "0:59:51", "throughput": 4258.15, "total_tokens": 9614288} {"current_steps": 14735, "total_steps": 38160, "loss": 0.4689, "lr": 0.0007706910774976848, "epoch": 7.722746331236897, "percentage": 38.61, "elapsed_time": "0:37:38", "remaining_time": "0:59:50", "throughput": 4258.26, "total_tokens": 9617680} {"current_steps": 14740, "total_steps": 38160, "loss": 0.3888, "lr": 0.0007704987755978021, "epoch": 7.7253668763102725, "percentage": 38.63, "elapsed_time": "0:37:39", "remaining_time": "0:59:49", "throughput": 4258.33, "total_tokens": 9620944} {"current_steps": 14745, "total_steps": 38160, "loss": 0.4512, "lr": 0.0007703064171126615, "epoch": 7.727987421383648, "percentage": 38.64, "elapsed_time": "0:37:40", "remaining_time": "0:59:49", "throughput": 4258.96, "total_tokens": 9627536} {"current_steps": 14750, "total_steps": 38160, "loss": 0.5572, "lr": 0.0007701140020825022, "epoch": 7.730607966457023, "percentage": 38.65, "elapsed_time": "0:37:41", "remaining_time": "0:59:48", "throughput": 4259.13, "total_tokens": 9631216} {"current_steps": 14755, "total_steps": 38160, "loss": 0.3761, "lr": 0.0007699215305475753, "epoch": 7.733228511530398, "percentage": 38.67, "elapsed_time": "0:37:42", "remaining_time": "0:59:48", "throughput": 4259.13, "total_tokens": 9634160} {"current_steps": 14760, "total_steps": 38160, "loss": 0.4039, "lr": 0.0007697290025481436, "epoch": 7.735849056603773, "percentage": 38.68, "elapsed_time": "0:37:42", "remaining_time": "0:59:47", "throughput": 4259.21, "total_tokens": 9637456} {"current_steps": 14765, "total_steps": 38160, "loss": 0.4641, "lr": 0.0007695364181244819, "epoch": 7.738469601677149, "percentage": 38.69, "elapsed_time": "0:37:43", "remaining_time": "0:59:46", "throughput": 4259.43, "total_tokens": 9641520} {"current_steps": 14770, "total_steps": 38160, "loss": 0.4498, "lr": 0.0007693437773168764, "epoch": 7.741090146750524, "percentage": 38.71, "elapsed_time": "0:37:44", "remaining_time": "0:59:45", "throughput": 4259.52, "total_tokens": 9644912} {"current_steps": 14775, "total_steps": 38160, "loss": 0.403, "lr": 0.0007691510801656256, "epoch": 7.7437106918239, "percentage": 38.72, "elapsed_time": "0:37:44", "remaining_time": "0:59:44", "throughput": 4259.48, "total_tokens": 9647568} {"current_steps": 14780, "total_steps": 38160, "loss": 0.4109, "lr": 0.0007689583267110395, "epoch": 7.746331236897275, "percentage": 38.73, "elapsed_time": "0:37:45", "remaining_time": "0:59:44", "throughput": 4259.7, "total_tokens": 9651600} {"current_steps": 14785, "total_steps": 38160, "loss": 0.3317, "lr": 0.0007687655169934398, "epoch": 7.74895178197065, "percentage": 38.74, "elapsed_time": "0:37:46", "remaining_time": "0:59:43", "throughput": 4259.73, "total_tokens": 9654576} {"current_steps": 14790, "total_steps": 38160, "loss": 0.45, "lr": 0.0007685726510531603, "epoch": 7.751572327044025, "percentage": 38.76, "elapsed_time": "0:37:47", "remaining_time": "0:59:42", "throughput": 4259.83, "total_tokens": 9658000} {"current_steps": 14795, "total_steps": 38160, "loss": 0.4817, "lr": 0.0007683797289305463, "epoch": 7.7541928721174, "percentage": 38.77, "elapsed_time": "0:37:47", "remaining_time": "0:59:41", "throughput": 4259.82, "total_tokens": 9660880} {"current_steps": 14800, "total_steps": 38160, "loss": 0.3686, "lr": 0.0007681867506659548, "epoch": 7.756813417190775, "percentage": 38.78, "elapsed_time": "0:37:48", "remaining_time": "0:59:40", "throughput": 4259.85, "total_tokens": 9663920} {"current_steps": 14805, "total_steps": 38160, "loss": 0.4319, "lr": 0.0007679937162997546, "epoch": 7.759433962264151, "percentage": 38.8, "elapsed_time": "0:37:49", "remaining_time": "0:59:40", "throughput": 4260.06, "total_tokens": 9667792} {"current_steps": 14810, "total_steps": 38160, "loss": 0.4156, "lr": 0.0007678006258723264, "epoch": 7.762054507337526, "percentage": 38.81, "elapsed_time": "0:37:50", "remaining_time": "0:59:39", "throughput": 4260.14, "total_tokens": 9671120} {"current_steps": 14815, "total_steps": 38160, "loss": 0.383, "lr": 0.0007676074794240626, "epoch": 7.764675052410902, "percentage": 38.82, "elapsed_time": "0:37:50", "remaining_time": "0:59:38", "throughput": 4260.27, "total_tokens": 9674608} {"current_steps": 14820, "total_steps": 38160, "loss": 0.429, "lr": 0.000767414276995367, "epoch": 7.767295597484277, "percentage": 38.84, "elapsed_time": "0:37:51", "remaining_time": "0:59:37", "throughput": 4260.31, "total_tokens": 9677904} {"current_steps": 14825, "total_steps": 38160, "loss": 0.4427, "lr": 0.0007672210186266555, "epoch": 7.769916142557652, "percentage": 38.85, "elapsed_time": "0:37:52", "remaining_time": "0:59:36", "throughput": 4260.46, "total_tokens": 9681648} {"current_steps": 14830, "total_steps": 38160, "loss": 0.5371, "lr": 0.0007670277043583556, "epoch": 7.772536687631027, "percentage": 38.86, "elapsed_time": "0:37:53", "remaining_time": "0:59:35", "throughput": 4260.38, "total_tokens": 9684208} {"current_steps": 14835, "total_steps": 38160, "loss": 0.5189, "lr": 0.0007668343342309063, "epoch": 7.7751572327044025, "percentage": 38.88, "elapsed_time": "0:37:53", "remaining_time": "0:59:34", "throughput": 4260.31, "total_tokens": 9686800} {"current_steps": 14840, "total_steps": 38160, "loss": 0.4272, "lr": 0.0007666409082847586, "epoch": 7.777777777777778, "percentage": 38.89, "elapsed_time": "0:37:54", "remaining_time": "0:59:34", "throughput": 4260.26, "total_tokens": 9689424} {"current_steps": 14845, "total_steps": 38160, "loss": 0.4142, "lr": 0.0007664474265603747, "epoch": 7.780398322851153, "percentage": 38.9, "elapsed_time": "0:37:55", "remaining_time": "0:59:33", "throughput": 4260.26, "total_tokens": 9692368} {"current_steps": 14850, "total_steps": 38160, "loss": 0.3748, "lr": 0.0007662538890982291, "epoch": 7.783018867924528, "percentage": 38.92, "elapsed_time": "0:37:55", "remaining_time": "0:59:32", "throughput": 4260.36, "total_tokens": 9695856} {"current_steps": 14855, "total_steps": 38160, "loss": 0.3737, "lr": 0.0007660602959388075, "epoch": 7.785639412997903, "percentage": 38.93, "elapsed_time": "0:37:56", "remaining_time": "0:59:31", "throughput": 4260.45, "total_tokens": 9699280} {"current_steps": 14860, "total_steps": 38160, "loss": 0.5622, "lr": 0.0007658666471226073, "epoch": 7.788259958071279, "percentage": 38.94, "elapsed_time": "0:37:57", "remaining_time": "0:59:30", "throughput": 4260.36, "total_tokens": 9701840} {"current_steps": 14865, "total_steps": 38160, "loss": 0.4659, "lr": 0.0007656729426901377, "epoch": 7.790880503144654, "percentage": 38.95, "elapsed_time": "0:37:57", "remaining_time": "0:59:29", "throughput": 4260.3, "total_tokens": 9704400} {"current_steps": 14870, "total_steps": 38160, "loss": 0.4112, "lr": 0.0007654791826819194, "epoch": 7.79350104821803, "percentage": 38.97, "elapsed_time": "0:37:58", "remaining_time": "0:59:28", "throughput": 4260.35, "total_tokens": 9707664} {"current_steps": 14875, "total_steps": 38160, "loss": 0.5004, "lr": 0.0007652853671384847, "epoch": 7.796121593291405, "percentage": 38.98, "elapsed_time": "0:37:59", "remaining_time": "0:59:27", "throughput": 4260.37, "total_tokens": 9710672} {"current_steps": 14880, "total_steps": 38160, "loss": 0.5313, "lr": 0.0007650914961003781, "epoch": 7.79874213836478, "percentage": 38.99, "elapsed_time": "0:38:00", "remaining_time": "0:59:27", "throughput": 4260.44, "total_tokens": 9713872} {"current_steps": 14885, "total_steps": 38160, "loss": 0.3952, "lr": 0.0007648975696081546, "epoch": 7.801362683438155, "percentage": 39.01, "elapsed_time": "0:38:00", "remaining_time": "0:59:26", "throughput": 4260.49, "total_tokens": 9717008} {"current_steps": 14890, "total_steps": 38160, "loss": 0.5802, "lr": 0.0007647035877023816, "epoch": 7.80398322851153, "percentage": 39.02, "elapsed_time": "0:38:01", "remaining_time": "0:59:25", "throughput": 4260.63, "total_tokens": 9720560} {"current_steps": 14895, "total_steps": 38160, "loss": 0.3912, "lr": 0.0007645095504236381, "epoch": 7.806603773584905, "percentage": 39.03, "elapsed_time": "0:38:02", "remaining_time": "0:59:24", "throughput": 4260.68, "total_tokens": 9723792} {"current_steps": 14900, "total_steps": 38160, "loss": 0.4077, "lr": 0.0007643154578125142, "epoch": 7.809224318658281, "percentage": 39.05, "elapsed_time": "0:38:02", "remaining_time": "0:59:23", "throughput": 4260.78, "total_tokens": 9727184} {"current_steps": 14905, "total_steps": 38160, "loss": 0.4479, "lr": 0.0007641213099096121, "epoch": 7.811844863731656, "percentage": 39.06, "elapsed_time": "0:38:03", "remaining_time": "0:59:23", "throughput": 4260.93, "total_tokens": 9730832} {"current_steps": 14910, "total_steps": 38160, "loss": 0.459, "lr": 0.0007639271067555452, "epoch": 7.814465408805032, "percentage": 39.07, "elapsed_time": "0:38:04", "remaining_time": "0:59:22", "throughput": 4261.11, "total_tokens": 9734640} {"current_steps": 14915, "total_steps": 38160, "loss": 0.3176, "lr": 0.0007637328483909385, "epoch": 7.817085953878407, "percentage": 39.09, "elapsed_time": "0:38:05", "remaining_time": "0:59:21", "throughput": 4261.1, "total_tokens": 9737520} {"current_steps": 14920, "total_steps": 38160, "loss": 0.4551, "lr": 0.000763538534856429, "epoch": 7.819706498951782, "percentage": 39.1, "elapsed_time": "0:38:05", "remaining_time": "0:59:20", "throughput": 4261.2, "total_tokens": 9740880} {"current_steps": 14925, "total_steps": 38160, "loss": 0.3479, "lr": 0.0007633441661926643, "epoch": 7.822327044025157, "percentage": 39.11, "elapsed_time": "0:38:06", "remaining_time": "0:59:19", "throughput": 4261.26, "total_tokens": 9744080} {"current_steps": 14930, "total_steps": 38160, "loss": 0.4505, "lr": 0.0007631497424403046, "epoch": 7.8249475890985325, "percentage": 39.12, "elapsed_time": "0:38:07", "remaining_time": "0:59:18", "throughput": 4261.31, "total_tokens": 9747184} {"current_steps": 14935, "total_steps": 38160, "loss": 0.562, "lr": 0.000762955263640021, "epoch": 7.827568134171908, "percentage": 39.14, "elapsed_time": "0:38:08", "remaining_time": "0:59:18", "throughput": 4261.2, "total_tokens": 9749648} {"current_steps": 14940, "total_steps": 38160, "loss": 0.5122, "lr": 0.0007627607298324961, "epoch": 7.830188679245283, "percentage": 39.15, "elapsed_time": "0:38:08", "remaining_time": "0:59:17", "throughput": 4261.08, "total_tokens": 9751984} {"current_steps": 14945, "total_steps": 38160, "loss": 0.4311, "lr": 0.0007625661410584244, "epoch": 7.832809224318658, "percentage": 39.16, "elapsed_time": "0:38:09", "remaining_time": "0:59:16", "throughput": 4261.12, "total_tokens": 9755152} {"current_steps": 14950, "total_steps": 38160, "loss": 0.4978, "lr": 0.0007623714973585113, "epoch": 7.835429769392033, "percentage": 39.18, "elapsed_time": "0:38:10", "remaining_time": "0:59:15", "throughput": 4261.2, "total_tokens": 9758448} {"current_steps": 14955, "total_steps": 38160, "loss": 0.443, "lr": 0.0007621767987734743, "epoch": 7.838050314465409, "percentage": 39.19, "elapsed_time": "0:38:10", "remaining_time": "0:59:14", "throughput": 4261.18, "total_tokens": 9761264} {"current_steps": 14960, "total_steps": 38160, "loss": 0.5748, "lr": 0.000761982045344042, "epoch": 7.840670859538784, "percentage": 39.2, "elapsed_time": "0:38:11", "remaining_time": "0:59:13", "throughput": 4261.34, "total_tokens": 9764976} {"current_steps": 14965, "total_steps": 38160, "loss": 0.5588, "lr": 0.0007617872371109549, "epoch": 7.84329140461216, "percentage": 39.22, "elapsed_time": "0:38:12", "remaining_time": "0:59:12", "throughput": 4261.4, "total_tokens": 9768208} {"current_steps": 14970, "total_steps": 38160, "loss": 0.4193, "lr": 0.0007615923741149643, "epoch": 7.845911949685535, "percentage": 39.23, "elapsed_time": "0:38:12", "remaining_time": "0:59:11", "throughput": 4261.44, "total_tokens": 9771248} {"current_steps": 14975, "total_steps": 38160, "loss": 0.4563, "lr": 0.0007613974563968333, "epoch": 7.84853249475891, "percentage": 39.24, "elapsed_time": "0:38:13", "remaining_time": "0:59:11", "throughput": 4261.36, "total_tokens": 9773776} {"current_steps": 14980, "total_steps": 38160, "loss": 0.5283, "lr": 0.0007612024839973368, "epoch": 7.851153039832285, "percentage": 39.26, "elapsed_time": "0:38:14", "remaining_time": "0:59:10", "throughput": 4261.51, "total_tokens": 9777360} {"current_steps": 14985, "total_steps": 38160, "loss": 0.428, "lr": 0.0007610074569572605, "epoch": 7.85377358490566, "percentage": 39.27, "elapsed_time": "0:38:15", "remaining_time": "0:59:09", "throughput": 4261.43, "total_tokens": 9779984} {"current_steps": 14990, "total_steps": 38160, "loss": 0.4526, "lr": 0.0007608123753174019, "epoch": 7.856394129979035, "percentage": 39.28, "elapsed_time": "0:38:15", "remaining_time": "0:59:08", "throughput": 4261.34, "total_tokens": 9782480} {"current_steps": 14995, "total_steps": 38160, "loss": 0.5589, "lr": 0.00076061723911857, "epoch": 7.859014675052411, "percentage": 39.3, "elapsed_time": "0:38:16", "remaining_time": "0:59:07", "throughput": 4261.56, "total_tokens": 9786608} {"current_steps": 15000, "total_steps": 38160, "loss": 0.517, "lr": 0.0007604220484015849, "epoch": 7.861635220125786, "percentage": 39.31, "elapsed_time": "0:38:17", "remaining_time": "0:59:06", "throughput": 4261.67, "total_tokens": 9790096} {"current_steps": 15005, "total_steps": 38160, "loss": 0.5425, "lr": 0.0007602268032072784, "epoch": 7.864255765199162, "percentage": 39.32, "elapsed_time": "0:38:17", "remaining_time": "0:59:06", "throughput": 4261.69, "total_tokens": 9793072} {"current_steps": 15010, "total_steps": 38160, "loss": 0.4501, "lr": 0.0007600315035764933, "epoch": 7.866876310272537, "percentage": 39.33, "elapsed_time": "0:38:18", "remaining_time": "0:59:05", "throughput": 4261.82, "total_tokens": 9796528} {"current_steps": 15015, "total_steps": 38160, "loss": 0.4606, "lr": 0.0007598361495500844, "epoch": 7.869496855345912, "percentage": 39.35, "elapsed_time": "0:38:19", "remaining_time": "0:59:04", "throughput": 4261.96, "total_tokens": 9800048} {"current_steps": 15020, "total_steps": 38160, "loss": 0.4187, "lr": 0.0007596407411689173, "epoch": 7.872117400419287, "percentage": 39.36, "elapsed_time": "0:38:20", "remaining_time": "0:59:03", "throughput": 4261.9, "total_tokens": 9802672} {"current_steps": 15025, "total_steps": 38160, "loss": 0.5589, "lr": 0.0007594452784738695, "epoch": 7.8747379454926625, "percentage": 39.37, "elapsed_time": "0:38:20", "remaining_time": "0:59:02", "throughput": 4262.04, "total_tokens": 9806352} {"current_steps": 15030, "total_steps": 38160, "loss": 0.3869, "lr": 0.000759249761505829, "epoch": 7.877358490566038, "percentage": 39.39, "elapsed_time": "0:38:21", "remaining_time": "0:59:01", "throughput": 4262.02, "total_tokens": 9809200} {"current_steps": 15035, "total_steps": 38160, "loss": 0.5659, "lr": 0.0007590541903056963, "epoch": 7.879979035639413, "percentage": 39.4, "elapsed_time": "0:38:22", "remaining_time": "0:59:00", "throughput": 4261.91, "total_tokens": 9811568} {"current_steps": 15040, "total_steps": 38160, "loss": 0.5339, "lr": 0.0007588585649143825, "epoch": 7.882599580712788, "percentage": 39.41, "elapsed_time": "0:38:22", "remaining_time": "0:58:59", "throughput": 4261.91, "total_tokens": 9814480} {"current_steps": 15045, "total_steps": 38160, "loss": 0.4519, "lr": 0.0007586628853728099, "epoch": 7.885220125786163, "percentage": 39.43, "elapsed_time": "0:38:23", "remaining_time": "0:58:59", "throughput": 4261.87, "total_tokens": 9817200} {"current_steps": 15050, "total_steps": 38160, "loss": 0.3437, "lr": 0.0007584671517219128, "epoch": 7.887840670859539, "percentage": 39.44, "elapsed_time": "0:38:24", "remaining_time": "0:58:58", "throughput": 4261.92, "total_tokens": 9820336} {"current_steps": 15055, "total_steps": 38160, "loss": 0.5144, "lr": 0.0007582713640026364, "epoch": 7.890461215932914, "percentage": 39.45, "elapsed_time": "0:38:24", "remaining_time": "0:58:57", "throughput": 4261.97, "total_tokens": 9823664} {"current_steps": 15060, "total_steps": 38160, "loss": 0.463, "lr": 0.000758075522255937, "epoch": 7.8930817610062896, "percentage": 39.47, "elapsed_time": "0:38:25", "remaining_time": "0:58:56", "throughput": 4262.11, "total_tokens": 9827280} {"current_steps": 15065, "total_steps": 38160, "loss": 0.5143, "lr": 0.0007578796265227828, "epoch": 7.895702306079665, "percentage": 39.48, "elapsed_time": "0:38:26", "remaining_time": "0:58:55", "throughput": 4262.12, "total_tokens": 9830192} {"current_steps": 15070, "total_steps": 38160, "loss": 0.4751, "lr": 0.0007576836768441525, "epoch": 7.89832285115304, "percentage": 39.49, "elapsed_time": "0:38:27", "remaining_time": "0:58:54", "throughput": 4262.06, "total_tokens": 9832816} {"current_steps": 15075, "total_steps": 38160, "loss": 0.3917, "lr": 0.0007574876732610369, "epoch": 7.900943396226415, "percentage": 39.5, "elapsed_time": "0:38:27", "remaining_time": "0:58:54", "throughput": 4262.12, "total_tokens": 9836080} {"current_steps": 15080, "total_steps": 38160, "loss": 0.3957, "lr": 0.0007572916158144379, "epoch": 7.90356394129979, "percentage": 39.52, "elapsed_time": "0:38:28", "remaining_time": "0:58:53", "throughput": 4262.14, "total_tokens": 9839152} {"current_steps": 15085, "total_steps": 38160, "loss": 0.3615, "lr": 0.0007570955045453679, "epoch": 7.906184486373165, "percentage": 39.53, "elapsed_time": "0:38:29", "remaining_time": "0:58:52", "throughput": 4262.38, "total_tokens": 9843120} {"current_steps": 15090, "total_steps": 38160, "loss": 0.4707, "lr": 0.0007568993394948516, "epoch": 7.908805031446541, "percentage": 39.54, "elapsed_time": "0:38:30", "remaining_time": "0:58:51", "throughput": 4262.51, "total_tokens": 9846608} {"current_steps": 15095, "total_steps": 38160, "loss": 0.4721, "lr": 0.0007567031207039243, "epoch": 7.911425576519916, "percentage": 39.56, "elapsed_time": "0:38:30", "remaining_time": "0:58:50", "throughput": 4262.49, "total_tokens": 9849552} {"current_steps": 15100, "total_steps": 38160, "loss": 0.4673, "lr": 0.0007565068482136328, "epoch": 7.914046121593291, "percentage": 39.57, "elapsed_time": "0:38:31", "remaining_time": "0:58:49", "throughput": 4262.47, "total_tokens": 9852336} {"current_steps": 15105, "total_steps": 38160, "loss": 0.4546, "lr": 0.000756310522065035, "epoch": 7.916666666666667, "percentage": 39.58, "elapsed_time": "0:38:32", "remaining_time": "0:58:49", "throughput": 4262.5, "total_tokens": 9855376} {"current_steps": 15110, "total_steps": 38160, "loss": 0.5025, "lr": 0.0007561141422992002, "epoch": 7.919287211740042, "percentage": 39.6, "elapsed_time": "0:38:32", "remaining_time": "0:58:48", "throughput": 4262.55, "total_tokens": 9858608} {"current_steps": 15115, "total_steps": 38160, "loss": 0.4434, "lr": 0.0007559177089572086, "epoch": 7.921907756813417, "percentage": 39.61, "elapsed_time": "0:38:33", "remaining_time": "0:58:47", "throughput": 4262.59, "total_tokens": 9861776} {"current_steps": 15120, "total_steps": 38160, "loss": 0.4829, "lr": 0.0007557212220801521, "epoch": 7.9245283018867925, "percentage": 39.62, "elapsed_time": "0:38:34", "remaining_time": "0:58:46", "throughput": 4262.48, "total_tokens": 9864144} {"current_steps": 15125, "total_steps": 38160, "loss": 0.472, "lr": 0.0007555246817091332, "epoch": 7.927148846960168, "percentage": 39.64, "elapsed_time": "0:38:34", "remaining_time": "0:58:45", "throughput": 4262.36, "total_tokens": 9866512} {"current_steps": 15130, "total_steps": 38160, "loss": 0.5297, "lr": 0.0007553280878852663, "epoch": 7.929769392033543, "percentage": 39.65, "elapsed_time": "0:38:35", "remaining_time": "0:58:44", "throughput": 4262.46, "total_tokens": 9869936} {"current_steps": 15135, "total_steps": 38160, "loss": 0.3653, "lr": 0.0007551314406496762, "epoch": 7.932389937106918, "percentage": 39.66, "elapsed_time": "0:38:36", "remaining_time": "0:58:43", "throughput": 4262.53, "total_tokens": 9873168} {"current_steps": 15140, "total_steps": 38160, "loss": 0.5807, "lr": 0.0007549347400434994, "epoch": 7.935010482180293, "percentage": 39.68, "elapsed_time": "0:38:36", "remaining_time": "0:58:42", "throughput": 4262.49, "total_tokens": 9875888} {"current_steps": 15145, "total_steps": 38160, "loss": 0.556, "lr": 0.0007547379861078835, "epoch": 7.937631027253669, "percentage": 39.69, "elapsed_time": "0:38:37", "remaining_time": "0:58:42", "throughput": 4262.79, "total_tokens": 9880432} {"current_steps": 15150, "total_steps": 38160, "loss": 0.4317, "lr": 0.0007545411788839871, "epoch": 7.940251572327044, "percentage": 39.7, "elapsed_time": "0:38:38", "remaining_time": "0:58:41", "throughput": 4263.14, "total_tokens": 9885136} {"current_steps": 15155, "total_steps": 38160, "loss": 0.5031, "lr": 0.0007543443184129799, "epoch": 7.9428721174004195, "percentage": 39.71, "elapsed_time": "0:38:39", "remaining_time": "0:58:40", "throughput": 4263.13, "total_tokens": 9887920} {"current_steps": 15160, "total_steps": 38160, "loss": 0.4141, "lr": 0.000754147404736043, "epoch": 7.945492662473795, "percentage": 39.73, "elapsed_time": "0:38:40", "remaining_time": "0:58:40", "throughput": 4263.42, "total_tokens": 9892464} {"current_steps": 15165, "total_steps": 38160, "loss": 0.4724, "lr": 0.0007539504378943686, "epoch": 7.94811320754717, "percentage": 39.74, "elapsed_time": "0:38:40", "remaining_time": "0:58:39", "throughput": 4263.42, "total_tokens": 9895344} {"current_steps": 15170, "total_steps": 38160, "loss": 0.4777, "lr": 0.0007537534179291599, "epoch": 7.950733752620545, "percentage": 39.75, "elapsed_time": "0:38:41", "remaining_time": "0:58:38", "throughput": 4263.39, "total_tokens": 9898032} {"current_steps": 15175, "total_steps": 38160, "loss": 0.3327, "lr": 0.000753556344881631, "epoch": 7.95335429769392, "percentage": 39.77, "elapsed_time": "0:38:42", "remaining_time": "0:58:37", "throughput": 4263.6, "total_tokens": 9902160} {"current_steps": 15180, "total_steps": 38160, "loss": 0.4158, "lr": 0.0007533592187930076, "epoch": 7.955974842767295, "percentage": 39.78, "elapsed_time": "0:38:43", "remaining_time": "0:58:37", "throughput": 4263.83, "total_tokens": 9906160} {"current_steps": 15185, "total_steps": 38160, "loss": 0.4292, "lr": 0.000753162039704526, "epoch": 7.9585953878406706, "percentage": 39.79, "elapsed_time": "0:38:44", "remaining_time": "0:58:36", "throughput": 4263.88, "total_tokens": 9909296} {"current_steps": 15190, "total_steps": 38160, "loss": 0.475, "lr": 0.000752964807657434, "epoch": 7.961215932914046, "percentage": 39.81, "elapsed_time": "0:38:44", "remaining_time": "0:58:35", "throughput": 4263.83, "total_tokens": 9911952} {"current_steps": 15195, "total_steps": 38160, "loss": 0.5491, "lr": 0.0007527675226929902, "epoch": 7.963836477987421, "percentage": 39.82, "elapsed_time": "0:38:45", "remaining_time": "0:58:34", "throughput": 4263.86, "total_tokens": 9914992} {"current_steps": 15200, "total_steps": 38160, "loss": 0.3313, "lr": 0.0007525701848524643, "epoch": 7.966457023060797, "percentage": 39.83, "elapsed_time": "0:38:46", "remaining_time": "0:58:33", "throughput": 4264.12, "total_tokens": 9919184} {"current_steps": 15205, "total_steps": 38160, "loss": 0.5871, "lr": 0.0007523727941771372, "epoch": 7.969077568134172, "percentage": 39.85, "elapsed_time": "0:38:46", "remaining_time": "0:58:32", "throughput": 4264.05, "total_tokens": 9921744} {"current_steps": 15210, "total_steps": 38160, "loss": 0.4679, "lr": 0.0007521753507083009, "epoch": 7.971698113207547, "percentage": 39.86, "elapsed_time": "0:38:47", "remaining_time": "0:58:31", "throughput": 4264.12, "total_tokens": 9924912} {"current_steps": 15215, "total_steps": 38160, "loss": 0.3884, "lr": 0.0007519778544872581, "epoch": 7.9743186582809225, "percentage": 39.87, "elapsed_time": "0:38:48", "remaining_time": "0:58:31", "throughput": 4264.12, "total_tokens": 9927728} {"current_steps": 15220, "total_steps": 38160, "loss": 0.4286, "lr": 0.000751780305555323, "epoch": 7.976939203354298, "percentage": 39.88, "elapsed_time": "0:38:48", "remaining_time": "0:58:30", "throughput": 4264.08, "total_tokens": 9930448} {"current_steps": 15225, "total_steps": 38160, "loss": 0.4813, "lr": 0.0007515827039538202, "epoch": 7.979559748427673, "percentage": 39.9, "elapsed_time": "0:38:49", "remaining_time": "0:58:29", "throughput": 4264.33, "total_tokens": 9934608} {"current_steps": 15230, "total_steps": 38160, "loss": 0.4153, "lr": 0.0007513850497240861, "epoch": 7.982180293501048, "percentage": 39.91, "elapsed_time": "0:38:50", "remaining_time": "0:58:28", "throughput": 4264.32, "total_tokens": 9937456} {"current_steps": 15235, "total_steps": 38160, "loss": 0.5064, "lr": 0.0007511873429074676, "epoch": 7.984800838574423, "percentage": 39.92, "elapsed_time": "0:38:51", "remaining_time": "0:58:27", "throughput": 4264.41, "total_tokens": 9940816} {"current_steps": 15240, "total_steps": 38160, "loss": 0.3927, "lr": 0.0007509895835453224, "epoch": 7.987421383647799, "percentage": 39.94, "elapsed_time": "0:38:51", "remaining_time": "0:58:26", "throughput": 4264.49, "total_tokens": 9944080} {"current_steps": 15245, "total_steps": 38160, "loss": 0.4209, "lr": 0.0007507917716790201, "epoch": 7.990041928721174, "percentage": 39.95, "elapsed_time": "0:38:52", "remaining_time": "0:58:25", "throughput": 4264.4, "total_tokens": 9946480} {"current_steps": 15250, "total_steps": 38160, "loss": 0.4688, "lr": 0.0007505939073499401, "epoch": 7.9926624737945495, "percentage": 39.96, "elapsed_time": "0:38:53", "remaining_time": "0:58:25", "throughput": 4264.5, "total_tokens": 9949872} {"current_steps": 15255, "total_steps": 38160, "loss": 0.4237, "lr": 0.0007503959905994737, "epoch": 7.995283018867925, "percentage": 39.98, "elapsed_time": "0:38:53", "remaining_time": "0:58:24", "throughput": 4264.67, "total_tokens": 9953520} {"current_steps": 15260, "total_steps": 38160, "loss": 0.4793, "lr": 0.0007501980214690227, "epoch": 7.9979035639413, "percentage": 39.99, "elapsed_time": "0:38:54", "remaining_time": "0:58:23", "throughput": 4264.73, "total_tokens": 9956624} {"current_steps": 15264, "total_steps": 38160, "eval_loss": 0.4539332985877991, "epoch": 8.0, "percentage": 40.0, "elapsed_time": "0:39:08", "remaining_time": "0:58:43", "throughput": 4239.62, "total_tokens": 9958360} {"current_steps": 15265, "total_steps": 38160, "loss": 0.448, "lr": 0.00075, "epoch": 8.000524109014675, "percentage": 40.0, "elapsed_time": "0:39:10", "remaining_time": "0:58:45", "throughput": 4236.4, "total_tokens": 9958968} {"current_steps": 15270, "total_steps": 38160, "loss": 0.388, "lr": 0.0007498019262338295, "epoch": 8.00314465408805, "percentage": 40.02, "elapsed_time": "0:39:11", "remaining_time": "0:58:44", "throughput": 4236.36, "total_tokens": 9961624} {"current_steps": 15275, "total_steps": 38160, "loss": 0.5294, "lr": 0.0007496038002119459, "epoch": 8.005765199161425, "percentage": 40.03, "elapsed_time": "0:39:12", "remaining_time": "0:58:43", "throughput": 4236.38, "total_tokens": 9964600} {"current_steps": 15280, "total_steps": 38160, "loss": 0.4519, "lr": 0.000749405621975795, "epoch": 8.0083857442348, "percentage": 40.04, "elapsed_time": "0:39:12", "remaining_time": "0:58:43", "throughput": 4236.31, "total_tokens": 9967096} {"current_steps": 15285, "total_steps": 38160, "loss": 0.4108, "lr": 0.0007492073915668334, "epoch": 8.011006289308176, "percentage": 40.06, "elapsed_time": "0:39:13", "remaining_time": "0:58:42", "throughput": 4236.3, "total_tokens": 9969848} {"current_steps": 15290, "total_steps": 38160, "loss": 0.4293, "lr": 0.0007490091090265283, "epoch": 8.01362683438155, "percentage": 40.07, "elapsed_time": "0:39:14", "remaining_time": "0:58:41", "throughput": 4236.39, "total_tokens": 9973272} {"current_steps": 15295, "total_steps": 38160, "loss": 0.4019, "lr": 0.0007488107743963587, "epoch": 8.016247379454926, "percentage": 40.08, "elapsed_time": "0:39:14", "remaining_time": "0:58:40", "throughput": 4236.38, "total_tokens": 9975992} {"current_steps": 15300, "total_steps": 38160, "loss": 0.5395, "lr": 0.0007486123877178136, "epoch": 8.018867924528301, "percentage": 40.09, "elapsed_time": "0:39:15", "remaining_time": "0:58:39", "throughput": 4236.53, "total_tokens": 9979704} {"current_steps": 15305, "total_steps": 38160, "loss": 0.4772, "lr": 0.0007484139490323932, "epoch": 8.021488469601676, "percentage": 40.11, "elapsed_time": "0:39:16", "remaining_time": "0:58:38", "throughput": 4236.54, "total_tokens": 9982712} {"current_steps": 15310, "total_steps": 38160, "loss": 0.3334, "lr": 0.000748215458381609, "epoch": 8.024109014675052, "percentage": 40.12, "elapsed_time": "0:39:17", "remaining_time": "0:58:37", "throughput": 4236.53, "total_tokens": 9985560} {"current_steps": 15315, "total_steps": 38160, "loss": 0.3968, "lr": 0.0007480169158069826, "epoch": 8.026729559748428, "percentage": 40.13, "elapsed_time": "0:39:17", "remaining_time": "0:58:37", "throughput": 4236.7, "total_tokens": 9989272} {"current_steps": 15320, "total_steps": 38160, "loss": 0.3889, "lr": 0.0007478183213500468, "epoch": 8.029350104821804, "percentage": 40.15, "elapsed_time": "0:39:18", "remaining_time": "0:58:36", "throughput": 4236.68, "total_tokens": 9992088} {"current_steps": 15325, "total_steps": 38160, "loss": 0.4608, "lr": 0.0007476196750523456, "epoch": 8.031970649895179, "percentage": 40.16, "elapsed_time": "0:39:19", "remaining_time": "0:58:35", "throughput": 4236.68, "total_tokens": 9995032} {"current_steps": 15330, "total_steps": 38160, "loss": 0.338, "lr": 0.000747420976955433, "epoch": 8.034591194968554, "percentage": 40.17, "elapsed_time": "0:39:19", "remaining_time": "0:58:34", "throughput": 4236.7, "total_tokens": 9998008} {"current_steps": 15335, "total_steps": 38160, "loss": 0.5982, "lr": 0.0007472222271008752, "epoch": 8.03721174004193, "percentage": 40.19, "elapsed_time": "0:39:20", "remaining_time": "0:58:33", "throughput": 4236.81, "total_tokens": 10001464} {"current_steps": 15340, "total_steps": 38160, "loss": 0.427, "lr": 0.0007470234255302478, "epoch": 8.039832285115304, "percentage": 40.2, "elapsed_time": "0:39:21", "remaining_time": "0:58:32", "throughput": 4236.83, "total_tokens": 10004472} {"current_steps": 15345, "total_steps": 38160, "loss": 0.4309, "lr": 0.0007468245722851379, "epoch": 8.04245283018868, "percentage": 40.21, "elapsed_time": "0:39:21", "remaining_time": "0:58:31", "throughput": 4236.79, "total_tokens": 10007160} {"current_steps": 15350, "total_steps": 38160, "loss": 0.5246, "lr": 0.0007466256674071434, "epoch": 8.045073375262055, "percentage": 40.23, "elapsed_time": "0:39:22", "remaining_time": "0:58:30", "throughput": 4236.81, "total_tokens": 10010136} {"current_steps": 15355, "total_steps": 38160, "loss": 0.4998, "lr": 0.000746426710937873, "epoch": 8.04769392033543, "percentage": 40.24, "elapsed_time": "0:39:23", "remaining_time": "0:58:30", "throughput": 4236.91, "total_tokens": 10013560} {"current_steps": 15360, "total_steps": 38160, "loss": 0.4469, "lr": 0.0007462277029189461, "epoch": 8.050314465408805, "percentage": 40.25, "elapsed_time": "0:39:24", "remaining_time": "0:58:29", "throughput": 4236.86, "total_tokens": 10016280} {"current_steps": 15365, "total_steps": 38160, "loss": 0.6, "lr": 0.0007460286433919928, "epoch": 8.05293501048218, "percentage": 40.26, "elapsed_time": "0:39:24", "remaining_time": "0:58:28", "throughput": 4236.86, "total_tokens": 10019096} {"current_steps": 15370, "total_steps": 38160, "loss": 0.511, "lr": 0.0007458295323986542, "epoch": 8.055555555555555, "percentage": 40.28, "elapsed_time": "0:39:25", "remaining_time": "0:58:27", "throughput": 4236.91, "total_tokens": 10022200} {"current_steps": 15375, "total_steps": 38160, "loss": 0.4542, "lr": 0.0007456303699805817, "epoch": 8.05817610062893, "percentage": 40.29, "elapsed_time": "0:39:26", "remaining_time": "0:58:26", "throughput": 4237.0, "total_tokens": 10025528} {"current_steps": 15380, "total_steps": 38160, "loss": 0.5148, "lr": 0.0007454311561794386, "epoch": 8.060796645702306, "percentage": 40.3, "elapsed_time": "0:39:27", "remaining_time": "0:58:25", "throughput": 4237.34, "total_tokens": 10030104} {"current_steps": 15385, "total_steps": 38160, "loss": 0.5267, "lr": 0.0007452318910368972, "epoch": 8.06341719077568, "percentage": 40.32, "elapsed_time": "0:39:27", "remaining_time": "0:58:25", "throughput": 4237.37, "total_tokens": 10033112} {"current_steps": 15390, "total_steps": 38160, "loss": 0.4152, "lr": 0.0007450325745946422, "epoch": 8.066037735849056, "percentage": 40.33, "elapsed_time": "0:39:28", "remaining_time": "0:58:24", "throughput": 4237.42, "total_tokens": 10036280} {"current_steps": 15395, "total_steps": 38160, "loss": 0.3682, "lr": 0.0007448332068943681, "epoch": 8.068658280922431, "percentage": 40.34, "elapsed_time": "0:39:29", "remaining_time": "0:58:23", "throughput": 4237.43, "total_tokens": 10039160} {"current_steps": 15400, "total_steps": 38160, "loss": 0.4283, "lr": 0.0007446337879777802, "epoch": 8.071278825995806, "percentage": 40.36, "elapsed_time": "0:39:29", "remaining_time": "0:58:22", "throughput": 4237.66, "total_tokens": 10043224} {"current_steps": 15405, "total_steps": 38160, "loss": 0.4139, "lr": 0.0007444343178865948, "epoch": 8.073899371069182, "percentage": 40.37, "elapsed_time": "0:39:30", "remaining_time": "0:58:21", "throughput": 4237.64, "total_tokens": 10045976} {"current_steps": 15410, "total_steps": 38160, "loss": 0.387, "lr": 0.0007442347966625389, "epoch": 8.076519916142558, "percentage": 40.38, "elapsed_time": "0:39:31", "remaining_time": "0:58:20", "throughput": 4237.62, "total_tokens": 10048824} {"current_steps": 15415, "total_steps": 38160, "loss": 0.4482, "lr": 0.0007440352243473496, "epoch": 8.079140461215934, "percentage": 40.4, "elapsed_time": "0:39:31", "remaining_time": "0:58:19", "throughput": 4237.6, "total_tokens": 10051512} {"current_steps": 15420, "total_steps": 38160, "loss": 0.5499, "lr": 0.0007438356009827758, "epoch": 8.081761006289309, "percentage": 40.41, "elapsed_time": "0:39:32", "remaining_time": "0:58:19", "throughput": 4237.65, "total_tokens": 10054712} {"current_steps": 15425, "total_steps": 38160, "loss": 0.5347, "lr": 0.0007436359266105759, "epoch": 8.084381551362684, "percentage": 40.42, "elapsed_time": "0:39:33", "remaining_time": "0:58:18", "throughput": 4237.77, "total_tokens": 10058232} {"current_steps": 15430, "total_steps": 38160, "loss": 0.4843, "lr": 0.0007434362012725198, "epoch": 8.08700209643606, "percentage": 40.44, "elapsed_time": "0:39:34", "remaining_time": "0:58:17", "throughput": 4237.92, "total_tokens": 10061880} {"current_steps": 15435, "total_steps": 38160, "loss": 0.4756, "lr": 0.0007432364250103877, "epoch": 8.089622641509434, "percentage": 40.45, "elapsed_time": "0:39:34", "remaining_time": "0:58:16", "throughput": 4237.96, "total_tokens": 10064984} {"current_steps": 15440, "total_steps": 38160, "loss": 0.4515, "lr": 0.0007430365978659704, "epoch": 8.09224318658281, "percentage": 40.46, "elapsed_time": "0:39:35", "remaining_time": "0:58:15", "throughput": 4237.86, "total_tokens": 10067384} {"current_steps": 15445, "total_steps": 38160, "loss": 0.4576, "lr": 0.0007428367198810694, "epoch": 8.094863731656185, "percentage": 40.47, "elapsed_time": "0:39:36", "remaining_time": "0:58:14", "throughput": 4237.98, "total_tokens": 10070776} {"current_steps": 15450, "total_steps": 38160, "loss": 0.3642, "lr": 0.0007426367910974973, "epoch": 8.09748427672956, "percentage": 40.49, "elapsed_time": "0:39:37", "remaining_time": "0:58:14", "throughput": 4238.09, "total_tokens": 10074104} {"current_steps": 15455, "total_steps": 38160, "loss": 0.3941, "lr": 0.0007424368115570763, "epoch": 8.100104821802935, "percentage": 40.5, "elapsed_time": "0:39:37", "remaining_time": "0:58:13", "throughput": 4238.24, "total_tokens": 10077784} {"current_steps": 15460, "total_steps": 38160, "loss": 0.5034, "lr": 0.0007422367813016405, "epoch": 8.10272536687631, "percentage": 40.51, "elapsed_time": "0:39:38", "remaining_time": "0:58:12", "throughput": 4238.55, "total_tokens": 10082392} {"current_steps": 15465, "total_steps": 38160, "loss": 0.398, "lr": 0.0007420367003730335, "epoch": 8.105345911949685, "percentage": 40.53, "elapsed_time": "0:39:39", "remaining_time": "0:58:11", "throughput": 4238.64, "total_tokens": 10085656} {"current_steps": 15470, "total_steps": 38160, "loss": 0.4781, "lr": 0.0007418365688131103, "epoch": 8.10796645702306, "percentage": 40.54, "elapsed_time": "0:39:40", "remaining_time": "0:58:11", "throughput": 4238.83, "total_tokens": 10089688} {"current_steps": 15475, "total_steps": 38160, "loss": 0.5415, "lr": 0.0007416363866637356, "epoch": 8.110587002096436, "percentage": 40.55, "elapsed_time": "0:39:40", "remaining_time": "0:58:10", "throughput": 4238.84, "total_tokens": 10092632} {"current_steps": 15480, "total_steps": 38160, "loss": 0.4565, "lr": 0.0007414361539667857, "epoch": 8.11320754716981, "percentage": 40.57, "elapsed_time": "0:39:41", "remaining_time": "0:58:09", "throughput": 4238.8, "total_tokens": 10095384} {"current_steps": 15485, "total_steps": 38160, "loss": 0.5165, "lr": 0.0007412358707641468, "epoch": 8.115828092243186, "percentage": 40.58, "elapsed_time": "0:39:42", "remaining_time": "0:58:09", "throughput": 4239.28, "total_tokens": 10101272} {"current_steps": 15490, "total_steps": 38160, "loss": 0.5086, "lr": 0.0007410355370977158, "epoch": 8.118448637316561, "percentage": 40.59, "elapsed_time": "0:39:43", "remaining_time": "0:58:08", "throughput": 4239.43, "total_tokens": 10104920} {"current_steps": 15495, "total_steps": 38160, "loss": 0.4807, "lr": 0.0007408351530094005, "epoch": 8.121069182389936, "percentage": 40.61, "elapsed_time": "0:39:44", "remaining_time": "0:58:07", "throughput": 4239.56, "total_tokens": 10108440} {"current_steps": 15500, "total_steps": 38160, "loss": 0.4061, "lr": 0.0007406347185411187, "epoch": 8.123689727463312, "percentage": 40.62, "elapsed_time": "0:39:45", "remaining_time": "0:58:06", "throughput": 4239.63, "total_tokens": 10111672} {"current_steps": 15505, "total_steps": 38160, "loss": 0.5184, "lr": 0.0007404342337347992, "epoch": 8.126310272536688, "percentage": 40.63, "elapsed_time": "0:39:45", "remaining_time": "0:58:06", "throughput": 4239.8, "total_tokens": 10115448} {"current_steps": 15510, "total_steps": 38160, "loss": 0.3763, "lr": 0.000740233698632381, "epoch": 8.128930817610064, "percentage": 40.64, "elapsed_time": "0:39:46", "remaining_time": "0:58:05", "throughput": 4239.79, "total_tokens": 10118328} {"current_steps": 15515, "total_steps": 38160, "loss": 0.4825, "lr": 0.0007400331132758136, "epoch": 8.131551362683439, "percentage": 40.66, "elapsed_time": "0:39:47", "remaining_time": "0:58:04", "throughput": 4240.02, "total_tokens": 10122328} {"current_steps": 15520, "total_steps": 38160, "loss": 0.4991, "lr": 0.0007398324777070576, "epoch": 8.134171907756814, "percentage": 40.67, "elapsed_time": "0:39:47", "remaining_time": "0:58:03", "throughput": 4240.01, "total_tokens": 10125112} {"current_steps": 15525, "total_steps": 38160, "loss": 0.3635, "lr": 0.0007396317919680832, "epoch": 8.13679245283019, "percentage": 40.68, "elapsed_time": "0:39:48", "remaining_time": "0:58:02", "throughput": 4240.07, "total_tokens": 10128280} {"current_steps": 15530, "total_steps": 38160, "loss": 0.3623, "lr": 0.0007394310561008717, "epoch": 8.139412997903564, "percentage": 40.7, "elapsed_time": "0:39:49", "remaining_time": "0:58:01", "throughput": 4240.11, "total_tokens": 10131320} {"current_steps": 15535, "total_steps": 38160, "loss": 0.4633, "lr": 0.0007392302701474151, "epoch": 8.14203354297694, "percentage": 40.71, "elapsed_time": "0:39:50", "remaining_time": "0:58:01", "throughput": 4240.33, "total_tokens": 10135384} {"current_steps": 15540, "total_steps": 38160, "loss": 0.5788, "lr": 0.0007390294341497151, "epoch": 8.144654088050315, "percentage": 40.72, "elapsed_time": "0:39:50", "remaining_time": "0:58:00", "throughput": 4240.39, "total_tokens": 10138520} {"current_steps": 15545, "total_steps": 38160, "loss": 0.4522, "lr": 0.0007388285481497845, "epoch": 8.14727463312369, "percentage": 40.74, "elapsed_time": "0:39:51", "remaining_time": "0:57:59", "throughput": 4240.42, "total_tokens": 10141528} {"current_steps": 15550, "total_steps": 38160, "loss": 0.5004, "lr": 0.0007386276121896465, "epoch": 8.149895178197065, "percentage": 40.75, "elapsed_time": "0:39:52", "remaining_time": "0:57:58", "throughput": 4240.44, "total_tokens": 10144568} {"current_steps": 15555, "total_steps": 38160, "loss": 0.4567, "lr": 0.0007384266263113342, "epoch": 8.15251572327044, "percentage": 40.76, "elapsed_time": "0:39:53", "remaining_time": "0:57:57", "throughput": 4240.67, "total_tokens": 10148504} {"current_steps": 15560, "total_steps": 38160, "loss": 0.4814, "lr": 0.0007382255905568919, "epoch": 8.155136268343815, "percentage": 40.78, "elapsed_time": "0:39:53", "remaining_time": "0:57:56", "throughput": 4240.65, "total_tokens": 10151288} {"current_steps": 15565, "total_steps": 38160, "loss": 0.4558, "lr": 0.000738024504968374, "epoch": 8.15775681341719, "percentage": 40.79, "elapsed_time": "0:39:54", "remaining_time": "0:57:56", "throughput": 4240.77, "total_tokens": 10154744} {"current_steps": 15570, "total_steps": 38160, "loss": 0.358, "lr": 0.0007378233695878449, "epoch": 8.160377358490566, "percentage": 40.8, "elapsed_time": "0:39:55", "remaining_time": "0:57:55", "throughput": 4240.87, "total_tokens": 10158136} {"current_steps": 15575, "total_steps": 38160, "loss": 0.4109, "lr": 0.0007376221844573803, "epoch": 8.16299790356394, "percentage": 40.81, "elapsed_time": "0:39:56", "remaining_time": "0:57:54", "throughput": 4240.97, "total_tokens": 10161560} {"current_steps": 15580, "total_steps": 38160, "loss": 0.495, "lr": 0.0007374209496190656, "epoch": 8.165618448637316, "percentage": 40.83, "elapsed_time": "0:39:56", "remaining_time": "0:57:53", "throughput": 4240.88, "total_tokens": 10163960} {"current_steps": 15585, "total_steps": 38160, "loss": 0.3452, "lr": 0.0007372196651149968, "epoch": 8.168238993710691, "percentage": 40.84, "elapsed_time": "0:39:57", "remaining_time": "0:57:52", "throughput": 4240.88, "total_tokens": 10166776} {"current_steps": 15590, "total_steps": 38160, "loss": 0.3459, "lr": 0.0007370183309872805, "epoch": 8.170859538784066, "percentage": 40.85, "elapsed_time": "0:39:57", "remaining_time": "0:57:51", "throughput": 4240.87, "total_tokens": 10169592} {"current_steps": 15595, "total_steps": 38160, "loss": 0.4298, "lr": 0.0007368169472780335, "epoch": 8.173480083857442, "percentage": 40.87, "elapsed_time": "0:39:58", "remaining_time": "0:57:50", "throughput": 4240.94, "total_tokens": 10172760} {"current_steps": 15600, "total_steps": 38160, "loss": 0.4605, "lr": 0.0007366155140293828, "epoch": 8.176100628930818, "percentage": 40.88, "elapsed_time": "0:39:59", "remaining_time": "0:57:50", "throughput": 4241.28, "total_tokens": 10177496} {"current_steps": 15605, "total_steps": 38160, "loss": 0.4404, "lr": 0.000736414031283466, "epoch": 8.178721174004194, "percentage": 40.89, "elapsed_time": "0:40:00", "remaining_time": "0:57:49", "throughput": 4241.44, "total_tokens": 10181112} {"current_steps": 15610, "total_steps": 38160, "loss": 0.4784, "lr": 0.000736212499082431, "epoch": 8.181341719077569, "percentage": 40.91, "elapsed_time": "0:40:01", "remaining_time": "0:57:48", "throughput": 4241.56, "total_tokens": 10184632} {"current_steps": 15615, "total_steps": 38160, "loss": 0.4417, "lr": 0.0007360109174684359, "epoch": 8.183962264150944, "percentage": 40.92, "elapsed_time": "0:40:01", "remaining_time": "0:57:47", "throughput": 4241.58, "total_tokens": 10187576} {"current_steps": 15620, "total_steps": 38160, "loss": 0.5626, "lr": 0.0007358092864836497, "epoch": 8.18658280922432, "percentage": 40.93, "elapsed_time": "0:40:02", "remaining_time": "0:57:46", "throughput": 4241.62, "total_tokens": 10190648} {"current_steps": 15625, "total_steps": 38160, "loss": 0.3287, "lr": 0.0007356076061702508, "epoch": 8.189203354297694, "percentage": 40.95, "elapsed_time": "0:40:03", "remaining_time": "0:57:46", "throughput": 4241.7, "total_tokens": 10193944} {"current_steps": 15630, "total_steps": 38160, "loss": 0.4079, "lr": 0.0007354058765704288, "epoch": 8.19182389937107, "percentage": 40.96, "elapsed_time": "0:40:03", "remaining_time": "0:57:45", "throughput": 4241.66, "total_tokens": 10196824} {"current_steps": 15635, "total_steps": 38160, "loss": 0.5183, "lr": 0.000735204097726383, "epoch": 8.194444444444445, "percentage": 40.97, "elapsed_time": "0:40:04", "remaining_time": "0:57:44", "throughput": 4241.79, "total_tokens": 10200312} {"current_steps": 15640, "total_steps": 38160, "loss": 0.5734, "lr": 0.0007350022696803233, "epoch": 8.19706498951782, "percentage": 40.99, "elapsed_time": "0:40:05", "remaining_time": "0:57:43", "throughput": 4241.95, "total_tokens": 10203992} {"current_steps": 15645, "total_steps": 38160, "loss": 0.416, "lr": 0.0007348003924744699, "epoch": 8.199685534591195, "percentage": 41.0, "elapsed_time": "0:40:06", "remaining_time": "0:57:42", "throughput": 4241.95, "total_tokens": 10206904} {"current_steps": 15650, "total_steps": 38160, "loss": 0.4541, "lr": 0.000734598466151053, "epoch": 8.20230607966457, "percentage": 41.01, "elapsed_time": "0:40:06", "remaining_time": "0:57:41", "throughput": 4241.97, "total_tokens": 10209880} {"current_steps": 15655, "total_steps": 38160, "loss": 0.5031, "lr": 0.0007343964907523135, "epoch": 8.204926624737945, "percentage": 41.02, "elapsed_time": "0:40:07", "remaining_time": "0:57:41", "throughput": 4242.47, "total_tokens": 10215864} {"current_steps": 15660, "total_steps": 38160, "loss": 0.4471, "lr": 0.0007341944663205023, "epoch": 8.20754716981132, "percentage": 41.04, "elapsed_time": "0:40:08", "remaining_time": "0:57:40", "throughput": 4242.51, "total_tokens": 10218904} {"current_steps": 15665, "total_steps": 38160, "loss": 0.4026, "lr": 0.0007339923928978805, "epoch": 8.210167714884696, "percentage": 41.05, "elapsed_time": "0:40:09", "remaining_time": "0:57:40", "throughput": 4243.06, "total_tokens": 10225048} {"current_steps": 15670, "total_steps": 38160, "loss": 0.4522, "lr": 0.0007337902705267197, "epoch": 8.21278825995807, "percentage": 41.06, "elapsed_time": "0:40:10", "remaining_time": "0:57:39", "throughput": 4243.0, "total_tokens": 10227576} {"current_steps": 15675, "total_steps": 38160, "loss": 0.6135, "lr": 0.0007335880992493016, "epoch": 8.215408805031446, "percentage": 41.08, "elapsed_time": "0:40:11", "remaining_time": "0:57:38", "throughput": 4243.05, "total_tokens": 10230712} {"current_steps": 15680, "total_steps": 38160, "loss": 0.544, "lr": 0.000733385879107918, "epoch": 8.218029350104821, "percentage": 41.09, "elapsed_time": "0:40:11", "remaining_time": "0:57:37", "throughput": 4243.1, "total_tokens": 10233848} {"current_steps": 15685, "total_steps": 38160, "loss": 0.4757, "lr": 0.000733183610144871, "epoch": 8.220649895178196, "percentage": 41.1, "elapsed_time": "0:40:12", "remaining_time": "0:57:37", "throughput": 4243.31, "total_tokens": 10237816} {"current_steps": 15690, "total_steps": 38160, "loss": 0.4344, "lr": 0.0007329812924024732, "epoch": 8.223270440251572, "percentage": 41.12, "elapsed_time": "0:40:13", "remaining_time": "0:57:36", "throughput": 4243.41, "total_tokens": 10241272} {"current_steps": 15695, "total_steps": 38160, "loss": 0.4673, "lr": 0.0007327789259230468, "epoch": 8.225890985324948, "percentage": 41.13, "elapsed_time": "0:40:14", "remaining_time": "0:57:35", "throughput": 4243.36, "total_tokens": 10243864} {"current_steps": 15700, "total_steps": 38160, "loss": 0.3279, "lr": 0.0007325765107489249, "epoch": 8.228511530398324, "percentage": 41.14, "elapsed_time": "0:40:14", "remaining_time": "0:57:34", "throughput": 4243.36, "total_tokens": 10246712} {"current_steps": 15705, "total_steps": 38160, "loss": 0.5034, "lr": 0.0007323740469224505, "epoch": 8.231132075471699, "percentage": 41.16, "elapsed_time": "0:40:15", "remaining_time": "0:57:33", "throughput": 4243.56, "total_tokens": 10250648} {"current_steps": 15710, "total_steps": 38160, "loss": 0.4929, "lr": 0.0007321715344859763, "epoch": 8.233752620545074, "percentage": 41.17, "elapsed_time": "0:40:16", "remaining_time": "0:57:32", "throughput": 4243.59, "total_tokens": 10253624} {"current_steps": 15715, "total_steps": 38160, "loss": 0.426, "lr": 0.000731968973481866, "epoch": 8.23637316561845, "percentage": 41.18, "elapsed_time": "0:40:16", "remaining_time": "0:57:32", "throughput": 4243.59, "total_tokens": 10256536} {"current_steps": 15720, "total_steps": 38160, "loss": 0.4262, "lr": 0.0007317663639524928, "epoch": 8.238993710691824, "percentage": 41.19, "elapsed_time": "0:40:17", "remaining_time": "0:57:31", "throughput": 4243.59, "total_tokens": 10259448} {"current_steps": 15725, "total_steps": 38160, "loss": 0.4584, "lr": 0.0007315637059402404, "epoch": 8.2416142557652, "percentage": 41.21, "elapsed_time": "0:40:18", "remaining_time": "0:57:30", "throughput": 4243.89, "total_tokens": 10263768} {"current_steps": 15730, "total_steps": 38160, "loss": 0.4811, "lr": 0.0007313609994875024, "epoch": 8.244234800838575, "percentage": 41.22, "elapsed_time": "0:40:19", "remaining_time": "0:57:29", "throughput": 4243.89, "total_tokens": 10266712} {"current_steps": 15735, "total_steps": 38160, "loss": 0.6723, "lr": 0.0007311582446366831, "epoch": 8.24685534591195, "percentage": 41.23, "elapsed_time": "0:40:19", "remaining_time": "0:57:28", "throughput": 4244.12, "total_tokens": 10270712} {"current_steps": 15740, "total_steps": 38160, "loss": 0.5871, "lr": 0.000730955441430196, "epoch": 8.249475890985325, "percentage": 41.25, "elapsed_time": "0:40:20", "remaining_time": "0:57:28", "throughput": 4244.3, "total_tokens": 10274456} {"current_steps": 15745, "total_steps": 38160, "loss": 0.4464, "lr": 0.0007307525899104655, "epoch": 8.2520964360587, "percentage": 41.26, "elapsed_time": "0:40:21", "remaining_time": "0:57:27", "throughput": 4244.6, "total_tokens": 10278840} {"current_steps": 15750, "total_steps": 38160, "loss": 0.3343, "lr": 0.0007305496901199259, "epoch": 8.254716981132075, "percentage": 41.27, "elapsed_time": "0:40:22", "remaining_time": "0:57:26", "throughput": 4244.7, "total_tokens": 10282104} {"current_steps": 15755, "total_steps": 38160, "loss": 0.5292, "lr": 0.0007303467421010211, "epoch": 8.25733752620545, "percentage": 41.29, "elapsed_time": "0:40:23", "remaining_time": "0:57:25", "throughput": 4244.77, "total_tokens": 10285272} {"current_steps": 15760, "total_steps": 38160, "loss": 0.4461, "lr": 0.0007301437458962061, "epoch": 8.259958071278826, "percentage": 41.3, "elapsed_time": "0:40:23", "remaining_time": "0:57:24", "throughput": 4244.84, "total_tokens": 10288472} {"current_steps": 15765, "total_steps": 38160, "loss": 0.5011, "lr": 0.0007299407015479448, "epoch": 8.2625786163522, "percentage": 41.31, "elapsed_time": "0:40:24", "remaining_time": "0:57:23", "throughput": 4244.8, "total_tokens": 10291128} {"current_steps": 15770, "total_steps": 38160, "loss": 0.4603, "lr": 0.0007297376090987122, "epoch": 8.265199161425576, "percentage": 41.33, "elapsed_time": "0:40:25", "remaining_time": "0:57:23", "throughput": 4245.03, "total_tokens": 10295288} {"current_steps": 15775, "total_steps": 38160, "loss": 0.4338, "lr": 0.0007295344685909926, "epoch": 8.267819706498951, "percentage": 41.34, "elapsed_time": "0:40:25", "remaining_time": "0:57:22", "throughput": 4245.13, "total_tokens": 10298680} {"current_steps": 15780, "total_steps": 38160, "loss": 0.4846, "lr": 0.000729331280067281, "epoch": 8.270440251572326, "percentage": 41.35, "elapsed_time": "0:40:26", "remaining_time": "0:57:21", "throughput": 4245.12, "total_tokens": 10301496} {"current_steps": 15785, "total_steps": 38160, "loss": 0.3779, "lr": 0.0007291280435700819, "epoch": 8.273060796645701, "percentage": 41.37, "elapsed_time": "0:40:27", "remaining_time": "0:57:20", "throughput": 4245.05, "total_tokens": 10303992} {"current_steps": 15790, "total_steps": 38160, "loss": 0.4063, "lr": 0.0007289247591419102, "epoch": 8.275681341719078, "percentage": 41.38, "elapsed_time": "0:40:27", "remaining_time": "0:57:19", "throughput": 4245.04, "total_tokens": 10306808} {"current_steps": 15795, "total_steps": 38160, "loss": 0.4089, "lr": 0.0007287214268252904, "epoch": 8.278301886792454, "percentage": 41.39, "elapsed_time": "0:40:28", "remaining_time": "0:57:19", "throughput": 4245.21, "total_tokens": 10310584} {"current_steps": 15800, "total_steps": 38160, "loss": 0.3499, "lr": 0.0007285180466627577, "epoch": 8.280922431865829, "percentage": 41.4, "elapsed_time": "0:40:29", "remaining_time": "0:57:18", "throughput": 4245.5, "total_tokens": 10314872} {"current_steps": 15805, "total_steps": 38160, "loss": 0.3708, "lr": 0.0007283146186968565, "epoch": 8.283542976939204, "percentage": 41.42, "elapsed_time": "0:40:30", "remaining_time": "0:57:17", "throughput": 4245.5, "total_tokens": 10317624} {"current_steps": 15810, "total_steps": 38160, "loss": 0.3894, "lr": 0.000728111142970142, "epoch": 8.286163522012579, "percentage": 41.43, "elapsed_time": "0:40:30", "remaining_time": "0:57:16", "throughput": 4245.47, "total_tokens": 10320408} {"current_steps": 15815, "total_steps": 38160, "loss": 0.498, "lr": 0.0007279076195251788, "epoch": 8.288784067085954, "percentage": 41.44, "elapsed_time": "0:40:31", "remaining_time": "0:57:15", "throughput": 4245.49, "total_tokens": 10323320} {"current_steps": 15820, "total_steps": 38160, "loss": 0.3803, "lr": 0.0007277040484045416, "epoch": 8.29140461215933, "percentage": 41.46, "elapsed_time": "0:40:32", "remaining_time": "0:57:14", "throughput": 4245.61, "total_tokens": 10326776} {"current_steps": 15825, "total_steps": 38160, "loss": 0.2886, "lr": 0.0007275004296508154, "epoch": 8.294025157232705, "percentage": 41.47, "elapsed_time": "0:40:33", "remaining_time": "0:57:14", "throughput": 4245.81, "total_tokens": 10330584} {"current_steps": 15830, "total_steps": 38160, "loss": 0.4489, "lr": 0.0007272967633065947, "epoch": 8.29664570230608, "percentage": 41.48, "elapsed_time": "0:40:33", "remaining_time": "0:57:13", "throughput": 4245.69, "total_tokens": 10332824} {"current_steps": 15835, "total_steps": 38160, "loss": 0.5632, "lr": 0.0007270930494144843, "epoch": 8.299266247379455, "percentage": 41.5, "elapsed_time": "0:40:34", "remaining_time": "0:57:12", "throughput": 4245.66, "total_tokens": 10335480} {"current_steps": 15840, "total_steps": 38160, "loss": 0.4803, "lr": 0.0007268892880170988, "epoch": 8.30188679245283, "percentage": 41.51, "elapsed_time": "0:40:35", "remaining_time": "0:57:11", "throughput": 4245.68, "total_tokens": 10338424} {"current_steps": 15845, "total_steps": 38160, "loss": 0.464, "lr": 0.0007266854791570625, "epoch": 8.304507337526205, "percentage": 41.52, "elapsed_time": "0:40:35", "remaining_time": "0:57:10", "throughput": 4245.78, "total_tokens": 10341784} {"current_steps": 15850, "total_steps": 38160, "loss": 0.4462, "lr": 0.0007264816228770103, "epoch": 8.30712788259958, "percentage": 41.54, "elapsed_time": "0:40:36", "remaining_time": "0:57:09", "throughput": 4245.86, "total_tokens": 10345144} {"current_steps": 15855, "total_steps": 38160, "loss": 0.4094, "lr": 0.0007262777192195866, "epoch": 8.309748427672956, "percentage": 41.55, "elapsed_time": "0:40:37", "remaining_time": "0:57:08", "throughput": 4246.06, "total_tokens": 10348984} {"current_steps": 15860, "total_steps": 38160, "loss": 0.4641, "lr": 0.0007260737682274452, "epoch": 8.31236897274633, "percentage": 41.56, "elapsed_time": "0:40:38", "remaining_time": "0:57:07", "throughput": 4246.12, "total_tokens": 10352152} {"current_steps": 15865, "total_steps": 38160, "loss": 0.5134, "lr": 0.0007258697699432511, "epoch": 8.314989517819706, "percentage": 41.57, "elapsed_time": "0:40:38", "remaining_time": "0:57:06", "throughput": 4245.99, "total_tokens": 10354392} {"current_steps": 15870, "total_steps": 38160, "loss": 0.7279, "lr": 0.0007256657244096775, "epoch": 8.317610062893081, "percentage": 41.59, "elapsed_time": "0:40:39", "remaining_time": "0:57:06", "throughput": 4246.01, "total_tokens": 10357368} {"current_steps": 15875, "total_steps": 38160, "loss": 0.4135, "lr": 0.0007254616316694091, "epoch": 8.320230607966456, "percentage": 41.6, "elapsed_time": "0:40:39", "remaining_time": "0:57:05", "throughput": 4245.95, "total_tokens": 10359864} {"current_steps": 15880, "total_steps": 38160, "loss": 0.5901, "lr": 0.0007252574917651398, "epoch": 8.322851153039831, "percentage": 41.61, "elapsed_time": "0:40:40", "remaining_time": "0:57:04", "throughput": 4246.26, "total_tokens": 10364536} {"current_steps": 15885, "total_steps": 38160, "loss": 0.4941, "lr": 0.0007250533047395728, "epoch": 8.325471698113208, "percentage": 41.63, "elapsed_time": "0:40:41", "remaining_time": "0:57:03", "throughput": 4246.34, "total_tokens": 10367864} {"current_steps": 15890, "total_steps": 38160, "loss": 0.5218, "lr": 0.0007248490706354221, "epoch": 8.328092243186584, "percentage": 41.64, "elapsed_time": "0:40:42", "remaining_time": "0:57:03", "throughput": 4246.52, "total_tokens": 10371736} {"current_steps": 15895, "total_steps": 38160, "loss": 0.3332, "lr": 0.0007246447894954109, "epoch": 8.330712788259959, "percentage": 41.65, "elapsed_time": "0:40:43", "remaining_time": "0:57:02", "throughput": 4246.64, "total_tokens": 10375192} {"current_steps": 15900, "total_steps": 38160, "loss": 0.4251, "lr": 0.0007244404613622727, "epoch": 8.333333333333334, "percentage": 41.67, "elapsed_time": "0:40:44", "remaining_time": "0:57:02", "throughput": 4247.5, "total_tokens": 10383288} {"current_steps": 15905, "total_steps": 38160, "loss": 0.5489, "lr": 0.0007242360862787507, "epoch": 8.335953878406709, "percentage": 41.68, "elapsed_time": "0:40:45", "remaining_time": "0:57:01", "throughput": 4247.7, "total_tokens": 10387192} {"current_steps": 15910, "total_steps": 38160, "loss": 0.4212, "lr": 0.0007240316642875975, "epoch": 8.338574423480084, "percentage": 41.69, "elapsed_time": "0:40:45", "remaining_time": "0:57:00", "throughput": 4247.57, "total_tokens": 10389400} {"current_steps": 15915, "total_steps": 38160, "loss": 0.5033, "lr": 0.0007238271954315759, "epoch": 8.34119496855346, "percentage": 41.71, "elapsed_time": "0:40:46", "remaining_time": "0:56:59", "throughput": 4247.69, "total_tokens": 10392920} {"current_steps": 15920, "total_steps": 38160, "loss": 0.4463, "lr": 0.0007236226797534589, "epoch": 8.343815513626835, "percentage": 41.72, "elapsed_time": "0:40:47", "remaining_time": "0:56:59", "throughput": 4247.77, "total_tokens": 10396280} {"current_steps": 15925, "total_steps": 38160, "loss": 0.5118, "lr": 0.0007234181172960283, "epoch": 8.34643605870021, "percentage": 41.73, "elapsed_time": "0:40:48", "remaining_time": "0:56:58", "throughput": 4247.92, "total_tokens": 10399960} {"current_steps": 15930, "total_steps": 38160, "loss": 0.4551, "lr": 0.0007232135081020766, "epoch": 8.349056603773585, "percentage": 41.75, "elapsed_time": "0:40:48", "remaining_time": "0:56:57", "throughput": 4247.96, "total_tokens": 10403128} {"current_steps": 15935, "total_steps": 38160, "loss": 0.4246, "lr": 0.0007230088522144054, "epoch": 8.35167714884696, "percentage": 41.76, "elapsed_time": "0:40:49", "remaining_time": "0:56:56", "throughput": 4247.95, "total_tokens": 10405976} {"current_steps": 15940, "total_steps": 38160, "loss": 0.4433, "lr": 0.0007228041496758265, "epoch": 8.354297693920335, "percentage": 41.77, "elapsed_time": "0:40:50", "remaining_time": "0:56:55", "throughput": 4247.91, "total_tokens": 10408632} {"current_steps": 15945, "total_steps": 38160, "loss": 0.5252, "lr": 0.0007225994005291615, "epoch": 8.35691823899371, "percentage": 41.78, "elapsed_time": "0:40:51", "remaining_time": "0:56:54", "throughput": 4248.05, "total_tokens": 10412216} {"current_steps": 15950, "total_steps": 38160, "loss": 0.444, "lr": 0.0007223946048172414, "epoch": 8.359538784067086, "percentage": 41.8, "elapsed_time": "0:40:51", "remaining_time": "0:56:53", "throughput": 4247.97, "total_tokens": 10414680} {"current_steps": 15955, "total_steps": 38160, "loss": 0.5205, "lr": 0.0007221897625829072, "epoch": 8.36215932914046, "percentage": 41.81, "elapsed_time": "0:40:52", "remaining_time": "0:56:53", "throughput": 4247.98, "total_tokens": 10417560} {"current_steps": 15960, "total_steps": 38160, "loss": 0.3483, "lr": 0.0007219848738690095, "epoch": 8.364779874213836, "percentage": 41.82, "elapsed_time": "0:40:52", "remaining_time": "0:56:52", "throughput": 4247.9, "total_tokens": 10420056} {"current_steps": 15965, "total_steps": 38160, "loss": 0.3547, "lr": 0.0007217799387184089, "epoch": 8.367400419287211, "percentage": 41.84, "elapsed_time": "0:40:53", "remaining_time": "0:56:51", "throughput": 4247.97, "total_tokens": 10423288} {"current_steps": 15970, "total_steps": 38160, "loss": 0.5003, "lr": 0.0007215749571739752, "epoch": 8.370020964360586, "percentage": 41.85, "elapsed_time": "0:40:54", "remaining_time": "0:56:50", "throughput": 4247.88, "total_tokens": 10425752} {"current_steps": 15975, "total_steps": 38160, "loss": 0.3969, "lr": 0.0007213699292785883, "epoch": 8.372641509433961, "percentage": 41.86, "elapsed_time": "0:40:55", "remaining_time": "0:56:49", "throughput": 4248.04, "total_tokens": 10429432} {"current_steps": 15980, "total_steps": 38160, "loss": 0.448, "lr": 0.0007211648550751377, "epoch": 8.375262054507338, "percentage": 41.88, "elapsed_time": "0:40:55", "remaining_time": "0:56:48", "throughput": 4248.17, "total_tokens": 10432856} {"current_steps": 15985, "total_steps": 38160, "loss": 0.5244, "lr": 0.0007209597346065226, "epoch": 8.377882599580714, "percentage": 41.89, "elapsed_time": "0:40:56", "remaining_time": "0:56:47", "throughput": 4248.33, "total_tokens": 10436600} {"current_steps": 15990, "total_steps": 38160, "loss": 0.4207, "lr": 0.000720754567915652, "epoch": 8.380503144654089, "percentage": 41.9, "elapsed_time": "0:40:57", "remaining_time": "0:56:47", "throughput": 4248.32, "total_tokens": 10439352} {"current_steps": 15995, "total_steps": 38160, "loss": 0.4712, "lr": 0.000720549355045444, "epoch": 8.383123689727464, "percentage": 41.92, "elapsed_time": "0:40:57", "remaining_time": "0:56:46", "throughput": 4248.28, "total_tokens": 10441976} {"current_steps": 16000, "total_steps": 38160, "loss": 0.4836, "lr": 0.0007203440960388273, "epoch": 8.385744234800839, "percentage": 41.93, "elapsed_time": "0:40:58", "remaining_time": "0:56:45", "throughput": 4248.35, "total_tokens": 10445272} {"current_steps": 16005, "total_steps": 38160, "loss": 0.5374, "lr": 0.0007201387909387396, "epoch": 8.388364779874214, "percentage": 41.94, "elapsed_time": "0:40:59", "remaining_time": "0:56:44", "throughput": 4248.29, "total_tokens": 10447864} {"current_steps": 16010, "total_steps": 38160, "loss": 0.3996, "lr": 0.0007199334397881282, "epoch": 8.39098532494759, "percentage": 41.95, "elapsed_time": "0:41:00", "remaining_time": "0:56:43", "throughput": 4248.52, "total_tokens": 10451992} {"current_steps": 16015, "total_steps": 38160, "loss": 0.524, "lr": 0.0007197280426299502, "epoch": 8.393605870020965, "percentage": 41.97, "elapsed_time": "0:41:00", "remaining_time": "0:56:42", "throughput": 4248.55, "total_tokens": 10454968} {"current_steps": 16020, "total_steps": 38160, "loss": 0.4876, "lr": 0.0007195225995071727, "epoch": 8.39622641509434, "percentage": 41.98, "elapsed_time": "0:41:01", "remaining_time": "0:56:41", "throughput": 4248.67, "total_tokens": 10458392} {"current_steps": 16025, "total_steps": 38160, "loss": 0.5741, "lr": 0.0007193171104627718, "epoch": 8.398846960167715, "percentage": 41.99, "elapsed_time": "0:41:02", "remaining_time": "0:56:41", "throughput": 4248.64, "total_tokens": 10461144} {"current_steps": 16030, "total_steps": 38160, "loss": 0.4064, "lr": 0.0007191115755397333, "epoch": 8.40146750524109, "percentage": 42.01, "elapsed_time": "0:41:02", "remaining_time": "0:56:40", "throughput": 4248.59, "total_tokens": 10463768} {"current_steps": 16035, "total_steps": 38160, "loss": 0.422, "lr": 0.0007189059947810531, "epoch": 8.404088050314465, "percentage": 42.02, "elapsed_time": "0:41:03", "remaining_time": "0:56:39", "throughput": 4248.68, "total_tokens": 10467128} {"current_steps": 16040, "total_steps": 38160, "loss": 0.442, "lr": 0.0007187003682297363, "epoch": 8.40670859538784, "percentage": 42.03, "elapsed_time": "0:41:04", "remaining_time": "0:56:38", "throughput": 4248.53, "total_tokens": 10469240} {"current_steps": 16045, "total_steps": 38160, "loss": 0.4523, "lr": 0.0007184946959287972, "epoch": 8.409329140461216, "percentage": 42.05, "elapsed_time": "0:41:04", "remaining_time": "0:56:37", "throughput": 4248.65, "total_tokens": 10472728} {"current_steps": 16050, "total_steps": 38160, "loss": 0.3999, "lr": 0.0007182889779212609, "epoch": 8.41194968553459, "percentage": 42.06, "elapsed_time": "0:41:05", "remaining_time": "0:56:36", "throughput": 4248.52, "total_tokens": 10474936} {"current_steps": 16055, "total_steps": 38160, "loss": 0.4685, "lr": 0.0007180832142501605, "epoch": 8.414570230607966, "percentage": 42.07, "elapsed_time": "0:41:06", "remaining_time": "0:56:35", "throughput": 4248.6, "total_tokens": 10478264} {"current_steps": 16060, "total_steps": 38160, "loss": 0.5175, "lr": 0.0007178774049585397, "epoch": 8.417190775681341, "percentage": 42.09, "elapsed_time": "0:41:07", "remaining_time": "0:56:34", "throughput": 4248.64, "total_tokens": 10481432} {"current_steps": 16065, "total_steps": 38160, "loss": 0.4244, "lr": 0.0007176715500894515, "epoch": 8.419811320754716, "percentage": 42.1, "elapsed_time": "0:41:07", "remaining_time": "0:56:33", "throughput": 4248.56, "total_tokens": 10483864} {"current_steps": 16070, "total_steps": 38160, "loss": 0.5176, "lr": 0.0007174656496859584, "epoch": 8.422431865828091, "percentage": 42.11, "elapsed_time": "0:41:08", "remaining_time": "0:56:33", "throughput": 4248.7, "total_tokens": 10487480} {"current_steps": 16075, "total_steps": 38160, "loss": 0.3553, "lr": 0.0007172597037911323, "epoch": 8.425052410901468, "percentage": 42.13, "elapsed_time": "0:41:09", "remaining_time": "0:56:32", "throughput": 4248.76, "total_tokens": 10490616} {"current_steps": 16080, "total_steps": 38160, "loss": 0.3708, "lr": 0.0007170537124480548, "epoch": 8.427672955974844, "percentage": 42.14, "elapsed_time": "0:41:09", "remaining_time": "0:56:31", "throughput": 4248.77, "total_tokens": 10493528} {"current_steps": 16085, "total_steps": 38160, "loss": 0.5056, "lr": 0.0007168476756998169, "epoch": 8.430293501048219, "percentage": 42.15, "elapsed_time": "0:41:10", "remaining_time": "0:56:30", "throughput": 4248.8, "total_tokens": 10496568} {"current_steps": 16090, "total_steps": 38160, "loss": 0.4647, "lr": 0.0007166415935895194, "epoch": 8.432914046121594, "percentage": 42.16, "elapsed_time": "0:41:11", "remaining_time": "0:56:29", "throughput": 4248.89, "total_tokens": 10499992} {"current_steps": 16095, "total_steps": 38160, "loss": 0.5007, "lr": 0.0007164354661602718, "epoch": 8.435534591194969, "percentage": 42.18, "elapsed_time": "0:41:11", "remaining_time": "0:56:28", "throughput": 4248.88, "total_tokens": 10502840} {"current_steps": 16100, "total_steps": 38160, "loss": 0.4488, "lr": 0.000716229293455194, "epoch": 8.438155136268344, "percentage": 42.19, "elapsed_time": "0:41:12", "remaining_time": "0:56:27", "throughput": 4248.89, "total_tokens": 10505752} {"current_steps": 16105, "total_steps": 38160, "loss": 0.4627, "lr": 0.000716023075517415, "epoch": 8.44077568134172, "percentage": 42.2, "elapsed_time": "0:41:13", "remaining_time": "0:56:27", "throughput": 4248.9, "total_tokens": 10508664} {"current_steps": 16110, "total_steps": 38160, "loss": 0.506, "lr": 0.000715816812390073, "epoch": 8.443396226415095, "percentage": 42.22, "elapsed_time": "0:41:13", "remaining_time": "0:56:26", "throughput": 4248.88, "total_tokens": 10511416} {"current_steps": 16115, "total_steps": 38160, "loss": 0.4333, "lr": 0.0007156105041163161, "epoch": 8.44601677148847, "percentage": 42.23, "elapsed_time": "0:41:14", "remaining_time": "0:56:25", "throughput": 4248.82, "total_tokens": 10513944} {"current_steps": 16120, "total_steps": 38160, "loss": 0.4324, "lr": 0.0007154041507393015, "epoch": 8.448637316561845, "percentage": 42.24, "elapsed_time": "0:41:15", "remaining_time": "0:56:24", "throughput": 4248.9, "total_tokens": 10517208} {"current_steps": 16125, "total_steps": 38160, "loss": 0.4423, "lr": 0.000715197752302196, "epoch": 8.45125786163522, "percentage": 42.26, "elapsed_time": "0:41:15", "remaining_time": "0:56:23", "throughput": 4248.84, "total_tokens": 10519704} {"current_steps": 16130, "total_steps": 38160, "loss": 0.5851, "lr": 0.0007149913088481759, "epoch": 8.453878406708595, "percentage": 42.27, "elapsed_time": "0:41:16", "remaining_time": "0:56:22", "throughput": 4248.92, "total_tokens": 10523160} {"current_steps": 16135, "total_steps": 38160, "loss": 0.4291, "lr": 0.0007147848204204266, "epoch": 8.45649895178197, "percentage": 42.28, "elapsed_time": "0:41:17", "remaining_time": "0:56:21", "throughput": 4248.94, "total_tokens": 10526168} {"current_steps": 16140, "total_steps": 38160, "loss": 0.3886, "lr": 0.0007145782870621435, "epoch": 8.459119496855346, "percentage": 42.3, "elapsed_time": "0:41:18", "remaining_time": "0:56:20", "throughput": 4248.89, "total_tokens": 10528824} {"current_steps": 16145, "total_steps": 38160, "loss": 0.4094, "lr": 0.0007143717088165304, "epoch": 8.46174004192872, "percentage": 42.31, "elapsed_time": "0:41:18", "remaining_time": "0:56:19", "throughput": 4248.87, "total_tokens": 10531640} {"current_steps": 16150, "total_steps": 38160, "loss": 0.3739, "lr": 0.0007141650857268019, "epoch": 8.464360587002096, "percentage": 42.32, "elapsed_time": "0:41:19", "remaining_time": "0:56:19", "throughput": 4248.93, "total_tokens": 10534808} {"current_steps": 16155, "total_steps": 38160, "loss": 0.4562, "lr": 0.0007139584178361807, "epoch": 8.466981132075471, "percentage": 42.33, "elapsed_time": "0:41:20", "remaining_time": "0:56:18", "throughput": 4248.96, "total_tokens": 10537784} {"current_steps": 16160, "total_steps": 38160, "loss": 0.5133, "lr": 0.0007137517051878994, "epoch": 8.469601677148846, "percentage": 42.35, "elapsed_time": "0:41:20", "remaining_time": "0:56:17", "throughput": 4248.96, "total_tokens": 10540760} {"current_steps": 16165, "total_steps": 38160, "loss": 0.4194, "lr": 0.0007135449478251998, "epoch": 8.472222222222221, "percentage": 42.36, "elapsed_time": "0:41:21", "remaining_time": "0:56:16", "throughput": 4248.99, "total_tokens": 10543928} {"current_steps": 16170, "total_steps": 38160, "loss": 0.5887, "lr": 0.0007133381457913336, "epoch": 8.474842767295598, "percentage": 42.37, "elapsed_time": "0:41:22", "remaining_time": "0:56:15", "throughput": 4248.92, "total_tokens": 10546456} {"current_steps": 16175, "total_steps": 38160, "loss": 0.4573, "lr": 0.0007131312991295611, "epoch": 8.477463312368974, "percentage": 42.39, "elapsed_time": "0:41:22", "remaining_time": "0:56:14", "throughput": 4249.0, "total_tokens": 10549752} {"current_steps": 16180, "total_steps": 38160, "loss": 0.5054, "lr": 0.0007129244078831525, "epoch": 8.480083857442349, "percentage": 42.4, "elapsed_time": "0:41:23", "remaining_time": "0:56:13", "throughput": 4249.08, "total_tokens": 10553048} {"current_steps": 16185, "total_steps": 38160, "loss": 0.484, "lr": 0.0007127174720953866, "epoch": 8.482704402515724, "percentage": 42.41, "elapsed_time": "0:41:24", "remaining_time": "0:56:12", "throughput": 4249.05, "total_tokens": 10555768} {"current_steps": 16190, "total_steps": 38160, "loss": 0.5293, "lr": 0.0007125104918095526, "epoch": 8.485324947589099, "percentage": 42.43, "elapsed_time": "0:41:25", "remaining_time": "0:56:12", "throughput": 4249.22, "total_tokens": 10559448} {"current_steps": 16195, "total_steps": 38160, "loss": 0.6494, "lr": 0.0007123034670689483, "epoch": 8.487945492662474, "percentage": 42.44, "elapsed_time": "0:41:25", "remaining_time": "0:56:11", "throughput": 4249.17, "total_tokens": 10562008} {"current_steps": 16200, "total_steps": 38160, "loss": 0.5054, "lr": 0.0007120963979168804, "epoch": 8.49056603773585, "percentage": 42.45, "elapsed_time": "0:41:26", "remaining_time": "0:56:10", "throughput": 4249.14, "total_tokens": 10564760} {"current_steps": 16205, "total_steps": 38160, "loss": 0.5668, "lr": 0.000711889284396666, "epoch": 8.493186582809225, "percentage": 42.47, "elapsed_time": "0:41:26", "remaining_time": "0:56:09", "throughput": 4249.12, "total_tokens": 10567512} {"current_steps": 16210, "total_steps": 38160, "loss": 0.3541, "lr": 0.0007116821265516307, "epoch": 8.4958071278826, "percentage": 42.48, "elapsed_time": "0:41:27", "remaining_time": "0:56:08", "throughput": 4249.06, "total_tokens": 10570104} {"current_steps": 16215, "total_steps": 38160, "loss": 0.5462, "lr": 0.0007114749244251094, "epoch": 8.498427672955975, "percentage": 42.49, "elapsed_time": "0:41:28", "remaining_time": "0:56:07", "throughput": 4249.13, "total_tokens": 10573304} {"current_steps": 16220, "total_steps": 38160, "loss": 0.3805, "lr": 0.0007112676780604468, "epoch": 8.50104821802935, "percentage": 42.51, "elapsed_time": "0:41:29", "remaining_time": "0:56:06", "throughput": 4249.16, "total_tokens": 10576408} {"current_steps": 16225, "total_steps": 38160, "loss": 0.2928, "lr": 0.000711060387500996, "epoch": 8.503668763102725, "percentage": 42.52, "elapsed_time": "0:41:29", "remaining_time": "0:56:06", "throughput": 4249.27, "total_tokens": 10579864} {"current_steps": 16230, "total_steps": 38160, "loss": 0.5064, "lr": 0.0007108530527901199, "epoch": 8.5062893081761, "percentage": 42.53, "elapsed_time": "0:41:30", "remaining_time": "0:56:05", "throughput": 4249.28, "total_tokens": 10582840} {"current_steps": 16235, "total_steps": 38160, "loss": 0.4859, "lr": 0.000710645673971191, "epoch": 8.508909853249476, "percentage": 42.54, "elapsed_time": "0:41:31", "remaining_time": "0:56:04", "throughput": 4249.39, "total_tokens": 10586392} {"current_steps": 16240, "total_steps": 38160, "loss": 0.3797, "lr": 0.00071043825108759, "epoch": 8.51153039832285, "percentage": 42.56, "elapsed_time": "0:41:32", "remaining_time": "0:56:03", "throughput": 4249.74, "total_tokens": 10591224} {"current_steps": 16245, "total_steps": 38160, "loss": 0.4673, "lr": 0.0007102307841827079, "epoch": 8.514150943396226, "percentage": 42.57, "elapsed_time": "0:41:32", "remaining_time": "0:56:03", "throughput": 4249.77, "total_tokens": 10594296} {"current_steps": 16250, "total_steps": 38160, "loss": 0.3882, "lr": 0.0007100232732999443, "epoch": 8.516771488469601, "percentage": 42.58, "elapsed_time": "0:41:33", "remaining_time": "0:56:02", "throughput": 4249.91, "total_tokens": 10597912} {"current_steps": 16255, "total_steps": 38160, "loss": 0.4688, "lr": 0.0007098157184827076, "epoch": 8.519392033542976, "percentage": 42.6, "elapsed_time": "0:41:34", "remaining_time": "0:56:01", "throughput": 4249.87, "total_tokens": 10600632} {"current_steps": 16260, "total_steps": 38160, "loss": 0.4736, "lr": 0.0007096081197744166, "epoch": 8.522012578616351, "percentage": 42.61, "elapsed_time": "0:41:35", "remaining_time": "0:56:00", "throughput": 4249.9, "total_tokens": 10603672} {"current_steps": 16265, "total_steps": 38160, "loss": 0.3791, "lr": 0.0007094004772184981, "epoch": 8.524633123689728, "percentage": 42.62, "elapsed_time": "0:41:35", "remaining_time": "0:55:59", "throughput": 4249.92, "total_tokens": 10606648} {"current_steps": 16270, "total_steps": 38160, "loss": 0.4168, "lr": 0.0007091927908583889, "epoch": 8.527253668763104, "percentage": 42.64, "elapsed_time": "0:41:36", "remaining_time": "0:55:58", "throughput": 4249.91, "total_tokens": 10609432} {"current_steps": 16275, "total_steps": 38160, "loss": 0.4061, "lr": 0.0007089850607375343, "epoch": 8.529874213836479, "percentage": 42.65, "elapsed_time": "0:41:37", "remaining_time": "0:55:58", "throughput": 4250.26, "total_tokens": 10614424} {"current_steps": 16280, "total_steps": 38160, "loss": 0.5804, "lr": 0.0007087772868993894, "epoch": 8.532494758909854, "percentage": 42.66, "elapsed_time": "0:41:38", "remaining_time": "0:55:57", "throughput": 4250.34, "total_tokens": 10617784} {"current_steps": 16285, "total_steps": 38160, "loss": 0.4874, "lr": 0.0007085694693874178, "epoch": 8.535115303983229, "percentage": 42.68, "elapsed_time": "0:41:38", "remaining_time": "0:55:56", "throughput": 4250.25, "total_tokens": 10620216} {"current_steps": 16290, "total_steps": 38160, "loss": 0.4954, "lr": 0.0007083616082450928, "epoch": 8.537735849056604, "percentage": 42.69, "elapsed_time": "0:41:39", "remaining_time": "0:55:55", "throughput": 4250.19, "total_tokens": 10622808} {"current_steps": 16295, "total_steps": 38160, "loss": 0.4766, "lr": 0.0007081537035158962, "epoch": 8.54035639412998, "percentage": 42.7, "elapsed_time": "0:41:40", "remaining_time": "0:55:54", "throughput": 4250.23, "total_tokens": 10625912} {"current_steps": 16300, "total_steps": 38160, "loss": 0.4183, "lr": 0.0007079457552433198, "epoch": 8.542976939203355, "percentage": 42.71, "elapsed_time": "0:41:40", "remaining_time": "0:55:53", "throughput": 4250.27, "total_tokens": 10629016} {"current_steps": 16305, "total_steps": 38160, "loss": 0.594, "lr": 0.0007077377634708637, "epoch": 8.54559748427673, "percentage": 42.73, "elapsed_time": "0:41:41", "remaining_time": "0:55:53", "throughput": 4250.47, "total_tokens": 10632920} {"current_steps": 16310, "total_steps": 38160, "loss": 0.3736, "lr": 0.0007075297282420375, "epoch": 8.548218029350105, "percentage": 42.74, "elapsed_time": "0:41:42", "remaining_time": "0:55:52", "throughput": 4250.46, "total_tokens": 10635800} {"current_steps": 16315, "total_steps": 38160, "loss": 0.4201, "lr": 0.0007073216496003598, "epoch": 8.55083857442348, "percentage": 42.75, "elapsed_time": "0:41:42", "remaining_time": "0:55:51", "throughput": 4250.48, "total_tokens": 10638712} {"current_steps": 16320, "total_steps": 38160, "loss": 0.3644, "lr": 0.0007071135275893584, "epoch": 8.553459119496855, "percentage": 42.77, "elapsed_time": "0:41:43", "remaining_time": "0:55:50", "throughput": 4250.45, "total_tokens": 10641528} {"current_steps": 16325, "total_steps": 38160, "loss": 0.4117, "lr": 0.0007069053622525696, "epoch": 8.55607966457023, "percentage": 42.78, "elapsed_time": "0:41:44", "remaining_time": "0:55:49", "throughput": 4250.4, "total_tokens": 10644152} {"current_steps": 16330, "total_steps": 38160, "loss": 0.4439, "lr": 0.0007066971536335395, "epoch": 8.558700209643606, "percentage": 42.79, "elapsed_time": "0:41:44", "remaining_time": "0:55:48", "throughput": 4250.43, "total_tokens": 10647288} {"current_steps": 16335, "total_steps": 38160, "loss": 0.3941, "lr": 0.0007064889017758234, "epoch": 8.56132075471698, "percentage": 42.81, "elapsed_time": "0:41:45", "remaining_time": "0:55:47", "throughput": 4250.55, "total_tokens": 10650840} {"current_steps": 16340, "total_steps": 38160, "loss": 0.4103, "lr": 0.0007062806067229845, "epoch": 8.563941299790356, "percentage": 42.82, "elapsed_time": "0:41:46", "remaining_time": "0:55:47", "throughput": 4250.68, "total_tokens": 10654360} {"current_steps": 16345, "total_steps": 38160, "loss": 0.4901, "lr": 0.0007060722685185961, "epoch": 8.566561844863731, "percentage": 42.83, "elapsed_time": "0:41:47", "remaining_time": "0:55:46", "throughput": 4251.06, "total_tokens": 10659448} {"current_steps": 16350, "total_steps": 38160, "loss": 0.4498, "lr": 0.00070586388720624, "epoch": 8.569182389937106, "percentage": 42.85, "elapsed_time": "0:41:48", "remaining_time": "0:55:45", "throughput": 4251.08, "total_tokens": 10662520} {"current_steps": 16355, "total_steps": 38160, "loss": 0.4592, "lr": 0.0007056554628295076, "epoch": 8.571802935010481, "percentage": 42.86, "elapsed_time": "0:41:48", "remaining_time": "0:55:44", "throughput": 4251.03, "total_tokens": 10665176} {"current_steps": 16360, "total_steps": 38160, "loss": 0.4154, "lr": 0.0007054469954319984, "epoch": 8.574423480083858, "percentage": 42.87, "elapsed_time": "0:41:49", "remaining_time": "0:55:44", "throughput": 4251.2, "total_tokens": 10668984} {"current_steps": 16365, "total_steps": 38160, "loss": 0.3582, "lr": 0.0007052384850573217, "epoch": 8.577044025157234, "percentage": 42.89, "elapsed_time": "0:41:50", "remaining_time": "0:55:43", "throughput": 4251.42, "total_tokens": 10673112} {"current_steps": 16370, "total_steps": 38160, "loss": 0.3734, "lr": 0.0007050299317490952, "epoch": 8.579664570230609, "percentage": 42.9, "elapsed_time": "0:41:51", "remaining_time": "0:55:42", "throughput": 4251.52, "total_tokens": 10676504} {"current_steps": 16375, "total_steps": 38160, "loss": 0.2968, "lr": 0.0007048213355509463, "epoch": 8.582285115303984, "percentage": 42.91, "elapsed_time": "0:41:51", "remaining_time": "0:55:41", "throughput": 4251.53, "total_tokens": 10679480} {"current_steps": 16380, "total_steps": 38160, "loss": 0.4412, "lr": 0.0007046126965065107, "epoch": 8.584905660377359, "percentage": 42.92, "elapsed_time": "0:41:52", "remaining_time": "0:55:40", "throughput": 4251.52, "total_tokens": 10682360} {"current_steps": 16385, "total_steps": 38160, "loss": 0.4742, "lr": 0.0007044040146594332, "epoch": 8.587526205450734, "percentage": 42.94, "elapsed_time": "0:41:53", "remaining_time": "0:55:40", "throughput": 4251.69, "total_tokens": 10686232} {"current_steps": 16390, "total_steps": 38160, "loss": 0.3974, "lr": 0.0007041952900533681, "epoch": 8.59014675052411, "percentage": 42.95, "elapsed_time": "0:41:54", "remaining_time": "0:55:39", "throughput": 4251.79, "total_tokens": 10689592} {"current_steps": 16395, "total_steps": 38160, "loss": 0.4307, "lr": 0.0007039865227319777, "epoch": 8.592767295597485, "percentage": 42.96, "elapsed_time": "0:41:54", "remaining_time": "0:55:38", "throughput": 4251.92, "total_tokens": 10693272} {"current_steps": 16400, "total_steps": 38160, "loss": 0.3505, "lr": 0.0007037777127389339, "epoch": 8.59538784067086, "percentage": 42.98, "elapsed_time": "0:41:55", "remaining_time": "0:55:38", "throughput": 4252.16, "total_tokens": 10697560} {"current_steps": 16405, "total_steps": 38160, "loss": 0.6545, "lr": 0.0007035688601179177, "epoch": 8.598008385744235, "percentage": 42.99, "elapsed_time": "0:41:56", "remaining_time": "0:55:37", "throughput": 4252.19, "total_tokens": 10700664} {"current_steps": 16410, "total_steps": 38160, "loss": 0.4669, "lr": 0.000703359964912618, "epoch": 8.60062893081761, "percentage": 43.0, "elapsed_time": "0:41:57", "remaining_time": "0:55:36", "throughput": 4252.4, "total_tokens": 10704696} {"current_steps": 16415, "total_steps": 38160, "loss": 0.527, "lr": 0.000703151027166734, "epoch": 8.603249475890985, "percentage": 43.02, "elapsed_time": "0:41:58", "remaining_time": "0:55:35", "throughput": 4252.38, "total_tokens": 10707512} {"current_steps": 16420, "total_steps": 38160, "loss": 0.3472, "lr": 0.0007029420469239726, "epoch": 8.60587002096436, "percentage": 43.03, "elapsed_time": "0:41:58", "remaining_time": "0:55:34", "throughput": 4252.51, "total_tokens": 10711128} {"current_steps": 16425, "total_steps": 38160, "loss": 0.4928, "lr": 0.0007027330242280503, "epoch": 8.608490566037736, "percentage": 43.04, "elapsed_time": "0:41:59", "remaining_time": "0:55:34", "throughput": 4252.57, "total_tokens": 10714392} {"current_steps": 16430, "total_steps": 38160, "loss": 0.5235, "lr": 0.0007025239591226923, "epoch": 8.61111111111111, "percentage": 43.06, "elapsed_time": "0:42:00", "remaining_time": "0:55:33", "throughput": 4252.71, "total_tokens": 10718008} {"current_steps": 16435, "total_steps": 38160, "loss": 0.4576, "lr": 0.0007023148516516326, "epoch": 8.613731656184486, "percentage": 43.07, "elapsed_time": "0:42:01", "remaining_time": "0:55:32", "throughput": 4252.75, "total_tokens": 10721240} {"current_steps": 16440, "total_steps": 38160, "loss": 0.5087, "lr": 0.0007021057018586139, "epoch": 8.616352201257861, "percentage": 43.08, "elapsed_time": "0:42:01", "remaining_time": "0:55:31", "throughput": 4252.77, "total_tokens": 10724312} {"current_steps": 16445, "total_steps": 38160, "loss": 0.4026, "lr": 0.0007018965097873883, "epoch": 8.618972746331236, "percentage": 43.09, "elapsed_time": "0:42:02", "remaining_time": "0:55:30", "throughput": 4252.69, "total_tokens": 10726872} {"current_steps": 16450, "total_steps": 38160, "loss": 0.4907, "lr": 0.0007016872754817161, "epoch": 8.621593291404611, "percentage": 43.11, "elapsed_time": "0:42:03", "remaining_time": "0:55:30", "throughput": 4252.87, "total_tokens": 10730808} {"current_steps": 16455, "total_steps": 38160, "loss": 0.4058, "lr": 0.0007014779989853668, "epoch": 8.624213836477988, "percentage": 43.12, "elapsed_time": "0:42:03", "remaining_time": "0:55:29", "throughput": 4252.89, "total_tokens": 10733848} {"current_steps": 16460, "total_steps": 38160, "loss": 0.3779, "lr": 0.0007012686803421189, "epoch": 8.626834381551364, "percentage": 43.13, "elapsed_time": "0:42:04", "remaining_time": "0:55:28", "throughput": 4252.93, "total_tokens": 10736952} {"current_steps": 16465, "total_steps": 38160, "loss": 0.3781, "lr": 0.000701059319595759, "epoch": 8.629454926624739, "percentage": 43.15, "elapsed_time": "0:42:05", "remaining_time": "0:55:27", "throughput": 4252.97, "total_tokens": 10740024} {"current_steps": 16470, "total_steps": 38160, "loss": 0.4825, "lr": 0.0007008499167900833, "epoch": 8.632075471698114, "percentage": 43.16, "elapsed_time": "0:42:05", "remaining_time": "0:55:26", "throughput": 4252.92, "total_tokens": 10742680} {"current_steps": 16475, "total_steps": 38160, "loss": 0.4356, "lr": 0.0007006404719688966, "epoch": 8.634696016771489, "percentage": 43.17, "elapsed_time": "0:42:06", "remaining_time": "0:55:25", "throughput": 4253.15, "total_tokens": 10746904} {"current_steps": 16480, "total_steps": 38160, "loss": 0.4933, "lr": 0.000700430985176012, "epoch": 8.637316561844864, "percentage": 43.19, "elapsed_time": "0:42:07", "remaining_time": "0:55:24", "throughput": 4253.13, "total_tokens": 10749656} {"current_steps": 16485, "total_steps": 38160, "loss": 0.6252, "lr": 0.0007002214564552521, "epoch": 8.63993710691824, "percentage": 43.2, "elapsed_time": "0:42:08", "remaining_time": "0:55:24", "throughput": 4253.08, "total_tokens": 10752280} {"current_steps": 16490, "total_steps": 38160, "loss": 0.4284, "lr": 0.0007000118858504476, "epoch": 8.642557651991615, "percentage": 43.21, "elapsed_time": "0:42:08", "remaining_time": "0:55:23", "throughput": 4253.17, "total_tokens": 10755672} {"current_steps": 16495, "total_steps": 38160, "loss": 0.4198, "lr": 0.0006998022734054386, "epoch": 8.64517819706499, "percentage": 43.23, "elapsed_time": "0:42:09", "remaining_time": "0:55:22", "throughput": 4253.29, "total_tokens": 10759256} {"current_steps": 16500, "total_steps": 38160, "loss": 0.5376, "lr": 0.0006995926191640734, "epoch": 8.647798742138365, "percentage": 43.24, "elapsed_time": "0:42:10", "remaining_time": "0:55:21", "throughput": 4253.4, "total_tokens": 10762840} {"current_steps": 16505, "total_steps": 38160, "loss": 0.5098, "lr": 0.0006993829231702092, "epoch": 8.65041928721174, "percentage": 43.25, "elapsed_time": "0:42:11", "remaining_time": "0:55:20", "throughput": 4253.37, "total_tokens": 10765592} {"current_steps": 16510, "total_steps": 38160, "loss": 0.3855, "lr": 0.0006991731854677124, "epoch": 8.653039832285115, "percentage": 43.27, "elapsed_time": "0:42:11", "remaining_time": "0:55:19", "throughput": 4253.25, "total_tokens": 10767800} {"current_steps": 16515, "total_steps": 38160, "loss": 0.477, "lr": 0.0006989634061004572, "epoch": 8.65566037735849, "percentage": 43.28, "elapsed_time": "0:42:13", "remaining_time": "0:55:19", "throughput": 4253.99, "total_tokens": 10775384} {"current_steps": 16520, "total_steps": 38160, "loss": 0.514, "lr": 0.0006987535851123276, "epoch": 8.658280922431866, "percentage": 43.29, "elapsed_time": "0:42:13", "remaining_time": "0:55:18", "throughput": 4253.88, "total_tokens": 10777752} {"current_steps": 16525, "total_steps": 38160, "loss": 0.2948, "lr": 0.0006985437225472155, "epoch": 8.66090146750524, "percentage": 43.3, "elapsed_time": "0:42:14", "remaining_time": "0:55:17", "throughput": 4253.8, "total_tokens": 10780376} {"current_steps": 16530, "total_steps": 38160, "loss": 0.442, "lr": 0.0006983338184490215, "epoch": 8.663522012578616, "percentage": 43.32, "elapsed_time": "0:42:15", "remaining_time": "0:55:17", "throughput": 4254.0, "total_tokens": 10784344} {"current_steps": 16535, "total_steps": 38160, "loss": 0.5352, "lr": 0.0006981238728616557, "epoch": 8.666142557651991, "percentage": 43.33, "elapsed_time": "0:42:15", "remaining_time": "0:55:16", "throughput": 4254.0, "total_tokens": 10787128} {"current_steps": 16540, "total_steps": 38160, "loss": 0.4184, "lr": 0.0006979138858290358, "epoch": 8.668763102725366, "percentage": 43.34, "elapsed_time": "0:42:16", "remaining_time": "0:55:15", "throughput": 4254.04, "total_tokens": 10790296} {"current_steps": 16545, "total_steps": 38160, "loss": 0.5034, "lr": 0.0006977038573950889, "epoch": 8.671383647798741, "percentage": 43.36, "elapsed_time": "0:42:17", "remaining_time": "0:55:14", "throughput": 4254.04, "total_tokens": 10793144} {"current_steps": 16550, "total_steps": 38160, "loss": 0.4708, "lr": 0.0006974937876037508, "epoch": 8.674004192872118, "percentage": 43.37, "elapsed_time": "0:42:17", "remaining_time": "0:55:13", "throughput": 4254.09, "total_tokens": 10796280} {"current_steps": 16555, "total_steps": 38160, "loss": 0.437, "lr": 0.0006972836764989652, "epoch": 8.676624737945493, "percentage": 43.38, "elapsed_time": "0:42:18", "remaining_time": "0:55:12", "throughput": 4254.06, "total_tokens": 10799000} {"current_steps": 16560, "total_steps": 38160, "loss": 0.5282, "lr": 0.0006970735241246853, "epoch": 8.679245283018869, "percentage": 43.4, "elapsed_time": "0:42:19", "remaining_time": "0:55:12", "throughput": 4254.14, "total_tokens": 10802264} {"current_steps": 16565, "total_steps": 38160, "loss": 0.4274, "lr": 0.0006968633305248724, "epoch": 8.681865828092244, "percentage": 43.41, "elapsed_time": "0:42:19", "remaining_time": "0:55:11", "throughput": 4254.23, "total_tokens": 10805656} {"current_steps": 16570, "total_steps": 38160, "loss": 0.4322, "lr": 0.0006966530957434968, "epoch": 8.684486373165619, "percentage": 43.42, "elapsed_time": "0:42:20", "remaining_time": "0:55:10", "throughput": 4254.4, "total_tokens": 10809496} {"current_steps": 16575, "total_steps": 38160, "loss": 0.4919, "lr": 0.0006964428198245372, "epoch": 8.687106918238994, "percentage": 43.44, "elapsed_time": "0:42:21", "remaining_time": "0:55:09", "throughput": 4254.49, "total_tokens": 10812856} {"current_steps": 16580, "total_steps": 38160, "loss": 0.4442, "lr": 0.0006962325028119806, "epoch": 8.68972746331237, "percentage": 43.45, "elapsed_time": "0:42:22", "remaining_time": "0:55:08", "throughput": 4254.47, "total_tokens": 10815544} {"current_steps": 16585, "total_steps": 38160, "loss": 0.5021, "lr": 0.0006960221447498232, "epoch": 8.692348008385745, "percentage": 43.46, "elapsed_time": "0:42:22", "remaining_time": "0:55:07", "throughput": 4254.4, "total_tokens": 10818072} {"current_steps": 16590, "total_steps": 38160, "loss": 0.4146, "lr": 0.0006958117456820696, "epoch": 8.69496855345912, "percentage": 43.47, "elapsed_time": "0:42:23", "remaining_time": "0:55:07", "throughput": 4254.45, "total_tokens": 10821304} {"current_steps": 16595, "total_steps": 38160, "loss": 0.3609, "lr": 0.0006956013056527326, "epoch": 8.697589098532495, "percentage": 43.49, "elapsed_time": "0:42:24", "remaining_time": "0:55:06", "throughput": 4254.6, "total_tokens": 10824984} {"current_steps": 16600, "total_steps": 38160, "loss": 0.5898, "lr": 0.0006953908247058341, "epoch": 8.70020964360587, "percentage": 43.5, "elapsed_time": "0:42:24", "remaining_time": "0:55:05", "throughput": 4254.63, "total_tokens": 10828024} {"current_steps": 16605, "total_steps": 38160, "loss": 0.477, "lr": 0.0006951803028854041, "epoch": 8.702830188679245, "percentage": 43.51, "elapsed_time": "0:42:25", "remaining_time": "0:55:04", "throughput": 4254.77, "total_tokens": 10831640} {"current_steps": 16610, "total_steps": 38160, "loss": 0.5095, "lr": 0.0006949697402354816, "epoch": 8.70545073375262, "percentage": 43.53, "elapsed_time": "0:42:26", "remaining_time": "0:55:03", "throughput": 4254.88, "total_tokens": 10835160} {"current_steps": 16615, "total_steps": 38160, "loss": 0.3709, "lr": 0.0006947591368001138, "epoch": 8.708071278825996, "percentage": 43.54, "elapsed_time": "0:42:27", "remaining_time": "0:55:03", "throughput": 4254.92, "total_tokens": 10838232} {"current_steps": 16620, "total_steps": 38160, "loss": 0.3412, "lr": 0.0006945484926233563, "epoch": 8.71069182389937, "percentage": 43.55, "elapsed_time": "0:42:27", "remaining_time": "0:55:02", "throughput": 4254.94, "total_tokens": 10841240} {"current_steps": 16625, "total_steps": 38160, "loss": 0.4114, "lr": 0.0006943378077492737, "epoch": 8.713312368972746, "percentage": 43.57, "elapsed_time": "0:42:28", "remaining_time": "0:55:01", "throughput": 4254.99, "total_tokens": 10844312} {"current_steps": 16630, "total_steps": 38160, "loss": 0.4007, "lr": 0.000694127082221939, "epoch": 8.715932914046121, "percentage": 43.58, "elapsed_time": "0:42:29", "remaining_time": "0:55:00", "throughput": 4255.0, "total_tokens": 10847320} {"current_steps": 16635, "total_steps": 38160, "loss": 0.397, "lr": 0.0006939163160854334, "epoch": 8.718553459119496, "percentage": 43.59, "elapsed_time": "0:42:30", "remaining_time": "0:54:59", "throughput": 4255.1, "total_tokens": 10850648} {"current_steps": 16640, "total_steps": 38160, "loss": 0.465, "lr": 0.0006937055093838467, "epoch": 8.721174004192871, "percentage": 43.61, "elapsed_time": "0:42:30", "remaining_time": "0:54:58", "throughput": 4255.16, "total_tokens": 10853912} {"current_steps": 16645, "total_steps": 38160, "loss": 0.4048, "lr": 0.0006934946621612774, "epoch": 8.723794549266248, "percentage": 43.62, "elapsed_time": "0:42:31", "remaining_time": "0:54:57", "throughput": 4255.18, "total_tokens": 10856824} {"current_steps": 16650, "total_steps": 38160, "loss": 0.3943, "lr": 0.0006932837744618322, "epoch": 8.726415094339622, "percentage": 43.63, "elapsed_time": "0:42:32", "remaining_time": "0:54:57", "throughput": 4255.29, "total_tokens": 10860280} {"current_steps": 16655, "total_steps": 38160, "loss": 0.5311, "lr": 0.0006930728463296265, "epoch": 8.729035639412999, "percentage": 43.65, "elapsed_time": "0:42:32", "remaining_time": "0:54:56", "throughput": 4255.4, "total_tokens": 10863832} {"current_steps": 16660, "total_steps": 38160, "loss": 0.436, "lr": 0.0006928618778087842, "epoch": 8.731656184486374, "percentage": 43.66, "elapsed_time": "0:42:33", "remaining_time": "0:54:55", "throughput": 4255.55, "total_tokens": 10867576} {"current_steps": 16665, "total_steps": 38160, "loss": 0.4637, "lr": 0.0006926508689434371, "epoch": 8.734276729559749, "percentage": 43.67, "elapsed_time": "0:42:34", "remaining_time": "0:54:54", "throughput": 4255.73, "total_tokens": 10871384} {"current_steps": 16670, "total_steps": 38160, "loss": 0.5845, "lr": 0.0006924398197777263, "epoch": 8.736897274633124, "percentage": 43.68, "elapsed_time": "0:42:35", "remaining_time": "0:54:54", "throughput": 4255.79, "total_tokens": 10874584} {"current_steps": 16675, "total_steps": 38160, "loss": 0.411, "lr": 0.0006922287303558006, "epoch": 8.7395178197065, "percentage": 43.7, "elapsed_time": "0:42:36", "remaining_time": "0:54:53", "throughput": 4255.98, "total_tokens": 10878584} {"current_steps": 16680, "total_steps": 38160, "loss": 0.6605, "lr": 0.0006920176007218175, "epoch": 8.742138364779874, "percentage": 43.71, "elapsed_time": "0:42:36", "remaining_time": "0:54:52", "throughput": 4256.01, "total_tokens": 10881560} {"current_steps": 16685, "total_steps": 38160, "loss": 0.5556, "lr": 0.000691806430919943, "epoch": 8.74475890985325, "percentage": 43.72, "elapsed_time": "0:42:37", "remaining_time": "0:54:51", "throughput": 4256.04, "total_tokens": 10884600} {"current_steps": 16690, "total_steps": 38160, "loss": 0.355, "lr": 0.0006915952209943514, "epoch": 8.747379454926625, "percentage": 43.74, "elapsed_time": "0:42:38", "remaining_time": "0:54:50", "throughput": 4256.2, "total_tokens": 10888408} {"current_steps": 16695, "total_steps": 38160, "loss": 0.5026, "lr": 0.0006913839709892256, "epoch": 8.75, "percentage": 43.75, "elapsed_time": "0:42:39", "remaining_time": "0:54:50", "throughput": 4256.25, "total_tokens": 10891736} {"current_steps": 16700, "total_steps": 38160, "loss": 0.3623, "lr": 0.0006911726809487561, "epoch": 8.752620545073375, "percentage": 43.76, "elapsed_time": "0:42:39", "remaining_time": "0:54:49", "throughput": 4256.2, "total_tokens": 10894648} {"current_steps": 16705, "total_steps": 38160, "loss": 0.3669, "lr": 0.0006909613509171431, "epoch": 8.75524109014675, "percentage": 43.78, "elapsed_time": "0:42:40", "remaining_time": "0:54:48", "throughput": 4256.21, "total_tokens": 10897624} {"current_steps": 16710, "total_steps": 38160, "loss": 0.4929, "lr": 0.0006907499809385941, "epoch": 8.757861635220126, "percentage": 43.79, "elapsed_time": "0:42:41", "remaining_time": "0:54:47", "throughput": 4256.25, "total_tokens": 10900696} {"current_steps": 16715, "total_steps": 38160, "loss": 0.5584, "lr": 0.0006905385710573252, "epoch": 8.7604821802935, "percentage": 43.8, "elapsed_time": "0:42:41", "remaining_time": "0:54:46", "throughput": 4256.35, "total_tokens": 10904280} {"current_steps": 16720, "total_steps": 38160, "loss": 0.4943, "lr": 0.000690327121317561, "epoch": 8.763102725366876, "percentage": 43.82, "elapsed_time": "0:42:42", "remaining_time": "0:54:46", "throughput": 4256.48, "total_tokens": 10907896} {"current_steps": 16725, "total_steps": 38160, "loss": 0.4179, "lr": 0.0006901156317635342, "epoch": 8.765723270440251, "percentage": 43.83, "elapsed_time": "0:42:43", "remaining_time": "0:54:45", "throughput": 4256.56, "total_tokens": 10911192} {"current_steps": 16730, "total_steps": 38160, "loss": 0.5898, "lr": 0.0006899041024394864, "epoch": 8.768343815513626, "percentage": 43.84, "elapsed_time": "0:42:44", "remaining_time": "0:54:44", "throughput": 4256.62, "total_tokens": 10914488} {"current_steps": 16735, "total_steps": 38160, "loss": 0.4063, "lr": 0.000689692533389667, "epoch": 8.770964360587001, "percentage": 43.85, "elapsed_time": "0:42:44", "remaining_time": "0:54:43", "throughput": 4256.82, "total_tokens": 10918456} {"current_steps": 16740, "total_steps": 38160, "loss": 0.4993, "lr": 0.0006894809246583334, "epoch": 8.773584905660378, "percentage": 43.87, "elapsed_time": "0:42:45", "remaining_time": "0:54:43", "throughput": 4256.98, "total_tokens": 10922296} {"current_steps": 16745, "total_steps": 38160, "loss": 0.5057, "lr": 0.0006892692762897523, "epoch": 8.776205450733752, "percentage": 43.88, "elapsed_time": "0:42:46", "remaining_time": "0:54:42", "throughput": 4257.03, "total_tokens": 10925400} {"current_steps": 16750, "total_steps": 38160, "loss": 0.4409, "lr": 0.000689057588328198, "epoch": 8.778825995807129, "percentage": 43.89, "elapsed_time": "0:42:47", "remaining_time": "0:54:41", "throughput": 4256.99, "total_tokens": 10928120} {"current_steps": 16755, "total_steps": 38160, "loss": 0.4844, "lr": 0.0006888458608179528, "epoch": 8.781446540880504, "percentage": 43.91, "elapsed_time": "0:42:47", "remaining_time": "0:54:40", "throughput": 4257.15, "total_tokens": 10932088} {"current_steps": 16760, "total_steps": 38160, "loss": 0.4878, "lr": 0.0006886340938033085, "epoch": 8.784067085953879, "percentage": 43.92, "elapsed_time": "0:42:48", "remaining_time": "0:54:39", "throughput": 4257.3, "total_tokens": 10935832} {"current_steps": 16765, "total_steps": 38160, "loss": 0.5775, "lr": 0.0006884222873285632, "epoch": 8.786687631027254, "percentage": 43.93, "elapsed_time": "0:42:49", "remaining_time": "0:54:38", "throughput": 4257.28, "total_tokens": 10938552} {"current_steps": 16770, "total_steps": 38160, "loss": 0.4456, "lr": 0.0006882104414380254, "epoch": 8.78930817610063, "percentage": 43.95, "elapsed_time": "0:42:50", "remaining_time": "0:54:38", "throughput": 4257.46, "total_tokens": 10942520} {"current_steps": 16775, "total_steps": 38160, "loss": 0.4608, "lr": 0.0006879985561760105, "epoch": 8.791928721174004, "percentage": 43.96, "elapsed_time": "0:42:50", "remaining_time": "0:54:37", "throughput": 4257.57, "total_tokens": 10946008} {"current_steps": 16780, "total_steps": 38160, "loss": 0.4634, "lr": 0.0006877866315868422, "epoch": 8.79454926624738, "percentage": 43.97, "elapsed_time": "0:42:51", "remaining_time": "0:54:36", "throughput": 4257.61, "total_tokens": 10949144} {"current_steps": 16785, "total_steps": 38160, "loss": 0.441, "lr": 0.0006875746677148531, "epoch": 8.797169811320755, "percentage": 43.99, "elapsed_time": "0:42:52", "remaining_time": "0:54:35", "throughput": 4257.87, "total_tokens": 10953400} {"current_steps": 16790, "total_steps": 38160, "loss": 0.4391, "lr": 0.0006873626646043835, "epoch": 8.79979035639413, "percentage": 44.0, "elapsed_time": "0:42:53", "remaining_time": "0:54:35", "throughput": 4257.92, "total_tokens": 10956472} {"current_steps": 16795, "total_steps": 38160, "loss": 0.4621, "lr": 0.000687150622299782, "epoch": 8.802410901467505, "percentage": 44.01, "elapsed_time": "0:42:54", "remaining_time": "0:54:34", "throughput": 4258.08, "total_tokens": 10960312} {"current_steps": 16800, "total_steps": 38160, "loss": 0.4399, "lr": 0.0006869385408454056, "epoch": 8.80503144654088, "percentage": 44.03, "elapsed_time": "0:42:54", "remaining_time": "0:54:33", "throughput": 4257.98, "total_tokens": 10962616} {"current_steps": 16805, "total_steps": 38160, "loss": 0.4287, "lr": 0.0006867264202856188, "epoch": 8.807651991614255, "percentage": 44.04, "elapsed_time": "0:42:55", "remaining_time": "0:54:32", "throughput": 4258.07, "total_tokens": 10966008} {"current_steps": 16810, "total_steps": 38160, "loss": 0.5532, "lr": 0.0006865142606647954, "epoch": 8.81027253668763, "percentage": 44.05, "elapsed_time": "0:42:56", "remaining_time": "0:54:31", "throughput": 4258.27, "total_tokens": 10970040} {"current_steps": 16815, "total_steps": 38160, "loss": 0.4824, "lr": 0.0006863020620273166, "epoch": 8.812893081761006, "percentage": 44.06, "elapsed_time": "0:42:56", "remaining_time": "0:54:30", "throughput": 4258.19, "total_tokens": 10972472} {"current_steps": 16820, "total_steps": 38160, "loss": 0.4036, "lr": 0.0006860898244175716, "epoch": 8.815513626834381, "percentage": 44.08, "elapsed_time": "0:42:57", "remaining_time": "0:54:30", "throughput": 4258.41, "total_tokens": 10976664} {"current_steps": 16825, "total_steps": 38160, "loss": 0.4299, "lr": 0.0006858775478799586, "epoch": 8.818134171907756, "percentage": 44.09, "elapsed_time": "0:42:58", "remaining_time": "0:54:29", "throughput": 4258.33, "total_tokens": 10979192} {"current_steps": 16830, "total_steps": 38160, "loss": 0.4022, "lr": 0.0006856652324588831, "epoch": 8.820754716981131, "percentage": 44.1, "elapsed_time": "0:42:58", "remaining_time": "0:54:28", "throughput": 4258.26, "total_tokens": 10981688} {"current_steps": 16835, "total_steps": 38160, "loss": 0.4679, "lr": 0.000685452878198759, "epoch": 8.823375262054507, "percentage": 44.12, "elapsed_time": "0:42:59", "remaining_time": "0:54:27", "throughput": 4258.37, "total_tokens": 10985176} {"current_steps": 16840, "total_steps": 38160, "loss": 0.4575, "lr": 0.0006852404851440088, "epoch": 8.825995807127882, "percentage": 44.13, "elapsed_time": "0:43:00", "remaining_time": "0:54:26", "throughput": 4258.46, "total_tokens": 10988536} {"current_steps": 16845, "total_steps": 38160, "loss": 0.3547, "lr": 0.0006850280533390624, "epoch": 8.828616352201259, "percentage": 44.14, "elapsed_time": "0:43:01", "remaining_time": "0:54:25", "throughput": 4258.38, "total_tokens": 10990936} {"current_steps": 16850, "total_steps": 38160, "loss": 0.4231, "lr": 0.0006848155828283581, "epoch": 8.831236897274634, "percentage": 44.16, "elapsed_time": "0:43:01", "remaining_time": "0:54:25", "throughput": 4258.46, "total_tokens": 10994200} {"current_steps": 16855, "total_steps": 38160, "loss": 0.4773, "lr": 0.0006846030736563422, "epoch": 8.833857442348009, "percentage": 44.17, "elapsed_time": "0:43:02", "remaining_time": "0:54:24", "throughput": 4258.48, "total_tokens": 10997240} {"current_steps": 16860, "total_steps": 38160, "loss": 0.3915, "lr": 0.0006843905258674696, "epoch": 8.836477987421384, "percentage": 44.18, "elapsed_time": "0:43:03", "remaining_time": "0:54:23", "throughput": 4258.56, "total_tokens": 11000568} {"current_steps": 16865, "total_steps": 38160, "loss": 0.351, "lr": 0.0006841779395062026, "epoch": 8.83909853249476, "percentage": 44.2, "elapsed_time": "0:43:04", "remaining_time": "0:54:22", "throughput": 4258.93, "total_tokens": 11005528} {"current_steps": 16870, "total_steps": 38160, "loss": 0.4933, "lr": 0.0006839653146170116, "epoch": 8.841719077568134, "percentage": 44.21, "elapsed_time": "0:43:04", "remaining_time": "0:54:22", "throughput": 4259.06, "total_tokens": 11009176} {"current_steps": 16875, "total_steps": 38160, "loss": 0.3892, "lr": 0.0006837526512443758, "epoch": 8.84433962264151, "percentage": 44.22, "elapsed_time": "0:43:05", "remaining_time": "0:54:21", "throughput": 4259.13, "total_tokens": 11012504} {"current_steps": 16880, "total_steps": 38160, "loss": 0.4692, "lr": 0.0006835399494327818, "epoch": 8.846960167714885, "percentage": 44.23, "elapsed_time": "0:43:06", "remaining_time": "0:54:20", "throughput": 4259.25, "total_tokens": 11015992} {"current_steps": 16885, "total_steps": 38160, "loss": 0.351, "lr": 0.0006833272092267241, "epoch": 8.84958071278826, "percentage": 44.25, "elapsed_time": "0:43:07", "remaining_time": "0:54:19", "throughput": 4259.43, "total_tokens": 11019928} {"current_steps": 16890, "total_steps": 38160, "loss": 0.5283, "lr": 0.000683114430670706, "epoch": 8.852201257861635, "percentage": 44.26, "elapsed_time": "0:43:07", "remaining_time": "0:54:19", "throughput": 4259.47, "total_tokens": 11023096} {"current_steps": 16895, "total_steps": 38160, "loss": 0.4906, "lr": 0.0006829016138092378, "epoch": 8.85482180293501, "percentage": 44.27, "elapsed_time": "0:43:08", "remaining_time": "0:54:18", "throughput": 4259.51, "total_tokens": 11026232} {"current_steps": 16900, "total_steps": 38160, "loss": 0.6377, "lr": 0.0006826887586868388, "epoch": 8.857442348008385, "percentage": 44.29, "elapsed_time": "0:43:09", "remaining_time": "0:54:17", "throughput": 4259.58, "total_tokens": 11029560} {"current_steps": 16905, "total_steps": 38160, "loss": 0.3963, "lr": 0.0006824758653480356, "epoch": 8.86006289308176, "percentage": 44.3, "elapsed_time": "0:43:09", "remaining_time": "0:54:16", "throughput": 4259.53, "total_tokens": 11032120} {"current_steps": 16910, "total_steps": 38160, "loss": 0.4663, "lr": 0.0006822629338373632, "epoch": 8.862683438155136, "percentage": 44.31, "elapsed_time": "0:43:10", "remaining_time": "0:54:15", "throughput": 4259.52, "total_tokens": 11034968} {"current_steps": 16915, "total_steps": 38160, "loss": 0.3137, "lr": 0.0006820499641993644, "epoch": 8.865303983228511, "percentage": 44.33, "elapsed_time": "0:43:11", "remaining_time": "0:54:14", "throughput": 4259.63, "total_tokens": 11038456} {"current_steps": 16920, "total_steps": 38160, "loss": 0.4119, "lr": 0.0006818369564785902, "epoch": 8.867924528301886, "percentage": 44.34, "elapsed_time": "0:43:12", "remaining_time": "0:54:14", "throughput": 4259.88, "total_tokens": 11042712} {"current_steps": 16925, "total_steps": 38160, "loss": 0.5329, "lr": 0.0006816239107195989, "epoch": 8.870545073375261, "percentage": 44.35, "elapsed_time": "0:43:12", "remaining_time": "0:54:13", "throughput": 4259.95, "total_tokens": 11046008} {"current_steps": 16930, "total_steps": 38160, "loss": 0.561, "lr": 0.000681410826966958, "epoch": 8.873165618448636, "percentage": 44.37, "elapsed_time": "0:43:13", "remaining_time": "0:54:12", "throughput": 4260.02, "total_tokens": 11049336} {"current_steps": 16935, "total_steps": 38160, "loss": 0.4014, "lr": 0.0006811977052652414, "epoch": 8.875786163522012, "percentage": 44.38, "elapsed_time": "0:43:14", "remaining_time": "0:54:11", "throughput": 4260.18, "total_tokens": 11053272} {"current_steps": 16940, "total_steps": 38160, "loss": 0.5075, "lr": 0.000680984545659032, "epoch": 8.878406708595389, "percentage": 44.39, "elapsed_time": "0:43:15", "remaining_time": "0:54:11", "throughput": 4260.47, "total_tokens": 11057848} {"current_steps": 16945, "total_steps": 38160, "loss": 0.4637, "lr": 0.0006807713481929207, "epoch": 8.881027253668764, "percentage": 44.41, "elapsed_time": "0:43:16", "remaining_time": "0:54:10", "throughput": 4260.38, "total_tokens": 11060216} {"current_steps": 16950, "total_steps": 38160, "loss": 0.4613, "lr": 0.0006805581129115055, "epoch": 8.883647798742139, "percentage": 44.42, "elapsed_time": "0:43:16", "remaining_time": "0:54:09", "throughput": 4260.49, "total_tokens": 11063640} {"current_steps": 16955, "total_steps": 38160, "loss": 0.3782, "lr": 0.0006803448398593931, "epoch": 8.886268343815514, "percentage": 44.43, "elapsed_time": "0:43:17", "remaining_time": "0:54:08", "throughput": 4260.54, "total_tokens": 11066872} {"current_steps": 16960, "total_steps": 38160, "loss": 0.4781, "lr": 0.0006801315290811976, "epoch": 8.88888888888889, "percentage": 44.44, "elapsed_time": "0:43:18", "remaining_time": "0:54:07", "throughput": 4260.53, "total_tokens": 11069624} {"current_steps": 16965, "total_steps": 38160, "loss": 0.4362, "lr": 0.0006799181806215413, "epoch": 8.891509433962264, "percentage": 44.46, "elapsed_time": "0:43:18", "remaining_time": "0:54:06", "throughput": 4260.62, "total_tokens": 11073048} {"current_steps": 16970, "total_steps": 38160, "loss": 0.3909, "lr": 0.0006797047945250543, "epoch": 8.89412997903564, "percentage": 44.47, "elapsed_time": "0:43:19", "remaining_time": "0:54:06", "throughput": 4260.68, "total_tokens": 11076312} {"current_steps": 16975, "total_steps": 38160, "loss": 0.531, "lr": 0.0006794913708363745, "epoch": 8.896750524109015, "percentage": 44.48, "elapsed_time": "0:43:20", "remaining_time": "0:54:05", "throughput": 4260.71, "total_tokens": 11079416} {"current_steps": 16980, "total_steps": 38160, "loss": 0.4879, "lr": 0.0006792779096001475, "epoch": 8.89937106918239, "percentage": 44.5, "elapsed_time": "0:43:21", "remaining_time": "0:54:04", "throughput": 4260.7, "total_tokens": 11082168} {"current_steps": 16985, "total_steps": 38160, "loss": 0.3524, "lr": 0.0006790644108610273, "epoch": 8.901991614255765, "percentage": 44.51, "elapsed_time": "0:43:21", "remaining_time": "0:54:03", "throughput": 4260.6, "total_tokens": 11084568} {"current_steps": 16990, "total_steps": 38160, "loss": 0.4118, "lr": 0.0006788508746636751, "epoch": 8.90461215932914, "percentage": 44.52, "elapsed_time": "0:43:22", "remaining_time": "0:54:02", "throughput": 4260.65, "total_tokens": 11087736} {"current_steps": 16995, "total_steps": 38160, "loss": 0.4507, "lr": 0.0006786373010527605, "epoch": 8.907232704402515, "percentage": 44.54, "elapsed_time": "0:43:23", "remaining_time": "0:54:01", "throughput": 4260.65, "total_tokens": 11090648} {"current_steps": 17000, "total_steps": 38160, "loss": 0.6216, "lr": 0.0006784236900729603, "epoch": 8.90985324947589, "percentage": 44.55, "elapsed_time": "0:43:23", "remaining_time": "0:54:00", "throughput": 4260.59, "total_tokens": 11093240} {"current_steps": 17005, "total_steps": 38160, "loss": 0.5673, "lr": 0.0006782100417689599, "epoch": 8.912473794549266, "percentage": 44.56, "elapsed_time": "0:43:24", "remaining_time": "0:54:00", "throughput": 4260.68, "total_tokens": 11096568} {"current_steps": 17010, "total_steps": 38160, "loss": 0.4246, "lr": 0.0006779963561854517, "epoch": 8.915094339622641, "percentage": 44.58, "elapsed_time": "0:43:25", "remaining_time": "0:53:59", "throughput": 4260.67, "total_tokens": 11099384} {"current_steps": 17015, "total_steps": 38160, "loss": 0.2988, "lr": 0.0006777826333671367, "epoch": 8.917714884696016, "percentage": 44.59, "elapsed_time": "0:43:25", "remaining_time": "0:53:58", "throughput": 4260.59, "total_tokens": 11101944} {"current_steps": 17020, "total_steps": 38160, "loss": 0.6237, "lr": 0.0006775688733587227, "epoch": 8.920335429769391, "percentage": 44.6, "elapsed_time": "0:43:26", "remaining_time": "0:53:57", "throughput": 4260.58, "total_tokens": 11104856} {"current_steps": 17025, "total_steps": 38160, "loss": 0.4562, "lr": 0.0006773550762049265, "epoch": 8.922955974842766, "percentage": 44.61, "elapsed_time": "0:43:27", "remaining_time": "0:53:56", "throughput": 4260.69, "total_tokens": 11108440} {"current_steps": 17030, "total_steps": 38160, "loss": 0.4157, "lr": 0.0006771412419504716, "epoch": 8.925576519916142, "percentage": 44.63, "elapsed_time": "0:43:28", "remaining_time": "0:53:55", "throughput": 4260.9, "total_tokens": 11112504} {"current_steps": 17035, "total_steps": 38160, "loss": 0.5252, "lr": 0.00067692737064009, "epoch": 8.928197064989519, "percentage": 44.64, "elapsed_time": "0:43:28", "remaining_time": "0:53:55", "throughput": 4261.01, "total_tokens": 11116024} {"current_steps": 17040, "total_steps": 38160, "loss": 0.4398, "lr": 0.0006767134623185208, "epoch": 8.930817610062894, "percentage": 44.65, "elapsed_time": "0:43:29", "remaining_time": "0:53:54", "throughput": 4261.06, "total_tokens": 11119128} {"current_steps": 17045, "total_steps": 38160, "loss": 0.547, "lr": 0.0006764995170305114, "epoch": 8.933438155136269, "percentage": 44.67, "elapsed_time": "0:43:30", "remaining_time": "0:53:53", "throughput": 4261.16, "total_tokens": 11122584} {"current_steps": 17050, "total_steps": 38160, "loss": 0.4577, "lr": 0.0006762855348208166, "epoch": 8.936058700209644, "percentage": 44.68, "elapsed_time": "0:43:30", "remaining_time": "0:53:52", "throughput": 4261.17, "total_tokens": 11125592} {"current_steps": 17055, "total_steps": 38160, "loss": 0.4626, "lr": 0.0006760715157341991, "epoch": 8.93867924528302, "percentage": 44.69, "elapsed_time": "0:43:31", "remaining_time": "0:53:51", "throughput": 4261.13, "total_tokens": 11128312} {"current_steps": 17060, "total_steps": 38160, "loss": 0.3858, "lr": 0.0006758574598154292, "epoch": 8.941299790356394, "percentage": 44.71, "elapsed_time": "0:43:32", "remaining_time": "0:53:51", "throughput": 4261.29, "total_tokens": 11132120} {"current_steps": 17065, "total_steps": 38160, "loss": 0.3501, "lr": 0.0006756433671092852, "epoch": 8.94392033542977, "percentage": 44.72, "elapsed_time": "0:43:33", "remaining_time": "0:53:50", "throughput": 4261.39, "total_tokens": 11135768} {"current_steps": 17070, "total_steps": 38160, "loss": 0.4352, "lr": 0.0006754292376605524, "epoch": 8.946540880503145, "percentage": 44.73, "elapsed_time": "0:43:33", "remaining_time": "0:53:49", "throughput": 4261.47, "total_tokens": 11139128} {"current_steps": 17075, "total_steps": 38160, "loss": 0.6466, "lr": 0.0006752150715140247, "epoch": 8.94916142557652, "percentage": 44.75, "elapsed_time": "0:43:34", "remaining_time": "0:53:48", "throughput": 4261.53, "total_tokens": 11142360} {"current_steps": 17080, "total_steps": 38160, "loss": 0.3752, "lr": 0.0006750008687145028, "epoch": 8.951781970649895, "percentage": 44.76, "elapsed_time": "0:43:35", "remaining_time": "0:53:47", "throughput": 4261.48, "total_tokens": 11144984} {"current_steps": 17085, "total_steps": 38160, "loss": 0.5026, "lr": 0.0006747866293067958, "epoch": 8.95440251572327, "percentage": 44.77, "elapsed_time": "0:43:35", "remaining_time": "0:53:46", "throughput": 4261.45, "total_tokens": 11147672} {"current_steps": 17090, "total_steps": 38160, "loss": 0.5141, "lr": 0.00067457235333572, "epoch": 8.957023060796645, "percentage": 44.79, "elapsed_time": "0:43:36", "remaining_time": "0:53:46", "throughput": 4261.51, "total_tokens": 11150872} {"current_steps": 17095, "total_steps": 38160, "loss": 0.4732, "lr": 0.0006743580408460994, "epoch": 8.95964360587002, "percentage": 44.8, "elapsed_time": "0:43:37", "remaining_time": "0:53:45", "throughput": 4261.6, "total_tokens": 11154360} {"current_steps": 17100, "total_steps": 38160, "loss": 0.5063, "lr": 0.0006741436918827659, "epoch": 8.962264150943396, "percentage": 44.81, "elapsed_time": "0:43:38", "remaining_time": "0:53:44", "throughput": 4261.56, "total_tokens": 11156984} {"current_steps": 17105, "total_steps": 38160, "loss": 0.6986, "lr": 0.0006739293064905589, "epoch": 8.964884696016771, "percentage": 44.82, "elapsed_time": "0:43:38", "remaining_time": "0:53:43", "throughput": 4261.7, "total_tokens": 11160696} {"current_steps": 17110, "total_steps": 38160, "loss": 0.5157, "lr": 0.0006737148847143251, "epoch": 8.967505241090146, "percentage": 44.84, "elapsed_time": "0:43:39", "remaining_time": "0:53:42", "throughput": 4261.73, "total_tokens": 11163800} {"current_steps": 17115, "total_steps": 38160, "loss": 0.5476, "lr": 0.0006735004265989195, "epoch": 8.970125786163521, "percentage": 44.85, "elapsed_time": "0:43:40", "remaining_time": "0:53:42", "throughput": 4261.88, "total_tokens": 11167480} {"current_steps": 17120, "total_steps": 38160, "loss": 0.4827, "lr": 0.0006732859321892038, "epoch": 8.972746331236896, "percentage": 44.86, "elapsed_time": "0:43:40", "remaining_time": "0:53:41", "throughput": 4261.86, "total_tokens": 11170232} {"current_steps": 17125, "total_steps": 38160, "loss": 0.6774, "lr": 0.0006730714015300481, "epoch": 8.975366876310272, "percentage": 44.88, "elapsed_time": "0:43:41", "remaining_time": "0:53:40", "throughput": 4261.9, "total_tokens": 11173400} {"current_steps": 17130, "total_steps": 38160, "loss": 0.45, "lr": 0.0006728568346663299, "epoch": 8.977987421383649, "percentage": 44.89, "elapsed_time": "0:43:42", "remaining_time": "0:53:39", "throughput": 4261.92, "total_tokens": 11176472} {"current_steps": 17135, "total_steps": 38160, "loss": 0.382, "lr": 0.0006726422316429337, "epoch": 8.980607966457024, "percentage": 44.9, "elapsed_time": "0:43:43", "remaining_time": "0:53:38", "throughput": 4261.9, "total_tokens": 11179288} {"current_steps": 17140, "total_steps": 38160, "loss": 0.4734, "lr": 0.0006724275925047523, "epoch": 8.983228511530399, "percentage": 44.92, "elapsed_time": "0:43:43", "remaining_time": "0:53:37", "throughput": 4261.88, "total_tokens": 11182136} {"current_steps": 17145, "total_steps": 38160, "loss": 0.4005, "lr": 0.0006722129172966858, "epoch": 8.985849056603774, "percentage": 44.93, "elapsed_time": "0:43:44", "remaining_time": "0:53:37", "throughput": 4262.11, "total_tokens": 11186296} {"current_steps": 17150, "total_steps": 38160, "loss": 0.3462, "lr": 0.0006719982060636416, "epoch": 8.98846960167715, "percentage": 44.94, "elapsed_time": "0:43:45", "remaining_time": "0:53:36", "throughput": 4262.14, "total_tokens": 11189304} {"current_steps": 17155, "total_steps": 38160, "loss": 0.5255, "lr": 0.000671783458850535, "epoch": 8.991090146750524, "percentage": 44.96, "elapsed_time": "0:43:45", "remaining_time": "0:53:35", "throughput": 4262.12, "total_tokens": 11192024} {"current_steps": 17160, "total_steps": 38160, "loss": 0.525, "lr": 0.0006715686757022886, "epoch": 8.9937106918239, "percentage": 44.97, "elapsed_time": "0:43:46", "remaining_time": "0:53:34", "throughput": 4262.17, "total_tokens": 11195160} {"current_steps": 17165, "total_steps": 38160, "loss": 0.5113, "lr": 0.0006713538566638326, "epoch": 8.996331236897275, "percentage": 44.98, "elapsed_time": "0:43:47", "remaining_time": "0:53:33", "throughput": 4262.21, "total_tokens": 11198264} {"current_steps": 17170, "total_steps": 38160, "loss": 0.4566, "lr": 0.0006711390017801049, "epoch": 8.99895178197065, "percentage": 44.99, "elapsed_time": "0:43:48", "remaining_time": "0:53:32", "throughput": 4262.54, "total_tokens": 11202840} {"current_steps": 17172, "total_steps": 38160, "eval_loss": 0.45358505845069885, "epoch": 9.0, "percentage": 45.0, "elapsed_time": "0:44:02", "remaining_time": "0:53:49", "throughput": 4240.57, "total_tokens": 11204000} {"current_steps": 17175, "total_steps": 38160, "loss": 0.4921, "lr": 0.0006709241110960502, "epoch": 9.001572327044025, "percentage": 45.01, "elapsed_time": "0:44:03", "remaining_time": "0:53:50", "throughput": 4238.32, "total_tokens": 11206048} {"current_steps": 17180, "total_steps": 38160, "loss": 0.5509, "lr": 0.0006707091846566216, "epoch": 9.0041928721174, "percentage": 45.02, "elapsed_time": "0:44:04", "remaining_time": "0:53:49", "throughput": 4238.57, "total_tokens": 11210464} {"current_steps": 17185, "total_steps": 38160, "loss": 0.4248, "lr": 0.0006704942225067791, "epoch": 9.006813417190775, "percentage": 45.03, "elapsed_time": "0:44:05", "remaining_time": "0:53:49", "throughput": 4238.55, "total_tokens": 11213312} {"current_steps": 17190, "total_steps": 38160, "loss": 0.403, "lr": 0.0006702792246914902, "epoch": 9.00943396226415, "percentage": 45.05, "elapsed_time": "0:44:06", "remaining_time": "0:53:48", "throughput": 4238.63, "total_tokens": 11216704} {"current_steps": 17195, "total_steps": 38160, "loss": 0.4283, "lr": 0.0006700641912557304, "epoch": 9.012054507337526, "percentage": 45.06, "elapsed_time": "0:44:07", "remaining_time": "0:53:47", "throughput": 4238.9, "total_tokens": 11221248} {"current_steps": 17200, "total_steps": 38160, "loss": 0.434, "lr": 0.0006698491222444818, "epoch": 9.014675052410901, "percentage": 45.07, "elapsed_time": "0:44:07", "remaining_time": "0:53:46", "throughput": 4238.87, "total_tokens": 11223904} {"current_steps": 17205, "total_steps": 38160, "loss": 0.4039, "lr": 0.0006696340177027346, "epoch": 9.017295597484276, "percentage": 45.09, "elapsed_time": "0:44:08", "remaining_time": "0:53:45", "throughput": 4239.01, "total_tokens": 11227648} {"current_steps": 17210, "total_steps": 38160, "loss": 0.4214, "lr": 0.0006694188776754863, "epoch": 9.019916142557651, "percentage": 45.1, "elapsed_time": "0:44:09", "remaining_time": "0:53:45", "throughput": 4238.99, "total_tokens": 11230432} {"current_steps": 17215, "total_steps": 38160, "loss": 0.4424, "lr": 0.0006692037022077415, "epoch": 9.022536687631026, "percentage": 45.11, "elapsed_time": "0:44:10", "remaining_time": "0:53:44", "throughput": 4239.02, "total_tokens": 11233536} {"current_steps": 17220, "total_steps": 38160, "loss": 0.4811, "lr": 0.0006689884913445126, "epoch": 9.025157232704403, "percentage": 45.13, "elapsed_time": "0:44:10", "remaining_time": "0:53:43", "throughput": 4239.04, "total_tokens": 11236512} {"current_steps": 17225, "total_steps": 38160, "loss": 0.4125, "lr": 0.0006687732451308193, "epoch": 9.027777777777779, "percentage": 45.14, "elapsed_time": "0:44:11", "remaining_time": "0:53:42", "throughput": 4238.9, "total_tokens": 11238656} {"current_steps": 17230, "total_steps": 38160, "loss": 0.5283, "lr": 0.0006685579636116886, "epoch": 9.030398322851154, "percentage": 45.15, "elapsed_time": "0:44:12", "remaining_time": "0:53:41", "throughput": 4239.04, "total_tokens": 11242400} {"current_steps": 17235, "total_steps": 38160, "loss": 0.4596, "lr": 0.0006683426468321547, "epoch": 9.033018867924529, "percentage": 45.17, "elapsed_time": "0:44:12", "remaining_time": "0:53:40", "throughput": 4239.13, "total_tokens": 11245824} {"current_steps": 17240, "total_steps": 38160, "loss": 0.3665, "lr": 0.0006681272948372598, "epoch": 9.035639412997904, "percentage": 45.18, "elapsed_time": "0:44:13", "remaining_time": "0:53:39", "throughput": 4239.13, "total_tokens": 11248736} {"current_steps": 17245, "total_steps": 38160, "loss": 0.5402, "lr": 0.000667911907672053, "epoch": 9.03825995807128, "percentage": 45.19, "elapsed_time": "0:44:14", "remaining_time": "0:53:39", "throughput": 4239.23, "total_tokens": 11252096} {"current_steps": 17250, "total_steps": 38160, "loss": 0.434, "lr": 0.0006676964853815906, "epoch": 9.040880503144654, "percentage": 45.2, "elapsed_time": "0:44:15", "remaining_time": "0:53:38", "throughput": 4239.75, "total_tokens": 11258496} {"current_steps": 17255, "total_steps": 38160, "loss": 0.4036, "lr": 0.0006674810280109367, "epoch": 9.04350104821803, "percentage": 45.22, "elapsed_time": "0:44:16", "remaining_time": "0:53:37", "throughput": 4239.68, "total_tokens": 11260960} {"current_steps": 17260, "total_steps": 38160, "loss": 0.4207, "lr": 0.0006672655356051625, "epoch": 9.046121593291405, "percentage": 45.23, "elapsed_time": "0:44:16", "remaining_time": "0:53:37", "throughput": 4239.8, "total_tokens": 11264512} {"current_steps": 17265, "total_steps": 38160, "loss": 0.4955, "lr": 0.0006670500082093465, "epoch": 9.04874213836478, "percentage": 45.24, "elapsed_time": "0:44:17", "remaining_time": "0:53:36", "throughput": 4239.94, "total_tokens": 11268256} {"current_steps": 17270, "total_steps": 38160, "loss": 0.5992, "lr": 0.0006668344458685745, "epoch": 9.051362683438155, "percentage": 45.26, "elapsed_time": "0:44:18", "remaining_time": "0:53:35", "throughput": 4239.97, "total_tokens": 11271328} {"current_steps": 17275, "total_steps": 38160, "loss": 0.3778, "lr": 0.00066661884862794, "epoch": 9.05398322851153, "percentage": 45.27, "elapsed_time": "0:44:19", "remaining_time": "0:53:34", "throughput": 4239.95, "total_tokens": 11274048} {"current_steps": 17280, "total_steps": 38160, "loss": 0.5216, "lr": 0.000666403216532543, "epoch": 9.056603773584905, "percentage": 45.28, "elapsed_time": "0:44:19", "remaining_time": "0:53:33", "throughput": 4240.05, "total_tokens": 11277440} {"current_steps": 17285, "total_steps": 38160, "loss": 0.4623, "lr": 0.0006661875496274916, "epoch": 9.05922431865828, "percentage": 45.3, "elapsed_time": "0:44:20", "remaining_time": "0:53:33", "throughput": 4240.17, "total_tokens": 11281120} {"current_steps": 17290, "total_steps": 38160, "loss": 0.4526, "lr": 0.0006659718479579008, "epoch": 9.061844863731656, "percentage": 45.31, "elapsed_time": "0:44:21", "remaining_time": "0:53:32", "throughput": 4240.19, "total_tokens": 11284064} {"current_steps": 17295, "total_steps": 38160, "loss": 0.3997, "lr": 0.0006657561115688929, "epoch": 9.064465408805031, "percentage": 45.32, "elapsed_time": "0:44:22", "remaining_time": "0:53:31", "throughput": 4240.37, "total_tokens": 11288096} {"current_steps": 17300, "total_steps": 38160, "loss": 0.3312, "lr": 0.0006655403405055977, "epoch": 9.067085953878406, "percentage": 45.34, "elapsed_time": "0:44:22", "remaining_time": "0:53:30", "throughput": 4240.55, "total_tokens": 11292032} {"current_steps": 17305, "total_steps": 38160, "loss": 0.3861, "lr": 0.0006653245348131517, "epoch": 9.069706498951781, "percentage": 45.35, "elapsed_time": "0:44:23", "remaining_time": "0:53:29", "throughput": 4240.51, "total_tokens": 11294720} {"current_steps": 17310, "total_steps": 38160, "loss": 0.4658, "lr": 0.0006651086945366991, "epoch": 9.072327044025156, "percentage": 45.36, "elapsed_time": "0:44:24", "remaining_time": "0:53:29", "throughput": 4240.71, "total_tokens": 11298880} {"current_steps": 17315, "total_steps": 38160, "loss": 0.626, "lr": 0.0006648928197213914, "epoch": 9.074947589098532, "percentage": 45.37, "elapsed_time": "0:44:25", "remaining_time": "0:53:28", "throughput": 4240.8, "total_tokens": 11302336} {"current_steps": 17320, "total_steps": 38160, "loss": 0.3639, "lr": 0.0006646769104123868, "epoch": 9.077568134171909, "percentage": 45.39, "elapsed_time": "0:44:25", "remaining_time": "0:53:27", "throughput": 4240.79, "total_tokens": 11305216} {"current_steps": 17325, "total_steps": 38160, "loss": 0.5793, "lr": 0.0006644609666548513, "epoch": 9.080188679245284, "percentage": 45.4, "elapsed_time": "0:44:26", "remaining_time": "0:53:26", "throughput": 4240.86, "total_tokens": 11308512} {"current_steps": 17330, "total_steps": 38160, "loss": 0.534, "lr": 0.000664244988493958, "epoch": 9.082809224318659, "percentage": 45.41, "elapsed_time": "0:44:27", "remaining_time": "0:53:26", "throughput": 4241.04, "total_tokens": 11312416} {"current_steps": 17335, "total_steps": 38160, "loss": 0.3657, "lr": 0.0006640289759748867, "epoch": 9.085429769392034, "percentage": 45.43, "elapsed_time": "0:44:28", "remaining_time": "0:53:25", "throughput": 4241.15, "total_tokens": 11315904} {"current_steps": 17340, "total_steps": 38160, "loss": 0.3068, "lr": 0.0006638129291428252, "epoch": 9.08805031446541, "percentage": 45.44, "elapsed_time": "0:44:29", "remaining_time": "0:53:24", "throughput": 4241.63, "total_tokens": 11321664} {"current_steps": 17345, "total_steps": 38160, "loss": 0.3932, "lr": 0.0006635968480429677, "epoch": 9.090670859538784, "percentage": 45.45, "elapsed_time": "0:44:30", "remaining_time": "0:53:24", "throughput": 4241.84, "total_tokens": 11325728} {"current_steps": 17350, "total_steps": 38160, "loss": 0.4248, "lr": 0.0006633807327205162, "epoch": 9.09329140461216, "percentage": 45.47, "elapsed_time": "0:44:30", "remaining_time": "0:53:23", "throughput": 4241.98, "total_tokens": 11329344} {"current_steps": 17355, "total_steps": 38160, "loss": 0.4221, "lr": 0.0006631645832206789, "epoch": 9.095911949685535, "percentage": 45.48, "elapsed_time": "0:44:31", "remaining_time": "0:53:22", "throughput": 4241.91, "total_tokens": 11331840} {"current_steps": 17360, "total_steps": 38160, "loss": 0.5001, "lr": 0.0006629483995886727, "epoch": 9.09853249475891, "percentage": 45.49, "elapsed_time": "0:44:32", "remaining_time": "0:53:21", "throughput": 4241.93, "total_tokens": 11334912} {"current_steps": 17365, "total_steps": 38160, "loss": 0.4519, "lr": 0.0006627321818697202, "epoch": 9.101153039832285, "percentage": 45.51, "elapsed_time": "0:44:32", "remaining_time": "0:53:20", "throughput": 4241.85, "total_tokens": 11337344} {"current_steps": 17370, "total_steps": 38160, "loss": 0.5895, "lr": 0.0006625159301090518, "epoch": 9.10377358490566, "percentage": 45.52, "elapsed_time": "0:44:33", "remaining_time": "0:53:19", "throughput": 4241.89, "total_tokens": 11340384} {"current_steps": 17375, "total_steps": 38160, "loss": 0.4491, "lr": 0.0006622996443519047, "epoch": 9.106394129979035, "percentage": 45.53, "elapsed_time": "0:44:34", "remaining_time": "0:53:18", "throughput": 4241.84, "total_tokens": 11342976} {"current_steps": 17380, "total_steps": 38160, "loss": 0.4204, "lr": 0.0006620833246435238, "epoch": 9.10901467505241, "percentage": 45.55, "elapsed_time": "0:44:34", "remaining_time": "0:53:17", "throughput": 4241.76, "total_tokens": 11345504} {"current_steps": 17385, "total_steps": 38160, "loss": 0.4378, "lr": 0.0006618669710291606, "epoch": 9.111635220125786, "percentage": 45.56, "elapsed_time": "0:44:35", "remaining_time": "0:53:17", "throughput": 4241.92, "total_tokens": 11349216} {"current_steps": 17390, "total_steps": 38160, "loss": 0.4492, "lr": 0.0006616505835540736, "epoch": 9.114255765199161, "percentage": 45.57, "elapsed_time": "0:44:36", "remaining_time": "0:53:16", "throughput": 4242.0, "total_tokens": 11352576} {"current_steps": 17395, "total_steps": 38160, "loss": 0.3812, "lr": 0.0006614341622635287, "epoch": 9.116876310272536, "percentage": 45.58, "elapsed_time": "0:44:36", "remaining_time": "0:53:15", "throughput": 4241.96, "total_tokens": 11355104} {"current_steps": 17400, "total_steps": 38160, "loss": 0.5131, "lr": 0.0006612177072027989, "epoch": 9.119496855345911, "percentage": 45.6, "elapsed_time": "0:44:38", "remaining_time": "0:53:15", "throughput": 4242.49, "total_tokens": 11361504} {"current_steps": 17405, "total_steps": 38160, "loss": 0.4321, "lr": 0.0006610012184171641, "epoch": 9.122117400419286, "percentage": 45.61, "elapsed_time": "0:44:38", "remaining_time": "0:53:14", "throughput": 4242.62, "total_tokens": 11365120} {"current_steps": 17410, "total_steps": 38160, "loss": 0.5137, "lr": 0.0006607846959519109, "epoch": 9.124737945492662, "percentage": 45.62, "elapsed_time": "0:44:39", "remaining_time": "0:53:13", "throughput": 4242.77, "total_tokens": 11368800} {"current_steps": 17415, "total_steps": 38160, "loss": 0.678, "lr": 0.0006605681398523339, "epoch": 9.127358490566039, "percentage": 45.64, "elapsed_time": "0:44:40", "remaining_time": "0:53:12", "throughput": 4242.76, "total_tokens": 11371616} {"current_steps": 17420, "total_steps": 38160, "loss": 0.5186, "lr": 0.0006603515501637338, "epoch": 9.129979035639414, "percentage": 45.65, "elapsed_time": "0:44:40", "remaining_time": "0:53:11", "throughput": 4242.75, "total_tokens": 11374496} {"current_steps": 17425, "total_steps": 38160, "loss": 0.4227, "lr": 0.0006601349269314187, "epoch": 9.132599580712789, "percentage": 45.66, "elapsed_time": "0:44:41", "remaining_time": "0:53:11", "throughput": 4242.96, "total_tokens": 11378624} {"current_steps": 17430, "total_steps": 38160, "loss": 0.5231, "lr": 0.0006599182702007042, "epoch": 9.135220125786164, "percentage": 45.68, "elapsed_time": "0:44:42", "remaining_time": "0:53:10", "throughput": 4242.93, "total_tokens": 11381312} {"current_steps": 17435, "total_steps": 38160, "loss": 0.3695, "lr": 0.0006597015800169116, "epoch": 9.13784067085954, "percentage": 45.69, "elapsed_time": "0:44:43", "remaining_time": "0:53:09", "throughput": 4242.86, "total_tokens": 11383808} {"current_steps": 17440, "total_steps": 38160, "loss": 0.4707, "lr": 0.0006594848564253705, "epoch": 9.140461215932914, "percentage": 45.7, "elapsed_time": "0:44:43", "remaining_time": "0:53:08", "throughput": 4243.05, "total_tokens": 11387840} {"current_steps": 17445, "total_steps": 38160, "loss": 0.3706, "lr": 0.0006592680994714171, "epoch": 9.14308176100629, "percentage": 45.72, "elapsed_time": "0:44:44", "remaining_time": "0:53:08", "throughput": 4243.42, "total_tokens": 11392800} {"current_steps": 17450, "total_steps": 38160, "loss": 0.3254, "lr": 0.0006590513092003943, "epoch": 9.145702306079665, "percentage": 45.73, "elapsed_time": "0:44:45", "remaining_time": "0:53:07", "throughput": 4243.52, "total_tokens": 11396224} {"current_steps": 17455, "total_steps": 38160, "loss": 0.4835, "lr": 0.0006588344856576521, "epoch": 9.14832285115304, "percentage": 45.74, "elapsed_time": "0:44:46", "remaining_time": "0:53:06", "throughput": 4243.57, "total_tokens": 11399456} {"current_steps": 17460, "total_steps": 38160, "loss": 0.4102, "lr": 0.0006586176288885475, "epoch": 9.150943396226415, "percentage": 45.75, "elapsed_time": "0:44:46", "remaining_time": "0:53:05", "throughput": 4243.57, "total_tokens": 11402304} {"current_steps": 17465, "total_steps": 38160, "loss": 0.4877, "lr": 0.0006584007389384446, "epoch": 9.15356394129979, "percentage": 45.77, "elapsed_time": "0:44:47", "remaining_time": "0:53:04", "throughput": 4243.6, "total_tokens": 11405440} {"current_steps": 17470, "total_steps": 38160, "loss": 0.4804, "lr": 0.0006581838158527144, "epoch": 9.156184486373165, "percentage": 45.78, "elapsed_time": "0:44:48", "remaining_time": "0:53:03", "throughput": 4243.59, "total_tokens": 11408256} {"current_steps": 17475, "total_steps": 38160, "loss": 0.3514, "lr": 0.0006579668596767343, "epoch": 9.15880503144654, "percentage": 45.79, "elapsed_time": "0:44:49", "remaining_time": "0:53:03", "throughput": 4243.78, "total_tokens": 11412288} {"current_steps": 17480, "total_steps": 38160, "loss": 0.4181, "lr": 0.0006577498704558894, "epoch": 9.161425576519916, "percentage": 45.81, "elapsed_time": "0:44:49", "remaining_time": "0:53:02", "throughput": 4243.72, "total_tokens": 11414816} {"current_steps": 17485, "total_steps": 38160, "loss": 0.4632, "lr": 0.0006575328482355715, "epoch": 9.164046121593291, "percentage": 45.82, "elapsed_time": "0:44:50", "remaining_time": "0:53:01", "throughput": 4243.7, "total_tokens": 11417632} {"current_steps": 17490, "total_steps": 38160, "loss": 0.5855, "lr": 0.0006573157930611788, "epoch": 9.166666666666666, "percentage": 45.83, "elapsed_time": "0:44:51", "remaining_time": "0:53:00", "throughput": 4243.68, "total_tokens": 11420384} {"current_steps": 17495, "total_steps": 38160, "loss": 0.5091, "lr": 0.000657098704978117, "epoch": 9.169287211740041, "percentage": 45.85, "elapsed_time": "0:44:51", "remaining_time": "0:52:59", "throughput": 4243.75, "total_tokens": 11423648} {"current_steps": 17500, "total_steps": 38160, "loss": 0.3944, "lr": 0.0006568815840317984, "epoch": 9.171907756813416, "percentage": 45.86, "elapsed_time": "0:44:52", "remaining_time": "0:52:58", "throughput": 4243.82, "total_tokens": 11426976} {"current_steps": 17505, "total_steps": 38160, "loss": 0.3877, "lr": 0.0006566644302676422, "epoch": 9.174528301886792, "percentage": 45.87, "elapsed_time": "0:44:53", "remaining_time": "0:52:58", "throughput": 4243.89, "total_tokens": 11430304} {"current_steps": 17510, "total_steps": 38160, "loss": 0.4351, "lr": 0.0006564472437310746, "epoch": 9.177148846960169, "percentage": 45.89, "elapsed_time": "0:44:53", "remaining_time": "0:52:57", "throughput": 4243.8, "total_tokens": 11432704} {"current_steps": 17515, "total_steps": 38160, "loss": 0.3962, "lr": 0.0006562300244675283, "epoch": 9.179769392033544, "percentage": 45.9, "elapsed_time": "0:44:54", "remaining_time": "0:52:56", "throughput": 4243.94, "total_tokens": 11436448} {"current_steps": 17520, "total_steps": 38160, "loss": 0.4112, "lr": 0.0006560127725224432, "epoch": 9.182389937106919, "percentage": 45.91, "elapsed_time": "0:44:55", "remaining_time": "0:52:55", "throughput": 4244.03, "total_tokens": 11439872} {"current_steps": 17525, "total_steps": 38160, "loss": 0.5758, "lr": 0.0006557954879412662, "epoch": 9.185010482180294, "percentage": 45.93, "elapsed_time": "0:44:56", "remaining_time": "0:52:54", "throughput": 4243.94, "total_tokens": 11442304} {"current_steps": 17530, "total_steps": 38160, "loss": 0.6112, "lr": 0.0006555781707694506, "epoch": 9.18763102725367, "percentage": 45.94, "elapsed_time": "0:44:56", "remaining_time": "0:52:53", "throughput": 4244.06, "total_tokens": 11445856} {"current_steps": 17535, "total_steps": 38160, "loss": 0.4364, "lr": 0.0006553608210524564, "epoch": 9.190251572327044, "percentage": 45.95, "elapsed_time": "0:44:58", "remaining_time": "0:52:53", "throughput": 4244.58, "total_tokens": 11452288} {"current_steps": 17540, "total_steps": 38160, "loss": 0.5563, "lr": 0.0006551434388357509, "epoch": 9.19287211740042, "percentage": 45.96, "elapsed_time": "0:44:58", "remaining_time": "0:52:52", "throughput": 4244.72, "total_tokens": 11456032} {"current_steps": 17545, "total_steps": 38160, "loss": 0.3992, "lr": 0.000654926024164808, "epoch": 9.195492662473795, "percentage": 45.98, "elapsed_time": "0:44:59", "remaining_time": "0:52:51", "throughput": 4244.82, "total_tokens": 11459392} {"current_steps": 17550, "total_steps": 38160, "loss": 0.4816, "lr": 0.0006547085770851084, "epoch": 9.19811320754717, "percentage": 45.99, "elapsed_time": "0:45:00", "remaining_time": "0:52:51", "throughput": 4244.82, "total_tokens": 11462336} {"current_steps": 17555, "total_steps": 38160, "loss": 0.4476, "lr": 0.0006544910976421395, "epoch": 9.200733752620545, "percentage": 46.0, "elapsed_time": "0:45:00", "remaining_time": "0:52:50", "throughput": 4244.76, "total_tokens": 11464896} {"current_steps": 17560, "total_steps": 38160, "loss": 0.4232, "lr": 0.0006542735858813953, "epoch": 9.20335429769392, "percentage": 46.02, "elapsed_time": "0:45:02", "remaining_time": "0:52:50", "throughput": 4245.42, "total_tokens": 11472224} {"current_steps": 17565, "total_steps": 38160, "loss": 0.4926, "lr": 0.0006540560418483771, "epoch": 9.205974842767295, "percentage": 46.03, "elapsed_time": "0:45:02", "remaining_time": "0:52:49", "throughput": 4245.39, "total_tokens": 11474912} {"current_steps": 17570, "total_steps": 38160, "loss": 0.6496, "lr": 0.0006538384655885925, "epoch": 9.20859538784067, "percentage": 46.04, "elapsed_time": "0:45:03", "remaining_time": "0:52:48", "throughput": 4245.48, "total_tokens": 11478240} {"current_steps": 17575, "total_steps": 38160, "loss": 0.3852, "lr": 0.000653620857147556, "epoch": 9.211215932914046, "percentage": 46.06, "elapsed_time": "0:45:04", "remaining_time": "0:52:47", "throughput": 4245.49, "total_tokens": 11481216} {"current_steps": 17580, "total_steps": 38160, "loss": 0.4432, "lr": 0.0006534032165707887, "epoch": 9.213836477987421, "percentage": 46.07, "elapsed_time": "0:45:05", "remaining_time": "0:52:46", "throughput": 4245.54, "total_tokens": 11484384} {"current_steps": 17585, "total_steps": 38160, "loss": 0.5199, "lr": 0.0006531855439038187, "epoch": 9.216457023060796, "percentage": 46.08, "elapsed_time": "0:45:05", "remaining_time": "0:52:45", "throughput": 4245.51, "total_tokens": 11487104} {"current_steps": 17590, "total_steps": 38160, "loss": 0.377, "lr": 0.0006529678391921805, "epoch": 9.219077568134171, "percentage": 46.1, "elapsed_time": "0:45:06", "remaining_time": "0:52:44", "throughput": 4245.46, "total_tokens": 11489696} {"current_steps": 17595, "total_steps": 38160, "loss": 0.5347, "lr": 0.0006527501024814155, "epoch": 9.221698113207546, "percentage": 46.11, "elapsed_time": "0:45:07", "remaining_time": "0:52:43", "throughput": 4245.44, "total_tokens": 11492512} {"current_steps": 17600, "total_steps": 38160, "loss": 0.4237, "lr": 0.0006525323338170718, "epoch": 9.224318658280922, "percentage": 46.12, "elapsed_time": "0:45:07", "remaining_time": "0:52:43", "throughput": 4245.49, "total_tokens": 11495648} {"current_steps": 17605, "total_steps": 38160, "loss": 0.4926, "lr": 0.000652314533244704, "epoch": 9.226939203354299, "percentage": 46.13, "elapsed_time": "0:45:08", "remaining_time": "0:52:42", "throughput": 4245.58, "total_tokens": 11498976} {"current_steps": 17610, "total_steps": 38160, "loss": 0.403, "lr": 0.0006520967008098735, "epoch": 9.229559748427674, "percentage": 46.15, "elapsed_time": "0:45:09", "remaining_time": "0:52:41", "throughput": 4245.58, "total_tokens": 11501888} {"current_steps": 17615, "total_steps": 38160, "loss": 0.532, "lr": 0.0006518788365581485, "epoch": 9.232180293501049, "percentage": 46.16, "elapsed_time": "0:45:09", "remaining_time": "0:52:40", "throughput": 4245.53, "total_tokens": 11504544} {"current_steps": 17620, "total_steps": 38160, "loss": 0.391, "lr": 0.0006516609405351034, "epoch": 9.234800838574424, "percentage": 46.17, "elapsed_time": "0:45:10", "remaining_time": "0:52:39", "throughput": 4245.48, "total_tokens": 11507168} {"current_steps": 17625, "total_steps": 38160, "loss": 0.385, "lr": 0.00065144301278632, "epoch": 9.2374213836478, "percentage": 46.19, "elapsed_time": "0:45:11", "remaining_time": "0:52:38", "throughput": 4245.51, "total_tokens": 11510272} {"current_steps": 17630, "total_steps": 38160, "loss": 0.4587, "lr": 0.0006512250533573862, "epoch": 9.240041928721174, "percentage": 46.2, "elapsed_time": "0:45:11", "remaining_time": "0:52:37", "throughput": 4245.54, "total_tokens": 11513280} {"current_steps": 17635, "total_steps": 38160, "loss": 0.3657, "lr": 0.0006510070622938962, "epoch": 9.24266247379455, "percentage": 46.21, "elapsed_time": "0:45:12", "remaining_time": "0:52:37", "throughput": 4245.57, "total_tokens": 11516384} {"current_steps": 17640, "total_steps": 38160, "loss": 0.5291, "lr": 0.0006507890396414516, "epoch": 9.245283018867925, "percentage": 46.23, "elapsed_time": "0:45:13", "remaining_time": "0:52:36", "throughput": 4245.81, "total_tokens": 11520672} {"current_steps": 17645, "total_steps": 38160, "loss": 0.4949, "lr": 0.0006505709854456602, "epoch": 9.2479035639413, "percentage": 46.24, "elapsed_time": "0:45:14", "remaining_time": "0:52:35", "throughput": 4245.8, "total_tokens": 11523456} {"current_steps": 17650, "total_steps": 38160, "loss": 0.3615, "lr": 0.0006503528997521365, "epoch": 9.250524109014675, "percentage": 46.25, "elapsed_time": "0:45:14", "remaining_time": "0:52:34", "throughput": 4245.77, "total_tokens": 11526240} {"current_steps": 17655, "total_steps": 38160, "loss": 0.4596, "lr": 0.0006501347826065017, "epoch": 9.25314465408805, "percentage": 46.27, "elapsed_time": "0:45:15", "remaining_time": "0:52:34", "throughput": 4246.08, "total_tokens": 11531040} {"current_steps": 17660, "total_steps": 38160, "loss": 0.4566, "lr": 0.000649916634054383, "epoch": 9.255765199161425, "percentage": 46.28, "elapsed_time": "0:45:16", "remaining_time": "0:52:33", "throughput": 4246.1, "total_tokens": 11533984} {"current_steps": 17665, "total_steps": 38160, "loss": 0.4464, "lr": 0.0006496984541414147, "epoch": 9.2583857442348, "percentage": 46.29, "elapsed_time": "0:45:17", "remaining_time": "0:52:32", "throughput": 4246.15, "total_tokens": 11537248} {"current_steps": 17670, "total_steps": 38160, "loss": 0.4544, "lr": 0.0006494802429132378, "epoch": 9.261006289308176, "percentage": 46.31, "elapsed_time": "0:45:17", "remaining_time": "0:52:31", "throughput": 4246.19, "total_tokens": 11540384} {"current_steps": 17675, "total_steps": 38160, "loss": 0.537, "lr": 0.0006492620004154993, "epoch": 9.26362683438155, "percentage": 46.32, "elapsed_time": "0:45:18", "remaining_time": "0:52:30", "throughput": 4246.23, "total_tokens": 11543424} {"current_steps": 17680, "total_steps": 38160, "loss": 0.4478, "lr": 0.0006490437266938534, "epoch": 9.266247379454926, "percentage": 46.33, "elapsed_time": "0:45:19", "remaining_time": "0:52:29", "throughput": 4246.37, "total_tokens": 11547136} {"current_steps": 17685, "total_steps": 38160, "loss": 0.5558, "lr": 0.0006488254217939601, "epoch": 9.268867924528301, "percentage": 46.34, "elapsed_time": "0:45:20", "remaining_time": "0:52:29", "throughput": 4246.46, "total_tokens": 11550528} {"current_steps": 17690, "total_steps": 38160, "loss": 0.3497, "lr": 0.0006486070857614863, "epoch": 9.271488469601676, "percentage": 46.36, "elapsed_time": "0:45:20", "remaining_time": "0:52:28", "throughput": 4246.45, "total_tokens": 11553440} {"current_steps": 17695, "total_steps": 38160, "loss": 0.3508, "lr": 0.0006483887186421059, "epoch": 9.274109014675052, "percentage": 46.37, "elapsed_time": "0:45:21", "remaining_time": "0:52:27", "throughput": 4246.59, "total_tokens": 11557184} {"current_steps": 17700, "total_steps": 38160, "loss": 0.4037, "lr": 0.0006481703204814982, "epoch": 9.276729559748428, "percentage": 46.38, "elapsed_time": "0:45:22", "remaining_time": "0:52:26", "throughput": 4246.65, "total_tokens": 11560416} {"current_steps": 17705, "total_steps": 38160, "loss": 0.4584, "lr": 0.00064795189132535, "epoch": 9.279350104821804, "percentage": 46.4, "elapsed_time": "0:45:22", "remaining_time": "0:52:25", "throughput": 4246.72, "total_tokens": 11563712} {"current_steps": 17710, "total_steps": 38160, "loss": 0.5034, "lr": 0.000647733431219354, "epoch": 9.281970649895179, "percentage": 46.41, "elapsed_time": "0:45:23", "remaining_time": "0:52:25", "throughput": 4246.92, "total_tokens": 11567776} {"current_steps": 17715, "total_steps": 38160, "loss": 0.4866, "lr": 0.0006475149402092097, "epoch": 9.284591194968554, "percentage": 46.42, "elapsed_time": "0:45:24", "remaining_time": "0:52:24", "throughput": 4247.05, "total_tokens": 11571456} {"current_steps": 17720, "total_steps": 38160, "loss": 0.453, "lr": 0.0006472964183406229, "epoch": 9.28721174004193, "percentage": 46.44, "elapsed_time": "0:45:25", "remaining_time": "0:52:23", "throughput": 4247.2, "total_tokens": 11575136} {"current_steps": 17725, "total_steps": 38160, "loss": 0.4626, "lr": 0.0006470778656593055, "epoch": 9.289832285115304, "percentage": 46.45, "elapsed_time": "0:45:26", "remaining_time": "0:52:22", "throughput": 4247.34, "total_tokens": 11578880} {"current_steps": 17730, "total_steps": 38160, "loss": 0.3178, "lr": 0.0006468592822109769, "epoch": 9.29245283018868, "percentage": 46.46, "elapsed_time": "0:45:26", "remaining_time": "0:52:22", "throughput": 4247.35, "total_tokens": 11581792} {"current_steps": 17735, "total_steps": 38160, "loss": 0.5677, "lr": 0.0006466406680413619, "epoch": 9.295073375262055, "percentage": 46.48, "elapsed_time": "0:45:27", "remaining_time": "0:52:21", "throughput": 4247.35, "total_tokens": 11584704} {"current_steps": 17740, "total_steps": 38160, "loss": 0.5597, "lr": 0.000646422023196192, "epoch": 9.29769392033543, "percentage": 46.49, "elapsed_time": "0:45:28", "remaining_time": "0:52:20", "throughput": 4247.42, "total_tokens": 11587936} {"current_steps": 17745, "total_steps": 38160, "loss": 0.5186, "lr": 0.0006462033477212054, "epoch": 9.300314465408805, "percentage": 46.5, "elapsed_time": "0:45:28", "remaining_time": "0:52:19", "throughput": 4247.48, "total_tokens": 11591232} {"current_steps": 17750, "total_steps": 38160, "loss": 0.6321, "lr": 0.0006459846416621462, "epoch": 9.30293501048218, "percentage": 46.51, "elapsed_time": "0:45:29", "remaining_time": "0:52:18", "throughput": 4247.58, "total_tokens": 11594656} {"current_steps": 17755, "total_steps": 38160, "loss": 0.3889, "lr": 0.0006457659050647657, "epoch": 9.305555555555555, "percentage": 46.53, "elapsed_time": "0:45:30", "remaining_time": "0:52:17", "throughput": 4247.66, "total_tokens": 11598016} {"current_steps": 17760, "total_steps": 38160, "loss": 0.3637, "lr": 0.0006455471379748208, "epoch": 9.30817610062893, "percentage": 46.54, "elapsed_time": "0:45:31", "remaining_time": "0:52:17", "throughput": 4247.73, "total_tokens": 11601312} {"current_steps": 17765, "total_steps": 38160, "loss": 0.5366, "lr": 0.000645328340438075, "epoch": 9.310796645702306, "percentage": 46.55, "elapsed_time": "0:45:31", "remaining_time": "0:52:16", "throughput": 4247.86, "total_tokens": 11604896} {"current_steps": 17770, "total_steps": 38160, "loss": 0.4307, "lr": 0.0006451095125002985, "epoch": 9.31341719077568, "percentage": 46.57, "elapsed_time": "0:45:32", "remaining_time": "0:52:15", "throughput": 4247.87, "total_tokens": 11607840} {"current_steps": 17775, "total_steps": 38160, "loss": 0.4101, "lr": 0.0006448906542072674, "epoch": 9.316037735849056, "percentage": 46.58, "elapsed_time": "0:45:33", "remaining_time": "0:52:14", "throughput": 4247.98, "total_tokens": 11611392} {"current_steps": 17780, "total_steps": 38160, "loss": 0.4007, "lr": 0.0006446717656047645, "epoch": 9.318658280922431, "percentage": 46.59, "elapsed_time": "0:45:34", "remaining_time": "0:52:13", "throughput": 4248.06, "total_tokens": 11614752} {"current_steps": 17785, "total_steps": 38160, "loss": 0.4292, "lr": 0.0006444528467385789, "epoch": 9.321278825995806, "percentage": 46.61, "elapsed_time": "0:45:34", "remaining_time": "0:52:13", "throughput": 4248.08, "total_tokens": 11617728} {"current_steps": 17790, "total_steps": 38160, "loss": 0.4202, "lr": 0.0006442338976545054, "epoch": 9.323899371069182, "percentage": 46.62, "elapsed_time": "0:45:35", "remaining_time": "0:52:12", "throughput": 4248.11, "total_tokens": 11620736} {"current_steps": 17795, "total_steps": 38160, "loss": 0.5432, "lr": 0.0006440149183983461, "epoch": 9.326519916142558, "percentage": 46.63, "elapsed_time": "0:45:36", "remaining_time": "0:52:11", "throughput": 4248.13, "total_tokens": 11623744} {"current_steps": 17800, "total_steps": 38160, "loss": 0.4937, "lr": 0.0006437959090159093, "epoch": 9.329140461215934, "percentage": 46.65, "elapsed_time": "0:45:36", "remaining_time": "0:52:10", "throughput": 4248.11, "total_tokens": 11626496} {"current_steps": 17805, "total_steps": 38160, "loss": 0.3954, "lr": 0.0006435768695530085, "epoch": 9.331761006289309, "percentage": 46.66, "elapsed_time": "0:45:37", "remaining_time": "0:52:09", "throughput": 4248.13, "total_tokens": 11629504} {"current_steps": 17810, "total_steps": 38160, "loss": 0.4905, "lr": 0.0006433578000554645, "epoch": 9.334381551362684, "percentage": 46.67, "elapsed_time": "0:45:38", "remaining_time": "0:52:08", "throughput": 4248.13, "total_tokens": 11632384} {"current_steps": 17815, "total_steps": 38160, "loss": 0.3967, "lr": 0.0006431387005691045, "epoch": 9.33700209643606, "percentage": 46.69, "elapsed_time": "0:45:38", "remaining_time": "0:52:07", "throughput": 4248.19, "total_tokens": 11635616} {"current_steps": 17820, "total_steps": 38160, "loss": 0.4282, "lr": 0.0006429195711397611, "epoch": 9.339622641509434, "percentage": 46.7, "elapsed_time": "0:45:39", "remaining_time": "0:52:07", "throughput": 4248.26, "total_tokens": 11638912} {"current_steps": 17825, "total_steps": 38160, "loss": 0.4906, "lr": 0.0006427004118132742, "epoch": 9.34224318658281, "percentage": 46.71, "elapsed_time": "0:45:40", "remaining_time": "0:52:06", "throughput": 4248.36, "total_tokens": 11642432} {"current_steps": 17830, "total_steps": 38160, "loss": 0.4082, "lr": 0.0006424812226354889, "epoch": 9.344863731656185, "percentage": 46.72, "elapsed_time": "0:45:41", "remaining_time": "0:52:05", "throughput": 4248.32, "total_tokens": 11645120} {"current_steps": 17835, "total_steps": 38160, "loss": 0.4082, "lr": 0.0006422620036522574, "epoch": 9.34748427672956, "percentage": 46.74, "elapsed_time": "0:45:41", "remaining_time": "0:52:04", "throughput": 4248.23, "total_tokens": 11647456} {"current_steps": 17840, "total_steps": 38160, "loss": 0.472, "lr": 0.000642042754909438, "epoch": 9.350104821802935, "percentage": 46.75, "elapsed_time": "0:45:42", "remaining_time": "0:52:03", "throughput": 4248.34, "total_tokens": 11650976} {"current_steps": 17845, "total_steps": 38160, "loss": 0.4425, "lr": 0.0006418234764528945, "epoch": 9.35272536687631, "percentage": 46.76, "elapsed_time": "0:45:43", "remaining_time": "0:52:02", "throughput": 4248.42, "total_tokens": 11654304} {"current_steps": 17850, "total_steps": 38160, "loss": 0.5073, "lr": 0.0006416041683284978, "epoch": 9.355345911949685, "percentage": 46.78, "elapsed_time": "0:45:44", "remaining_time": "0:52:02", "throughput": 4248.65, "total_tokens": 11658592} {"current_steps": 17855, "total_steps": 38160, "loss": 0.5415, "lr": 0.0006413848305821246, "epoch": 9.35796645702306, "percentage": 46.79, "elapsed_time": "0:45:44", "remaining_time": "0:52:01", "throughput": 4248.81, "total_tokens": 11662464} {"current_steps": 17860, "total_steps": 38160, "loss": 0.3913, "lr": 0.0006411654632596578, "epoch": 9.360587002096436, "percentage": 46.8, "elapsed_time": "0:45:45", "remaining_time": "0:52:00", "throughput": 4248.79, "total_tokens": 11665248} {"current_steps": 17865, "total_steps": 38160, "loss": 0.5148, "lr": 0.0006409460664069867, "epoch": 9.36320754716981, "percentage": 46.82, "elapsed_time": "0:45:46", "remaining_time": "0:51:59", "throughput": 4248.79, "total_tokens": 11668256} {"current_steps": 17870, "total_steps": 38160, "loss": 0.49, "lr": 0.0006407266400700064, "epoch": 9.365828092243186, "percentage": 46.83, "elapsed_time": "0:45:46", "remaining_time": "0:51:58", "throughput": 4248.8, "total_tokens": 11671264} {"current_steps": 17875, "total_steps": 38160, "loss": 0.6437, "lr": 0.0006405071842946185, "epoch": 9.368448637316561, "percentage": 46.84, "elapsed_time": "0:45:47", "remaining_time": "0:51:58", "throughput": 4248.74, "total_tokens": 11673728} {"current_steps": 17880, "total_steps": 38160, "loss": 0.3963, "lr": 0.0006402876991267308, "epoch": 9.371069182389936, "percentage": 46.86, "elapsed_time": "0:45:48", "remaining_time": "0:51:57", "throughput": 4248.79, "total_tokens": 11676960} {"current_steps": 17885, "total_steps": 38160, "loss": 0.5067, "lr": 0.0006400681846122568, "epoch": 9.373689727463312, "percentage": 46.87, "elapsed_time": "0:45:49", "remaining_time": "0:51:56", "throughput": 4249.04, "total_tokens": 11681440} {"current_steps": 17890, "total_steps": 38160, "loss": 0.4297, "lr": 0.0006398486407971166, "epoch": 9.376310272536688, "percentage": 46.88, "elapsed_time": "0:45:49", "remaining_time": "0:51:55", "throughput": 4249.06, "total_tokens": 11684544} {"current_steps": 17895, "total_steps": 38160, "loss": 0.4524, "lr": 0.0006396290677272361, "epoch": 9.378930817610064, "percentage": 46.89, "elapsed_time": "0:45:50", "remaining_time": "0:51:54", "throughput": 4249.08, "total_tokens": 11687584} {"current_steps": 17900, "total_steps": 38160, "loss": 0.3579, "lr": 0.0006394094654485477, "epoch": 9.381551362683439, "percentage": 46.91, "elapsed_time": "0:45:51", "remaining_time": "0:51:54", "throughput": 4249.15, "total_tokens": 11690944} {"current_steps": 17905, "total_steps": 38160, "loss": 0.4297, "lr": 0.0006391898340069896, "epoch": 9.384171907756814, "percentage": 46.92, "elapsed_time": "0:45:52", "remaining_time": "0:51:53", "throughput": 4249.2, "total_tokens": 11694112} {"current_steps": 17910, "total_steps": 38160, "loss": 0.4811, "lr": 0.0006389701734485061, "epoch": 9.38679245283019, "percentage": 46.93, "elapsed_time": "0:45:52", "remaining_time": "0:51:52", "throughput": 4249.25, "total_tokens": 11697376} {"current_steps": 17915, "total_steps": 38160, "loss": 0.3756, "lr": 0.0006387504838190479, "epoch": 9.389412997903564, "percentage": 46.95, "elapsed_time": "0:45:53", "remaining_time": "0:51:51", "throughput": 4249.34, "total_tokens": 11700832} {"current_steps": 17920, "total_steps": 38160, "loss": 0.4153, "lr": 0.0006385307651645715, "epoch": 9.39203354297694, "percentage": 46.96, "elapsed_time": "0:45:54", "remaining_time": "0:51:50", "throughput": 4249.31, "total_tokens": 11703520} {"current_steps": 17925, "total_steps": 38160, "loss": 0.4333, "lr": 0.0006383110175310393, "epoch": 9.394654088050315, "percentage": 46.97, "elapsed_time": "0:45:54", "remaining_time": "0:51:49", "throughput": 4249.43, "total_tokens": 11707008} {"current_steps": 17930, "total_steps": 38160, "loss": 0.3417, "lr": 0.0006380912409644202, "epoch": 9.39727463312369, "percentage": 46.99, "elapsed_time": "0:45:55", "remaining_time": "0:51:49", "throughput": 4249.35, "total_tokens": 11709408} {"current_steps": 17935, "total_steps": 38160, "loss": 0.4003, "lr": 0.000637871435510689, "epoch": 9.399895178197065, "percentage": 47.0, "elapsed_time": "0:45:56", "remaining_time": "0:51:48", "throughput": 4249.31, "total_tokens": 11712000} {"current_steps": 17940, "total_steps": 38160, "loss": 0.5248, "lr": 0.0006376516012158262, "epoch": 9.40251572327044, "percentage": 47.01, "elapsed_time": "0:45:57", "remaining_time": "0:51:47", "throughput": 4249.54, "total_tokens": 11716064} {"current_steps": 17945, "total_steps": 38160, "loss": 0.3821, "lr": 0.000637431738125819, "epoch": 9.405136268343815, "percentage": 47.03, "elapsed_time": "0:45:57", "remaining_time": "0:51:46", "throughput": 4249.69, "total_tokens": 11719776} {"current_steps": 17950, "total_steps": 38160, "loss": 0.3775, "lr": 0.00063721184628666, "epoch": 9.40775681341719, "percentage": 47.04, "elapsed_time": "0:45:58", "remaining_time": "0:51:45", "throughput": 4249.73, "total_tokens": 11722880} {"current_steps": 17955, "total_steps": 38160, "loss": 0.6267, "lr": 0.0006369919257443484, "epoch": 9.410377358490566, "percentage": 47.05, "elapsed_time": "0:45:59", "remaining_time": "0:51:44", "throughput": 4249.73, "total_tokens": 11725824} {"current_steps": 17960, "total_steps": 38160, "loss": 0.5323, "lr": 0.0006367719765448886, "epoch": 9.41299790356394, "percentage": 47.06, "elapsed_time": "0:45:59", "remaining_time": "0:51:44", "throughput": 4249.69, "total_tokens": 11728480} {"current_steps": 17965, "total_steps": 38160, "loss": 0.4175, "lr": 0.0006365519987342916, "epoch": 9.415618448637316, "percentage": 47.08, "elapsed_time": "0:46:00", "remaining_time": "0:51:43", "throughput": 4249.63, "total_tokens": 11731040} {"current_steps": 17970, "total_steps": 38160, "loss": 0.3584, "lr": 0.0006363319923585746, "epoch": 9.418238993710691, "percentage": 47.09, "elapsed_time": "0:46:01", "remaining_time": "0:51:42", "throughput": 4249.58, "total_tokens": 11733664} {"current_steps": 17975, "total_steps": 38160, "loss": 0.3899, "lr": 0.0006361119574637599, "epoch": 9.420859538784066, "percentage": 47.1, "elapsed_time": "0:46:01", "remaining_time": "0:51:41", "throughput": 4249.68, "total_tokens": 11737216} {"current_steps": 17980, "total_steps": 38160, "loss": 0.4147, "lr": 0.0006358918940958767, "epoch": 9.423480083857442, "percentage": 47.12, "elapsed_time": "0:46:02", "remaining_time": "0:51:40", "throughput": 4249.82, "total_tokens": 11740864} {"current_steps": 17985, "total_steps": 38160, "loss": 0.4078, "lr": 0.0006356718023009597, "epoch": 9.426100628930818, "percentage": 47.13, "elapsed_time": "0:46:03", "remaining_time": "0:51:39", "throughput": 4249.84, "total_tokens": 11743776} {"current_steps": 17990, "total_steps": 38160, "loss": 0.4311, "lr": 0.0006354516821250492, "epoch": 9.428721174004194, "percentage": 47.14, "elapsed_time": "0:46:04", "remaining_time": "0:51:39", "throughput": 4249.99, "total_tokens": 11747552} {"current_steps": 17995, "total_steps": 38160, "loss": 0.4625, "lr": 0.0006352315336141923, "epoch": 9.431341719077569, "percentage": 47.16, "elapsed_time": "0:46:04", "remaining_time": "0:51:38", "throughput": 4250.05, "total_tokens": 11750656} {"current_steps": 18000, "total_steps": 38160, "loss": 0.3756, "lr": 0.0006350113568144414, "epoch": 9.433962264150944, "percentage": 47.17, "elapsed_time": "0:46:05", "remaining_time": "0:51:37", "throughput": 4250.09, "total_tokens": 11753888} {"current_steps": 18005, "total_steps": 38160, "loss": 0.4388, "lr": 0.0006347911517718547, "epoch": 9.43658280922432, "percentage": 47.18, "elapsed_time": "0:46:06", "remaining_time": "0:51:36", "throughput": 4250.13, "total_tokens": 11757184} {"current_steps": 18010, "total_steps": 38160, "loss": 0.3986, "lr": 0.0006345709185324972, "epoch": 9.439203354297694, "percentage": 47.2, "elapsed_time": "0:46:06", "remaining_time": "0:51:35", "throughput": 4250.11, "total_tokens": 11759936} {"current_steps": 18015, "total_steps": 38160, "loss": 0.4426, "lr": 0.0006343506571424386, "epoch": 9.44182389937107, "percentage": 47.21, "elapsed_time": "0:46:07", "remaining_time": "0:51:34", "throughput": 4250.11, "total_tokens": 11762816} {"current_steps": 18020, "total_steps": 38160, "loss": 0.3908, "lr": 0.0006341303676477552, "epoch": 9.444444444444445, "percentage": 47.22, "elapsed_time": "0:46:08", "remaining_time": "0:51:34", "throughput": 4250.13, "total_tokens": 11765824} {"current_steps": 18025, "total_steps": 38160, "loss": 0.405, "lr": 0.0006339100500945293, "epoch": 9.44706498951782, "percentage": 47.24, "elapsed_time": "0:46:09", "remaining_time": "0:51:33", "throughput": 4250.2, "total_tokens": 11769056} {"current_steps": 18030, "total_steps": 38160, "loss": 0.3687, "lr": 0.0006336897045288486, "epoch": 9.449685534591195, "percentage": 47.25, "elapsed_time": "0:46:09", "remaining_time": "0:51:32", "throughput": 4250.18, "total_tokens": 11771808} {"current_steps": 18035, "total_steps": 38160, "loss": 0.3336, "lr": 0.0006334693309968068, "epoch": 9.45230607966457, "percentage": 47.26, "elapsed_time": "0:46:10", "remaining_time": "0:51:31", "throughput": 4250.19, "total_tokens": 11774720} {"current_steps": 18040, "total_steps": 38160, "loss": 0.4087, "lr": 0.0006332489295445038, "epoch": 9.454926624737945, "percentage": 47.27, "elapsed_time": "0:46:11", "remaining_time": "0:51:30", "throughput": 4250.18, "total_tokens": 11777664} {"current_steps": 18045, "total_steps": 38160, "loss": 0.3513, "lr": 0.0006330285002180448, "epoch": 9.45754716981132, "percentage": 47.29, "elapsed_time": "0:46:11", "remaining_time": "0:51:29", "throughput": 4250.37, "total_tokens": 11781696} {"current_steps": 18050, "total_steps": 38160, "loss": 0.4148, "lr": 0.0006328080430635412, "epoch": 9.460167714884696, "percentage": 47.3, "elapsed_time": "0:46:12", "remaining_time": "0:51:29", "throughput": 4250.38, "total_tokens": 11784672} {"current_steps": 18055, "total_steps": 38160, "loss": 0.4629, "lr": 0.0006325875581271103, "epoch": 9.46278825995807, "percentage": 47.31, "elapsed_time": "0:46:13", "remaining_time": "0:51:28", "throughput": 4250.35, "total_tokens": 11787424} {"current_steps": 18060, "total_steps": 38160, "loss": 0.4993, "lr": 0.0006323670454548749, "epoch": 9.465408805031446, "percentage": 47.33, "elapsed_time": "0:46:13", "remaining_time": "0:51:27", "throughput": 4250.27, "total_tokens": 11789824} {"current_steps": 18065, "total_steps": 38160, "loss": 0.2664, "lr": 0.0006321465050929635, "epoch": 9.468029350104821, "percentage": 47.34, "elapsed_time": "0:46:14", "remaining_time": "0:51:26", "throughput": 4250.36, "total_tokens": 11793120} {"current_steps": 18070, "total_steps": 38160, "loss": 0.4125, "lr": 0.000631925937087511, "epoch": 9.470649895178196, "percentage": 47.35, "elapsed_time": "0:46:15", "remaining_time": "0:51:25", "throughput": 4250.76, "total_tokens": 11798720} {"current_steps": 18075, "total_steps": 38160, "loss": 0.4333, "lr": 0.0006317053414846576, "epoch": 9.473270440251572, "percentage": 47.37, "elapsed_time": "0:46:16", "remaining_time": "0:51:25", "throughput": 4250.76, "total_tokens": 11801600} {"current_steps": 18080, "total_steps": 38160, "loss": 0.3446, "lr": 0.0006314847183305492, "epoch": 9.475890985324948, "percentage": 47.38, "elapsed_time": "0:46:17", "remaining_time": "0:51:24", "throughput": 4250.77, "total_tokens": 11804640} {"current_steps": 18085, "total_steps": 38160, "loss": 0.4281, "lr": 0.0006312640676713378, "epoch": 9.478511530398324, "percentage": 47.39, "elapsed_time": "0:46:17", "remaining_time": "0:51:23", "throughput": 4250.72, "total_tokens": 11807296} {"current_steps": 18090, "total_steps": 38160, "loss": 0.3211, "lr": 0.0006310433895531811, "epoch": 9.481132075471699, "percentage": 47.41, "elapsed_time": "0:46:18", "remaining_time": "0:51:22", "throughput": 4250.67, "total_tokens": 11809920} {"current_steps": 18095, "total_steps": 38160, "loss": 0.393, "lr": 0.0006308226840222422, "epoch": 9.483752620545074, "percentage": 47.42, "elapsed_time": "0:46:19", "remaining_time": "0:51:21", "throughput": 4250.79, "total_tokens": 11813440} {"current_steps": 18100, "total_steps": 38160, "loss": 0.4736, "lr": 0.0006306019511246905, "epoch": 9.48637316561845, "percentage": 47.43, "elapsed_time": "0:46:19", "remaining_time": "0:51:20", "throughput": 4250.97, "total_tokens": 11817440} {"current_steps": 18105, "total_steps": 38160, "loss": 0.508, "lr": 0.0006303811909067003, "epoch": 9.488993710691824, "percentage": 47.44, "elapsed_time": "0:46:20", "remaining_time": "0:51:20", "throughput": 4250.96, "total_tokens": 11820192} {"current_steps": 18110, "total_steps": 38160, "loss": 0.5523, "lr": 0.0006301604034144527, "epoch": 9.4916142557652, "percentage": 47.46, "elapsed_time": "0:46:21", "remaining_time": "0:51:19", "throughput": 4251.15, "total_tokens": 11824192} {"current_steps": 18115, "total_steps": 38160, "loss": 0.6074, "lr": 0.0006299395886941336, "epoch": 9.494234800838575, "percentage": 47.47, "elapsed_time": "0:46:22", "remaining_time": "0:51:18", "throughput": 4251.13, "total_tokens": 11826944} {"current_steps": 18120, "total_steps": 38160, "loss": 0.3949, "lr": 0.0006297187467919347, "epoch": 9.49685534591195, "percentage": 47.48, "elapsed_time": "0:46:22", "remaining_time": "0:51:17", "throughput": 4251.29, "total_tokens": 11830784} {"current_steps": 18125, "total_steps": 38160, "loss": 0.5939, "lr": 0.0006294978777540542, "epoch": 9.499475890985325, "percentage": 47.5, "elapsed_time": "0:46:23", "remaining_time": "0:51:16", "throughput": 4251.25, "total_tokens": 11833632} {"current_steps": 18130, "total_steps": 38160, "loss": 0.5765, "lr": 0.000629276981626695, "epoch": 9.5020964360587, "percentage": 47.51, "elapsed_time": "0:46:24", "remaining_time": "0:51:16", "throughput": 4251.33, "total_tokens": 11837056} {"current_steps": 18135, "total_steps": 38160, "loss": 0.3688, "lr": 0.0006290560584560661, "epoch": 9.504716981132075, "percentage": 47.52, "elapsed_time": "0:46:25", "remaining_time": "0:51:15", "throughput": 4251.47, "total_tokens": 11840736} {"current_steps": 18140, "total_steps": 38160, "loss": 0.6368, "lr": 0.0006288351082883822, "epoch": 9.50733752620545, "percentage": 47.54, "elapsed_time": "0:46:25", "remaining_time": "0:51:14", "throughput": 4251.42, "total_tokens": 11843328} {"current_steps": 18145, "total_steps": 38160, "loss": 0.5202, "lr": 0.0006286141311698633, "epoch": 9.509958071278826, "percentage": 47.55, "elapsed_time": "0:46:26", "remaining_time": "0:51:13", "throughput": 4251.52, "total_tokens": 11846784} {"current_steps": 18150, "total_steps": 38160, "loss": 0.4909, "lr": 0.0006283931271467355, "epoch": 9.5125786163522, "percentage": 47.56, "elapsed_time": "0:46:27", "remaining_time": "0:51:12", "throughput": 4251.56, "total_tokens": 11849984} {"current_steps": 18155, "total_steps": 38160, "loss": 0.4899, "lr": 0.0006281720962652305, "epoch": 9.515199161425576, "percentage": 47.58, "elapsed_time": "0:46:27", "remaining_time": "0:51:11", "throughput": 4251.59, "total_tokens": 11852992} {"current_steps": 18160, "total_steps": 38160, "loss": 0.4324, "lr": 0.0006279510385715849, "epoch": 9.517819706498951, "percentage": 47.59, "elapsed_time": "0:46:28", "remaining_time": "0:51:11", "throughput": 4251.58, "total_tokens": 11855776} {"current_steps": 18165, "total_steps": 38160, "loss": 0.3441, "lr": 0.0006277299541120419, "epoch": 9.520440251572326, "percentage": 47.6, "elapsed_time": "0:46:29", "remaining_time": "0:51:10", "throughput": 4251.64, "total_tokens": 11859008} {"current_steps": 18170, "total_steps": 38160, "loss": 0.3677, "lr": 0.0006275088429328499, "epoch": 9.523060796645701, "percentage": 47.62, "elapsed_time": "0:46:29", "remaining_time": "0:51:09", "throughput": 4251.59, "total_tokens": 11861632} {"current_steps": 18175, "total_steps": 38160, "loss": 0.3724, "lr": 0.0006272877050802623, "epoch": 9.525681341719078, "percentage": 47.63, "elapsed_time": "0:46:30", "remaining_time": "0:51:08", "throughput": 4251.65, "total_tokens": 11864864} {"current_steps": 18180, "total_steps": 38160, "loss": 0.5091, "lr": 0.0006270665406005393, "epoch": 9.528301886792454, "percentage": 47.64, "elapsed_time": "0:46:31", "remaining_time": "0:51:07", "throughput": 4251.72, "total_tokens": 11868224} {"current_steps": 18185, "total_steps": 38160, "loss": 0.4933, "lr": 0.0006268453495399455, "epoch": 9.530922431865829, "percentage": 47.65, "elapsed_time": "0:46:32", "remaining_time": "0:51:06", "throughput": 4251.71, "total_tokens": 11871072} {"current_steps": 18190, "total_steps": 38160, "loss": 0.4153, "lr": 0.0006266241319447517, "epoch": 9.533542976939204, "percentage": 47.67, "elapsed_time": "0:46:32", "remaining_time": "0:51:06", "throughput": 4251.7, "total_tokens": 11873888} {"current_steps": 18195, "total_steps": 38160, "loss": 0.3935, "lr": 0.0006264028878612343, "epoch": 9.536163522012579, "percentage": 47.68, "elapsed_time": "0:46:33", "remaining_time": "0:51:05", "throughput": 4251.66, "total_tokens": 11876608} {"current_steps": 18200, "total_steps": 38160, "loss": 0.4113, "lr": 0.0006261816173356746, "epoch": 9.538784067085954, "percentage": 47.69, "elapsed_time": "0:46:34", "remaining_time": "0:51:04", "throughput": 4251.9, "total_tokens": 11880864} {"current_steps": 18205, "total_steps": 38160, "loss": 0.4316, "lr": 0.0006259603204143602, "epoch": 9.54140461215933, "percentage": 47.71, "elapsed_time": "0:46:34", "remaining_time": "0:51:03", "throughput": 4251.86, "total_tokens": 11883520} {"current_steps": 18210, "total_steps": 38160, "loss": 0.3629, "lr": 0.0006257389971435839, "epoch": 9.544025157232705, "percentage": 47.72, "elapsed_time": "0:46:35", "remaining_time": "0:51:02", "throughput": 4251.98, "total_tokens": 11887168} {"current_steps": 18215, "total_steps": 38160, "loss": 0.6092, "lr": 0.0006255176475696437, "epoch": 9.54664570230608, "percentage": 47.73, "elapsed_time": "0:46:36", "remaining_time": "0:51:02", "throughput": 4252.13, "total_tokens": 11890976} {"current_steps": 18220, "total_steps": 38160, "loss": 0.4574, "lr": 0.0006252962717388438, "epoch": 9.549266247379455, "percentage": 47.75, "elapsed_time": "0:46:37", "remaining_time": "0:51:01", "throughput": 4252.12, "total_tokens": 11893888} {"current_steps": 18225, "total_steps": 38160, "loss": 0.437, "lr": 0.0006250748696974932, "epoch": 9.55188679245283, "percentage": 47.76, "elapsed_time": "0:46:37", "remaining_time": "0:51:00", "throughput": 4252.09, "total_tokens": 11896704} {"current_steps": 18230, "total_steps": 38160, "loss": 0.5422, "lr": 0.0006248534414919067, "epoch": 9.554507337526205, "percentage": 47.77, "elapsed_time": "0:46:38", "remaining_time": "0:50:59", "throughput": 4252.27, "total_tokens": 11900736} {"current_steps": 18235, "total_steps": 38160, "loss": 0.5102, "lr": 0.0006246319871684047, "epoch": 9.55712788259958, "percentage": 47.79, "elapsed_time": "0:46:39", "remaining_time": "0:50:58", "throughput": 4252.35, "total_tokens": 11904160} {"current_steps": 18240, "total_steps": 38160, "loss": 0.3785, "lr": 0.000624410506773313, "epoch": 9.559748427672956, "percentage": 47.8, "elapsed_time": "0:46:40", "remaining_time": "0:50:58", "throughput": 4252.38, "total_tokens": 11907200} {"current_steps": 18245, "total_steps": 38160, "loss": 0.3849, "lr": 0.0006241890003529626, "epoch": 9.56236897274633, "percentage": 47.81, "elapsed_time": "0:46:40", "remaining_time": "0:50:57", "throughput": 4252.43, "total_tokens": 11910368} {"current_steps": 18250, "total_steps": 38160, "loss": 0.4808, "lr": 0.00062396746795369, "epoch": 9.564989517819706, "percentage": 47.82, "elapsed_time": "0:46:41", "remaining_time": "0:50:56", "throughput": 4252.47, "total_tokens": 11913472} {"current_steps": 18255, "total_steps": 38160, "loss": 0.3612, "lr": 0.0006237459096218375, "epoch": 9.567610062893081, "percentage": 47.84, "elapsed_time": "0:46:42", "remaining_time": "0:50:55", "throughput": 4252.64, "total_tokens": 11917280} {"current_steps": 18260, "total_steps": 38160, "loss": 0.3867, "lr": 0.0006235243254037525, "epoch": 9.570230607966456, "percentage": 47.85, "elapsed_time": "0:46:42", "remaining_time": "0:50:54", "throughput": 4252.58, "total_tokens": 11919744} {"current_steps": 18265, "total_steps": 38160, "loss": 0.5394, "lr": 0.0006233027153457878, "epoch": 9.572851153039831, "percentage": 47.86, "elapsed_time": "0:46:43", "remaining_time": "0:50:54", "throughput": 4252.82, "total_tokens": 11924096} {"current_steps": 18270, "total_steps": 38160, "loss": 0.3567, "lr": 0.0006230810794943017, "epoch": 9.575471698113208, "percentage": 47.88, "elapsed_time": "0:46:44", "remaining_time": "0:50:53", "throughput": 4252.95, "total_tokens": 11927744} {"current_steps": 18275, "total_steps": 38160, "loss": 0.4368, "lr": 0.0006228594178956581, "epoch": 9.578092243186584, "percentage": 47.89, "elapsed_time": "0:46:45", "remaining_time": "0:50:52", "throughput": 4252.9, "total_tokens": 11930368} {"current_steps": 18280, "total_steps": 38160, "loss": 0.4779, "lr": 0.0006226377305962259, "epoch": 9.580712788259959, "percentage": 47.9, "elapsed_time": "0:46:45", "remaining_time": "0:50:51", "throughput": 4252.91, "total_tokens": 11933344} {"current_steps": 18285, "total_steps": 38160, "loss": 0.3595, "lr": 0.0006224160176423796, "epoch": 9.583333333333334, "percentage": 47.92, "elapsed_time": "0:46:46", "remaining_time": "0:50:50", "throughput": 4253.03, "total_tokens": 11936992} {"current_steps": 18290, "total_steps": 38160, "loss": 0.4649, "lr": 0.0006221942790804989, "epoch": 9.585953878406709, "percentage": 47.93, "elapsed_time": "0:46:47", "remaining_time": "0:50:49", "throughput": 4253.09, "total_tokens": 11940288} {"current_steps": 18295, "total_steps": 38160, "loss": 0.3841, "lr": 0.0006219725149569691, "epoch": 9.588574423480084, "percentage": 47.94, "elapsed_time": "0:46:48", "remaining_time": "0:50:49", "throughput": 4253.06, "total_tokens": 11943072} {"current_steps": 18300, "total_steps": 38160, "loss": 0.364, "lr": 0.0006217507253181809, "epoch": 9.59119496855346, "percentage": 47.96, "elapsed_time": "0:46:48", "remaining_time": "0:50:48", "throughput": 4253.08, "total_tokens": 11946016} {"current_steps": 18305, "total_steps": 38160, "loss": 0.4827, "lr": 0.0006215289102105297, "epoch": 9.593815513626835, "percentage": 47.97, "elapsed_time": "0:46:49", "remaining_time": "0:50:47", "throughput": 4253.14, "total_tokens": 11949280} {"current_steps": 18310, "total_steps": 38160, "loss": 0.4042, "lr": 0.0006213070696804171, "epoch": 9.59643605870021, "percentage": 47.98, "elapsed_time": "0:46:50", "remaining_time": "0:50:46", "throughput": 4253.32, "total_tokens": 11953216} {"current_steps": 18315, "total_steps": 38160, "loss": 0.432, "lr": 0.0006210852037742495, "epoch": 9.599056603773585, "percentage": 48.0, "elapsed_time": "0:46:51", "remaining_time": "0:50:45", "throughput": 4253.36, "total_tokens": 11956320} {"current_steps": 18320, "total_steps": 38160, "loss": 0.4475, "lr": 0.0006208633125384385, "epoch": 9.60167714884696, "percentage": 48.01, "elapsed_time": "0:46:51", "remaining_time": "0:50:44", "throughput": 4253.36, "total_tokens": 11959104} {"current_steps": 18325, "total_steps": 38160, "loss": 0.4096, "lr": 0.0006206413960194017, "epoch": 9.604297693920335, "percentage": 48.02, "elapsed_time": "0:46:52", "remaining_time": "0:50:44", "throughput": 4253.4, "total_tokens": 11962208} {"current_steps": 18330, "total_steps": 38160, "loss": 0.5802, "lr": 0.000620419454263561, "epoch": 9.60691823899371, "percentage": 48.03, "elapsed_time": "0:46:53", "remaining_time": "0:50:43", "throughput": 4253.37, "total_tokens": 11964832} {"current_steps": 18335, "total_steps": 38160, "loss": 0.6494, "lr": 0.0006201974873173443, "epoch": 9.609538784067086, "percentage": 48.05, "elapsed_time": "0:46:53", "remaining_time": "0:50:42", "throughput": 4253.41, "total_tokens": 11968000} {"current_steps": 18340, "total_steps": 38160, "loss": 0.5862, "lr": 0.0006199754952271847, "epoch": 9.61215932914046, "percentage": 48.06, "elapsed_time": "0:46:54", "remaining_time": "0:50:41", "throughput": 4253.42, "total_tokens": 11970912} {"current_steps": 18345, "total_steps": 38160, "loss": 0.3364, "lr": 0.00061975347803952, "epoch": 9.614779874213836, "percentage": 48.07, "elapsed_time": "0:46:55", "remaining_time": "0:50:40", "throughput": 4253.36, "total_tokens": 11973472} {"current_steps": 18350, "total_steps": 38160, "loss": 0.4695, "lr": 0.000619531435800794, "epoch": 9.617400419287211, "percentage": 48.09, "elapsed_time": "0:46:55", "remaining_time": "0:50:39", "throughput": 4253.45, "total_tokens": 11976864} {"current_steps": 18355, "total_steps": 38160, "loss": 0.5272, "lr": 0.0006193093685574553, "epoch": 9.620020964360586, "percentage": 48.1, "elapsed_time": "0:46:56", "remaining_time": "0:50:38", "throughput": 4253.47, "total_tokens": 11979872} {"current_steps": 18360, "total_steps": 38160, "loss": 0.4272, "lr": 0.0006190872763559578, "epoch": 9.622641509433961, "percentage": 48.11, "elapsed_time": "0:46:57", "remaining_time": "0:50:38", "throughput": 4253.54, "total_tokens": 11983168} {"current_steps": 18365, "total_steps": 38160, "loss": 0.4552, "lr": 0.0006188651592427609, "epoch": 9.625262054507338, "percentage": 48.13, "elapsed_time": "0:46:57", "remaining_time": "0:50:37", "throughput": 4253.61, "total_tokens": 11986432} {"current_steps": 18370, "total_steps": 38160, "loss": 0.2722, "lr": 0.0006186430172643287, "epoch": 9.627882599580714, "percentage": 48.14, "elapsed_time": "0:46:58", "remaining_time": "0:50:36", "throughput": 4253.46, "total_tokens": 11988512} {"current_steps": 18375, "total_steps": 38160, "loss": 0.6735, "lr": 0.0006184208504671307, "epoch": 9.630503144654089, "percentage": 48.15, "elapsed_time": "0:46:59", "remaining_time": "0:50:35", "throughput": 4253.47, "total_tokens": 11991424} {"current_steps": 18380, "total_steps": 38160, "loss": 0.4499, "lr": 0.000618198658897642, "epoch": 9.633123689727464, "percentage": 48.17, "elapsed_time": "0:46:59", "remaining_time": "0:50:34", "throughput": 4253.46, "total_tokens": 11994208} {"current_steps": 18385, "total_steps": 38160, "loss": 0.3819, "lr": 0.0006179764426023422, "epoch": 9.635744234800839, "percentage": 48.18, "elapsed_time": "0:47:00", "remaining_time": "0:50:33", "throughput": 4253.5, "total_tokens": 11997312} {"current_steps": 18390, "total_steps": 38160, "loss": 0.5764, "lr": 0.0006177542016277167, "epoch": 9.638364779874214, "percentage": 48.19, "elapsed_time": "0:47:01", "remaining_time": "0:50:32", "throughput": 4253.51, "total_tokens": 12000288} {"current_steps": 18395, "total_steps": 38160, "loss": 0.5718, "lr": 0.0006175319360202556, "epoch": 9.64098532494759, "percentage": 48.2, "elapsed_time": "0:47:01", "remaining_time": "0:50:32", "throughput": 4253.53, "total_tokens": 12003328} {"current_steps": 18400, "total_steps": 38160, "loss": 0.4819, "lr": 0.0006173096458264542, "epoch": 9.643605870020965, "percentage": 48.22, "elapsed_time": "0:47:02", "remaining_time": "0:50:31", "throughput": 4253.51, "total_tokens": 12006176} {"current_steps": 18405, "total_steps": 38160, "loss": 0.5552, "lr": 0.0006170873310928133, "epoch": 9.64622641509434, "percentage": 48.23, "elapsed_time": "0:47:03", "remaining_time": "0:50:30", "throughput": 4253.63, "total_tokens": 12009856} {"current_steps": 18410, "total_steps": 38160, "loss": 0.3497, "lr": 0.0006168649918658387, "epoch": 9.648846960167715, "percentage": 48.24, "elapsed_time": "0:47:04", "remaining_time": "0:50:29", "throughput": 4253.74, "total_tokens": 12013376} {"current_steps": 18415, "total_steps": 38160, "loss": 0.6078, "lr": 0.0006166426281920407, "epoch": 9.65146750524109, "percentage": 48.26, "elapsed_time": "0:47:04", "remaining_time": "0:50:28", "throughput": 4253.74, "total_tokens": 12016192} {"current_steps": 18420, "total_steps": 38160, "loss": 0.5751, "lr": 0.000616420240117936, "epoch": 9.654088050314465, "percentage": 48.27, "elapsed_time": "0:47:05", "remaining_time": "0:50:28", "throughput": 4253.84, "total_tokens": 12019680} {"current_steps": 18425, "total_steps": 38160, "loss": 0.4015, "lr": 0.000616197827690045, "epoch": 9.65670859538784, "percentage": 48.28, "elapsed_time": "0:47:06", "remaining_time": "0:50:27", "throughput": 4253.95, "total_tokens": 12023200} {"current_steps": 18430, "total_steps": 38160, "loss": 0.5367, "lr": 0.0006159753909548943, "epoch": 9.659329140461216, "percentage": 48.3, "elapsed_time": "0:47:07", "remaining_time": "0:50:26", "throughput": 4254.08, "total_tokens": 12026880} {"current_steps": 18435, "total_steps": 38160, "loss": 0.418, "lr": 0.0006157529299590148, "epoch": 9.66194968553459, "percentage": 48.31, "elapsed_time": "0:47:07", "remaining_time": "0:50:25", "throughput": 4254.03, "total_tokens": 12029472} {"current_steps": 18440, "total_steps": 38160, "loss": 0.4814, "lr": 0.000615530444748943, "epoch": 9.664570230607966, "percentage": 48.32, "elapsed_time": "0:47:08", "remaining_time": "0:50:24", "throughput": 4253.99, "total_tokens": 12032128} {"current_steps": 18445, "total_steps": 38160, "loss": 0.3827, "lr": 0.0006153079353712201, "epoch": 9.667190775681341, "percentage": 48.34, "elapsed_time": "0:47:09", "remaining_time": "0:50:23", "throughput": 4253.96, "total_tokens": 12034912} {"current_steps": 18450, "total_steps": 38160, "loss": 0.4152, "lr": 0.0006150854018723926, "epoch": 9.669811320754716, "percentage": 48.35, "elapsed_time": "0:47:09", "remaining_time": "0:50:23", "throughput": 4253.98, "total_tokens": 12037888} {"current_steps": 18455, "total_steps": 38160, "loss": 0.3922, "lr": 0.0006148628442990122, "epoch": 9.672431865828091, "percentage": 48.36, "elapsed_time": "0:47:10", "remaining_time": "0:50:22", "throughput": 4253.94, "total_tokens": 12040576} {"current_steps": 18460, "total_steps": 38160, "loss": 0.5451, "lr": 0.0006146402626976351, "epoch": 9.675052410901468, "percentage": 48.38, "elapsed_time": "0:47:11", "remaining_time": "0:50:21", "throughput": 4254.05, "total_tokens": 12044096} {"current_steps": 18465, "total_steps": 38160, "loss": 0.3695, "lr": 0.0006144176571148228, "epoch": 9.677672955974844, "percentage": 48.39, "elapsed_time": "0:47:11", "remaining_time": "0:50:20", "throughput": 4254.12, "total_tokens": 12047424} {"current_steps": 18470, "total_steps": 38160, "loss": 0.3486, "lr": 0.0006141950275971422, "epoch": 9.680293501048219, "percentage": 48.4, "elapsed_time": "0:47:12", "remaining_time": "0:50:19", "throughput": 4254.16, "total_tokens": 12050560} {"current_steps": 18475, "total_steps": 38160, "loss": 0.3983, "lr": 0.0006139723741911644, "epoch": 9.682914046121594, "percentage": 48.41, "elapsed_time": "0:47:13", "remaining_time": "0:50:18", "throughput": 4254.25, "total_tokens": 12053952} {"current_steps": 18480, "total_steps": 38160, "loss": 0.4093, "lr": 0.0006137496969434664, "epoch": 9.685534591194969, "percentage": 48.43, "elapsed_time": "0:47:14", "remaining_time": "0:50:18", "throughput": 4254.18, "total_tokens": 12056416} {"current_steps": 18485, "total_steps": 38160, "loss": 0.4725, "lr": 0.0006135269959006294, "epoch": 9.688155136268344, "percentage": 48.44, "elapsed_time": "0:47:14", "remaining_time": "0:50:17", "throughput": 4254.39, "total_tokens": 12060448} {"current_steps": 18490, "total_steps": 38160, "loss": 0.5203, "lr": 0.00061330427110924, "epoch": 9.69077568134172, "percentage": 48.45, "elapsed_time": "0:47:15", "remaining_time": "0:50:16", "throughput": 4254.65, "total_tokens": 12064960} {"current_steps": 18495, "total_steps": 38160, "loss": 0.3429, "lr": 0.0006130815226158899, "epoch": 9.693396226415095, "percentage": 48.47, "elapsed_time": "0:47:16", "remaining_time": "0:50:15", "throughput": 4254.69, "total_tokens": 12068192} {"current_steps": 18500, "total_steps": 38160, "loss": 0.3714, "lr": 0.0006128587504671753, "epoch": 9.69601677148847, "percentage": 48.48, "elapsed_time": "0:47:17", "remaining_time": "0:50:15", "throughput": 4254.7, "total_tokens": 12071200} {"current_steps": 18505, "total_steps": 38160, "loss": 0.4723, "lr": 0.0006126359547096974, "epoch": 9.698637316561845, "percentage": 48.49, "elapsed_time": "0:47:17", "remaining_time": "0:50:14", "throughput": 4254.7, "total_tokens": 12074112} {"current_steps": 18510, "total_steps": 38160, "loss": 0.5165, "lr": 0.0006124131353900632, "epoch": 9.70125786163522, "percentage": 48.51, "elapsed_time": "0:47:18", "remaining_time": "0:50:13", "throughput": 4254.88, "total_tokens": 12078048} {"current_steps": 18515, "total_steps": 38160, "loss": 0.5558, "lr": 0.0006121902925548833, "epoch": 9.703878406708595, "percentage": 48.52, "elapsed_time": "0:47:19", "remaining_time": "0:50:12", "throughput": 4254.89, "total_tokens": 12080896} {"current_steps": 18520, "total_steps": 38160, "loss": 0.3515, "lr": 0.0006119674262507743, "epoch": 9.70649895178197, "percentage": 48.53, "elapsed_time": "0:47:19", "remaining_time": "0:50:11", "throughput": 4254.89, "total_tokens": 12083744} {"current_steps": 18525, "total_steps": 38160, "loss": 0.4229, "lr": 0.0006117445365243571, "epoch": 9.709119496855346, "percentage": 48.55, "elapsed_time": "0:47:20", "remaining_time": "0:50:10", "throughput": 4254.85, "total_tokens": 12086496} {"current_steps": 18530, "total_steps": 38160, "loss": 0.3784, "lr": 0.0006115216234222575, "epoch": 9.71174004192872, "percentage": 48.56, "elapsed_time": "0:47:21", "remaining_time": "0:50:10", "throughput": 4254.9, "total_tokens": 12089728} {"current_steps": 18535, "total_steps": 38160, "loss": 0.588, "lr": 0.0006112986869911068, "epoch": 9.714360587002096, "percentage": 48.57, "elapsed_time": "0:47:22", "remaining_time": "0:50:09", "throughput": 4254.98, "total_tokens": 12093120} {"current_steps": 18540, "total_steps": 38160, "loss": 0.5321, "lr": 0.0006110757272775405, "epoch": 9.716981132075471, "percentage": 48.58, "elapsed_time": "0:47:22", "remaining_time": "0:50:08", "throughput": 4254.91, "total_tokens": 12095680} {"current_steps": 18545, "total_steps": 38160, "loss": 0.4555, "lr": 0.0006108527443281992, "epoch": 9.719601677148846, "percentage": 48.6, "elapsed_time": "0:47:23", "remaining_time": "0:50:07", "throughput": 4254.98, "total_tokens": 12099040} {"current_steps": 18550, "total_steps": 38160, "loss": 0.3461, "lr": 0.0006106297381897284, "epoch": 9.722222222222221, "percentage": 48.61, "elapsed_time": "0:47:24", "remaining_time": "0:50:06", "throughput": 4255.01, "total_tokens": 12102112} {"current_steps": 18555, "total_steps": 38160, "loss": 0.4207, "lr": 0.0006104067089087787, "epoch": 9.724842767295598, "percentage": 48.62, "elapsed_time": "0:47:24", "remaining_time": "0:50:05", "throughput": 4254.94, "total_tokens": 12104544} {"current_steps": 18560, "total_steps": 38160, "loss": 0.4046, "lr": 0.0006101836565320049, "epoch": 9.727463312368974, "percentage": 48.64, "elapsed_time": "0:47:25", "remaining_time": "0:50:04", "throughput": 4254.98, "total_tokens": 12107712} {"current_steps": 18565, "total_steps": 38160, "loss": 0.3937, "lr": 0.0006099605811060673, "epoch": 9.730083857442349, "percentage": 48.65, "elapsed_time": "0:47:26", "remaining_time": "0:50:04", "throughput": 4254.96, "total_tokens": 12110528} {"current_steps": 18570, "total_steps": 38160, "loss": 0.4136, "lr": 0.0006097374826776307, "epoch": 9.732704402515724, "percentage": 48.66, "elapsed_time": "0:47:26", "remaining_time": "0:50:03", "throughput": 4254.99, "total_tokens": 12113600} {"current_steps": 18575, "total_steps": 38160, "loss": 0.4735, "lr": 0.0006095143612933646, "epoch": 9.735324947589099, "percentage": 48.68, "elapsed_time": "0:47:27", "remaining_time": "0:50:02", "throughput": 4255.07, "total_tokens": 12116896} {"current_steps": 18580, "total_steps": 38160, "loss": 0.3625, "lr": 0.0006092912169999435, "epoch": 9.737945492662474, "percentage": 48.69, "elapsed_time": "0:47:28", "remaining_time": "0:50:01", "throughput": 4255.23, "total_tokens": 12120832} {"current_steps": 18585, "total_steps": 38160, "loss": 0.3092, "lr": 0.0006090680498440465, "epoch": 9.74056603773585, "percentage": 48.7, "elapsed_time": "0:47:29", "remaining_time": "0:50:01", "throughput": 4255.39, "total_tokens": 12124704} {"current_steps": 18590, "total_steps": 38160, "loss": 0.3728, "lr": 0.0006088448598723581, "epoch": 9.743186582809225, "percentage": 48.72, "elapsed_time": "0:47:30", "remaining_time": "0:50:00", "throughput": 4255.73, "total_tokens": 12129760} {"current_steps": 18595, "total_steps": 38160, "loss": 0.4338, "lr": 0.0006086216471315666, "epoch": 9.7458071278826, "percentage": 48.73, "elapsed_time": "0:47:30", "remaining_time": "0:49:59", "throughput": 4255.64, "total_tokens": 12132096} {"current_steps": 18600, "total_steps": 38160, "loss": 0.5666, "lr": 0.0006083984116683659, "epoch": 9.748427672955975, "percentage": 48.74, "elapsed_time": "0:47:31", "remaining_time": "0:49:58", "throughput": 4255.63, "total_tokens": 12135008} {"current_steps": 18605, "total_steps": 38160, "loss": 0.4746, "lr": 0.0006081751535294539, "epoch": 9.75104821802935, "percentage": 48.76, "elapsed_time": "0:47:32", "remaining_time": "0:49:57", "throughput": 4255.66, "total_tokens": 12138144} {"current_steps": 18610, "total_steps": 38160, "loss": 0.5664, "lr": 0.0006079518727615341, "epoch": 9.753668763102725, "percentage": 48.77, "elapsed_time": "0:47:32", "remaining_time": "0:49:57", "throughput": 4255.73, "total_tokens": 12141568} {"current_steps": 18615, "total_steps": 38160, "loss": 0.5533, "lr": 0.0006077285694113141, "epoch": 9.7562893081761, "percentage": 48.78, "elapsed_time": "0:47:33", "remaining_time": "0:49:56", "throughput": 4255.86, "total_tokens": 12145248} {"current_steps": 18620, "total_steps": 38160, "loss": 0.4043, "lr": 0.0006075052435255062, "epoch": 9.758909853249476, "percentage": 48.79, "elapsed_time": "0:47:34", "remaining_time": "0:49:55", "throughput": 4256.07, "total_tokens": 12149472} {"current_steps": 18625, "total_steps": 38160, "loss": 0.5295, "lr": 0.000607281895150828, "epoch": 9.76153039832285, "percentage": 48.81, "elapsed_time": "0:47:35", "remaining_time": "0:49:54", "throughput": 4256.17, "total_tokens": 12152992} {"current_steps": 18630, "total_steps": 38160, "loss": 0.4199, "lr": 0.0006070585243340013, "epoch": 9.764150943396226, "percentage": 48.82, "elapsed_time": "0:47:36", "remaining_time": "0:49:54", "throughput": 4256.14, "total_tokens": 12155712} {"current_steps": 18635, "total_steps": 38160, "loss": 0.509, "lr": 0.0006068351311217526, "epoch": 9.766771488469601, "percentage": 48.83, "elapsed_time": "0:47:36", "remaining_time": "0:49:53", "throughput": 4256.14, "total_tokens": 12158688} {"current_steps": 18640, "total_steps": 38160, "loss": 0.7768, "lr": 0.0006066117155608135, "epoch": 9.769392033542976, "percentage": 48.85, "elapsed_time": "0:47:37", "remaining_time": "0:49:52", "throughput": 4256.19, "total_tokens": 12161824} {"current_steps": 18645, "total_steps": 38160, "loss": 0.3761, "lr": 0.0006063882776979196, "epoch": 9.772012578616351, "percentage": 48.86, "elapsed_time": "0:47:38", "remaining_time": "0:49:51", "throughput": 4256.23, "total_tokens": 12164992} {"current_steps": 18650, "total_steps": 38160, "loss": 0.4157, "lr": 0.0006061648175798117, "epoch": 9.774633123689728, "percentage": 48.87, "elapsed_time": "0:47:38", "remaining_time": "0:49:50", "throughput": 4256.22, "total_tokens": 12167808} {"current_steps": 18655, "total_steps": 38160, "loss": 0.2947, "lr": 0.0006059413352532355, "epoch": 9.777253668763104, "percentage": 48.89, "elapsed_time": "0:47:39", "remaining_time": "0:49:49", "throughput": 4256.23, "total_tokens": 12170752} {"current_steps": 18660, "total_steps": 38160, "loss": 0.3659, "lr": 0.0006057178307649402, "epoch": 9.779874213836479, "percentage": 48.9, "elapsed_time": "0:47:40", "remaining_time": "0:49:48", "throughput": 4256.23, "total_tokens": 12173664} {"current_steps": 18665, "total_steps": 38160, "loss": 0.4209, "lr": 0.000605494304161681, "epoch": 9.782494758909854, "percentage": 48.91, "elapsed_time": "0:47:40", "remaining_time": "0:49:48", "throughput": 4256.3, "total_tokens": 12176960} {"current_steps": 18670, "total_steps": 38160, "loss": 0.6249, "lr": 0.0006052707554902169, "epoch": 9.785115303983229, "percentage": 48.93, "elapsed_time": "0:47:41", "remaining_time": "0:49:47", "throughput": 4256.32, "total_tokens": 12180096} {"current_steps": 18675, "total_steps": 38160, "loss": 0.3821, "lr": 0.0006050471847973117, "epoch": 9.787735849056604, "percentage": 48.94, "elapsed_time": "0:47:42", "remaining_time": "0:49:46", "throughput": 4256.38, "total_tokens": 12183424} {"current_steps": 18680, "total_steps": 38160, "loss": 0.3832, "lr": 0.000604823592129734, "epoch": 9.79035639412998, "percentage": 48.95, "elapsed_time": "0:47:43", "remaining_time": "0:49:45", "throughput": 4256.42, "total_tokens": 12186592} {"current_steps": 18685, "total_steps": 38160, "loss": 0.5218, "lr": 0.0006045999775342566, "epoch": 9.792976939203355, "percentage": 48.96, "elapsed_time": "0:47:43", "remaining_time": "0:49:44", "throughput": 4256.54, "total_tokens": 12190240} {"current_steps": 18690, "total_steps": 38160, "loss": 0.4451, "lr": 0.0006043763410576572, "epoch": 9.79559748427673, "percentage": 48.98, "elapsed_time": "0:47:44", "remaining_time": "0:49:44", "throughput": 4256.52, "total_tokens": 12193024} {"current_steps": 18695, "total_steps": 38160, "loss": 0.4681, "lr": 0.0006041526827467182, "epoch": 9.798218029350105, "percentage": 48.99, "elapsed_time": "0:47:45", "remaining_time": "0:49:43", "throughput": 4256.55, "total_tokens": 12196128} {"current_steps": 18700, "total_steps": 38160, "loss": 0.4223, "lr": 0.000603929002648226, "epoch": 9.80083857442348, "percentage": 49.0, "elapsed_time": "0:47:45", "remaining_time": "0:49:42", "throughput": 4256.53, "total_tokens": 12198880} {"current_steps": 18705, "total_steps": 38160, "loss": 0.4131, "lr": 0.0006037053008089723, "epoch": 9.803459119496855, "percentage": 49.02, "elapsed_time": "0:47:46", "remaining_time": "0:49:41", "throughput": 4256.52, "total_tokens": 12201760} {"current_steps": 18710, "total_steps": 38160, "loss": 0.6875, "lr": 0.0006034815772757528, "epoch": 9.80607966457023, "percentage": 49.03, "elapsed_time": "0:47:47", "remaining_time": "0:49:40", "throughput": 4256.76, "total_tokens": 12206272} {"current_steps": 18715, "total_steps": 38160, "loss": 0.4297, "lr": 0.0006032578320953678, "epoch": 9.808700209643606, "percentage": 49.04, "elapsed_time": "0:47:48", "remaining_time": "0:49:40", "throughput": 4256.8, "total_tokens": 12209472} {"current_steps": 18720, "total_steps": 38160, "loss": 0.4917, "lr": 0.0006030340653146224, "epoch": 9.81132075471698, "percentage": 49.06, "elapsed_time": "0:47:48", "remaining_time": "0:49:39", "throughput": 4256.77, "total_tokens": 12212256} {"current_steps": 18725, "total_steps": 38160, "loss": 0.5005, "lr": 0.0006028102769803261, "epoch": 9.813941299790356, "percentage": 49.07, "elapsed_time": "0:47:49", "remaining_time": "0:49:38", "throughput": 4256.82, "total_tokens": 12215456} {"current_steps": 18730, "total_steps": 38160, "loss": 0.4398, "lr": 0.0006025864671392925, "epoch": 9.816561844863731, "percentage": 49.08, "elapsed_time": "0:47:50", "remaining_time": "0:49:37", "throughput": 4257.08, "total_tokens": 12219936} {"current_steps": 18735, "total_steps": 38160, "loss": 0.4216, "lr": 0.0006023626358383406, "epoch": 9.819182389937106, "percentage": 49.1, "elapsed_time": "0:47:51", "remaining_time": "0:49:36", "throughput": 4257.12, "total_tokens": 12223200} {"current_steps": 18740, "total_steps": 38160, "loss": 0.4316, "lr": 0.0006021387831242932, "epoch": 9.821802935010481, "percentage": 49.11, "elapsed_time": "0:47:51", "remaining_time": "0:49:36", "throughput": 4257.17, "total_tokens": 12226432} {"current_steps": 18745, "total_steps": 38160, "loss": 0.4066, "lr": 0.0006019149090439774, "epoch": 9.824423480083858, "percentage": 49.12, "elapsed_time": "0:47:52", "remaining_time": "0:49:35", "throughput": 4257.13, "total_tokens": 12229120} {"current_steps": 18750, "total_steps": 38160, "loss": 0.3649, "lr": 0.0006016910136442254, "epoch": 9.827044025157234, "percentage": 49.14, "elapsed_time": "0:47:53", "remaining_time": "0:49:34", "throughput": 4257.33, "total_tokens": 12233248} {"current_steps": 18755, "total_steps": 38160, "loss": 0.5277, "lr": 0.0006014670969718735, "epoch": 9.829664570230609, "percentage": 49.15, "elapsed_time": "0:47:54", "remaining_time": "0:49:33", "throughput": 4257.57, "total_tokens": 12237696} {"current_steps": 18760, "total_steps": 38160, "loss": 0.3133, "lr": 0.0006012431590737625, "epoch": 9.832285115303984, "percentage": 49.16, "elapsed_time": "0:47:55", "remaining_time": "0:49:33", "throughput": 4257.72, "total_tokens": 12241504} {"current_steps": 18765, "total_steps": 38160, "loss": 0.4546, "lr": 0.0006010191999967378, "epoch": 9.834905660377359, "percentage": 49.17, "elapsed_time": "0:47:55", "remaining_time": "0:49:32", "throughput": 4257.8, "total_tokens": 12244832} {"current_steps": 18770, "total_steps": 38160, "loss": 0.425, "lr": 0.0006007952197876487, "epoch": 9.837526205450734, "percentage": 49.19, "elapsed_time": "0:47:56", "remaining_time": "0:49:31", "throughput": 4257.81, "total_tokens": 12247776} {"current_steps": 18775, "total_steps": 38160, "loss": 0.4224, "lr": 0.0006005712184933498, "epoch": 9.84014675052411, "percentage": 49.2, "elapsed_time": "0:47:57", "remaining_time": "0:49:30", "throughput": 4257.78, "total_tokens": 12250560} {"current_steps": 18780, "total_steps": 38160, "loss": 0.5179, "lr": 0.0006003471961606992, "epoch": 9.842767295597485, "percentage": 49.21, "elapsed_time": "0:47:57", "remaining_time": "0:49:29", "throughput": 4257.79, "total_tokens": 12253504} {"current_steps": 18785, "total_steps": 38160, "loss": 0.4299, "lr": 0.0006001231528365601, "epoch": 9.84538784067086, "percentage": 49.23, "elapsed_time": "0:47:58", "remaining_time": "0:49:28", "throughput": 4257.76, "total_tokens": 12256128} {"current_steps": 18790, "total_steps": 38160, "loss": 0.5638, "lr": 0.0005998990885677996, "epoch": 9.848008385744235, "percentage": 49.24, "elapsed_time": "0:47:59", "remaining_time": "0:49:28", "throughput": 4257.89, "total_tokens": 12260032} {"current_steps": 18795, "total_steps": 38160, "loss": 0.3921, "lr": 0.0005996750034012895, "epoch": 9.85062893081761, "percentage": 49.25, "elapsed_time": "0:48:00", "remaining_time": "0:49:27", "throughput": 4257.92, "total_tokens": 12263136} {"current_steps": 18800, "total_steps": 38160, "loss": 0.4975, "lr": 0.0005994508973839058, "epoch": 9.853249475890985, "percentage": 49.27, "elapsed_time": "0:48:00", "remaining_time": "0:49:26", "throughput": 4258.0, "total_tokens": 12266496} {"current_steps": 18805, "total_steps": 38160, "loss": 0.3803, "lr": 0.0005992267705625289, "epoch": 9.85587002096436, "percentage": 49.28, "elapsed_time": "0:48:01", "remaining_time": "0:49:25", "throughput": 4257.91, "total_tokens": 12268768} {"current_steps": 18810, "total_steps": 38160, "loss": 0.4624, "lr": 0.0005990026229840439, "epoch": 9.858490566037736, "percentage": 49.29, "elapsed_time": "0:48:02", "remaining_time": "0:49:24", "throughput": 4257.99, "total_tokens": 12272160} {"current_steps": 18815, "total_steps": 38160, "loss": 0.5475, "lr": 0.0005987784546953394, "epoch": 9.86111111111111, "percentage": 49.31, "elapsed_time": "0:48:02", "remaining_time": "0:49:24", "throughput": 4258.11, "total_tokens": 12275776} {"current_steps": 18820, "total_steps": 38160, "loss": 0.4295, "lr": 0.0005985542657433091, "epoch": 9.863731656184486, "percentage": 49.32, "elapsed_time": "0:48:03", "remaining_time": "0:49:23", "throughput": 4258.13, "total_tokens": 12278880} {"current_steps": 18825, "total_steps": 38160, "loss": 0.4333, "lr": 0.000598330056174851, "epoch": 9.866352201257861, "percentage": 49.33, "elapsed_time": "0:48:04", "remaining_time": "0:49:22", "throughput": 4258.09, "total_tokens": 12281536} {"current_steps": 18830, "total_steps": 38160, "loss": 0.5535, "lr": 0.0005981058260368668, "epoch": 9.868972746331236, "percentage": 49.34, "elapsed_time": "0:48:04", "remaining_time": "0:49:21", "throughput": 4258.07, "total_tokens": 12284416} {"current_steps": 18835, "total_steps": 38160, "loss": 0.4251, "lr": 0.0005978815753762632, "epoch": 9.871593291404611, "percentage": 49.36, "elapsed_time": "0:48:05", "remaining_time": "0:49:20", "throughput": 4258.21, "total_tokens": 12288224} {"current_steps": 18840, "total_steps": 38160, "loss": 0.38, "lr": 0.0005976573042399505, "epoch": 9.874213836477988, "percentage": 49.37, "elapsed_time": "0:48:06", "remaining_time": "0:49:20", "throughput": 4258.28, "total_tokens": 12291520} {"current_steps": 18845, "total_steps": 38160, "loss": 0.5355, "lr": 0.000597433012674844, "epoch": 9.876834381551364, "percentage": 49.38, "elapsed_time": "0:48:07", "remaining_time": "0:49:19", "throughput": 4258.41, "total_tokens": 12295264} {"current_steps": 18850, "total_steps": 38160, "loss": 0.4725, "lr": 0.0005972087007278628, "epoch": 9.879454926624739, "percentage": 49.4, "elapsed_time": "0:48:07", "remaining_time": "0:49:18", "throughput": 4258.39, "total_tokens": 12297984} {"current_steps": 18855, "total_steps": 38160, "loss": 0.4364, "lr": 0.0005969843684459305, "epoch": 9.882075471698114, "percentage": 49.41, "elapsed_time": "0:48:08", "remaining_time": "0:49:17", "throughput": 4258.43, "total_tokens": 12301184} {"current_steps": 18860, "total_steps": 38160, "loss": 0.4844, "lr": 0.0005967600158759746, "epoch": 9.884696016771489, "percentage": 49.42, "elapsed_time": "0:48:09", "remaining_time": "0:49:16", "throughput": 4258.41, "total_tokens": 12303968} {"current_steps": 18865, "total_steps": 38160, "loss": 0.3864, "lr": 0.0005965356430649276, "epoch": 9.887316561844864, "percentage": 49.44, "elapsed_time": "0:48:10", "remaining_time": "0:49:16", "throughput": 4258.63, "total_tokens": 12308256} {"current_steps": 18870, "total_steps": 38160, "loss": 0.5426, "lr": 0.0005963112500597251, "epoch": 9.88993710691824, "percentage": 49.45, "elapsed_time": "0:48:10", "remaining_time": "0:49:15", "throughput": 4258.59, "total_tokens": 12310816} {"current_steps": 18875, "total_steps": 38160, "loss": 0.4646, "lr": 0.0005960868369073079, "epoch": 9.892557651991615, "percentage": 49.46, "elapsed_time": "0:48:11", "remaining_time": "0:49:14", "throughput": 4258.74, "total_tokens": 12314752} {"current_steps": 18880, "total_steps": 38160, "loss": 0.4344, "lr": 0.0005958624036546208, "epoch": 9.89517819706499, "percentage": 49.48, "elapsed_time": "0:48:12", "remaining_time": "0:49:13", "throughput": 4258.84, "total_tokens": 12318272} {"current_steps": 18885, "total_steps": 38160, "loss": 0.5129, "lr": 0.0005956379503486123, "epoch": 9.897798742138365, "percentage": 49.49, "elapsed_time": "0:48:13", "remaining_time": "0:49:12", "throughput": 4259.03, "total_tokens": 12322336} {"current_steps": 18890, "total_steps": 38160, "loss": 0.4271, "lr": 0.0005954134770362359, "epoch": 9.90041928721174, "percentage": 49.5, "elapsed_time": "0:48:13", "remaining_time": "0:49:12", "throughput": 4259.13, "total_tokens": 12325760} {"current_steps": 18895, "total_steps": 38160, "loss": 0.5712, "lr": 0.0005951889837644486, "epoch": 9.903039832285115, "percentage": 49.52, "elapsed_time": "0:48:14", "remaining_time": "0:49:11", "throughput": 4259.39, "total_tokens": 12330304} {"current_steps": 18900, "total_steps": 38160, "loss": 0.4956, "lr": 0.0005949644705802116, "epoch": 9.90566037735849, "percentage": 49.53, "elapsed_time": "0:48:15", "remaining_time": "0:49:10", "throughput": 4259.35, "total_tokens": 12332960} {"current_steps": 18905, "total_steps": 38160, "loss": 0.5079, "lr": 0.0005947399375304909, "epoch": 9.908280922431866, "percentage": 49.54, "elapsed_time": "0:48:16", "remaining_time": "0:49:10", "throughput": 4259.6, "total_tokens": 12337536} {"current_steps": 18910, "total_steps": 38160, "loss": 0.4888, "lr": 0.0005945153846622563, "epoch": 9.91090146750524, "percentage": 49.55, "elapsed_time": "0:48:17", "remaining_time": "0:49:09", "throughput": 4259.73, "total_tokens": 12341120} {"current_steps": 18915, "total_steps": 38160, "loss": 0.4361, "lr": 0.0005942908120224815, "epoch": 9.913522012578616, "percentage": 49.57, "elapsed_time": "0:48:17", "remaining_time": "0:49:08", "throughput": 4259.71, "total_tokens": 12343904} {"current_steps": 18920, "total_steps": 38160, "loss": 0.5573, "lr": 0.0005940662196581443, "epoch": 9.916142557651991, "percentage": 49.58, "elapsed_time": "0:48:18", "remaining_time": "0:49:07", "throughput": 4259.74, "total_tokens": 12346912} {"current_steps": 18925, "total_steps": 38160, "loss": 0.3607, "lr": 0.0005938416076162273, "epoch": 9.918763102725366, "percentage": 49.59, "elapsed_time": "0:48:19", "remaining_time": "0:49:06", "throughput": 4259.81, "total_tokens": 12350272} {"current_steps": 18930, "total_steps": 38160, "loss": 0.536, "lr": 0.0005936169759437165, "epoch": 9.921383647798741, "percentage": 49.61, "elapsed_time": "0:48:19", "remaining_time": "0:49:05", "throughput": 4259.73, "total_tokens": 12352800} {"current_steps": 18935, "total_steps": 38160, "loss": 0.3854, "lr": 0.0005933923246876024, "epoch": 9.924004192872118, "percentage": 49.62, "elapsed_time": "0:48:20", "remaining_time": "0:49:04", "throughput": 4259.73, "total_tokens": 12355616} {"current_steps": 18940, "total_steps": 38160, "loss": 0.4273, "lr": 0.0005931676538948795, "epoch": 9.926624737945493, "percentage": 49.63, "elapsed_time": "0:48:21", "remaining_time": "0:49:04", "throughput": 4259.77, "total_tokens": 12358784} {"current_steps": 18945, "total_steps": 38160, "loss": 0.5075, "lr": 0.0005929429636125463, "epoch": 9.929245283018869, "percentage": 49.65, "elapsed_time": "0:48:21", "remaining_time": "0:49:03", "throughput": 4259.8, "total_tokens": 12361920} {"current_steps": 18950, "total_steps": 38160, "loss": 0.4482, "lr": 0.0005927182538876055, "epoch": 9.931865828092244, "percentage": 49.66, "elapsed_time": "0:48:22", "remaining_time": "0:49:02", "throughput": 4259.93, "total_tokens": 12365600} {"current_steps": 18955, "total_steps": 38160, "loss": 0.487, "lr": 0.0005924935247670637, "epoch": 9.934486373165619, "percentage": 49.67, "elapsed_time": "0:48:23", "remaining_time": "0:49:01", "throughput": 4259.85, "total_tokens": 12368000} {"current_steps": 18960, "total_steps": 38160, "loss": 0.4604, "lr": 0.0005922687762979317, "epoch": 9.937106918238994, "percentage": 49.69, "elapsed_time": "0:48:24", "remaining_time": "0:49:00", "throughput": 4259.81, "total_tokens": 12370592} {"current_steps": 18965, "total_steps": 38160, "loss": 0.4969, "lr": 0.0005920440085272245, "epoch": 9.93972746331237, "percentage": 49.7, "elapsed_time": "0:48:24", "remaining_time": "0:48:59", "throughput": 4259.86, "total_tokens": 12373760} {"current_steps": 18970, "total_steps": 38160, "loss": 0.4631, "lr": 0.0005918192215019608, "epoch": 9.942348008385745, "percentage": 49.71, "elapsed_time": "0:48:25", "remaining_time": "0:48:59", "throughput": 4260.02, "total_tokens": 12377600} {"current_steps": 18975, "total_steps": 38160, "loss": 0.387, "lr": 0.0005915944152691633, "epoch": 9.94496855345912, "percentage": 49.72, "elapsed_time": "0:48:26", "remaining_time": "0:48:58", "throughput": 4260.11, "total_tokens": 12381152} {"current_steps": 18980, "total_steps": 38160, "loss": 0.4809, "lr": 0.0005913695898758593, "epoch": 9.947589098532495, "percentage": 49.74, "elapsed_time": "0:48:26", "remaining_time": "0:48:57", "throughput": 4260.12, "total_tokens": 12384096} {"current_steps": 18985, "total_steps": 38160, "loss": 0.4295, "lr": 0.0005911447453690793, "epoch": 9.95020964360587, "percentage": 49.75, "elapsed_time": "0:48:27", "remaining_time": "0:48:56", "throughput": 4260.09, "total_tokens": 12386848} {"current_steps": 18990, "total_steps": 38160, "loss": 0.4192, "lr": 0.0005909198817958585, "epoch": 9.952830188679245, "percentage": 49.76, "elapsed_time": "0:48:28", "remaining_time": "0:48:55", "throughput": 4260.02, "total_tokens": 12389344} {"current_steps": 18995, "total_steps": 38160, "loss": 0.4808, "lr": 0.0005906949992032359, "epoch": 9.95545073375262, "percentage": 49.78, "elapsed_time": "0:48:29", "remaining_time": "0:48:55", "throughput": 4260.08, "total_tokens": 12392640} {"current_steps": 19000, "total_steps": 38160, "loss": 0.4897, "lr": 0.0005904700976382539, "epoch": 9.958071278825996, "percentage": 49.79, "elapsed_time": "0:48:29", "remaining_time": "0:48:54", "throughput": 4260.33, "total_tokens": 12397248} {"current_steps": 19005, "total_steps": 38160, "loss": 0.4997, "lr": 0.0005902451771479596, "epoch": 9.96069182389937, "percentage": 49.8, "elapsed_time": "0:48:30", "remaining_time": "0:48:53", "throughput": 4260.35, "total_tokens": 12400352} {"current_steps": 19010, "total_steps": 38160, "loss": 0.3841, "lr": 0.000590020237779404, "epoch": 9.963312368972746, "percentage": 49.82, "elapsed_time": "0:48:31", "remaining_time": "0:48:52", "throughput": 4260.3, "total_tokens": 12402944} {"current_steps": 19015, "total_steps": 38160, "loss": 0.4477, "lr": 0.0005897952795796415, "epoch": 9.965932914046121, "percentage": 49.83, "elapsed_time": "0:48:31", "remaining_time": "0:48:51", "throughput": 4260.31, "total_tokens": 12405952} {"current_steps": 19020, "total_steps": 38160, "loss": 0.6097, "lr": 0.0005895703025957311, "epoch": 9.968553459119496, "percentage": 49.84, "elapsed_time": "0:48:32", "remaining_time": "0:48:51", "throughput": 4260.39, "total_tokens": 12409376} {"current_steps": 19025, "total_steps": 38160, "loss": 0.4862, "lr": 0.0005893453068747352, "epoch": 9.971174004192871, "percentage": 49.86, "elapsed_time": "0:48:33", "remaining_time": "0:48:50", "throughput": 4260.54, "total_tokens": 12413216} {"current_steps": 19030, "total_steps": 38160, "loss": 0.3868, "lr": 0.0005891202924637202, "epoch": 9.973794549266248, "percentage": 49.87, "elapsed_time": "0:48:34", "remaining_time": "0:48:49", "throughput": 4260.61, "total_tokens": 12416512} {"current_steps": 19035, "total_steps": 38160, "loss": 0.4529, "lr": 0.0005888952594097572, "epoch": 9.976415094339622, "percentage": 49.88, "elapsed_time": "0:48:35", "remaining_time": "0:48:48", "throughput": 4260.73, "total_tokens": 12420192} {"current_steps": 19040, "total_steps": 38160, "loss": 0.5173, "lr": 0.0005886702077599197, "epoch": 9.979035639412999, "percentage": 49.9, "elapsed_time": "0:48:35", "remaining_time": "0:48:47", "throughput": 4260.62, "total_tokens": 12422464} {"current_steps": 19045, "total_steps": 38160, "loss": 0.5932, "lr": 0.0005884451375612865, "epoch": 9.981656184486374, "percentage": 49.91, "elapsed_time": "0:48:36", "remaining_time": "0:48:47", "throughput": 4260.6, "total_tokens": 12425248} {"current_steps": 19050, "total_steps": 38160, "loss": 0.4408, "lr": 0.0005882200488609396, "epoch": 9.984276729559749, "percentage": 49.92, "elapsed_time": "0:48:37", "remaining_time": "0:48:46", "throughput": 4260.7, "total_tokens": 12428704} {"current_steps": 19055, "total_steps": 38160, "loss": 0.5296, "lr": 0.0005879949417059649, "epoch": 9.986897274633124, "percentage": 49.93, "elapsed_time": "0:48:37", "remaining_time": "0:48:45", "throughput": 4260.84, "total_tokens": 12432480} {"current_steps": 19060, "total_steps": 38160, "loss": 0.3891, "lr": 0.0005877698161434522, "epoch": 9.9895178197065, "percentage": 49.95, "elapsed_time": "0:48:38", "remaining_time": "0:48:44", "throughput": 4260.76, "total_tokens": 12434912} {"current_steps": 19065, "total_steps": 38160, "loss": 0.405, "lr": 0.0005875446722204955, "epoch": 9.992138364779874, "percentage": 49.96, "elapsed_time": "0:48:39", "remaining_time": "0:48:43", "throughput": 4260.79, "total_tokens": 12438016} {"current_steps": 19070, "total_steps": 38160, "loss": 0.5152, "lr": 0.0005873195099841919, "epoch": 9.99475890985325, "percentage": 49.97, "elapsed_time": "0:48:39", "remaining_time": "0:48:42", "throughput": 4260.75, "total_tokens": 12440672} {"current_steps": 19075, "total_steps": 38160, "loss": 0.4651, "lr": 0.0005870943294816431, "epoch": 9.997379454926625, "percentage": 49.99, "elapsed_time": "0:48:40", "remaining_time": "0:48:42", "throughput": 4260.79, "total_tokens": 12443840} {"current_steps": 19080, "total_steps": 38160, "loss": 0.4859, "lr": 0.0005868691307599543, "epoch": 10.0, "percentage": 50.0, "elapsed_time": "0:48:41", "remaining_time": "0:48:41", "throughput": 4260.55, "total_tokens": 12446408} {"current_steps": 19080, "total_steps": 38160, "eval_loss": 0.4540214240550995, "epoch": 10.0, "percentage": 50.0, "elapsed_time": "0:48:54", "remaining_time": "0:48:54", "throughput": 4240.84, "total_tokens": 12446408} {"current_steps": 19085, "total_steps": 38160, "loss": 0.4087, "lr": 0.0005866439138662343, "epoch": 10.002620545073375, "percentage": 50.01, "elapsed_time": "0:48:57", "remaining_time": "0:48:55", "throughput": 4238.53, "total_tokens": 12450472} {"current_steps": 19090, "total_steps": 38160, "loss": 0.3767, "lr": 0.000586418678847596, "epoch": 10.00524109014675, "percentage": 50.03, "elapsed_time": "0:48:58", "remaining_time": "0:48:55", "throughput": 4238.65, "total_tokens": 12454056} {"current_steps": 19095, "total_steps": 38160, "loss": 0.4916, "lr": 0.000586193425751156, "epoch": 10.007861635220126, "percentage": 50.04, "elapsed_time": "0:48:58", "remaining_time": "0:48:54", "throughput": 4238.75, "total_tokens": 12457576} {"current_steps": 19100, "total_steps": 38160, "loss": 0.4718, "lr": 0.0005859681546240348, "epoch": 10.0104821802935, "percentage": 50.05, "elapsed_time": "0:48:59", "remaining_time": "0:48:53", "throughput": 4238.94, "total_tokens": 12461608} {"current_steps": 19105, "total_steps": 38160, "loss": 0.3696, "lr": 0.0005857428655133562, "epoch": 10.013102725366876, "percentage": 50.07, "elapsed_time": "0:49:00", "remaining_time": "0:48:52", "throughput": 4238.99, "total_tokens": 12464968} {"current_steps": 19110, "total_steps": 38160, "loss": 0.5033, "lr": 0.0005855175584662485, "epoch": 10.015723270440251, "percentage": 50.08, "elapsed_time": "0:49:01", "remaining_time": "0:48:52", "throughput": 4239.14, "total_tokens": 12468648} {"current_steps": 19115, "total_steps": 38160, "loss": 0.4887, "lr": 0.0005852922335298433, "epoch": 10.018343815513626, "percentage": 50.09, "elapsed_time": "0:49:02", "remaining_time": "0:48:51", "throughput": 4239.17, "total_tokens": 12471784} {"current_steps": 19120, "total_steps": 38160, "loss": 0.5805, "lr": 0.0005850668907512757, "epoch": 10.020964360587001, "percentage": 50.1, "elapsed_time": "0:49:02", "remaining_time": "0:48:50", "throughput": 4239.17, "total_tokens": 12474632} {"current_steps": 19125, "total_steps": 38160, "loss": 0.5325, "lr": 0.0005848415301776852, "epoch": 10.023584905660377, "percentage": 50.12, "elapsed_time": "0:49:03", "remaining_time": "0:48:49", "throughput": 4239.23, "total_tokens": 12477832} {"current_steps": 19130, "total_steps": 38160, "loss": 0.4696, "lr": 0.0005846161518562144, "epoch": 10.026205450733753, "percentage": 50.13, "elapsed_time": "0:49:04", "remaining_time": "0:48:48", "throughput": 4239.49, "total_tokens": 12482312} {"current_steps": 19135, "total_steps": 38160, "loss": 0.4191, "lr": 0.00058439075583401, "epoch": 10.028825995807129, "percentage": 50.14, "elapsed_time": "0:49:05", "remaining_time": "0:48:48", "throughput": 4239.59, "total_tokens": 12485768} {"current_steps": 19140, "total_steps": 38160, "loss": 0.3554, "lr": 0.0005841653421582223, "epoch": 10.031446540880504, "percentage": 50.16, "elapsed_time": "0:49:05", "remaining_time": "0:48:47", "throughput": 4239.61, "total_tokens": 12488776} {"current_steps": 19145, "total_steps": 38160, "loss": 0.4598, "lr": 0.0005839399108760052, "epoch": 10.034067085953879, "percentage": 50.17, "elapsed_time": "0:49:06", "remaining_time": "0:48:46", "throughput": 4239.58, "total_tokens": 12491464} {"current_steps": 19150, "total_steps": 38160, "loss": 0.4704, "lr": 0.0005837144620345165, "epoch": 10.036687631027254, "percentage": 50.18, "elapsed_time": "0:49:07", "remaining_time": "0:48:45", "throughput": 4239.63, "total_tokens": 12494600} {"current_steps": 19155, "total_steps": 38160, "loss": 0.6288, "lr": 0.0005834889956809173, "epoch": 10.03930817610063, "percentage": 50.2, "elapsed_time": "0:49:07", "remaining_time": "0:48:44", "throughput": 4239.81, "total_tokens": 12498696} {"current_steps": 19160, "total_steps": 38160, "loss": 0.4602, "lr": 0.0005832635118623726, "epoch": 10.041928721174004, "percentage": 50.21, "elapsed_time": "0:49:08", "remaining_time": "0:48:44", "throughput": 4239.89, "total_tokens": 12501960} {"current_steps": 19165, "total_steps": 38160, "loss": 0.599, "lr": 0.0005830380106260513, "epoch": 10.04454926624738, "percentage": 50.22, "elapsed_time": "0:49:09", "remaining_time": "0:48:43", "throughput": 4239.96, "total_tokens": 12505224} {"current_steps": 19170, "total_steps": 38160, "loss": 0.4869, "lr": 0.0005828124920191255, "epoch": 10.047169811320755, "percentage": 50.24, "elapsed_time": "0:49:10", "remaining_time": "0:48:42", "throughput": 4240.06, "total_tokens": 12508744} {"current_steps": 19175, "total_steps": 38160, "loss": 0.5589, "lr": 0.000582586956088771, "epoch": 10.04979035639413, "percentage": 50.25, "elapsed_time": "0:49:10", "remaining_time": "0:48:41", "throughput": 4240.03, "total_tokens": 12511464} {"current_steps": 19180, "total_steps": 38160, "loss": 0.4835, "lr": 0.0005823614028821677, "epoch": 10.052410901467505, "percentage": 50.26, "elapsed_time": "0:49:11", "remaining_time": "0:48:40", "throughput": 4239.93, "total_tokens": 12513736} {"current_steps": 19185, "total_steps": 38160, "loss": 0.4955, "lr": 0.0005821358324464985, "epoch": 10.05503144654088, "percentage": 50.28, "elapsed_time": "0:49:12", "remaining_time": "0:48:39", "throughput": 4239.92, "total_tokens": 12516584} {"current_steps": 19190, "total_steps": 38160, "loss": 0.368, "lr": 0.0005819102448289501, "epoch": 10.057651991614255, "percentage": 50.29, "elapsed_time": "0:49:12", "remaining_time": "0:48:39", "throughput": 4240.11, "total_tokens": 12520680} {"current_steps": 19195, "total_steps": 38160, "loss": 0.4923, "lr": 0.000581684640076713, "epoch": 10.06027253668763, "percentage": 50.3, "elapsed_time": "0:49:13", "remaining_time": "0:48:38", "throughput": 4240.14, "total_tokens": 12523624} {"current_steps": 19200, "total_steps": 38160, "loss": 0.416, "lr": 0.0005814590182369811, "epoch": 10.062893081761006, "percentage": 50.31, "elapsed_time": "0:49:14", "remaining_time": "0:48:37", "throughput": 4240.14, "total_tokens": 12526472} {"current_steps": 19205, "total_steps": 38160, "loss": 0.5109, "lr": 0.000581233379356952, "epoch": 10.065513626834381, "percentage": 50.33, "elapsed_time": "0:49:14", "remaining_time": "0:48:36", "throughput": 4240.21, "total_tokens": 12529768} {"current_steps": 19210, "total_steps": 38160, "loss": 0.4464, "lr": 0.0005810077234838267, "epoch": 10.068134171907756, "percentage": 50.34, "elapsed_time": "0:49:15", "remaining_time": "0:48:35", "throughput": 4240.21, "total_tokens": 12532680} {"current_steps": 19215, "total_steps": 38160, "loss": 0.4204, "lr": 0.0005807820506648097, "epoch": 10.070754716981131, "percentage": 50.35, "elapsed_time": "0:49:16", "remaining_time": "0:48:34", "throughput": 4240.27, "total_tokens": 12535944} {"current_steps": 19220, "total_steps": 38160, "loss": 0.5609, "lr": 0.0005805563609471095, "epoch": 10.073375262054507, "percentage": 50.37, "elapsed_time": "0:49:17", "remaining_time": "0:48:34", "throughput": 4240.44, "total_tokens": 12540008} {"current_steps": 19225, "total_steps": 38160, "loss": 0.3555, "lr": 0.0005803306543779375, "epoch": 10.075995807127883, "percentage": 50.38, "elapsed_time": "0:49:17", "remaining_time": "0:48:33", "throughput": 4240.45, "total_tokens": 12542952} {"current_steps": 19230, "total_steps": 38160, "loss": 0.406, "lr": 0.000580104931004509, "epoch": 10.078616352201259, "percentage": 50.39, "elapsed_time": "0:49:18", "remaining_time": "0:48:32", "throughput": 4240.42, "total_tokens": 12545672} {"current_steps": 19235, "total_steps": 38160, "loss": 0.4189, "lr": 0.000579879190874043, "epoch": 10.081236897274634, "percentage": 50.41, "elapsed_time": "0:49:19", "remaining_time": "0:48:31", "throughput": 4240.47, "total_tokens": 12548808} {"current_steps": 19240, "total_steps": 38160, "loss": 0.4869, "lr": 0.0005796534340337614, "epoch": 10.083857442348009, "percentage": 50.42, "elapsed_time": "0:49:20", "remaining_time": "0:48:30", "throughput": 4240.51, "total_tokens": 12551944} {"current_steps": 19245, "total_steps": 38160, "loss": 0.4789, "lr": 0.0005794276605308902, "epoch": 10.086477987421384, "percentage": 50.43, "elapsed_time": "0:49:20", "remaining_time": "0:48:29", "throughput": 4240.55, "total_tokens": 12555048} {"current_steps": 19250, "total_steps": 38160, "loss": 0.376, "lr": 0.0005792018704126586, "epoch": 10.08909853249476, "percentage": 50.45, "elapsed_time": "0:49:21", "remaining_time": "0:48:29", "throughput": 4240.61, "total_tokens": 12558312} {"current_steps": 19255, "total_steps": 38160, "loss": 0.4625, "lr": 0.0005789760637262992, "epoch": 10.091719077568134, "percentage": 50.46, "elapsed_time": "0:49:22", "remaining_time": "0:48:28", "throughput": 4240.75, "total_tokens": 12561992} {"current_steps": 19260, "total_steps": 38160, "loss": 0.4762, "lr": 0.0005787502405190483, "epoch": 10.09433962264151, "percentage": 50.47, "elapsed_time": "0:49:22", "remaining_time": "0:48:27", "throughput": 4240.86, "total_tokens": 12565544} {"current_steps": 19265, "total_steps": 38160, "loss": 0.5176, "lr": 0.0005785244008381456, "epoch": 10.096960167714885, "percentage": 50.48, "elapsed_time": "0:49:23", "remaining_time": "0:48:26", "throughput": 4240.83, "total_tokens": 12568232} {"current_steps": 19270, "total_steps": 38160, "loss": 0.4323, "lr": 0.0005782985447308341, "epoch": 10.09958071278826, "percentage": 50.5, "elapsed_time": "0:49:24", "remaining_time": "0:48:25", "throughput": 4240.74, "total_tokens": 12570568} {"current_steps": 19275, "total_steps": 38160, "loss": 0.4278, "lr": 0.0005780726722443602, "epoch": 10.102201257861635, "percentage": 50.51, "elapsed_time": "0:49:24", "remaining_time": "0:48:24", "throughput": 4240.74, "total_tokens": 12573448} {"current_steps": 19280, "total_steps": 38160, "loss": 0.3918, "lr": 0.0005778467834259741, "epoch": 10.10482180293501, "percentage": 50.52, "elapsed_time": "0:49:25", "remaining_time": "0:48:24", "throughput": 4240.9, "total_tokens": 12577256} {"current_steps": 19285, "total_steps": 38160, "loss": 0.422, "lr": 0.000577620878322929, "epoch": 10.107442348008385, "percentage": 50.54, "elapsed_time": "0:49:26", "remaining_time": "0:48:23", "throughput": 4241.02, "total_tokens": 12580808} {"current_steps": 19290, "total_steps": 38160, "loss": 0.4448, "lr": 0.0005773949569824816, "epoch": 10.11006289308176, "percentage": 50.55, "elapsed_time": "0:49:27", "remaining_time": "0:48:22", "throughput": 4241.34, "total_tokens": 12585896} {"current_steps": 19295, "total_steps": 38160, "loss": 0.4093, "lr": 0.0005771690194518922, "epoch": 10.112683438155136, "percentage": 50.56, "elapsed_time": "0:49:28", "remaining_time": "0:48:21", "throughput": 4241.39, "total_tokens": 12589000} {"current_steps": 19300, "total_steps": 38160, "loss": 0.4578, "lr": 0.0005769430657784245, "epoch": 10.115303983228511, "percentage": 50.58, "elapsed_time": "0:49:28", "remaining_time": "0:48:21", "throughput": 4241.4, "total_tokens": 12592104} {"current_steps": 19305, "total_steps": 38160, "loss": 0.3765, "lr": 0.0005767170960093449, "epoch": 10.117924528301886, "percentage": 50.59, "elapsed_time": "0:49:29", "remaining_time": "0:48:20", "throughput": 4241.45, "total_tokens": 12595240} {"current_steps": 19310, "total_steps": 38160, "loss": 0.3321, "lr": 0.0005764911101919244, "epoch": 10.120545073375261, "percentage": 50.6, "elapsed_time": "0:49:30", "remaining_time": "0:48:19", "throughput": 4241.34, "total_tokens": 12597480} {"current_steps": 19315, "total_steps": 38160, "loss": 0.5464, "lr": 0.0005762651083734363, "epoch": 10.123165618448636, "percentage": 50.62, "elapsed_time": "0:49:30", "remaining_time": "0:48:18", "throughput": 4241.33, "total_tokens": 12600328} {"current_steps": 19320, "total_steps": 38160, "loss": 0.4362, "lr": 0.0005760390906011574, "epoch": 10.125786163522013, "percentage": 50.63, "elapsed_time": "0:49:31", "remaining_time": "0:48:17", "throughput": 4241.15, "total_tokens": 12602152} {"current_steps": 19325, "total_steps": 38160, "loss": 0.502, "lr": 0.0005758130569223684, "epoch": 10.128406708595389, "percentage": 50.64, "elapsed_time": "0:49:32", "remaining_time": "0:48:16", "throughput": 4241.21, "total_tokens": 12605352} {"current_steps": 19330, "total_steps": 38160, "loss": 0.3764, "lr": 0.0005755870073843527, "epoch": 10.131027253668764, "percentage": 50.66, "elapsed_time": "0:49:32", "remaining_time": "0:48:15", "throughput": 4241.15, "total_tokens": 12607784} {"current_steps": 19335, "total_steps": 38160, "loss": 0.6105, "lr": 0.0005753609420343973, "epoch": 10.133647798742139, "percentage": 50.67, "elapsed_time": "0:49:33", "remaining_time": "0:48:15", "throughput": 4241.62, "total_tokens": 12614056} {"current_steps": 19340, "total_steps": 38160, "loss": 0.5055, "lr": 0.0005751348609197929, "epoch": 10.136268343815514, "percentage": 50.68, "elapsed_time": "0:49:34", "remaining_time": "0:48:14", "throughput": 4241.55, "total_tokens": 12616552} {"current_steps": 19345, "total_steps": 38160, "loss": 0.484, "lr": 0.0005749087640878325, "epoch": 10.13888888888889, "percentage": 50.69, "elapsed_time": "0:49:35", "remaining_time": "0:48:13", "throughput": 4241.63, "total_tokens": 12619976} {"current_steps": 19350, "total_steps": 38160, "loss": 0.4316, "lr": 0.0005746826515858135, "epoch": 10.141509433962264, "percentage": 50.71, "elapsed_time": "0:49:35", "remaining_time": "0:48:12", "throughput": 4241.7, "total_tokens": 12623272} {"current_steps": 19355, "total_steps": 38160, "loss": 0.5098, "lr": 0.0005744565234610356, "epoch": 10.14412997903564, "percentage": 50.72, "elapsed_time": "0:49:36", "remaining_time": "0:48:12", "throughput": 4241.67, "total_tokens": 12625960} {"current_steps": 19360, "total_steps": 38160, "loss": 0.4213, "lr": 0.0005742303797608023, "epoch": 10.146750524109015, "percentage": 50.73, "elapsed_time": "0:49:37", "remaining_time": "0:48:11", "throughput": 4241.88, "total_tokens": 12630184} {"current_steps": 19365, "total_steps": 38160, "loss": 0.4466, "lr": 0.0005740042205324208, "epoch": 10.14937106918239, "percentage": 50.75, "elapsed_time": "0:49:38", "remaining_time": "0:48:10", "throughput": 4241.9, "total_tokens": 12633224} {"current_steps": 19370, "total_steps": 38160, "loss": 0.4566, "lr": 0.0005737780458232004, "epoch": 10.151991614255765, "percentage": 50.76, "elapsed_time": "0:49:38", "remaining_time": "0:48:09", "throughput": 4241.97, "total_tokens": 12636584} {"current_steps": 19375, "total_steps": 38160, "loss": 0.52, "lr": 0.0005735518556804546, "epoch": 10.15461215932914, "percentage": 50.77, "elapsed_time": "0:49:39", "remaining_time": "0:48:08", "throughput": 4242.04, "total_tokens": 12639944} {"current_steps": 19380, "total_steps": 38160, "loss": 0.5011, "lr": 0.0005733256501514999, "epoch": 10.157232704402515, "percentage": 50.79, "elapsed_time": "0:49:40", "remaining_time": "0:48:08", "throughput": 4242.17, "total_tokens": 12643624} {"current_steps": 19385, "total_steps": 38160, "loss": 0.3062, "lr": 0.0005730994292836555, "epoch": 10.15985324947589, "percentage": 50.8, "elapsed_time": "0:49:41", "remaining_time": "0:48:07", "throughput": 4242.22, "total_tokens": 12646792} {"current_steps": 19390, "total_steps": 38160, "loss": 0.5125, "lr": 0.0005728731931242445, "epoch": 10.162473794549266, "percentage": 50.81, "elapsed_time": "0:49:41", "remaining_time": "0:48:06", "throughput": 4242.37, "total_tokens": 12650696} {"current_steps": 19395, "total_steps": 38160, "loss": 0.578, "lr": 0.0005726469417205928, "epoch": 10.165094339622641, "percentage": 50.83, "elapsed_time": "0:49:42", "remaining_time": "0:48:05", "throughput": 4242.36, "total_tokens": 12653512} {"current_steps": 19400, "total_steps": 38160, "loss": 0.4164, "lr": 0.0005724206751200297, "epoch": 10.167714884696016, "percentage": 50.84, "elapsed_time": "0:49:43", "remaining_time": "0:48:05", "throughput": 4242.48, "total_tokens": 12657160} {"current_steps": 19405, "total_steps": 38160, "loss": 0.4372, "lr": 0.0005721943933698879, "epoch": 10.170335429769391, "percentage": 50.85, "elapsed_time": "0:49:44", "remaining_time": "0:48:04", "throughput": 4242.65, "total_tokens": 12661096} {"current_steps": 19410, "total_steps": 38160, "loss": 0.3849, "lr": 0.0005719680965175023, "epoch": 10.172955974842766, "percentage": 50.86, "elapsed_time": "0:49:44", "remaining_time": "0:48:03", "throughput": 4242.69, "total_tokens": 12664168} {"current_steps": 19415, "total_steps": 38160, "loss": 0.4152, "lr": 0.000571741784610212, "epoch": 10.175576519916143, "percentage": 50.88, "elapsed_time": "0:49:45", "remaining_time": "0:48:02", "throughput": 4242.74, "total_tokens": 12667304} {"current_steps": 19420, "total_steps": 38160, "loss": 0.3756, "lr": 0.0005715154576953589, "epoch": 10.178197064989519, "percentage": 50.89, "elapsed_time": "0:49:46", "remaining_time": "0:48:01", "throughput": 4242.83, "total_tokens": 12670760} {"current_steps": 19425, "total_steps": 38160, "loss": 0.5103, "lr": 0.0005712891158202879, "epoch": 10.180817610062894, "percentage": 50.9, "elapsed_time": "0:49:47", "remaining_time": "0:48:00", "throughput": 4242.8, "total_tokens": 12673384} {"current_steps": 19430, "total_steps": 38160, "loss": 0.4509, "lr": 0.0005710627590323473, "epoch": 10.183438155136269, "percentage": 50.92, "elapsed_time": "0:49:47", "remaining_time": "0:48:00", "throughput": 4242.78, "total_tokens": 12676168} {"current_steps": 19435, "total_steps": 38160, "loss": 0.3837, "lr": 0.0005708363873788882, "epoch": 10.186058700209644, "percentage": 50.93, "elapsed_time": "0:49:48", "remaining_time": "0:47:59", "throughput": 4242.76, "total_tokens": 12678984} {"current_steps": 19440, "total_steps": 38160, "loss": 0.6023, "lr": 0.0005706100009072649, "epoch": 10.18867924528302, "percentage": 50.94, "elapsed_time": "0:49:49", "remaining_time": "0:47:58", "throughput": 4242.84, "total_tokens": 12682600} {"current_steps": 19445, "total_steps": 38160, "loss": 0.3637, "lr": 0.000570383599664835, "epoch": 10.191299790356394, "percentage": 50.96, "elapsed_time": "0:49:49", "remaining_time": "0:47:57", "throughput": 4242.85, "total_tokens": 12685704} {"current_steps": 19450, "total_steps": 38160, "loss": 0.3686, "lr": 0.0005701571836989591, "epoch": 10.19392033542977, "percentage": 50.97, "elapsed_time": "0:49:50", "remaining_time": "0:47:56", "throughput": 4242.93, "total_tokens": 12689256} {"current_steps": 19455, "total_steps": 38160, "loss": 0.4263, "lr": 0.0005699307530570008, "epoch": 10.196540880503145, "percentage": 50.98, "elapsed_time": "0:49:51", "remaining_time": "0:47:56", "throughput": 4243.06, "total_tokens": 12692968} {"current_steps": 19460, "total_steps": 38160, "loss": 0.3891, "lr": 0.0005697043077863267, "epoch": 10.19916142557652, "percentage": 51.0, "elapsed_time": "0:49:52", "remaining_time": "0:47:55", "throughput": 4243.19, "total_tokens": 12696712} {"current_steps": 19465, "total_steps": 38160, "loss": 0.5065, "lr": 0.0005694778479343065, "epoch": 10.201781970649895, "percentage": 51.01, "elapsed_time": "0:49:52", "remaining_time": "0:47:54", "throughput": 4243.22, "total_tokens": 12699848} {"current_steps": 19470, "total_steps": 38160, "loss": 0.4448, "lr": 0.0005692513735483134, "epoch": 10.20440251572327, "percentage": 51.02, "elapsed_time": "0:49:53", "remaining_time": "0:47:53", "throughput": 4243.29, "total_tokens": 12703176} {"current_steps": 19475, "total_steps": 38160, "loss": 0.5539, "lr": 0.0005690248846757228, "epoch": 10.207023060796645, "percentage": 51.04, "elapsed_time": "0:49:54", "remaining_time": "0:47:52", "throughput": 4243.33, "total_tokens": 12706280} {"current_steps": 19480, "total_steps": 38160, "loss": 0.5613, "lr": 0.0005687983813639139, "epoch": 10.20964360587002, "percentage": 51.05, "elapsed_time": "0:49:55", "remaining_time": "0:47:52", "throughput": 4243.34, "total_tokens": 12709224} {"current_steps": 19485, "total_steps": 38160, "loss": 0.3943, "lr": 0.0005685718636602685, "epoch": 10.212264150943396, "percentage": 51.06, "elapsed_time": "0:49:55", "remaining_time": "0:47:51", "throughput": 4243.48, "total_tokens": 12713064} {"current_steps": 19490, "total_steps": 38160, "loss": 0.4952, "lr": 0.0005683453316121716, "epoch": 10.214884696016771, "percentage": 51.07, "elapsed_time": "0:49:56", "remaining_time": "0:47:50", "throughput": 4243.57, "total_tokens": 12716424} {"current_steps": 19495, "total_steps": 38160, "loss": 0.4432, "lr": 0.0005681187852670111, "epoch": 10.217505241090146, "percentage": 51.09, "elapsed_time": "0:49:57", "remaining_time": "0:47:49", "throughput": 4243.65, "total_tokens": 12719816} {"current_steps": 19500, "total_steps": 38160, "loss": 0.5317, "lr": 0.0005678922246721777, "epoch": 10.220125786163521, "percentage": 51.1, "elapsed_time": "0:49:58", "remaining_time": "0:47:49", "throughput": 4243.8, "total_tokens": 12723624} {"current_steps": 19505, "total_steps": 38160, "loss": 0.4535, "lr": 0.0005676656498750656, "epoch": 10.222746331236896, "percentage": 51.11, "elapsed_time": "0:49:58", "remaining_time": "0:47:48", "throughput": 4243.93, "total_tokens": 12727240} {"current_steps": 19510, "total_steps": 38160, "loss": 0.4376, "lr": 0.0005674390609230715, "epoch": 10.225366876310272, "percentage": 51.13, "elapsed_time": "0:49:59", "remaining_time": "0:47:47", "throughput": 4244.02, "total_tokens": 12730792} {"current_steps": 19515, "total_steps": 38160, "loss": 0.4855, "lr": 0.0005672124578635951, "epoch": 10.227987421383649, "percentage": 51.14, "elapsed_time": "0:50:00", "remaining_time": "0:47:46", "throughput": 4244.04, "total_tokens": 12733928} {"current_steps": 19520, "total_steps": 38160, "loss": 0.389, "lr": 0.0005669858407440394, "epoch": 10.230607966457024, "percentage": 51.15, "elapsed_time": "0:50:01", "remaining_time": "0:47:45", "throughput": 4244.24, "total_tokens": 12737992} {"current_steps": 19525, "total_steps": 38160, "loss": 0.463, "lr": 0.00056675920961181, "epoch": 10.233228511530399, "percentage": 51.17, "elapsed_time": "0:50:01", "remaining_time": "0:47:45", "throughput": 4244.17, "total_tokens": 12740456} {"current_steps": 19530, "total_steps": 38160, "loss": 0.4908, "lr": 0.0005665325645143155, "epoch": 10.235849056603774, "percentage": 51.18, "elapsed_time": "0:50:02", "remaining_time": "0:47:44", "throughput": 4244.2, "total_tokens": 12743496} {"current_steps": 19535, "total_steps": 38160, "loss": 0.4009, "lr": 0.0005663059054989679, "epoch": 10.23846960167715, "percentage": 51.19, "elapsed_time": "0:50:03", "remaining_time": "0:47:43", "throughput": 4244.28, "total_tokens": 12746952} {"current_steps": 19540, "total_steps": 38160, "loss": 0.5417, "lr": 0.0005660792326131809, "epoch": 10.241090146750524, "percentage": 51.21, "elapsed_time": "0:50:03", "remaining_time": "0:47:42", "throughput": 4244.28, "total_tokens": 12749800} {"current_steps": 19545, "total_steps": 38160, "loss": 0.4496, "lr": 0.0005658525459043725, "epoch": 10.2437106918239, "percentage": 51.22, "elapsed_time": "0:50:04", "remaining_time": "0:47:41", "throughput": 4244.31, "total_tokens": 12752872} {"current_steps": 19550, "total_steps": 38160, "loss": 0.539, "lr": 0.000565625845419963, "epoch": 10.246331236897275, "percentage": 51.23, "elapsed_time": "0:50:05", "remaining_time": "0:47:40", "throughput": 4244.35, "total_tokens": 12755944} {"current_steps": 19555, "total_steps": 38160, "loss": 0.4589, "lr": 0.000565399131207375, "epoch": 10.24895178197065, "percentage": 51.24, "elapsed_time": "0:50:06", "remaining_time": "0:47:39", "throughput": 4244.28, "total_tokens": 12758344} {"current_steps": 19560, "total_steps": 38160, "loss": 0.3256, "lr": 0.000565172403314035, "epoch": 10.251572327044025, "percentage": 51.26, "elapsed_time": "0:50:06", "remaining_time": "0:47:39", "throughput": 4244.44, "total_tokens": 12762312} {"current_steps": 19565, "total_steps": 38160, "loss": 0.4321, "lr": 0.0005649456617873717, "epoch": 10.2541928721174, "percentage": 51.27, "elapsed_time": "0:50:07", "remaining_time": "0:47:38", "throughput": 4244.47, "total_tokens": 12765416} {"current_steps": 19570, "total_steps": 38160, "loss": 0.3391, "lr": 0.0005647189066748169, "epoch": 10.256813417190775, "percentage": 51.28, "elapsed_time": "0:50:08", "remaining_time": "0:47:37", "throughput": 4244.52, "total_tokens": 12768552} {"current_steps": 19575, "total_steps": 38160, "loss": 0.4139, "lr": 0.0005644921380238052, "epoch": 10.25943396226415, "percentage": 51.3, "elapsed_time": "0:50:08", "remaining_time": "0:47:36", "throughput": 4244.44, "total_tokens": 12770920} {"current_steps": 19580, "total_steps": 38160, "loss": 0.4199, "lr": 0.000564265355881774, "epoch": 10.262054507337526, "percentage": 51.31, "elapsed_time": "0:50:09", "remaining_time": "0:47:35", "throughput": 4244.52, "total_tokens": 12774184} {"current_steps": 19585, "total_steps": 38160, "loss": 0.4973, "lr": 0.0005640385602961634, "epoch": 10.264675052410901, "percentage": 51.32, "elapsed_time": "0:50:10", "remaining_time": "0:47:35", "throughput": 4244.56, "total_tokens": 12777288} {"current_steps": 19590, "total_steps": 38160, "loss": 0.4151, "lr": 0.0005638117513144168, "epoch": 10.267295597484276, "percentage": 51.34, "elapsed_time": "0:50:10", "remaining_time": "0:47:34", "throughput": 4244.55, "total_tokens": 12780136} {"current_steps": 19595, "total_steps": 38160, "loss": 0.4882, "lr": 0.0005635849289839797, "epoch": 10.269916142557651, "percentage": 51.35, "elapsed_time": "0:50:11", "remaining_time": "0:47:33", "throughput": 4244.57, "total_tokens": 12783144} {"current_steps": 19600, "total_steps": 38160, "loss": 0.3431, "lr": 0.000563358093352301, "epoch": 10.272536687631026, "percentage": 51.36, "elapsed_time": "0:50:12", "remaining_time": "0:47:32", "throughput": 4244.57, "total_tokens": 12785992} {"current_steps": 19605, "total_steps": 38160, "loss": 0.5355, "lr": 0.0005631312444668318, "epoch": 10.275157232704402, "percentage": 51.38, "elapsed_time": "0:50:13", "remaining_time": "0:47:31", "throughput": 4244.6, "total_tokens": 12789000} {"current_steps": 19610, "total_steps": 38160, "loss": 0.4666, "lr": 0.0005629043823750266, "epoch": 10.277777777777779, "percentage": 51.39, "elapsed_time": "0:50:13", "remaining_time": "0:47:30", "throughput": 4244.61, "total_tokens": 12791976} {"current_steps": 19615, "total_steps": 38160, "loss": 0.4672, "lr": 0.0005626775071243423, "epoch": 10.280398322851154, "percentage": 51.4, "elapsed_time": "0:50:14", "remaining_time": "0:47:30", "throughput": 4244.78, "total_tokens": 12795976} {"current_steps": 19620, "total_steps": 38160, "loss": 0.5091, "lr": 0.0005624506187622384, "epoch": 10.283018867924529, "percentage": 51.42, "elapsed_time": "0:50:15", "remaining_time": "0:47:29", "throughput": 4244.8, "total_tokens": 12798984} {"current_steps": 19625, "total_steps": 38160, "loss": 0.4359, "lr": 0.0005622237173361777, "epoch": 10.285639412997904, "percentage": 51.43, "elapsed_time": "0:50:15", "remaining_time": "0:47:28", "throughput": 4244.8, "total_tokens": 12801864} {"current_steps": 19630, "total_steps": 38160, "loss": 0.4989, "lr": 0.0005619968028936252, "epoch": 10.28825995807128, "percentage": 51.44, "elapsed_time": "0:50:16", "remaining_time": "0:47:27", "throughput": 4244.83, "total_tokens": 12804968} {"current_steps": 19635, "total_steps": 38160, "loss": 0.4224, "lr": 0.0005617698754820489, "epoch": 10.290880503144654, "percentage": 51.45, "elapsed_time": "0:50:17", "remaining_time": "0:47:26", "throughput": 4244.84, "total_tokens": 12807848} {"current_steps": 19640, "total_steps": 38160, "loss": 0.3966, "lr": 0.0005615429351489192, "epoch": 10.29350104821803, "percentage": 51.47, "elapsed_time": "0:50:17", "remaining_time": "0:47:25", "throughput": 4244.82, "total_tokens": 12810632} {"current_steps": 19645, "total_steps": 38160, "loss": 0.4731, "lr": 0.0005613159819417095, "epoch": 10.296121593291405, "percentage": 51.48, "elapsed_time": "0:50:18", "remaining_time": "0:47:25", "throughput": 4244.91, "total_tokens": 12814024} {"current_steps": 19650, "total_steps": 38160, "loss": 0.4126, "lr": 0.0005610890159078961, "epoch": 10.29874213836478, "percentage": 51.49, "elapsed_time": "0:50:19", "remaining_time": "0:47:24", "throughput": 4245.04, "total_tokens": 12817800} {"current_steps": 19655, "total_steps": 38160, "loss": 0.4461, "lr": 0.0005608620370949575, "epoch": 10.301362683438155, "percentage": 51.51, "elapsed_time": "0:50:20", "remaining_time": "0:47:23", "throughput": 4245.0, "total_tokens": 12820456} {"current_steps": 19660, "total_steps": 38160, "loss": 0.5345, "lr": 0.000560635045550375, "epoch": 10.30398322851153, "percentage": 51.52, "elapsed_time": "0:50:20", "remaining_time": "0:47:22", "throughput": 4244.91, "total_tokens": 12822792} {"current_steps": 19665, "total_steps": 38160, "loss": 0.6005, "lr": 0.0005604080413216328, "epoch": 10.306603773584905, "percentage": 51.53, "elapsed_time": "0:50:21", "remaining_time": "0:47:21", "throughput": 4245.1, "total_tokens": 12826888} {"current_steps": 19670, "total_steps": 38160, "loss": 0.455, "lr": 0.0005601810244562175, "epoch": 10.30922431865828, "percentage": 51.55, "elapsed_time": "0:50:22", "remaining_time": "0:47:20", "throughput": 4245.12, "total_tokens": 12829896} {"current_steps": 19675, "total_steps": 38160, "loss": 0.5701, "lr": 0.0005599539950016184, "epoch": 10.311844863731656, "percentage": 51.56, "elapsed_time": "0:50:23", "remaining_time": "0:47:20", "throughput": 4245.23, "total_tokens": 12833480} {"current_steps": 19680, "total_steps": 38160, "loss": 0.4427, "lr": 0.0005597269530053277, "epoch": 10.314465408805031, "percentage": 51.57, "elapsed_time": "0:50:23", "remaining_time": "0:47:19", "throughput": 4245.25, "total_tokens": 12836424} {"current_steps": 19685, "total_steps": 38160, "loss": 0.5702, "lr": 0.0005594998985148398, "epoch": 10.317085953878406, "percentage": 51.59, "elapsed_time": "0:50:24", "remaining_time": "0:47:18", "throughput": 4245.28, "total_tokens": 12839464} {"current_steps": 19690, "total_steps": 38160, "loss": 0.3349, "lr": 0.0005592728315776519, "epoch": 10.319706498951781, "percentage": 51.6, "elapsed_time": "0:50:25", "remaining_time": "0:47:17", "throughput": 4245.21, "total_tokens": 12841896} {"current_steps": 19695, "total_steps": 38160, "loss": 0.4215, "lr": 0.0005590457522412638, "epoch": 10.322327044025156, "percentage": 51.61, "elapsed_time": "0:50:25", "remaining_time": "0:47:16", "throughput": 4245.38, "total_tokens": 12845768} {"current_steps": 19700, "total_steps": 38160, "loss": 0.4407, "lr": 0.000558818660553178, "epoch": 10.324947589098532, "percentage": 51.62, "elapsed_time": "0:50:26", "remaining_time": "0:47:16", "throughput": 4245.38, "total_tokens": 12848680} {"current_steps": 19705, "total_steps": 38160, "loss": 0.5227, "lr": 0.0005585915565608995, "epoch": 10.327568134171909, "percentage": 51.64, "elapsed_time": "0:50:27", "remaining_time": "0:47:15", "throughput": 4245.35, "total_tokens": 12851464} {"current_steps": 19710, "total_steps": 38160, "loss": 0.313, "lr": 0.0005583644403119357, "epoch": 10.330188679245284, "percentage": 51.65, "elapsed_time": "0:50:27", "remaining_time": "0:47:14", "throughput": 4245.36, "total_tokens": 12854504} {"current_steps": 19715, "total_steps": 38160, "loss": 0.3531, "lr": 0.0005581373118537969, "epoch": 10.332809224318659, "percentage": 51.66, "elapsed_time": "0:50:28", "remaining_time": "0:47:13", "throughput": 4245.41, "total_tokens": 12857736} {"current_steps": 19720, "total_steps": 38160, "loss": 0.4543, "lr": 0.0005579101712339957, "epoch": 10.335429769392034, "percentage": 51.68, "elapsed_time": "0:50:29", "remaining_time": "0:47:12", "throughput": 4245.36, "total_tokens": 12860360} {"current_steps": 19725, "total_steps": 38160, "loss": 0.4311, "lr": 0.0005576830185000474, "epoch": 10.33805031446541, "percentage": 51.69, "elapsed_time": "0:50:29", "remaining_time": "0:47:11", "throughput": 4245.34, "total_tokens": 12863016} {"current_steps": 19730, "total_steps": 38160, "loss": 0.5543, "lr": 0.0005574558536994698, "epoch": 10.340670859538784, "percentage": 51.7, "elapsed_time": "0:50:30", "remaining_time": "0:47:10", "throughput": 4245.32, "total_tokens": 12865768} {"current_steps": 19735, "total_steps": 38160, "loss": 0.4884, "lr": 0.0005572286768797829, "epoch": 10.34329140461216, "percentage": 51.72, "elapsed_time": "0:50:31", "remaining_time": "0:47:10", "throughput": 4245.43, "total_tokens": 12869256} {"current_steps": 19740, "total_steps": 38160, "loss": 0.5015, "lr": 0.0005570014880885098, "epoch": 10.345911949685535, "percentage": 51.73, "elapsed_time": "0:50:32", "remaining_time": "0:47:09", "throughput": 4245.48, "total_tokens": 12872456} {"current_steps": 19745, "total_steps": 38160, "loss": 0.3754, "lr": 0.0005567742873731757, "epoch": 10.34853249475891, "percentage": 51.74, "elapsed_time": "0:50:32", "remaining_time": "0:47:08", "throughput": 4245.54, "total_tokens": 12875720} {"current_steps": 19750, "total_steps": 38160, "loss": 0.353, "lr": 0.0005565470747813085, "epoch": 10.351153039832285, "percentage": 51.76, "elapsed_time": "0:50:33", "remaining_time": "0:47:07", "throughput": 4245.47, "total_tokens": 12878088} {"current_steps": 19755, "total_steps": 38160, "loss": 0.4216, "lr": 0.0005563198503604382, "epoch": 10.35377358490566, "percentage": 51.77, "elapsed_time": "0:50:34", "remaining_time": "0:47:06", "throughput": 4245.42, "total_tokens": 12880616} {"current_steps": 19760, "total_steps": 38160, "loss": 0.5999, "lr": 0.0005560926141580978, "epoch": 10.356394129979035, "percentage": 51.78, "elapsed_time": "0:50:34", "remaining_time": "0:47:05", "throughput": 4245.37, "total_tokens": 12883144} {"current_steps": 19765, "total_steps": 38160, "loss": 0.3976, "lr": 0.0005558653662218225, "epoch": 10.35901467505241, "percentage": 51.8, "elapsed_time": "0:50:35", "remaining_time": "0:47:04", "throughput": 4245.34, "total_tokens": 12885832} {"current_steps": 19770, "total_steps": 38160, "loss": 0.4544, "lr": 0.00055563810659915, "epoch": 10.361635220125786, "percentage": 51.81, "elapsed_time": "0:50:36", "remaining_time": "0:47:04", "throughput": 4245.38, "total_tokens": 12889000} {"current_steps": 19775, "total_steps": 38160, "loss": 0.4338, "lr": 0.0005554108353376201, "epoch": 10.364255765199161, "percentage": 51.82, "elapsed_time": "0:50:36", "remaining_time": "0:47:03", "throughput": 4245.5, "total_tokens": 12892616} {"current_steps": 19780, "total_steps": 38160, "loss": 0.4801, "lr": 0.0005551835524847757, "epoch": 10.366876310272536, "percentage": 51.83, "elapsed_time": "0:50:37", "remaining_time": "0:47:02", "throughput": 4245.43, "total_tokens": 12895112} {"current_steps": 19785, "total_steps": 38160, "loss": 0.5193, "lr": 0.0005549562580881618, "epoch": 10.369496855345911, "percentage": 51.85, "elapsed_time": "0:50:38", "remaining_time": "0:47:01", "throughput": 4245.61, "total_tokens": 12899176} {"current_steps": 19790, "total_steps": 38160, "loss": 0.4878, "lr": 0.0005547289521953257, "epoch": 10.372117400419286, "percentage": 51.86, "elapsed_time": "0:50:38", "remaining_time": "0:47:00", "throughput": 4245.64, "total_tokens": 12902184} {"current_steps": 19795, "total_steps": 38160, "loss": 0.4061, "lr": 0.000554501634853817, "epoch": 10.374737945492662, "percentage": 51.87, "elapsed_time": "0:50:39", "remaining_time": "0:46:59", "throughput": 4245.6, "total_tokens": 12904712} {"current_steps": 19800, "total_steps": 38160, "loss": 0.5143, "lr": 0.0005542743061111883, "epoch": 10.377358490566039, "percentage": 51.89, "elapsed_time": "0:50:40", "remaining_time": "0:46:59", "throughput": 4245.6, "total_tokens": 12907560} {"current_steps": 19805, "total_steps": 38160, "loss": 0.4869, "lr": 0.0005540469660149938, "epoch": 10.379979035639414, "percentage": 51.9, "elapsed_time": "0:50:40", "remaining_time": "0:46:58", "throughput": 4245.62, "total_tokens": 12910568} {"current_steps": 19810, "total_steps": 38160, "loss": 0.6836, "lr": 0.0005538196146127907, "epoch": 10.382599580712789, "percentage": 51.91, "elapsed_time": "0:50:41", "remaining_time": "0:46:57", "throughput": 4245.64, "total_tokens": 12913608} {"current_steps": 19815, "total_steps": 38160, "loss": 0.3843, "lr": 0.0005535922519521381, "epoch": 10.385220125786164, "percentage": 51.93, "elapsed_time": "0:50:42", "remaining_time": "0:46:56", "throughput": 4245.77, "total_tokens": 12917288} {"current_steps": 19820, "total_steps": 38160, "loss": 0.4155, "lr": 0.0005533648780805979, "epoch": 10.38784067085954, "percentage": 51.94, "elapsed_time": "0:50:43", "remaining_time": "0:46:55", "throughput": 4245.79, "total_tokens": 12920232} {"current_steps": 19825, "total_steps": 38160, "loss": 0.4693, "lr": 0.000553137493045734, "epoch": 10.390461215932914, "percentage": 51.95, "elapsed_time": "0:50:43", "remaining_time": "0:46:55", "throughput": 4245.83, "total_tokens": 12923432} {"current_steps": 19830, "total_steps": 38160, "loss": 0.4587, "lr": 0.0005529100968951127, "epoch": 10.39308176100629, "percentage": 51.97, "elapsed_time": "0:50:44", "remaining_time": "0:46:54", "throughput": 4246.08, "total_tokens": 12927912} {"current_steps": 19835, "total_steps": 38160, "loss": 0.4263, "lr": 0.0005526826896763029, "epoch": 10.395702306079665, "percentage": 51.98, "elapsed_time": "0:50:45", "remaining_time": "0:46:53", "throughput": 4246.16, "total_tokens": 12931304} {"current_steps": 19840, "total_steps": 38160, "loss": 0.4839, "lr": 0.0005524552714368753, "epoch": 10.39832285115304, "percentage": 51.99, "elapsed_time": "0:50:46", "remaining_time": "0:46:52", "throughput": 4246.18, "total_tokens": 12934248} {"current_steps": 19845, "total_steps": 38160, "loss": 0.5065, "lr": 0.0005522278422244035, "epoch": 10.400943396226415, "percentage": 52.0, "elapsed_time": "0:50:46", "remaining_time": "0:46:51", "throughput": 4246.25, "total_tokens": 12937608} {"current_steps": 19850, "total_steps": 38160, "loss": 0.3711, "lr": 0.0005520004020864631, "epoch": 10.40356394129979, "percentage": 52.02, "elapsed_time": "0:50:47", "remaining_time": "0:46:51", "throughput": 4246.22, "total_tokens": 12940360} {"current_steps": 19855, "total_steps": 38160, "loss": 0.3607, "lr": 0.0005517729510706315, "epoch": 10.406184486373165, "percentage": 52.03, "elapsed_time": "0:50:48", "remaining_time": "0:46:50", "throughput": 4246.21, "total_tokens": 12943048} {"current_steps": 19860, "total_steps": 38160, "loss": 0.3144, "lr": 0.0005515454892244892, "epoch": 10.40880503144654, "percentage": 52.04, "elapsed_time": "0:50:48", "remaining_time": "0:46:49", "throughput": 4246.17, "total_tokens": 12945704} {"current_steps": 19865, "total_steps": 38160, "loss": 0.4257, "lr": 0.0005513180165956189, "epoch": 10.411425576519916, "percentage": 52.06, "elapsed_time": "0:50:49", "remaining_time": "0:46:48", "throughput": 4246.18, "total_tokens": 12948616} {"current_steps": 19870, "total_steps": 38160, "loss": 0.3442, "lr": 0.0005510905332316049, "epoch": 10.414046121593291, "percentage": 52.07, "elapsed_time": "0:50:50", "remaining_time": "0:46:47", "throughput": 4246.23, "total_tokens": 12951880} {"current_steps": 19875, "total_steps": 38160, "loss": 0.5075, "lr": 0.0005508630391800341, "epoch": 10.416666666666666, "percentage": 52.08, "elapsed_time": "0:50:50", "remaining_time": "0:46:46", "throughput": 4246.28, "total_tokens": 12954984} {"current_steps": 19880, "total_steps": 38160, "loss": 0.4155, "lr": 0.0005506355344884959, "epoch": 10.419287211740041, "percentage": 52.1, "elapsed_time": "0:50:51", "remaining_time": "0:46:45", "throughput": 4246.25, "total_tokens": 12957640} {"current_steps": 19885, "total_steps": 38160, "loss": 0.345, "lr": 0.0005504080192045813, "epoch": 10.421907756813416, "percentage": 52.11, "elapsed_time": "0:50:52", "remaining_time": "0:46:45", "throughput": 4246.26, "total_tokens": 12960488} {"current_steps": 19890, "total_steps": 38160, "loss": 0.5358, "lr": 0.0005501804933758846, "epoch": 10.424528301886792, "percentage": 52.12, "elapsed_time": "0:50:52", "remaining_time": "0:46:44", "throughput": 4246.29, "total_tokens": 12963560} {"current_steps": 19895, "total_steps": 38160, "loss": 0.4389, "lr": 0.0005499529570500009, "epoch": 10.427148846960169, "percentage": 52.14, "elapsed_time": "0:50:53", "remaining_time": "0:46:43", "throughput": 4246.43, "total_tokens": 12967208} {"current_steps": 19900, "total_steps": 38160, "loss": 0.3312, "lr": 0.0005497254102745285, "epoch": 10.429769392033544, "percentage": 52.15, "elapsed_time": "0:50:54", "remaining_time": "0:46:42", "throughput": 4246.47, "total_tokens": 12970248} {"current_steps": 19905, "total_steps": 38160, "loss": 0.4402, "lr": 0.0005494978530970676, "epoch": 10.432389937106919, "percentage": 52.16, "elapsed_time": "0:50:55", "remaining_time": "0:46:41", "throughput": 4246.52, "total_tokens": 12973480} {"current_steps": 19910, "total_steps": 38160, "loss": 0.4205, "lr": 0.0005492702855652206, "epoch": 10.435010482180294, "percentage": 52.18, "elapsed_time": "0:50:55", "remaining_time": "0:46:41", "throughput": 4246.59, "total_tokens": 12976904} {"current_steps": 19915, "total_steps": 38160, "loss": 0.528, "lr": 0.000549042707726592, "epoch": 10.43763102725367, "percentage": 52.19, "elapsed_time": "0:50:56", "remaining_time": "0:46:40", "throughput": 4246.61, "total_tokens": 12979912} {"current_steps": 19920, "total_steps": 38160, "loss": 0.4177, "lr": 0.0005488151196287882, "epoch": 10.440251572327044, "percentage": 52.2, "elapsed_time": "0:50:57", "remaining_time": "0:46:39", "throughput": 4246.61, "total_tokens": 12982728} {"current_steps": 19925, "total_steps": 38160, "loss": 0.35, "lr": 0.0005485875213194184, "epoch": 10.44287211740042, "percentage": 52.21, "elapsed_time": "0:50:57", "remaining_time": "0:46:38", "throughput": 4246.74, "total_tokens": 12986472} {"current_steps": 19930, "total_steps": 38160, "loss": 0.3922, "lr": 0.0005483599128460935, "epoch": 10.445492662473795, "percentage": 52.23, "elapsed_time": "0:50:58", "remaining_time": "0:46:37", "throughput": 4246.91, "total_tokens": 12990600} {"current_steps": 19935, "total_steps": 38160, "loss": 0.5552, "lr": 0.0005481322942564266, "epoch": 10.44811320754717, "percentage": 52.24, "elapsed_time": "0:50:59", "remaining_time": "0:46:37", "throughput": 4247.02, "total_tokens": 12994216} {"current_steps": 19940, "total_steps": 38160, "loss": 0.4677, "lr": 0.0005479046655980327, "epoch": 10.450733752620545, "percentage": 52.25, "elapsed_time": "0:51:00", "remaining_time": "0:46:36", "throughput": 4247.05, "total_tokens": 12997256} {"current_steps": 19945, "total_steps": 38160, "loss": 0.4125, "lr": 0.0005476770269185295, "epoch": 10.45335429769392, "percentage": 52.27, "elapsed_time": "0:51:01", "remaining_time": "0:46:35", "throughput": 4247.21, "total_tokens": 13001384} {"current_steps": 19950, "total_steps": 38160, "loss": 0.6228, "lr": 0.0005474493782655361, "epoch": 10.455974842767295, "percentage": 52.28, "elapsed_time": "0:51:01", "remaining_time": "0:46:34", "throughput": 4247.2, "total_tokens": 13004232} {"current_steps": 19955, "total_steps": 38160, "loss": 0.4135, "lr": 0.0005472217196866742, "epoch": 10.45859538784067, "percentage": 52.29, "elapsed_time": "0:51:02", "remaining_time": "0:46:33", "throughput": 4247.22, "total_tokens": 13007208} {"current_steps": 19960, "total_steps": 38160, "loss": 0.4581, "lr": 0.0005469940512295671, "epoch": 10.461215932914046, "percentage": 52.31, "elapsed_time": "0:51:03", "remaining_time": "0:46:33", "throughput": 4247.32, "total_tokens": 13010696} {"current_steps": 19965, "total_steps": 38160, "loss": 0.5106, "lr": 0.0005467663729418406, "epoch": 10.463836477987421, "percentage": 52.32, "elapsed_time": "0:51:03", "remaining_time": "0:46:32", "throughput": 4247.3, "total_tokens": 13013416} {"current_steps": 19970, "total_steps": 38160, "loss": 0.4322, "lr": 0.0005465386848711225, "epoch": 10.466457023060796, "percentage": 52.33, "elapsed_time": "0:51:04", "remaining_time": "0:46:31", "throughput": 4247.4, "total_tokens": 13016904} {"current_steps": 19975, "total_steps": 38160, "loss": 0.4566, "lr": 0.0005463109870650426, "epoch": 10.469077568134171, "percentage": 52.35, "elapsed_time": "0:51:05", "remaining_time": "0:46:30", "throughput": 4247.34, "total_tokens": 13019496} {"current_steps": 19980, "total_steps": 38160, "loss": 0.503, "lr": 0.0005460832795712323, "epoch": 10.471698113207546, "percentage": 52.36, "elapsed_time": "0:51:05", "remaining_time": "0:46:29", "throughput": 4247.31, "total_tokens": 13022184} {"current_steps": 19985, "total_steps": 38160, "loss": 0.5204, "lr": 0.0005458555624373258, "epoch": 10.474318658280922, "percentage": 52.37, "elapsed_time": "0:51:06", "remaining_time": "0:46:28", "throughput": 4247.3, "total_tokens": 13024968} {"current_steps": 19990, "total_steps": 38160, "loss": 0.4252, "lr": 0.0005456278357109589, "epoch": 10.476939203354299, "percentage": 52.38, "elapsed_time": "0:51:07", "remaining_time": "0:46:28", "throughput": 4247.37, "total_tokens": 13028328} {"current_steps": 19995, "total_steps": 38160, "loss": 0.4367, "lr": 0.0005454000994397691, "epoch": 10.479559748427674, "percentage": 52.4, "elapsed_time": "0:51:08", "remaining_time": "0:46:27", "throughput": 4247.49, "total_tokens": 13032040} {"current_steps": 20000, "total_steps": 38160, "loss": 0.4336, "lr": 0.0005451723536713965, "epoch": 10.482180293501049, "percentage": 52.41, "elapsed_time": "0:51:08", "remaining_time": "0:46:26", "throughput": 4247.64, "total_tokens": 13035944} {"current_steps": 20005, "total_steps": 38160, "loss": 0.5075, "lr": 0.0005449445984534828, "epoch": 10.484800838574424, "percentage": 52.42, "elapsed_time": "0:51:10", "remaining_time": "0:46:26", "throughput": 4248.16, "total_tokens": 13042856} {"current_steps": 20010, "total_steps": 38160, "loss": 0.4042, "lr": 0.0005447168338336721, "epoch": 10.4874213836478, "percentage": 52.44, "elapsed_time": "0:51:11", "remaining_time": "0:46:25", "throughput": 4248.32, "total_tokens": 13046792} {"current_steps": 20015, "total_steps": 38160, "loss": 0.3938, "lr": 0.0005444890598596098, "epoch": 10.490041928721174, "percentage": 52.45, "elapsed_time": "0:51:11", "remaining_time": "0:46:24", "throughput": 4248.49, "total_tokens": 13050920} {"current_steps": 20020, "total_steps": 38160, "loss": 0.4158, "lr": 0.0005442612765789437, "epoch": 10.49266247379455, "percentage": 52.46, "elapsed_time": "0:51:13", "remaining_time": "0:46:24", "throughput": 4249.15, "total_tokens": 13058664} {"current_steps": 20025, "total_steps": 38160, "loss": 0.4727, "lr": 0.0005440334840393235, "epoch": 10.495283018867925, "percentage": 52.48, "elapsed_time": "0:51:14", "remaining_time": "0:46:23", "throughput": 4249.35, "total_tokens": 13062952} {"current_steps": 20030, "total_steps": 38160, "loss": 0.2743, "lr": 0.0005438056822884007, "epoch": 10.4979035639413, "percentage": 52.49, "elapsed_time": "0:51:14", "remaining_time": "0:46:23", "throughput": 4249.35, "total_tokens": 13065768} {"current_steps": 20035, "total_steps": 38160, "loss": 0.5013, "lr": 0.0005435778713738292, "epoch": 10.500524109014675, "percentage": 52.5, "elapsed_time": "0:51:15", "remaining_time": "0:46:22", "throughput": 4249.43, "total_tokens": 13069160} {"current_steps": 20040, "total_steps": 38160, "loss": 0.3924, "lr": 0.0005433500513432639, "epoch": 10.50314465408805, "percentage": 52.52, "elapsed_time": "0:51:16", "remaining_time": "0:46:21", "throughput": 4249.46, "total_tokens": 13072168} {"current_steps": 20045, "total_steps": 38160, "loss": 0.3846, "lr": 0.0005431222222443626, "epoch": 10.505765199161425, "percentage": 52.53, "elapsed_time": "0:51:16", "remaining_time": "0:46:20", "throughput": 4249.44, "total_tokens": 13074888} {"current_steps": 20050, "total_steps": 38160, "loss": 0.6713, "lr": 0.0005428943841247843, "epoch": 10.5083857442348, "percentage": 52.54, "elapsed_time": "0:51:17", "remaining_time": "0:46:19", "throughput": 4249.51, "total_tokens": 13078280} {"current_steps": 20055, "total_steps": 38160, "loss": 0.5074, "lr": 0.0005426665370321901, "epoch": 10.511006289308176, "percentage": 52.56, "elapsed_time": "0:51:18", "remaining_time": "0:46:19", "throughput": 4249.57, "total_tokens": 13081544} {"current_steps": 20060, "total_steps": 38160, "loss": 0.4876, "lr": 0.0005424386810142433, "epoch": 10.51362683438155, "percentage": 52.57, "elapsed_time": "0:51:18", "remaining_time": "0:46:18", "throughput": 4249.57, "total_tokens": 13084360} {"current_steps": 20065, "total_steps": 38160, "loss": 0.5616, "lr": 0.0005422108161186086, "epoch": 10.516247379454926, "percentage": 52.58, "elapsed_time": "0:51:19", "remaining_time": "0:46:17", "throughput": 4249.61, "total_tokens": 13087464} {"current_steps": 20070, "total_steps": 38160, "loss": 0.3733, "lr": 0.0005419829423929525, "epoch": 10.518867924528301, "percentage": 52.59, "elapsed_time": "0:51:20", "remaining_time": "0:46:16", "throughput": 4249.74, "total_tokens": 13091112} {"current_steps": 20075, "total_steps": 38160, "loss": 0.5343, "lr": 0.0005417550598849441, "epoch": 10.521488469601676, "percentage": 52.61, "elapsed_time": "0:51:21", "remaining_time": "0:46:15", "throughput": 4249.85, "total_tokens": 13094824} {"current_steps": 20080, "total_steps": 38160, "loss": 0.393, "lr": 0.0005415271686422534, "epoch": 10.524109014675052, "percentage": 52.62, "elapsed_time": "0:51:21", "remaining_time": "0:46:14", "throughput": 4249.86, "total_tokens": 13097768} {"current_steps": 20085, "total_steps": 38160, "loss": 0.5072, "lr": 0.0005412992687125527, "epoch": 10.526729559748428, "percentage": 52.63, "elapsed_time": "0:51:22", "remaining_time": "0:46:14", "throughput": 4249.88, "total_tokens": 13100712} {"current_steps": 20090, "total_steps": 38160, "loss": 0.3739, "lr": 0.0005410713601435164, "epoch": 10.529350104821804, "percentage": 52.65, "elapsed_time": "0:51:23", "remaining_time": "0:46:13", "throughput": 4249.87, "total_tokens": 13103464} {"current_steps": 20095, "total_steps": 38160, "loss": 0.4082, "lr": 0.0005408434429828199, "epoch": 10.531970649895179, "percentage": 52.66, "elapsed_time": "0:51:23", "remaining_time": "0:46:12", "throughput": 4249.87, "total_tokens": 13106312} {"current_steps": 20100, "total_steps": 38160, "loss": 0.4246, "lr": 0.0005406155172781412, "epoch": 10.534591194968554, "percentage": 52.67, "elapsed_time": "0:51:24", "remaining_time": "0:46:11", "throughput": 4249.83, "total_tokens": 13108936} {"current_steps": 20105, "total_steps": 38160, "loss": 0.3905, "lr": 0.0005403875830771596, "epoch": 10.53721174004193, "percentage": 52.69, "elapsed_time": "0:51:25", "remaining_time": "0:46:10", "throughput": 4250.11, "total_tokens": 13113544} {"current_steps": 20110, "total_steps": 38160, "loss": 0.548, "lr": 0.0005401596404275564, "epoch": 10.539832285115304, "percentage": 52.7, "elapsed_time": "0:51:26", "remaining_time": "0:46:10", "throughput": 4250.14, "total_tokens": 13116648} {"current_steps": 20115, "total_steps": 38160, "loss": 0.2908, "lr": 0.0005399316893770147, "epoch": 10.54245283018868, "percentage": 52.71, "elapsed_time": "0:51:26", "remaining_time": "0:46:09", "throughput": 4250.18, "total_tokens": 13119816} {"current_steps": 20120, "total_steps": 38160, "loss": 0.7114, "lr": 0.0005397037299732189, "epoch": 10.545073375262055, "percentage": 52.73, "elapsed_time": "0:51:27", "remaining_time": "0:46:08", "throughput": 4250.33, "total_tokens": 13123656} {"current_steps": 20125, "total_steps": 38160, "loss": 0.379, "lr": 0.000539475762263856, "epoch": 10.54769392033543, "percentage": 52.74, "elapsed_time": "0:51:28", "remaining_time": "0:46:07", "throughput": 4250.27, "total_tokens": 13126120} {"current_steps": 20130, "total_steps": 38160, "loss": 0.5349, "lr": 0.0005392477862966138, "epoch": 10.550314465408805, "percentage": 52.75, "elapsed_time": "0:51:28", "remaining_time": "0:46:06", "throughput": 4250.28, "total_tokens": 13128968} {"current_steps": 20135, "total_steps": 38160, "loss": 0.3864, "lr": 0.0005390198021191827, "epoch": 10.55293501048218, "percentage": 52.76, "elapsed_time": "0:51:29", "remaining_time": "0:46:05", "throughput": 4250.34, "total_tokens": 13132168} {"current_steps": 20140, "total_steps": 38160, "loss": 0.5063, "lr": 0.000538791809779254, "epoch": 10.555555555555555, "percentage": 52.78, "elapsed_time": "0:51:30", "remaining_time": "0:46:05", "throughput": 4250.43, "total_tokens": 13135560} {"current_steps": 20145, "total_steps": 38160, "loss": 0.472, "lr": 0.0005385638093245213, "epoch": 10.55817610062893, "percentage": 52.79, "elapsed_time": "0:51:31", "remaining_time": "0:46:04", "throughput": 4250.58, "total_tokens": 13139400} {"current_steps": 20150, "total_steps": 38160, "loss": 0.5146, "lr": 0.0005383358008026795, "epoch": 10.560796645702306, "percentage": 52.8, "elapsed_time": "0:51:32", "remaining_time": "0:46:03", "throughput": 4250.87, "total_tokens": 13144232} {"current_steps": 20155, "total_steps": 38160, "loss": 0.3399, "lr": 0.0005381077842614257, "epoch": 10.56341719077568, "percentage": 52.82, "elapsed_time": "0:51:32", "remaining_time": "0:46:02", "throughput": 4250.93, "total_tokens": 13147432} {"current_steps": 20160, "total_steps": 38160, "loss": 0.3536, "lr": 0.0005378797597484582, "epoch": 10.566037735849056, "percentage": 52.83, "elapsed_time": "0:51:33", "remaining_time": "0:46:02", "throughput": 4250.98, "total_tokens": 13150632} {"current_steps": 20165, "total_steps": 38160, "loss": 0.4286, "lr": 0.0005376517273114771, "epoch": 10.568658280922431, "percentage": 52.84, "elapsed_time": "0:51:34", "remaining_time": "0:46:01", "throughput": 4251.09, "total_tokens": 13154152} {"current_steps": 20170, "total_steps": 38160, "loss": 0.3226, "lr": 0.0005374236869981841, "epoch": 10.571278825995806, "percentage": 52.86, "elapsed_time": "0:51:35", "remaining_time": "0:46:00", "throughput": 4251.57, "total_tokens": 13160552} {"current_steps": 20175, "total_steps": 38160, "loss": 0.453, "lr": 0.0005371956388562827, "epoch": 10.573899371069182, "percentage": 52.87, "elapsed_time": "0:51:36", "remaining_time": "0:46:00", "throughput": 4251.55, "total_tokens": 13163208} {"current_steps": 20180, "total_steps": 38160, "loss": 0.5055, "lr": 0.0005369675829334782, "epoch": 10.576519916142558, "percentage": 52.88, "elapsed_time": "0:51:36", "remaining_time": "0:45:59", "throughput": 4251.55, "total_tokens": 13166056} {"current_steps": 20185, "total_steps": 38160, "loss": 0.4038, "lr": 0.0005367395192774769, "epoch": 10.579140461215934, "percentage": 52.9, "elapsed_time": "0:51:37", "remaining_time": "0:45:58", "throughput": 4251.52, "total_tokens": 13168712} {"current_steps": 20190, "total_steps": 38160, "loss": 0.4596, "lr": 0.0005365114479359875, "epoch": 10.581761006289309, "percentage": 52.91, "elapsed_time": "0:51:38", "remaining_time": "0:45:57", "throughput": 4251.49, "total_tokens": 13171400} {"current_steps": 20195, "total_steps": 38160, "loss": 0.4289, "lr": 0.0005362833689567197, "epoch": 10.584381551362684, "percentage": 52.92, "elapsed_time": "0:51:38", "remaining_time": "0:45:56", "throughput": 4251.6, "total_tokens": 13174888} {"current_steps": 20200, "total_steps": 38160, "loss": 0.4322, "lr": 0.0005360552823873849, "epoch": 10.58700209643606, "percentage": 52.94, "elapsed_time": "0:51:39", "remaining_time": "0:45:55", "throughput": 4251.76, "total_tokens": 13178920} {"current_steps": 20205, "total_steps": 38160, "loss": 0.4829, "lr": 0.0005358271882756966, "epoch": 10.589622641509434, "percentage": 52.95, "elapsed_time": "0:51:40", "remaining_time": "0:45:55", "throughput": 4251.97, "total_tokens": 13183176} {"current_steps": 20210, "total_steps": 38160, "loss": 0.396, "lr": 0.0005355990866693689, "epoch": 10.59224318658281, "percentage": 52.96, "elapsed_time": "0:51:41", "remaining_time": "0:45:54", "throughput": 4252.07, "total_tokens": 13186760} {"current_steps": 20215, "total_steps": 38160, "loss": 0.3737, "lr": 0.0005353709776161187, "epoch": 10.594863731656185, "percentage": 52.97, "elapsed_time": "0:51:41", "remaining_time": "0:45:53", "throughput": 4252.05, "total_tokens": 13189544} {"current_steps": 20220, "total_steps": 38160, "loss": 0.4441, "lr": 0.0005351428611636636, "epoch": 10.59748427672956, "percentage": 52.99, "elapsed_time": "0:51:42", "remaining_time": "0:45:52", "throughput": 4252.17, "total_tokens": 13193096} {"current_steps": 20225, "total_steps": 38160, "loss": 0.3536, "lr": 0.0005349147373597226, "epoch": 10.600104821802935, "percentage": 53.0, "elapsed_time": "0:51:43", "remaining_time": "0:45:51", "throughput": 4252.17, "total_tokens": 13195944} {"current_steps": 20230, "total_steps": 38160, "loss": 0.3847, "lr": 0.000534686606252017, "epoch": 10.60272536687631, "percentage": 53.01, "elapsed_time": "0:51:44", "remaining_time": "0:45:51", "throughput": 4252.17, "total_tokens": 13198760} {"current_steps": 20235, "total_steps": 38160, "loss": 0.4291, "lr": 0.0005344584678882692, "epoch": 10.605345911949685, "percentage": 53.03, "elapsed_time": "0:51:44", "remaining_time": "0:45:50", "throughput": 4252.17, "total_tokens": 13201704} {"current_steps": 20240, "total_steps": 38160, "loss": 0.4868, "lr": 0.0005342303223162027, "epoch": 10.60796645702306, "percentage": 53.04, "elapsed_time": "0:51:45", "remaining_time": "0:45:49", "throughput": 4252.22, "total_tokens": 13204872} {"current_steps": 20245, "total_steps": 38160, "loss": 0.4087, "lr": 0.0005340021695835437, "epoch": 10.610587002096436, "percentage": 53.05, "elapsed_time": "0:51:46", "remaining_time": "0:45:48", "throughput": 4252.27, "total_tokens": 13208200} {"current_steps": 20250, "total_steps": 38160, "loss": 0.3697, "lr": 0.0005337740097380184, "epoch": 10.61320754716981, "percentage": 53.07, "elapsed_time": "0:51:46", "remaining_time": "0:45:47", "throughput": 4252.37, "total_tokens": 13211848} {"current_steps": 20255, "total_steps": 38160, "loss": 0.4159, "lr": 0.0005335458428273557, "epoch": 10.615828092243186, "percentage": 53.08, "elapsed_time": "0:51:47", "remaining_time": "0:45:47", "throughput": 4252.38, "total_tokens": 13214760} {"current_steps": 20260, "total_steps": 38160, "loss": 0.3976, "lr": 0.0005333176688992855, "epoch": 10.618448637316561, "percentage": 53.09, "elapsed_time": "0:51:48", "remaining_time": "0:45:46", "throughput": 4252.58, "total_tokens": 13219016} {"current_steps": 20265, "total_steps": 38160, "loss": 0.3467, "lr": 0.000533089488001539, "epoch": 10.621069182389936, "percentage": 53.11, "elapsed_time": "0:51:49", "remaining_time": "0:45:45", "throughput": 4252.56, "total_tokens": 13221800} {"current_steps": 20270, "total_steps": 38160, "loss": 0.4171, "lr": 0.0005328613001818492, "epoch": 10.623689727463312, "percentage": 53.12, "elapsed_time": "0:51:49", "remaining_time": "0:45:44", "throughput": 4252.59, "total_tokens": 13224936} {"current_steps": 20275, "total_steps": 38160, "loss": 0.4354, "lr": 0.0005326331054879502, "epoch": 10.626310272536688, "percentage": 53.13, "elapsed_time": "0:51:50", "remaining_time": "0:45:43", "throughput": 4252.55, "total_tokens": 13227560} {"current_steps": 20280, "total_steps": 38160, "loss": 0.4019, "lr": 0.0005324049039675778, "epoch": 10.628930817610064, "percentage": 53.14, "elapsed_time": "0:51:51", "remaining_time": "0:45:43", "throughput": 4252.61, "total_tokens": 13230888} {"current_steps": 20285, "total_steps": 38160, "loss": 0.5, "lr": 0.0005321766956684693, "epoch": 10.631551362683439, "percentage": 53.16, "elapsed_time": "0:51:51", "remaining_time": "0:45:42", "throughput": 4252.66, "total_tokens": 13234152} {"current_steps": 20290, "total_steps": 38160, "loss": 0.4511, "lr": 0.0005319484806383631, "epoch": 10.634171907756814, "percentage": 53.17, "elapsed_time": "0:51:52", "remaining_time": "0:45:41", "throughput": 4252.7, "total_tokens": 13237352} {"current_steps": 20295, "total_steps": 38160, "loss": 0.4549, "lr": 0.0005317202589249991, "epoch": 10.63679245283019, "percentage": 53.18, "elapsed_time": "0:51:53", "remaining_time": "0:45:40", "throughput": 4252.7, "total_tokens": 13240264} {"current_steps": 20300, "total_steps": 38160, "loss": 0.4094, "lr": 0.0005314920305761191, "epoch": 10.639412997903564, "percentage": 53.2, "elapsed_time": "0:51:54", "remaining_time": "0:45:39", "throughput": 4252.76, "total_tokens": 13243528} {"current_steps": 20305, "total_steps": 38160, "loss": 0.5026, "lr": 0.0005312637956394654, "epoch": 10.64203354297694, "percentage": 53.21, "elapsed_time": "0:51:55", "remaining_time": "0:45:39", "throughput": 4253.09, "total_tokens": 13248712} {"current_steps": 20310, "total_steps": 38160, "loss": 0.4954, "lr": 0.0005310355541627824, "epoch": 10.644654088050315, "percentage": 53.22, "elapsed_time": "0:51:55", "remaining_time": "0:45:38", "throughput": 4253.26, "total_tokens": 13252712} {"current_steps": 20315, "total_steps": 38160, "loss": 0.4513, "lr": 0.0005308073061938153, "epoch": 10.64727463312369, "percentage": 53.24, "elapsed_time": "0:51:56", "remaining_time": "0:45:37", "throughput": 4253.4, "total_tokens": 13256392} {"current_steps": 20320, "total_steps": 38160, "loss": 0.4981, "lr": 0.0005305790517803115, "epoch": 10.649895178197065, "percentage": 53.25, "elapsed_time": "0:51:57", "remaining_time": "0:45:36", "throughput": 4253.39, "total_tokens": 13259240} {"current_steps": 20325, "total_steps": 38160, "loss": 0.452, "lr": 0.0005303507909700189, "epoch": 10.65251572327044, "percentage": 53.26, "elapsed_time": "0:51:58", "remaining_time": "0:45:36", "throughput": 4253.55, "total_tokens": 13263176} {"current_steps": 20330, "total_steps": 38160, "loss": 0.5146, "lr": 0.000530122523810687, "epoch": 10.655136268343815, "percentage": 53.28, "elapsed_time": "0:51:58", "remaining_time": "0:45:35", "throughput": 4253.65, "total_tokens": 13266696} {"current_steps": 20335, "total_steps": 38160, "loss": 0.3923, "lr": 0.0005298942503500668, "epoch": 10.65775681341719, "percentage": 53.29, "elapsed_time": "0:51:59", "remaining_time": "0:45:34", "throughput": 4253.63, "total_tokens": 13269512} {"current_steps": 20340, "total_steps": 38160, "loss": 0.3213, "lr": 0.0005296659706359105, "epoch": 10.660377358490566, "percentage": 53.3, "elapsed_time": "0:52:00", "remaining_time": "0:45:33", "throughput": 4253.59, "total_tokens": 13272072} {"current_steps": 20345, "total_steps": 38160, "loss": 0.4529, "lr": 0.0005294376847159716, "epoch": 10.66299790356394, "percentage": 53.31, "elapsed_time": "0:52:00", "remaining_time": "0:45:32", "throughput": 4253.73, "total_tokens": 13275848} {"current_steps": 20350, "total_steps": 38160, "loss": 0.5319, "lr": 0.0005292093926380049, "epoch": 10.665618448637316, "percentage": 53.33, "elapsed_time": "0:52:01", "remaining_time": "0:45:32", "throughput": 4253.69, "total_tokens": 13278440} {"current_steps": 20355, "total_steps": 38160, "loss": 0.3975, "lr": 0.0005289810944497663, "epoch": 10.668238993710691, "percentage": 53.34, "elapsed_time": "0:52:02", "remaining_time": "0:45:31", "throughput": 4253.72, "total_tokens": 13281576} {"current_steps": 20360, "total_steps": 38160, "loss": 0.4602, "lr": 0.0005287527901990137, "epoch": 10.670859538784066, "percentage": 53.35, "elapsed_time": "0:52:03", "remaining_time": "0:45:30", "throughput": 4253.65, "total_tokens": 13284168} {"current_steps": 20365, "total_steps": 38160, "loss": 0.4668, "lr": 0.0005285244799335053, "epoch": 10.673480083857442, "percentage": 53.37, "elapsed_time": "0:52:03", "remaining_time": "0:45:29", "throughput": 4253.6, "total_tokens": 13286760} {"current_steps": 20370, "total_steps": 38160, "loss": 0.5156, "lr": 0.0005282961637010009, "epoch": 10.676100628930818, "percentage": 53.38, "elapsed_time": "0:52:04", "remaining_time": "0:45:28", "throughput": 4253.6, "total_tokens": 13289672} {"current_steps": 20375, "total_steps": 38160, "loss": 0.5485, "lr": 0.0005280678415492621, "epoch": 10.678721174004194, "percentage": 53.39, "elapsed_time": "0:52:05", "remaining_time": "0:45:27", "throughput": 4253.6, "total_tokens": 13292616} {"current_steps": 20380, "total_steps": 38160, "loss": 0.5094, "lr": 0.0005278395135260512, "epoch": 10.681341719077569, "percentage": 53.41, "elapsed_time": "0:52:05", "remaining_time": "0:45:27", "throughput": 4253.73, "total_tokens": 13296424} {"current_steps": 20385, "total_steps": 38160, "loss": 0.3836, "lr": 0.0005276111796791314, "epoch": 10.683962264150944, "percentage": 53.42, "elapsed_time": "0:52:06", "remaining_time": "0:45:26", "throughput": 4253.7, "total_tokens": 13299048} {"current_steps": 20390, "total_steps": 38160, "loss": 0.4258, "lr": 0.000527382840056268, "epoch": 10.68658280922432, "percentage": 53.43, "elapsed_time": "0:52:07", "remaining_time": "0:45:25", "throughput": 4253.73, "total_tokens": 13302152} {"current_steps": 20395, "total_steps": 38160, "loss": 0.3379, "lr": 0.0005271544947052267, "epoch": 10.689203354297694, "percentage": 53.45, "elapsed_time": "0:52:07", "remaining_time": "0:45:24", "throughput": 4253.69, "total_tokens": 13304840} {"current_steps": 20400, "total_steps": 38160, "loss": 0.3697, "lr": 0.000526926143673775, "epoch": 10.69182389937107, "percentage": 53.46, "elapsed_time": "0:52:08", "remaining_time": "0:45:23", "throughput": 4253.73, "total_tokens": 13307976} {"current_steps": 20405, "total_steps": 38160, "loss": 0.4403, "lr": 0.0005266977870096813, "epoch": 10.694444444444445, "percentage": 53.47, "elapsed_time": "0:52:09", "remaining_time": "0:45:22", "throughput": 4253.72, "total_tokens": 13310856} {"current_steps": 20410, "total_steps": 38160, "loss": 0.4412, "lr": 0.000526469424760715, "epoch": 10.69706498951782, "percentage": 53.49, "elapsed_time": "0:52:09", "remaining_time": "0:45:21", "throughput": 4253.68, "total_tokens": 13313448} {"current_steps": 20415, "total_steps": 38160, "loss": 0.5126, "lr": 0.0005262410569746471, "epoch": 10.699685534591195, "percentage": 53.5, "elapsed_time": "0:52:10", "remaining_time": "0:45:21", "throughput": 4253.75, "total_tokens": 13316776} {"current_steps": 20420, "total_steps": 38160, "loss": 0.544, "lr": 0.0005260126836992495, "epoch": 10.70230607966457, "percentage": 53.51, "elapsed_time": "0:52:11", "remaining_time": "0:45:20", "throughput": 4253.74, "total_tokens": 13319560} {"current_steps": 20425, "total_steps": 38160, "loss": 0.4471, "lr": 0.000525784304982295, "epoch": 10.704926624737945, "percentage": 53.52, "elapsed_time": "0:52:11", "remaining_time": "0:45:19", "throughput": 4253.73, "total_tokens": 13322440} {"current_steps": 20430, "total_steps": 38160, "loss": 0.4027, "lr": 0.0005255559208715585, "epoch": 10.70754716981132, "percentage": 53.54, "elapsed_time": "0:52:12", "remaining_time": "0:45:18", "throughput": 4253.76, "total_tokens": 13325448} {"current_steps": 20435, "total_steps": 38160, "loss": 0.3599, "lr": 0.0005253275314148145, "epoch": 10.710167714884696, "percentage": 53.55, "elapsed_time": "0:52:13", "remaining_time": "0:45:17", "throughput": 4253.79, "total_tokens": 13328520} {"current_steps": 20440, "total_steps": 38160, "loss": 0.3529, "lr": 0.0005250991366598401, "epoch": 10.71278825995807, "percentage": 53.56, "elapsed_time": "0:52:14", "remaining_time": "0:45:16", "throughput": 4253.82, "total_tokens": 13331560} {"current_steps": 20445, "total_steps": 38160, "loss": 0.4653, "lr": 0.0005248707366544126, "epoch": 10.715408805031446, "percentage": 53.58, "elapsed_time": "0:52:14", "remaining_time": "0:45:16", "throughput": 4253.78, "total_tokens": 13334216} {"current_steps": 20450, "total_steps": 38160, "loss": 0.5188, "lr": 0.0005246423314463106, "epoch": 10.718029350104821, "percentage": 53.59, "elapsed_time": "0:52:15", "remaining_time": "0:45:15", "throughput": 4253.89, "total_tokens": 13337768} {"current_steps": 20455, "total_steps": 38160, "loss": 0.4559, "lr": 0.000524413921083314, "epoch": 10.720649895178196, "percentage": 53.6, "elapsed_time": "0:52:16", "remaining_time": "0:45:14", "throughput": 4253.94, "total_tokens": 13341064} {"current_steps": 20460, "total_steps": 38160, "loss": 0.3759, "lr": 0.0005241855056132039, "epoch": 10.723270440251572, "percentage": 53.62, "elapsed_time": "0:52:16", "remaining_time": "0:45:13", "throughput": 4253.89, "total_tokens": 13343688} {"current_steps": 20465, "total_steps": 38160, "loss": 0.4216, "lr": 0.0005239570850837617, "epoch": 10.725890985324948, "percentage": 53.63, "elapsed_time": "0:52:17", "remaining_time": "0:45:12", "throughput": 4253.95, "total_tokens": 13347048} {"current_steps": 20470, "total_steps": 38160, "loss": 0.4555, "lr": 0.0005237286595427709, "epoch": 10.728511530398324, "percentage": 53.64, "elapsed_time": "0:52:18", "remaining_time": "0:45:12", "throughput": 4254.1, "total_tokens": 13350952} {"current_steps": 20475, "total_steps": 38160, "loss": 0.4652, "lr": 0.000523500229038015, "epoch": 10.731132075471699, "percentage": 53.66, "elapsed_time": "0:52:19", "remaining_time": "0:45:11", "throughput": 4254.07, "total_tokens": 13353672} {"current_steps": 20480, "total_steps": 38160, "loss": 0.5402, "lr": 0.0005232717936172794, "epoch": 10.733752620545074, "percentage": 53.67, "elapsed_time": "0:52:19", "remaining_time": "0:45:10", "throughput": 4254.22, "total_tokens": 13357544} {"current_steps": 20485, "total_steps": 38160, "loss": 0.3878, "lr": 0.0005230433533283498, "epoch": 10.73637316561845, "percentage": 53.68, "elapsed_time": "0:52:20", "remaining_time": "0:45:09", "throughput": 4254.4, "total_tokens": 13361544} {"current_steps": 20490, "total_steps": 38160, "loss": 0.5238, "lr": 0.0005228149082190139, "epoch": 10.738993710691824, "percentage": 53.69, "elapsed_time": "0:52:21", "remaining_time": "0:45:09", "throughput": 4254.54, "total_tokens": 13365480} {"current_steps": 20495, "total_steps": 38160, "loss": 0.3718, "lr": 0.0005225864583370594, "epoch": 10.7416142557652, "percentage": 53.71, "elapsed_time": "0:52:22", "remaining_time": "0:45:08", "throughput": 4254.51, "total_tokens": 13368072} {"current_steps": 20500, "total_steps": 38160, "loss": 0.4508, "lr": 0.0005223580037302754, "epoch": 10.744234800838575, "percentage": 53.72, "elapsed_time": "0:52:22", "remaining_time": "0:45:07", "throughput": 4254.51, "total_tokens": 13370920} {"current_steps": 20505, "total_steps": 38160, "loss": 0.729, "lr": 0.0005221295444464522, "epoch": 10.74685534591195, "percentage": 53.73, "elapsed_time": "0:52:23", "remaining_time": "0:45:06", "throughput": 4254.51, "total_tokens": 13373832} {"current_steps": 20510, "total_steps": 38160, "loss": 0.4051, "lr": 0.0005219010805333807, "epoch": 10.749475890985325, "percentage": 53.75, "elapsed_time": "0:52:24", "remaining_time": "0:45:05", "throughput": 4254.51, "total_tokens": 13376712} {"current_steps": 20515, "total_steps": 38160, "loss": 0.4726, "lr": 0.000521672612038853, "epoch": 10.7520964360587, "percentage": 53.76, "elapsed_time": "0:52:24", "remaining_time": "0:45:04", "throughput": 4254.5, "total_tokens": 13379496} {"current_steps": 20520, "total_steps": 38160, "loss": 0.3788, "lr": 0.0005214441390106624, "epoch": 10.754716981132075, "percentage": 53.77, "elapsed_time": "0:52:25", "remaining_time": "0:45:04", "throughput": 4254.69, "total_tokens": 13383688} {"current_steps": 20525, "total_steps": 38160, "loss": 0.4092, "lr": 0.0005212156614966022, "epoch": 10.75733752620545, "percentage": 53.79, "elapsed_time": "0:52:26", "remaining_time": "0:45:03", "throughput": 4254.78, "total_tokens": 13387112} {"current_steps": 20530, "total_steps": 38160, "loss": 0.4523, "lr": 0.0005209871795444678, "epoch": 10.759958071278826, "percentage": 53.8, "elapsed_time": "0:52:27", "remaining_time": "0:45:02", "throughput": 4254.93, "total_tokens": 13391048} {"current_steps": 20535, "total_steps": 38160, "loss": 0.4284, "lr": 0.000520758693202055, "epoch": 10.7625786163522, "percentage": 53.81, "elapsed_time": "0:52:27", "remaining_time": "0:45:01", "throughput": 4254.86, "total_tokens": 13393448} {"current_steps": 20540, "total_steps": 38160, "loss": 0.542, "lr": 0.0005205302025171601, "epoch": 10.765199161425576, "percentage": 53.83, "elapsed_time": "0:52:28", "remaining_time": "0:45:00", "throughput": 4254.82, "total_tokens": 13396040} {"current_steps": 20545, "total_steps": 38160, "loss": 0.4808, "lr": 0.0005203017075375812, "epoch": 10.767819706498951, "percentage": 53.84, "elapsed_time": "0:52:29", "remaining_time": "0:45:00", "throughput": 4254.8, "total_tokens": 13398824} {"current_steps": 20550, "total_steps": 38160, "loss": 0.4327, "lr": 0.0005200732083111169, "epoch": 10.770440251572326, "percentage": 53.85, "elapsed_time": "0:52:29", "remaining_time": "0:44:59", "throughput": 4255.04, "total_tokens": 13403368} {"current_steps": 20555, "total_steps": 38160, "loss": 0.4769, "lr": 0.000519844704885566, "epoch": 10.773060796645701, "percentage": 53.87, "elapsed_time": "0:52:30", "remaining_time": "0:44:58", "throughput": 4255.06, "total_tokens": 13406376} {"current_steps": 20560, "total_steps": 38160, "loss": 0.5482, "lr": 0.0005196161973087297, "epoch": 10.775681341719078, "percentage": 53.88, "elapsed_time": "0:52:31", "remaining_time": "0:44:57", "throughput": 4255.36, "total_tokens": 13411208} {"current_steps": 20565, "total_steps": 38160, "loss": 0.3623, "lr": 0.0005193876856284084, "epoch": 10.778301886792454, "percentage": 53.89, "elapsed_time": "0:52:32", "remaining_time": "0:44:56", "throughput": 4255.31, "total_tokens": 13413704} {"current_steps": 20570, "total_steps": 38160, "loss": 0.4763, "lr": 0.0005191591698924046, "epoch": 10.780922431865829, "percentage": 53.9, "elapsed_time": "0:52:32", "remaining_time": "0:44:56", "throughput": 4255.39, "total_tokens": 13417128} {"current_steps": 20575, "total_steps": 38160, "loss": 0.4612, "lr": 0.0005189306501485211, "epoch": 10.783542976939204, "percentage": 53.92, "elapsed_time": "0:52:33", "remaining_time": "0:44:55", "throughput": 4255.41, "total_tokens": 13420136} {"current_steps": 20580, "total_steps": 38160, "loss": 0.5215, "lr": 0.0005187021264445613, "epoch": 10.786163522012579, "percentage": 53.93, "elapsed_time": "0:52:34", "remaining_time": "0:44:54", "throughput": 4255.33, "total_tokens": 13422472} {"current_steps": 20585, "total_steps": 38160, "loss": 0.3217, "lr": 0.0005184735988283302, "epoch": 10.788784067085954, "percentage": 53.94, "elapsed_time": "0:52:35", "remaining_time": "0:44:53", "throughput": 4255.47, "total_tokens": 13426280} {"current_steps": 20590, "total_steps": 38160, "loss": 0.4168, "lr": 0.000518245067347633, "epoch": 10.79140461215933, "percentage": 53.96, "elapsed_time": "0:52:35", "remaining_time": "0:44:52", "throughput": 4255.5, "total_tokens": 13429416} {"current_steps": 20595, "total_steps": 38160, "loss": 0.4658, "lr": 0.0005180165320502756, "epoch": 10.794025157232705, "percentage": 53.97, "elapsed_time": "0:52:36", "remaining_time": "0:44:52", "throughput": 4255.56, "total_tokens": 13432776} {"current_steps": 20600, "total_steps": 38160, "loss": 0.4354, "lr": 0.0005177879929840655, "epoch": 10.79664570230608, "percentage": 53.98, "elapsed_time": "0:52:37", "remaining_time": "0:44:51", "throughput": 4255.61, "total_tokens": 13435976} {"current_steps": 20605, "total_steps": 38160, "loss": 0.4397, "lr": 0.0005175594501968103, "epoch": 10.799266247379455, "percentage": 54.0, "elapsed_time": "0:52:37", "remaining_time": "0:44:50", "throughput": 4255.66, "total_tokens": 13439208} {"current_steps": 20610, "total_steps": 38160, "loss": 0.3837, "lr": 0.0005173309037363182, "epoch": 10.80188679245283, "percentage": 54.01, "elapsed_time": "0:52:38", "remaining_time": "0:44:49", "throughput": 4255.64, "total_tokens": 13441928} {"current_steps": 20615, "total_steps": 38160, "loss": 0.4386, "lr": 0.0005171023536503991, "epoch": 10.804507337526205, "percentage": 54.02, "elapsed_time": "0:52:39", "remaining_time": "0:44:48", "throughput": 4255.66, "total_tokens": 13445000} {"current_steps": 20620, "total_steps": 38160, "loss": 0.532, "lr": 0.0005168737999868624, "epoch": 10.80712788259958, "percentage": 54.04, "elapsed_time": "0:52:40", "remaining_time": "0:44:48", "throughput": 4255.83, "total_tokens": 13449032} {"current_steps": 20625, "total_steps": 38160, "loss": 0.4447, "lr": 0.0005166452427935193, "epoch": 10.809748427672956, "percentage": 54.05, "elapsed_time": "0:52:40", "remaining_time": "0:44:47", "throughput": 4255.91, "total_tokens": 13452392} {"current_steps": 20630, "total_steps": 38160, "loss": 0.6985, "lr": 0.0005164166821181814, "epoch": 10.81236897274633, "percentage": 54.06, "elapsed_time": "0:52:41", "remaining_time": "0:44:46", "throughput": 4255.97, "total_tokens": 13455784} {"current_steps": 20635, "total_steps": 38160, "loss": 0.4136, "lr": 0.0005161881180086607, "epoch": 10.814989517819706, "percentage": 54.07, "elapsed_time": "0:52:42", "remaining_time": "0:44:45", "throughput": 4256.07, "total_tokens": 13459368} {"current_steps": 20640, "total_steps": 38160, "loss": 0.4203, "lr": 0.0005159595505127705, "epoch": 10.817610062893081, "percentage": 54.09, "elapsed_time": "0:52:43", "remaining_time": "0:44:44", "throughput": 4256.14, "total_tokens": 13462664} {"current_steps": 20645, "total_steps": 38160, "loss": 0.5018, "lr": 0.0005157309796783246, "epoch": 10.820230607966456, "percentage": 54.1, "elapsed_time": "0:52:43", "remaining_time": "0:44:44", "throughput": 4256.03, "total_tokens": 13464872} {"current_steps": 20650, "total_steps": 38160, "loss": 0.3011, "lr": 0.000515502405553137, "epoch": 10.822851153039831, "percentage": 54.11, "elapsed_time": "0:52:44", "remaining_time": "0:44:43", "throughput": 4256.01, "total_tokens": 13467624} {"current_steps": 20655, "total_steps": 38160, "loss": 0.527, "lr": 0.0005152738281850231, "epoch": 10.825471698113208, "percentage": 54.13, "elapsed_time": "0:52:45", "remaining_time": "0:44:42", "throughput": 4256.05, "total_tokens": 13470856} {"current_steps": 20660, "total_steps": 38160, "loss": 0.3851, "lr": 0.0005150452476217986, "epoch": 10.828092243186584, "percentage": 54.14, "elapsed_time": "0:52:45", "remaining_time": "0:44:41", "throughput": 4256.1, "total_tokens": 13474024} {"current_steps": 20665, "total_steps": 38160, "loss": 0.4898, "lr": 0.0005148166639112799, "epoch": 10.830712788259959, "percentage": 54.15, "elapsed_time": "0:52:46", "remaining_time": "0:44:40", "throughput": 4256.31, "total_tokens": 13478376} {"current_steps": 20670, "total_steps": 38160, "loss": 0.4195, "lr": 0.0005145880771012842, "epoch": 10.833333333333334, "percentage": 54.17, "elapsed_time": "0:52:47", "remaining_time": "0:44:40", "throughput": 4256.33, "total_tokens": 13481480} {"current_steps": 20675, "total_steps": 38160, "loss": 0.376, "lr": 0.0005143594872396291, "epoch": 10.835953878406709, "percentage": 54.18, "elapsed_time": "0:52:48", "remaining_time": "0:44:39", "throughput": 4256.33, "total_tokens": 13484456} {"current_steps": 20680, "total_steps": 38160, "loss": 0.4716, "lr": 0.0005141308943741333, "epoch": 10.838574423480084, "percentage": 54.19, "elapsed_time": "0:52:48", "remaining_time": "0:44:38", "throughput": 4256.37, "total_tokens": 13487560} {"current_steps": 20685, "total_steps": 38160, "loss": 0.4594, "lr": 0.0005139022985526154, "epoch": 10.84119496855346, "percentage": 54.21, "elapsed_time": "0:52:49", "remaining_time": "0:44:37", "throughput": 4256.49, "total_tokens": 13491272} {"current_steps": 20690, "total_steps": 38160, "loss": 0.3758, "lr": 0.0005136736998228952, "epoch": 10.843815513626835, "percentage": 54.22, "elapsed_time": "0:52:50", "remaining_time": "0:44:36", "throughput": 4256.47, "total_tokens": 13493992} {"current_steps": 20695, "total_steps": 38160, "loss": 0.4851, "lr": 0.0005134450982327933, "epoch": 10.84643605870021, "percentage": 54.23, "elapsed_time": "0:52:50", "remaining_time": "0:44:36", "throughput": 4256.47, "total_tokens": 13496968} {"current_steps": 20700, "total_steps": 38160, "loss": 0.5827, "lr": 0.0005132164938301299, "epoch": 10.849056603773585, "percentage": 54.25, "elapsed_time": "0:52:51", "remaining_time": "0:44:35", "throughput": 4256.63, "total_tokens": 13501032} {"current_steps": 20705, "total_steps": 38160, "loss": 0.6255, "lr": 0.0005129878866627271, "epoch": 10.85167714884696, "percentage": 54.26, "elapsed_time": "0:52:52", "remaining_time": "0:44:34", "throughput": 4256.49, "total_tokens": 13502984} {"current_steps": 20710, "total_steps": 38160, "loss": 0.4424, "lr": 0.0005127592767784063, "epoch": 10.854297693920335, "percentage": 54.27, "elapsed_time": "0:52:53", "remaining_time": "0:44:33", "throughput": 4256.76, "total_tokens": 13507816} {"current_steps": 20715, "total_steps": 38160, "loss": 0.4719, "lr": 0.0005125306642249905, "epoch": 10.85691823899371, "percentage": 54.28, "elapsed_time": "0:52:54", "remaining_time": "0:44:32", "throughput": 4256.86, "total_tokens": 13511368} {"current_steps": 20720, "total_steps": 38160, "loss": 0.506, "lr": 0.0005123020490503027, "epoch": 10.859538784067086, "percentage": 54.3, "elapsed_time": "0:52:54", "remaining_time": "0:44:32", "throughput": 4257.07, "total_tokens": 13515720} {"current_steps": 20725, "total_steps": 38160, "loss": 0.4911, "lr": 0.0005120734313021665, "epoch": 10.86215932914046, "percentage": 54.31, "elapsed_time": "0:52:55", "remaining_time": "0:44:31", "throughput": 4257.24, "total_tokens": 13519784} {"current_steps": 20730, "total_steps": 38160, "loss": 0.3886, "lr": 0.0005118448110284063, "epoch": 10.864779874213836, "percentage": 54.32, "elapsed_time": "0:52:56", "remaining_time": "0:44:30", "throughput": 4257.33, "total_tokens": 13523304} {"current_steps": 20735, "total_steps": 38160, "loss": 0.7238, "lr": 0.0005116161882768469, "epoch": 10.867400419287211, "percentage": 54.34, "elapsed_time": "0:52:57", "remaining_time": "0:44:29", "throughput": 4257.34, "total_tokens": 13526120} {"current_steps": 20740, "total_steps": 38160, "loss": 0.4086, "lr": 0.0005113875630953131, "epoch": 10.870020964360586, "percentage": 54.35, "elapsed_time": "0:52:57", "remaining_time": "0:44:29", "throughput": 4257.34, "total_tokens": 13529128} {"current_steps": 20745, "total_steps": 38160, "loss": 0.5197, "lr": 0.0005111589355316314, "epoch": 10.872641509433961, "percentage": 54.36, "elapsed_time": "0:52:58", "remaining_time": "0:44:28", "throughput": 4257.43, "total_tokens": 13532584} {"current_steps": 20750, "total_steps": 38160, "loss": 0.4355, "lr": 0.0005109303056336274, "epoch": 10.875262054507338, "percentage": 54.38, "elapsed_time": "0:52:59", "remaining_time": "0:44:27", "throughput": 4257.53, "total_tokens": 13536104} {"current_steps": 20755, "total_steps": 38160, "loss": 0.3561, "lr": 0.0005107016734491281, "epoch": 10.877882599580714, "percentage": 54.39, "elapsed_time": "0:53:00", "remaining_time": "0:44:26", "throughput": 4257.59, "total_tokens": 13539528} {"current_steps": 20760, "total_steps": 38160, "loss": 0.4899, "lr": 0.0005104730390259611, "epoch": 10.880503144654089, "percentage": 54.4, "elapsed_time": "0:53:00", "remaining_time": "0:44:25", "throughput": 4257.62, "total_tokens": 13542600} {"current_steps": 20765, "total_steps": 38160, "loss": 0.3258, "lr": 0.0005102444024119537, "epoch": 10.883123689727464, "percentage": 54.42, "elapsed_time": "0:53:01", "remaining_time": "0:44:25", "throughput": 4257.66, "total_tokens": 13545704} {"current_steps": 20770, "total_steps": 38160, "loss": 0.4315, "lr": 0.0005100157636549342, "epoch": 10.885744234800839, "percentage": 54.43, "elapsed_time": "0:53:02", "remaining_time": "0:44:24", "throughput": 4257.72, "total_tokens": 13549096} {"current_steps": 20775, "total_steps": 38160, "loss": 0.4966, "lr": 0.0005097871228027312, "epoch": 10.888364779874214, "percentage": 54.44, "elapsed_time": "0:53:02", "remaining_time": "0:44:23", "throughput": 4257.75, "total_tokens": 13552232} {"current_steps": 20780, "total_steps": 38160, "loss": 0.5201, "lr": 0.0005095584799031736, "epoch": 10.89098532494759, "percentage": 54.45, "elapsed_time": "0:53:03", "remaining_time": "0:44:22", "throughput": 4257.73, "total_tokens": 13554984} {"current_steps": 20785, "total_steps": 38160, "loss": 0.2687, "lr": 0.0005093298350040912, "epoch": 10.893605870020965, "percentage": 54.47, "elapsed_time": "0:53:04", "remaining_time": "0:44:22", "throughput": 4258.14, "total_tokens": 13561288} {"current_steps": 20790, "total_steps": 38160, "loss": 0.4371, "lr": 0.0005091011881533139, "epoch": 10.89622641509434, "percentage": 54.48, "elapsed_time": "0:53:05", "remaining_time": "0:44:21", "throughput": 4258.13, "total_tokens": 13564072} {"current_steps": 20795, "total_steps": 38160, "loss": 0.4344, "lr": 0.0005088725393986716, "epoch": 10.898846960167715, "percentage": 54.49, "elapsed_time": "0:53:06", "remaining_time": "0:44:20", "throughput": 4258.11, "total_tokens": 13566856} {"current_steps": 20800, "total_steps": 38160, "loss": 0.4712, "lr": 0.0005086438887879955, "epoch": 10.90146750524109, "percentage": 54.51, "elapsed_time": "0:53:06", "remaining_time": "0:44:19", "throughput": 4258.24, "total_tokens": 13570696} {"current_steps": 20805, "total_steps": 38160, "loss": 0.3336, "lr": 0.0005084152363691164, "epoch": 10.904088050314465, "percentage": 54.52, "elapsed_time": "0:53:07", "remaining_time": "0:44:19", "throughput": 4258.22, "total_tokens": 13573416} {"current_steps": 20810, "total_steps": 38160, "loss": 0.5357, "lr": 0.0005081865821898658, "epoch": 10.90670859538784, "percentage": 54.53, "elapsed_time": "0:53:08", "remaining_time": "0:44:18", "throughput": 4258.22, "total_tokens": 13576392} {"current_steps": 20815, "total_steps": 38160, "loss": 0.5184, "lr": 0.0005079579262980756, "epoch": 10.909329140461216, "percentage": 54.55, "elapsed_time": "0:53:08", "remaining_time": "0:44:17", "throughput": 4258.19, "total_tokens": 13579048} {"current_steps": 20820, "total_steps": 38160, "loss": 0.6064, "lr": 0.0005077292687415781, "epoch": 10.91194968553459, "percentage": 54.56, "elapsed_time": "0:53:09", "remaining_time": "0:44:16", "throughput": 4258.32, "total_tokens": 13582920} {"current_steps": 20825, "total_steps": 38160, "loss": 0.3453, "lr": 0.0005075006095682056, "epoch": 10.914570230607966, "percentage": 54.57, "elapsed_time": "0:53:10", "remaining_time": "0:44:15", "throughput": 4258.29, "total_tokens": 13585576} {"current_steps": 20830, "total_steps": 38160, "loss": 0.4364, "lr": 0.0005072719488257914, "epoch": 10.917190775681341, "percentage": 54.59, "elapsed_time": "0:53:11", "remaining_time": "0:44:14", "throughput": 4258.28, "total_tokens": 13588360} {"current_steps": 20835, "total_steps": 38160, "loss": 0.5323, "lr": 0.0005070432865621683, "epoch": 10.919811320754716, "percentage": 54.6, "elapsed_time": "0:53:11", "remaining_time": "0:44:14", "throughput": 4258.28, "total_tokens": 13591272} {"current_steps": 20840, "total_steps": 38160, "loss": 0.3697, "lr": 0.00050681462282517, "epoch": 10.922431865828091, "percentage": 54.61, "elapsed_time": "0:53:12", "remaining_time": "0:44:13", "throughput": 4258.29, "total_tokens": 13594184} {"current_steps": 20845, "total_steps": 38160, "loss": 0.4749, "lr": 0.0005065859576626304, "epoch": 10.925052410901468, "percentage": 54.63, "elapsed_time": "0:53:13", "remaining_time": "0:44:12", "throughput": 4258.33, "total_tokens": 13597352} {"current_steps": 20850, "total_steps": 38160, "loss": 0.4917, "lr": 0.0005063572911223836, "epoch": 10.927672955974844, "percentage": 54.64, "elapsed_time": "0:53:13", "remaining_time": "0:44:11", "throughput": 4258.3, "total_tokens": 13600008} {"current_steps": 20855, "total_steps": 38160, "loss": 0.3877, "lr": 0.0005061286232522639, "epoch": 10.930293501048219, "percentage": 54.65, "elapsed_time": "0:53:14", "remaining_time": "0:44:10", "throughput": 4258.4, "total_tokens": 13603656} {"current_steps": 20860, "total_steps": 38160, "loss": 0.4937, "lr": 0.0005058999541001064, "epoch": 10.932914046121594, "percentage": 54.66, "elapsed_time": "0:53:15", "remaining_time": "0:44:09", "throughput": 4258.49, "total_tokens": 13607176} {"current_steps": 20865, "total_steps": 38160, "loss": 0.5866, "lr": 0.0005056712837137456, "epoch": 10.935534591194969, "percentage": 54.68, "elapsed_time": "0:53:16", "remaining_time": "0:44:09", "throughput": 4258.56, "total_tokens": 13610600} {"current_steps": 20870, "total_steps": 38160, "loss": 0.4049, "lr": 0.000505442612141017, "epoch": 10.938155136268344, "percentage": 54.69, "elapsed_time": "0:53:16", "remaining_time": "0:44:08", "throughput": 4258.7, "total_tokens": 13614472} {"current_steps": 20875, "total_steps": 38160, "loss": 0.357, "lr": 0.000505213939429756, "epoch": 10.94077568134172, "percentage": 54.7, "elapsed_time": "0:53:17", "remaining_time": "0:44:07", "throughput": 4258.69, "total_tokens": 13617384} {"current_steps": 20880, "total_steps": 38160, "loss": 0.4923, "lr": 0.0005049852656277984, "epoch": 10.943396226415095, "percentage": 54.72, "elapsed_time": "0:53:18", "remaining_time": "0:44:06", "throughput": 4258.79, "total_tokens": 13620968} {"current_steps": 20885, "total_steps": 38160, "loss": 0.5495, "lr": 0.0005047565907829801, "epoch": 10.94601677148847, "percentage": 54.73, "elapsed_time": "0:53:18", "remaining_time": "0:44:06", "throughput": 4258.77, "total_tokens": 13623752} {"current_steps": 20890, "total_steps": 38160, "loss": 0.4722, "lr": 0.0005045279149431374, "epoch": 10.948637316561845, "percentage": 54.74, "elapsed_time": "0:53:19", "remaining_time": "0:44:05", "throughput": 4259.07, "total_tokens": 13629000} {"current_steps": 20895, "total_steps": 38160, "loss": 0.4143, "lr": 0.0005042992381561063, "epoch": 10.95125786163522, "percentage": 54.76, "elapsed_time": "0:53:20", "remaining_time": "0:44:04", "throughput": 4259.12, "total_tokens": 13632200} {"current_steps": 20900, "total_steps": 38160, "loss": 0.4154, "lr": 0.0005040705604697238, "epoch": 10.953878406708595, "percentage": 54.77, "elapsed_time": "0:53:21", "remaining_time": "0:44:03", "throughput": 4259.03, "total_tokens": 13634536} {"current_steps": 20905, "total_steps": 38160, "loss": 0.4445, "lr": 0.0005038418819318265, "epoch": 10.95649895178197, "percentage": 54.78, "elapsed_time": "0:53:22", "remaining_time": "0:44:03", "throughput": 4259.21, "total_tokens": 13638760} {"current_steps": 20910, "total_steps": 38160, "loss": 0.4405, "lr": 0.0005036132025902511, "epoch": 10.959119496855346, "percentage": 54.8, "elapsed_time": "0:53:22", "remaining_time": "0:44:02", "throughput": 4259.16, "total_tokens": 13641256} {"current_steps": 20915, "total_steps": 38160, "loss": 0.4276, "lr": 0.0005033845224928352, "epoch": 10.96174004192872, "percentage": 54.81, "elapsed_time": "0:53:23", "remaining_time": "0:44:01", "throughput": 4259.27, "total_tokens": 13644808} {"current_steps": 20920, "total_steps": 38160, "loss": 0.4777, "lr": 0.0005031558416874156, "epoch": 10.964360587002096, "percentage": 54.82, "elapsed_time": "0:53:24", "remaining_time": "0:44:00", "throughput": 4259.34, "total_tokens": 13648168} {"current_steps": 20925, "total_steps": 38160, "loss": 0.5109, "lr": 0.0005029271602218301, "epoch": 10.966981132075471, "percentage": 54.83, "elapsed_time": "0:53:25", "remaining_time": "0:43:59", "throughput": 4259.54, "total_tokens": 13652520} {"current_steps": 20930, "total_steps": 38160, "loss": 0.4538, "lr": 0.0005026984781439162, "epoch": 10.969601677148846, "percentage": 54.85, "elapsed_time": "0:53:25", "remaining_time": "0:43:59", "throughput": 4259.58, "total_tokens": 13655656} {"current_steps": 20935, "total_steps": 38160, "loss": 0.5027, "lr": 0.0005024697955015112, "epoch": 10.972222222222221, "percentage": 54.86, "elapsed_time": "0:53:26", "remaining_time": "0:43:58", "throughput": 4259.58, "total_tokens": 13658440} {"current_steps": 20940, "total_steps": 38160, "loss": 0.3601, "lr": 0.0005022411123424532, "epoch": 10.974842767295598, "percentage": 54.87, "elapsed_time": "0:53:27", "remaining_time": "0:43:57", "throughput": 4259.55, "total_tokens": 13661160} {"current_steps": 20945, "total_steps": 38160, "loss": 0.4323, "lr": 0.00050201242871458, "epoch": 10.977463312368974, "percentage": 54.89, "elapsed_time": "0:53:27", "remaining_time": "0:43:56", "throughput": 4259.67, "total_tokens": 13664936} {"current_steps": 20950, "total_steps": 38160, "loss": 0.5121, "lr": 0.0005017837446657298, "epoch": 10.980083857442349, "percentage": 54.9, "elapsed_time": "0:53:28", "remaining_time": "0:43:55", "throughput": 4259.71, "total_tokens": 13668072} {"current_steps": 20955, "total_steps": 38160, "loss": 0.3919, "lr": 0.0005015550602437405, "epoch": 10.982704402515724, "percentage": 54.91, "elapsed_time": "0:53:29", "remaining_time": "0:43:55", "throughput": 4259.68, "total_tokens": 13670856} {"current_steps": 20960, "total_steps": 38160, "loss": 0.4154, "lr": 0.0005013263754964504, "epoch": 10.985324947589099, "percentage": 54.93, "elapsed_time": "0:53:30", "remaining_time": "0:43:54", "throughput": 4259.83, "total_tokens": 13674792} {"current_steps": 20965, "total_steps": 38160, "loss": 0.4789, "lr": 0.0005010976904716977, "epoch": 10.987945492662474, "percentage": 54.94, "elapsed_time": "0:53:30", "remaining_time": "0:43:53", "throughput": 4259.8, "total_tokens": 13677544} {"current_steps": 20970, "total_steps": 38160, "loss": 0.4509, "lr": 0.0005008690052173206, "epoch": 10.99056603773585, "percentage": 54.95, "elapsed_time": "0:53:31", "remaining_time": "0:43:52", "throughput": 4260.01, "total_tokens": 13681896} {"current_steps": 20975, "total_steps": 38160, "loss": 0.3438, "lr": 0.0005006403197811575, "epoch": 10.993186582809225, "percentage": 54.97, "elapsed_time": "0:53:32", "remaining_time": "0:43:51", "throughput": 4260.07, "total_tokens": 13685256} {"current_steps": 20980, "total_steps": 38160, "loss": 0.5057, "lr": 0.0005004116342110469, "epoch": 10.9958071278826, "percentage": 54.98, "elapsed_time": "0:53:33", "remaining_time": "0:43:51", "throughput": 4260.04, "total_tokens": 13688072} {"current_steps": 20985, "total_steps": 38160, "loss": 0.3744, "lr": 0.0005001829485548272, "epoch": 10.998427672955975, "percentage": 54.99, "elapsed_time": "0:53:33", "remaining_time": "0:43:50", "throughput": 4260.02, "total_tokens": 13690824} {"current_steps": 20988, "total_steps": 38160, "eval_loss": 0.455534964799881, "epoch": 11.0, "percentage": 55.0, "elapsed_time": "0:53:47", "remaining_time": "0:44:00", "throughput": 4241.89, "total_tokens": 13691904} {"current_steps": 20990, "total_steps": 38160, "loss": 0.5478, "lr": 0.0004999542628603364, "epoch": 11.00104821802935, "percentage": 55.01, "elapsed_time": "0:53:49", "remaining_time": "0:44:02", "throughput": 4239.54, "total_tokens": 13692896} {"current_steps": 20995, "total_steps": 38160, "loss": 0.3445, "lr": 0.0004997255771754136, "epoch": 11.003668763102725, "percentage": 55.02, "elapsed_time": "0:53:50", "remaining_time": "0:44:01", "throughput": 4239.58, "total_tokens": 13696160} {"current_steps": 21000, "total_steps": 38160, "loss": 0.5265, "lr": 0.0004994968915478969, "epoch": 11.0062893081761, "percentage": 55.03, "elapsed_time": "0:53:51", "remaining_time": "0:44:00", "throughput": 4239.6, "total_tokens": 13699136} {"current_steps": 21005, "total_steps": 38160, "loss": 0.404, "lr": 0.0004992682060256246, "epoch": 11.008909853249476, "percentage": 55.04, "elapsed_time": "0:53:51", "remaining_time": "0:43:59", "throughput": 4239.67, "total_tokens": 13702496} {"current_steps": 21010, "total_steps": 38160, "loss": 0.4461, "lr": 0.0004990395206564353, "epoch": 11.01153039832285, "percentage": 55.06, "elapsed_time": "0:53:52", "remaining_time": "0:43:58", "throughput": 4239.77, "total_tokens": 13706048} {"current_steps": 21015, "total_steps": 38160, "loss": 0.5214, "lr": 0.0004988108354881674, "epoch": 11.014150943396226, "percentage": 55.07, "elapsed_time": "0:53:53", "remaining_time": "0:43:57", "throughput": 4239.73, "total_tokens": 13708640} {"current_steps": 21020, "total_steps": 38160, "loss": 0.3506, "lr": 0.0004985821505686591, "epoch": 11.016771488469601, "percentage": 55.08, "elapsed_time": "0:53:54", "remaining_time": "0:43:57", "throughput": 4239.8, "total_tokens": 13712000} {"current_steps": 21025, "total_steps": 38160, "loss": 0.4265, "lr": 0.0004983534659457489, "epoch": 11.019392033542976, "percentage": 55.1, "elapsed_time": "0:53:54", "remaining_time": "0:43:56", "throughput": 4239.85, "total_tokens": 13715232} {"current_steps": 21030, "total_steps": 38160, "loss": 0.7968, "lr": 0.0004981247816672745, "epoch": 11.022012578616351, "percentage": 55.11, "elapsed_time": "0:53:55", "remaining_time": "0:43:55", "throughput": 4239.89, "total_tokens": 13718368} {"current_steps": 21035, "total_steps": 38160, "loss": 0.4526, "lr": 0.0004978960977810746, "epoch": 11.024633123689727, "percentage": 55.12, "elapsed_time": "0:53:56", "remaining_time": "0:43:54", "throughput": 4239.96, "total_tokens": 13721824} {"current_steps": 21040, "total_steps": 38160, "loss": 0.4727, "lr": 0.0004976674143349869, "epoch": 11.027253668763104, "percentage": 55.14, "elapsed_time": "0:53:56", "remaining_time": "0:43:53", "throughput": 4239.93, "total_tokens": 13724480} {"current_steps": 21045, "total_steps": 38160, "loss": 0.3922, "lr": 0.0004974387313768497, "epoch": 11.029874213836479, "percentage": 55.15, "elapsed_time": "0:53:57", "remaining_time": "0:43:52", "throughput": 4239.82, "total_tokens": 13726656} {"current_steps": 21050, "total_steps": 38160, "loss": 0.3869, "lr": 0.0004972100489545007, "epoch": 11.032494758909854, "percentage": 55.16, "elapsed_time": "0:53:58", "remaining_time": "0:43:52", "throughput": 4239.78, "total_tokens": 13729184} {"current_steps": 21055, "total_steps": 38160, "loss": 0.4385, "lr": 0.0004969813671157774, "epoch": 11.035115303983229, "percentage": 55.18, "elapsed_time": "0:53:59", "remaining_time": "0:43:51", "throughput": 4240.0, "total_tokens": 13733600} {"current_steps": 21060, "total_steps": 38160, "loss": 0.5345, "lr": 0.0004967526859085177, "epoch": 11.037735849056604, "percentage": 55.19, "elapsed_time": "0:53:59", "remaining_time": "0:43:50", "throughput": 4240.04, "total_tokens": 13736832} {"current_steps": 21065, "total_steps": 38160, "loss": 0.4574, "lr": 0.0004965240053805591, "epoch": 11.04035639412998, "percentage": 55.2, "elapsed_time": "0:54:00", "remaining_time": "0:43:49", "throughput": 4239.98, "total_tokens": 13739360} {"current_steps": 21070, "total_steps": 38160, "loss": 0.3567, "lr": 0.000496295325579739, "epoch": 11.042976939203355, "percentage": 55.21, "elapsed_time": "0:54:01", "remaining_time": "0:43:48", "throughput": 4240.13, "total_tokens": 13743296} {"current_steps": 21075, "total_steps": 38160, "loss": 0.3472, "lr": 0.0004960666465538945, "epoch": 11.04559748427673, "percentage": 55.23, "elapsed_time": "0:54:02", "remaining_time": "0:43:48", "throughput": 4240.26, "total_tokens": 13747072} {"current_steps": 21080, "total_steps": 38160, "loss": 0.4254, "lr": 0.0004958379683508627, "epoch": 11.048218029350105, "percentage": 55.24, "elapsed_time": "0:54:02", "remaining_time": "0:43:47", "throughput": 4240.29, "total_tokens": 13750208} {"current_steps": 21085, "total_steps": 38160, "loss": 0.4385, "lr": 0.0004956092910184803, "epoch": 11.05083857442348, "percentage": 55.25, "elapsed_time": "0:54:03", "remaining_time": "0:43:46", "throughput": 4240.27, "total_tokens": 13752928} {"current_steps": 21090, "total_steps": 38160, "loss": 0.3809, "lr": 0.0004953806146045843, "epoch": 11.053459119496855, "percentage": 55.27, "elapsed_time": "0:54:04", "remaining_time": "0:43:45", "throughput": 4240.41, "total_tokens": 13756736} {"current_steps": 21095, "total_steps": 38160, "loss": 0.4463, "lr": 0.0004951519391570108, "epoch": 11.05607966457023, "percentage": 55.28, "elapsed_time": "0:54:04", "remaining_time": "0:43:44", "throughput": 4240.38, "total_tokens": 13759520} {"current_steps": 21100, "total_steps": 38160, "loss": 0.4357, "lr": 0.0004949232647235964, "epoch": 11.058700209643606, "percentage": 55.29, "elapsed_time": "0:54:05", "remaining_time": "0:43:44", "throughput": 4240.39, "total_tokens": 13762592} {"current_steps": 21105, "total_steps": 38160, "loss": 0.5407, "lr": 0.0004946945913521771, "epoch": 11.06132075471698, "percentage": 55.31, "elapsed_time": "0:54:06", "remaining_time": "0:43:43", "throughput": 4240.54, "total_tokens": 13766464} {"current_steps": 21110, "total_steps": 38160, "loss": 0.4123, "lr": 0.0004944659190905889, "epoch": 11.063941299790356, "percentage": 55.32, "elapsed_time": "0:54:07", "remaining_time": "0:43:42", "throughput": 4240.94, "total_tokens": 13772672} {"current_steps": 21115, "total_steps": 38160, "loss": 0.4642, "lr": 0.0004942372479866674, "epoch": 11.066561844863731, "percentage": 55.33, "elapsed_time": "0:54:08", "remaining_time": "0:43:42", "throughput": 4241.0, "total_tokens": 13776000} {"current_steps": 21120, "total_steps": 38160, "loss": 0.7058, "lr": 0.0004940085780882475, "epoch": 11.069182389937106, "percentage": 55.35, "elapsed_time": "0:54:08", "remaining_time": "0:43:41", "throughput": 4240.93, "total_tokens": 13778464} {"current_steps": 21125, "total_steps": 38160, "loss": 0.4601, "lr": 0.0004937799094431649, "epoch": 11.071802935010481, "percentage": 55.36, "elapsed_time": "0:54:09", "remaining_time": "0:43:40", "throughput": 4240.95, "total_tokens": 13781536} {"current_steps": 21130, "total_steps": 38160, "loss": 0.3976, "lr": 0.0004935512420992542, "epoch": 11.074423480083857, "percentage": 55.37, "elapsed_time": "0:54:10", "remaining_time": "0:43:39", "throughput": 4241.0, "total_tokens": 13784800} {"current_steps": 21135, "total_steps": 38160, "loss": 0.478, "lr": 0.0004933225761043502, "epoch": 11.077044025157234, "percentage": 55.39, "elapsed_time": "0:54:11", "remaining_time": "0:43:38", "throughput": 4241.08, "total_tokens": 13788384} {"current_steps": 21140, "total_steps": 38160, "loss": 0.5572, "lr": 0.0004930939115062872, "epoch": 11.079664570230609, "percentage": 55.4, "elapsed_time": "0:54:11", "remaining_time": "0:43:38", "throughput": 4241.13, "total_tokens": 13791744} {"current_steps": 21145, "total_steps": 38160, "loss": 0.3569, "lr": 0.0004928652483528989, "epoch": 11.082285115303984, "percentage": 55.41, "elapsed_time": "0:54:13", "remaining_time": "0:43:37", "throughput": 4241.61, "total_tokens": 13798304} {"current_steps": 21150, "total_steps": 38160, "loss": 0.4119, "lr": 0.0004926365866920193, "epoch": 11.084905660377359, "percentage": 55.42, "elapsed_time": "0:54:13", "remaining_time": "0:43:36", "throughput": 4241.6, "total_tokens": 13801184} {"current_steps": 21155, "total_steps": 38160, "loss": 0.3981, "lr": 0.0004924079265714817, "epoch": 11.087526205450734, "percentage": 55.44, "elapsed_time": "0:54:14", "remaining_time": "0:43:36", "throughput": 4241.75, "total_tokens": 13805120} {"current_steps": 21160, "total_steps": 38160, "loss": 0.4001, "lr": 0.0004921792680391193, "epoch": 11.09014675052411, "percentage": 55.45, "elapsed_time": "0:54:15", "remaining_time": "0:43:35", "throughput": 4241.81, "total_tokens": 13808448} {"current_steps": 21165, "total_steps": 38160, "loss": 0.42, "lr": 0.0004919506111427649, "epoch": 11.092767295597485, "percentage": 55.46, "elapsed_time": "0:54:16", "remaining_time": "0:43:34", "throughput": 4241.94, "total_tokens": 13812320} {"current_steps": 21170, "total_steps": 38160, "loss": 0.3671, "lr": 0.0004917219559302507, "epoch": 11.09538784067086, "percentage": 55.48, "elapsed_time": "0:54:16", "remaining_time": "0:43:33", "throughput": 4241.94, "total_tokens": 13815168} {"current_steps": 21175, "total_steps": 38160, "loss": 0.4875, "lr": 0.0004914933024494089, "epoch": 11.098008385744235, "percentage": 55.49, "elapsed_time": "0:54:17", "remaining_time": "0:43:32", "throughput": 4241.88, "total_tokens": 13817696} {"current_steps": 21180, "total_steps": 38160, "loss": 0.5289, "lr": 0.0004912646507480713, "epoch": 11.10062893081761, "percentage": 55.5, "elapsed_time": "0:54:18", "remaining_time": "0:43:32", "throughput": 4241.85, "total_tokens": 13820320} {"current_steps": 21185, "total_steps": 38160, "loss": 0.4591, "lr": 0.0004910360008740689, "epoch": 11.103249475890985, "percentage": 55.52, "elapsed_time": "0:54:18", "remaining_time": "0:43:31", "throughput": 4241.9, "total_tokens": 13823680} {"current_steps": 21190, "total_steps": 38160, "loss": 0.4583, "lr": 0.0004908073528752329, "epoch": 11.10587002096436, "percentage": 55.53, "elapsed_time": "0:54:19", "remaining_time": "0:43:30", "throughput": 4241.82, "total_tokens": 13826016} {"current_steps": 21195, "total_steps": 38160, "loss": 0.5079, "lr": 0.0004905787067993941, "epoch": 11.108490566037736, "percentage": 55.54, "elapsed_time": "0:54:20", "remaining_time": "0:43:29", "throughput": 4241.74, "total_tokens": 13828416} {"current_steps": 21200, "total_steps": 38160, "loss": 0.4821, "lr": 0.000490350062694382, "epoch": 11.11111111111111, "percentage": 55.56, "elapsed_time": "0:54:20", "remaining_time": "0:43:28", "throughput": 4241.69, "total_tokens": 13830976} {"current_steps": 21205, "total_steps": 38160, "loss": 0.493, "lr": 0.0004901214206080269, "epoch": 11.113731656184486, "percentage": 55.57, "elapsed_time": "0:54:21", "remaining_time": "0:43:27", "throughput": 4241.7, "total_tokens": 13833952} {"current_steps": 21210, "total_steps": 38160, "loss": 0.3507, "lr": 0.0004898927805881577, "epoch": 11.116352201257861, "percentage": 55.58, "elapsed_time": "0:54:22", "remaining_time": "0:43:26", "throughput": 4241.61, "total_tokens": 13836224} {"current_steps": 21215, "total_steps": 38160, "loss": 0.4081, "lr": 0.0004896641426826036, "epoch": 11.118972746331236, "percentage": 55.59, "elapsed_time": "0:54:22", "remaining_time": "0:43:26", "throughput": 4241.78, "total_tokens": 13840416} {"current_steps": 21220, "total_steps": 38160, "loss": 0.3769, "lr": 0.0004894355069391931, "epoch": 11.121593291404611, "percentage": 55.61, "elapsed_time": "0:54:23", "remaining_time": "0:43:25", "throughput": 4241.72, "total_tokens": 13843072} {"current_steps": 21225, "total_steps": 38160, "loss": 0.5689, "lr": 0.0004892068734057538, "epoch": 11.124213836477987, "percentage": 55.62, "elapsed_time": "0:54:24", "remaining_time": "0:43:24", "throughput": 4241.69, "total_tokens": 13845728} {"current_steps": 21230, "total_steps": 38160, "loss": 0.3716, "lr": 0.0004889782421301134, "epoch": 11.126834381551364, "percentage": 55.63, "elapsed_time": "0:54:24", "remaining_time": "0:43:23", "throughput": 4241.8, "total_tokens": 13849472} {"current_steps": 21235, "total_steps": 38160, "loss": 0.3957, "lr": 0.0004887496131600991, "epoch": 11.129454926624739, "percentage": 55.65, "elapsed_time": "0:54:25", "remaining_time": "0:43:22", "throughput": 4241.85, "total_tokens": 13852704} {"current_steps": 21240, "total_steps": 38160, "loss": 0.5054, "lr": 0.0004885209865435373, "epoch": 11.132075471698114, "percentage": 55.66, "elapsed_time": "0:54:26", "remaining_time": "0:43:22", "throughput": 4241.91, "total_tokens": 13856000} {"current_steps": 21245, "total_steps": 38160, "loss": 0.44, "lr": 0.0004882923623282543, "epoch": 11.134696016771489, "percentage": 55.67, "elapsed_time": "0:54:27", "remaining_time": "0:43:21", "throughput": 4241.92, "total_tokens": 13858944} {"current_steps": 21250, "total_steps": 38160, "loss": 0.4472, "lr": 0.0004880637405620756, "epoch": 11.137316561844864, "percentage": 55.69, "elapsed_time": "0:54:27", "remaining_time": "0:43:20", "throughput": 4241.87, "total_tokens": 13861504} {"current_steps": 21255, "total_steps": 38160, "loss": 0.4542, "lr": 0.00048783512129282604, "epoch": 11.13993710691824, "percentage": 55.7, "elapsed_time": "0:54:28", "remaining_time": "0:43:19", "throughput": 4241.96, "total_tokens": 13865088} {"current_steps": 21260, "total_steps": 38160, "loss": 0.459, "lr": 0.00048760650456833033, "epoch": 11.142557651991615, "percentage": 55.71, "elapsed_time": "0:54:29", "remaining_time": "0:43:18", "throughput": 4241.89, "total_tokens": 13867488} {"current_steps": 21265, "total_steps": 38160, "loss": 0.4798, "lr": 0.0004873778904364125, "epoch": 11.14517819706499, "percentage": 55.73, "elapsed_time": "0:54:29", "remaining_time": "0:43:17", "throughput": 4241.97, "total_tokens": 13870912} {"current_steps": 21270, "total_steps": 38160, "loss": 0.4265, "lr": 0.00048714927894489597, "epoch": 11.147798742138365, "percentage": 55.74, "elapsed_time": "0:54:30", "remaining_time": "0:43:17", "throughput": 4242.01, "total_tokens": 13874080} {"current_steps": 21275, "total_steps": 38160, "loss": 0.5401, "lr": 0.00048692067014160357, "epoch": 11.15041928721174, "percentage": 55.75, "elapsed_time": "0:54:31", "remaining_time": "0:43:16", "throughput": 4242.14, "total_tokens": 13877920} {"current_steps": 21280, "total_steps": 38160, "loss": 0.5061, "lr": 0.00048669206407435806, "epoch": 11.153039832285115, "percentage": 55.77, "elapsed_time": "0:54:32", "remaining_time": "0:43:15", "throughput": 4242.11, "total_tokens": 13880608} {"current_steps": 21285, "total_steps": 38160, "loss": 0.6067, "lr": 0.00048646346079098075, "epoch": 11.15566037735849, "percentage": 55.78, "elapsed_time": "0:54:32", "remaining_time": "0:43:14", "throughput": 4242.18, "total_tokens": 13883936} {"current_steps": 21290, "total_steps": 38160, "loss": 0.5501, "lr": 0.0004862348603392929, "epoch": 11.158280922431866, "percentage": 55.79, "elapsed_time": "0:54:33", "remaining_time": "0:43:13", "throughput": 4242.29, "total_tokens": 13887680} {"current_steps": 21295, "total_steps": 38160, "loss": 0.4716, "lr": 0.0004860062627671154, "epoch": 11.16090146750524, "percentage": 55.8, "elapsed_time": "0:54:34", "remaining_time": "0:43:13", "throughput": 4242.3, "total_tokens": 13890592} {"current_steps": 21300, "total_steps": 38160, "loss": 0.4795, "lr": 0.0004857776681222679, "epoch": 11.163522012578616, "percentage": 55.82, "elapsed_time": "0:54:34", "remaining_time": "0:43:12", "throughput": 4242.18, "total_tokens": 13892704} {"current_steps": 21305, "total_steps": 38160, "loss": 0.3469, "lr": 0.00048554907645257024, "epoch": 11.166142557651991, "percentage": 55.83, "elapsed_time": "0:54:35", "remaining_time": "0:43:11", "throughput": 4242.17, "total_tokens": 13895616} {"current_steps": 21310, "total_steps": 38160, "loss": 0.5298, "lr": 0.0004853204878058407, "epoch": 11.168763102725366, "percentage": 55.84, "elapsed_time": "0:54:36", "remaining_time": "0:43:10", "throughput": 4242.19, "total_tokens": 13898688} {"current_steps": 21315, "total_steps": 38160, "loss": 0.4224, "lr": 0.0004850919022298977, "epoch": 11.171383647798741, "percentage": 55.86, "elapsed_time": "0:54:37", "remaining_time": "0:43:09", "throughput": 4242.22, "total_tokens": 13901760} {"current_steps": 21320, "total_steps": 38160, "loss": 0.5675, "lr": 0.0004848633197725586, "epoch": 11.174004192872117, "percentage": 55.87, "elapsed_time": "0:54:37", "remaining_time": "0:43:08", "throughput": 4242.17, "total_tokens": 13904416} {"current_steps": 21325, "total_steps": 38160, "loss": 0.4411, "lr": 0.0004846347404816404, "epoch": 11.176624737945493, "percentage": 55.88, "elapsed_time": "0:54:38", "remaining_time": "0:43:08", "throughput": 4242.29, "total_tokens": 13908192} {"current_steps": 21330, "total_steps": 38160, "loss": 0.5655, "lr": 0.0004844061644049591, "epoch": 11.179245283018869, "percentage": 55.9, "elapsed_time": "0:54:39", "remaining_time": "0:43:07", "throughput": 4242.34, "total_tokens": 13911392} {"current_steps": 21335, "total_steps": 38160, "loss": 0.3238, "lr": 0.0004841775915903305, "epoch": 11.181865828092244, "percentage": 55.91, "elapsed_time": "0:54:39", "remaining_time": "0:43:06", "throughput": 4242.35, "total_tokens": 13914368} {"current_steps": 21340, "total_steps": 38160, "loss": 0.4058, "lr": 0.00048394902208556917, "epoch": 11.184486373165619, "percentage": 55.92, "elapsed_time": "0:54:40", "remaining_time": "0:43:05", "throughput": 4242.23, "total_tokens": 13916544} {"current_steps": 21345, "total_steps": 38160, "loss": 0.4949, "lr": 0.0004837204559384892, "epoch": 11.187106918238994, "percentage": 55.94, "elapsed_time": "0:54:41", "remaining_time": "0:43:04", "throughput": 4242.24, "total_tokens": 13919520} {"current_steps": 21350, "total_steps": 38160, "loss": 0.3755, "lr": 0.0004834918931969042, "epoch": 11.18972746331237, "percentage": 55.95, "elapsed_time": "0:54:41", "remaining_time": "0:43:03", "throughput": 4242.25, "total_tokens": 13922496} {"current_steps": 21355, "total_steps": 38160, "loss": 0.421, "lr": 0.0004832633339086267, "epoch": 11.192348008385745, "percentage": 55.96, "elapsed_time": "0:54:42", "remaining_time": "0:43:03", "throughput": 4242.25, "total_tokens": 13925440} {"current_steps": 21360, "total_steps": 38160, "loss": 0.4816, "lr": 0.0004830347781214689, "epoch": 11.19496855345912, "percentage": 55.97, "elapsed_time": "0:54:43", "remaining_time": "0:43:02", "throughput": 4242.28, "total_tokens": 13928544} {"current_steps": 21365, "total_steps": 38160, "loss": 0.4289, "lr": 0.0004828062258832421, "epoch": 11.197589098532495, "percentage": 55.99, "elapsed_time": "0:54:43", "remaining_time": "0:43:01", "throughput": 4242.25, "total_tokens": 13931200} {"current_steps": 21370, "total_steps": 38160, "loss": 0.4798, "lr": 0.0004825776772417564, "epoch": 11.20020964360587, "percentage": 56.0, "elapsed_time": "0:54:44", "remaining_time": "0:43:00", "throughput": 4242.24, "total_tokens": 13933984} {"current_steps": 21375, "total_steps": 38160, "loss": 0.4351, "lr": 0.00048234913224482205, "epoch": 11.202830188679245, "percentage": 56.01, "elapsed_time": "0:54:45", "remaining_time": "0:42:59", "throughput": 4242.3, "total_tokens": 13937184} {"current_steps": 21380, "total_steps": 38160, "loss": 0.4647, "lr": 0.00048212059094024774, "epoch": 11.20545073375262, "percentage": 56.03, "elapsed_time": "0:54:46", "remaining_time": "0:42:59", "throughput": 4242.42, "total_tokens": 13940864} {"current_steps": 21385, "total_steps": 38160, "loss": 0.532, "lr": 0.0004818920533758418, "epoch": 11.208071278825996, "percentage": 56.04, "elapsed_time": "0:54:46", "remaining_time": "0:42:58", "throughput": 4242.45, "total_tokens": 13943904} {"current_steps": 21390, "total_steps": 38160, "loss": 0.3944, "lr": 0.00048166351959941185, "epoch": 11.21069182389937, "percentage": 56.05, "elapsed_time": "0:54:47", "remaining_time": "0:42:57", "throughput": 4242.65, "total_tokens": 13948192} {"current_steps": 21395, "total_steps": 38160, "loss": 0.2956, "lr": 0.0004814349896587645, "epoch": 11.213312368972746, "percentage": 56.07, "elapsed_time": "0:54:48", "remaining_time": "0:42:56", "throughput": 4242.62, "total_tokens": 13950912} {"current_steps": 21400, "total_steps": 38160, "loss": 0.4247, "lr": 0.0004812064636017053, "epoch": 11.215932914046121, "percentage": 56.08, "elapsed_time": "0:54:48", "remaining_time": "0:42:55", "throughput": 4242.6, "total_tokens": 13953664} {"current_steps": 21405, "total_steps": 38160, "loss": 0.4284, "lr": 0.0004809779414760396, "epoch": 11.218553459119496, "percentage": 56.09, "elapsed_time": "0:54:49", "remaining_time": "0:42:54", "throughput": 4242.61, "total_tokens": 13956576} {"current_steps": 21410, "total_steps": 38160, "loss": 0.4299, "lr": 0.00048074942332957136, "epoch": 11.221174004192871, "percentage": 56.11, "elapsed_time": "0:54:50", "remaining_time": "0:42:54", "throughput": 4242.61, "total_tokens": 13959520} {"current_steps": 21415, "total_steps": 38160, "loss": 0.4793, "lr": 0.00048052090921010435, "epoch": 11.223794549266247, "percentage": 56.12, "elapsed_time": "0:54:51", "remaining_time": "0:42:53", "throughput": 4242.78, "total_tokens": 13963552} {"current_steps": 21420, "total_steps": 38160, "loss": 0.5664, "lr": 0.00048029239916544094, "epoch": 11.226415094339623, "percentage": 56.13, "elapsed_time": "0:54:51", "remaining_time": "0:42:52", "throughput": 4242.86, "total_tokens": 13967072} {"current_steps": 21425, "total_steps": 38160, "loss": 0.3735, "lr": 0.0004800638932433826, "epoch": 11.229035639412999, "percentage": 56.15, "elapsed_time": "0:54:52", "remaining_time": "0:42:51", "throughput": 4242.94, "total_tokens": 13970592} {"current_steps": 21430, "total_steps": 38160, "loss": 0.4891, "lr": 0.00047983539149173043, "epoch": 11.231656184486374, "percentage": 56.16, "elapsed_time": "0:54:53", "remaining_time": "0:42:51", "throughput": 4242.97, "total_tokens": 13973696} {"current_steps": 21435, "total_steps": 38160, "loss": 0.4737, "lr": 0.0004796068939582843, "epoch": 11.234276729559749, "percentage": 56.17, "elapsed_time": "0:54:54", "remaining_time": "0:42:50", "throughput": 4243.06, "total_tokens": 13977248} {"current_steps": 21440, "total_steps": 38160, "loss": 0.5296, "lr": 0.00047937840069084333, "epoch": 11.236897274633124, "percentage": 56.18, "elapsed_time": "0:54:54", "remaining_time": "0:42:49", "throughput": 4243.14, "total_tokens": 13980704} {"current_steps": 21445, "total_steps": 38160, "loss": 0.4996, "lr": 0.0004791499117372056, "epoch": 11.2395178197065, "percentage": 56.2, "elapsed_time": "0:54:55", "remaining_time": "0:42:48", "throughput": 4243.04, "total_tokens": 13982976} {"current_steps": 21450, "total_steps": 38160, "loss": 0.5918, "lr": 0.0004789214271451686, "epoch": 11.242138364779874, "percentage": 56.21, "elapsed_time": "0:54:56", "remaining_time": "0:42:47", "throughput": 4243.05, "total_tokens": 13985888} {"current_steps": 21455, "total_steps": 38160, "loss": 0.4126, "lr": 0.00047869294696252854, "epoch": 11.24475890985325, "percentage": 56.22, "elapsed_time": "0:54:57", "remaining_time": "0:42:47", "throughput": 4243.21, "total_tokens": 13990048} {"current_steps": 21460, "total_steps": 38160, "loss": 0.3949, "lr": 0.0004784644712370807, "epoch": 11.247379454926625, "percentage": 56.24, "elapsed_time": "0:54:57", "remaining_time": "0:42:46", "throughput": 4243.24, "total_tokens": 13993152} {"current_steps": 21465, "total_steps": 38160, "loss": 0.5264, "lr": 0.00047823600001661984, "epoch": 11.25, "percentage": 56.25, "elapsed_time": "0:54:58", "remaining_time": "0:42:45", "throughput": 4243.2, "total_tokens": 13995776} {"current_steps": 21470, "total_steps": 38160, "loss": 0.599, "lr": 0.0004780075333489396, "epoch": 11.252620545073375, "percentage": 56.26, "elapsed_time": "0:54:59", "remaining_time": "0:42:44", "throughput": 4243.28, "total_tokens": 13999168} {"current_steps": 21475, "total_steps": 38160, "loss": 0.4078, "lr": 0.00047777907128183233, "epoch": 11.25524109014675, "percentage": 56.28, "elapsed_time": "0:54:59", "remaining_time": "0:42:43", "throughput": 4243.28, "total_tokens": 14002048} {"current_steps": 21480, "total_steps": 38160, "loss": 0.4416, "lr": 0.0004775506138630901, "epoch": 11.257861635220126, "percentage": 56.29, "elapsed_time": "0:55:00", "remaining_time": "0:42:42", "throughput": 4243.27, "total_tokens": 14004864} {"current_steps": 21485, "total_steps": 38160, "loss": 0.3311, "lr": 0.0004773221611405032, "epoch": 11.2604821802935, "percentage": 56.3, "elapsed_time": "0:55:01", "remaining_time": "0:42:42", "throughput": 4243.36, "total_tokens": 14008352} {"current_steps": 21490, "total_steps": 38160, "loss": 0.3936, "lr": 0.0004770937131618614, "epoch": 11.263102725366876, "percentage": 56.32, "elapsed_time": "0:55:01", "remaining_time": "0:42:41", "throughput": 4243.36, "total_tokens": 14011232} {"current_steps": 21495, "total_steps": 38160, "loss": 0.4375, "lr": 0.0004768652699749535, "epoch": 11.265723270440251, "percentage": 56.33, "elapsed_time": "0:55:02", "remaining_time": "0:42:40", "throughput": 4243.46, "total_tokens": 14014848} {"current_steps": 21500, "total_steps": 38160, "loss": 0.4174, "lr": 0.00047663683162756717, "epoch": 11.268343815513626, "percentage": 56.34, "elapsed_time": "0:55:03", "remaining_time": "0:42:39", "throughput": 4243.44, "total_tokens": 14017536} {"current_steps": 21505, "total_steps": 38160, "loss": 0.392, "lr": 0.00047640839816748926, "epoch": 11.270964360587001, "percentage": 56.35, "elapsed_time": "0:55:04", "remaining_time": "0:42:38", "throughput": 4243.57, "total_tokens": 14021376} {"current_steps": 21510, "total_steps": 38160, "loss": 0.4758, "lr": 0.00047617996964250525, "epoch": 11.273584905660377, "percentage": 56.37, "elapsed_time": "0:55:04", "remaining_time": "0:42:38", "throughput": 4243.56, "total_tokens": 14024224} {"current_steps": 21515, "total_steps": 38160, "loss": 0.3866, "lr": 0.0004759515461003997, "epoch": 11.276205450733753, "percentage": 56.38, "elapsed_time": "0:55:05", "remaining_time": "0:42:37", "throughput": 4243.54, "total_tokens": 14026848} {"current_steps": 21520, "total_steps": 38160, "loss": 0.3491, "lr": 0.00047572312758895654, "epoch": 11.278825995807129, "percentage": 56.39, "elapsed_time": "0:55:06", "remaining_time": "0:42:36", "throughput": 4243.67, "total_tokens": 14030720} {"current_steps": 21525, "total_steps": 38160, "loss": 0.4, "lr": 0.0004754947141559579, "epoch": 11.281446540880504, "percentage": 56.41, "elapsed_time": "0:55:06", "remaining_time": "0:42:35", "throughput": 4243.67, "total_tokens": 14033632} {"current_steps": 21530, "total_steps": 38160, "loss": 0.4431, "lr": 0.0004752663058491856, "epoch": 11.284067085953879, "percentage": 56.42, "elapsed_time": "0:55:07", "remaining_time": "0:42:34", "throughput": 4243.74, "total_tokens": 14036960} {"current_steps": 21535, "total_steps": 38160, "loss": 0.4644, "lr": 0.0004750379027164201, "epoch": 11.286687631027254, "percentage": 56.43, "elapsed_time": "0:55:08", "remaining_time": "0:42:34", "throughput": 4243.69, "total_tokens": 14039648} {"current_steps": 21540, "total_steps": 38160, "loss": 0.5615, "lr": 0.00047480950480544037, "epoch": 11.28930817610063, "percentage": 56.45, "elapsed_time": "0:55:09", "remaining_time": "0:42:33", "throughput": 4243.85, "total_tokens": 14043840} {"current_steps": 21545, "total_steps": 38160, "loss": 0.4903, "lr": 0.00047458111216402483, "epoch": 11.291928721174004, "percentage": 56.46, "elapsed_time": "0:55:09", "remaining_time": "0:42:32", "throughput": 4243.91, "total_tokens": 14047200} {"current_steps": 21550, "total_steps": 38160, "loss": 0.3946, "lr": 0.00047435272483995074, "epoch": 11.29454926624738, "percentage": 56.47, "elapsed_time": "0:55:10", "remaining_time": "0:42:31", "throughput": 4243.94, "total_tokens": 14050336} {"current_steps": 21555, "total_steps": 38160, "loss": 0.501, "lr": 0.00047412434288099386, "epoch": 11.297169811320755, "percentage": 56.49, "elapsed_time": "0:55:11", "remaining_time": "0:42:30", "throughput": 4243.95, "total_tokens": 14053312} {"current_steps": 21560, "total_steps": 38160, "loss": 0.3425, "lr": 0.0004738959663349294, "epoch": 11.29979035639413, "percentage": 56.5, "elapsed_time": "0:55:12", "remaining_time": "0:42:30", "throughput": 4243.95, "total_tokens": 14056256} {"current_steps": 21565, "total_steps": 38160, "loss": 0.5125, "lr": 0.0004736675952495311, "epoch": 11.302410901467505, "percentage": 56.51, "elapsed_time": "0:55:12", "remaining_time": "0:42:29", "throughput": 4243.94, "total_tokens": 14059168} {"current_steps": 21570, "total_steps": 38160, "loss": 0.3975, "lr": 0.0004734392296725712, "epoch": 11.30503144654088, "percentage": 56.53, "elapsed_time": "0:55:13", "remaining_time": "0:42:28", "throughput": 4244.03, "total_tokens": 14062720} {"current_steps": 21575, "total_steps": 38160, "loss": 0.4067, "lr": 0.00047321086965182153, "epoch": 11.307651991614255, "percentage": 56.54, "elapsed_time": "0:55:14", "remaining_time": "0:42:27", "throughput": 4244.09, "total_tokens": 14065952} {"current_steps": 21580, "total_steps": 38160, "loss": 0.4604, "lr": 0.0004729825152350522, "epoch": 11.31027253668763, "percentage": 56.55, "elapsed_time": "0:55:15", "remaining_time": "0:42:26", "throughput": 4244.19, "total_tokens": 14069664} {"current_steps": 21585, "total_steps": 38160, "loss": 0.4472, "lr": 0.00047275416647003256, "epoch": 11.312893081761006, "percentage": 56.56, "elapsed_time": "0:55:15", "remaining_time": "0:42:26", "throughput": 4244.26, "total_tokens": 14073024} {"current_steps": 21590, "total_steps": 38160, "loss": 0.4266, "lr": 0.0004725258234045306, "epoch": 11.315513626834381, "percentage": 56.58, "elapsed_time": "0:55:16", "remaining_time": "0:42:25", "throughput": 4244.36, "total_tokens": 14076576} {"current_steps": 21595, "total_steps": 38160, "loss": 0.5238, "lr": 0.0004722974860863127, "epoch": 11.318134171907756, "percentage": 56.59, "elapsed_time": "0:55:17", "remaining_time": "0:42:24", "throughput": 4244.46, "total_tokens": 14080128} {"current_steps": 21600, "total_steps": 38160, "loss": 0.4569, "lr": 0.00047206915456314476, "epoch": 11.320754716981131, "percentage": 56.6, "elapsed_time": "0:55:18", "remaining_time": "0:42:23", "throughput": 4244.65, "total_tokens": 14084320} {"current_steps": 21605, "total_steps": 38160, "loss": 0.3501, "lr": 0.00047184082888279097, "epoch": 11.323375262054507, "percentage": 56.62, "elapsed_time": "0:55:18", "remaining_time": "0:42:23", "throughput": 4244.62, "total_tokens": 14087008} {"current_steps": 21610, "total_steps": 38160, "loss": 0.3964, "lr": 0.00047161250909301454, "epoch": 11.325995807127883, "percentage": 56.63, "elapsed_time": "0:55:19", "remaining_time": "0:42:22", "throughput": 4244.67, "total_tokens": 14090208} {"current_steps": 21615, "total_steps": 38160, "loss": 0.3103, "lr": 0.00047138419524157734, "epoch": 11.328616352201259, "percentage": 56.64, "elapsed_time": "0:55:20", "remaining_time": "0:42:21", "throughput": 4244.69, "total_tokens": 14093184} {"current_steps": 21620, "total_steps": 38160, "loss": 0.4802, "lr": 0.0004711558873762402, "epoch": 11.331236897274634, "percentage": 56.66, "elapsed_time": "0:55:21", "remaining_time": "0:42:21", "throughput": 4245.17, "total_tokens": 14100064} {"current_steps": 21625, "total_steps": 38160, "loss": 0.425, "lr": 0.0004709275855447621, "epoch": 11.333857442348009, "percentage": 56.67, "elapsed_time": "0:55:22", "remaining_time": "0:42:20", "throughput": 4245.19, "total_tokens": 14103104} {"current_steps": 21630, "total_steps": 38160, "loss": 0.378, "lr": 0.0004706992897949016, "epoch": 11.336477987421384, "percentage": 56.68, "elapsed_time": "0:55:22", "remaining_time": "0:42:19", "throughput": 4245.26, "total_tokens": 14106496} {"current_steps": 21635, "total_steps": 38160, "loss": 0.5507, "lr": 0.00047047100017441525, "epoch": 11.33909853249476, "percentage": 56.7, "elapsed_time": "0:55:23", "remaining_time": "0:42:18", "throughput": 4245.4, "total_tokens": 14110368} {"current_steps": 21640, "total_steps": 38160, "loss": 0.6335, "lr": 0.0004702427167310589, "epoch": 11.341719077568134, "percentage": 56.71, "elapsed_time": "0:55:24", "remaining_time": "0:42:17", "throughput": 4245.64, "total_tokens": 14114944} {"current_steps": 21645, "total_steps": 38160, "loss": 0.39, "lr": 0.0004700144395125866, "epoch": 11.34433962264151, "percentage": 56.72, "elapsed_time": "0:55:25", "remaining_time": "0:42:17", "throughput": 4245.7, "total_tokens": 14118272} {"current_steps": 21650, "total_steps": 38160, "loss": 0.4282, "lr": 0.00046978616856675173, "epoch": 11.346960167714885, "percentage": 56.73, "elapsed_time": "0:55:26", "remaining_time": "0:42:16", "throughput": 4245.75, "total_tokens": 14121472} {"current_steps": 21655, "total_steps": 38160, "loss": 0.362, "lr": 0.0004695579039413055, "epoch": 11.34958071278826, "percentage": 56.75, "elapsed_time": "0:55:26", "remaining_time": "0:42:15", "throughput": 4245.67, "total_tokens": 14123808} {"current_steps": 21660, "total_steps": 38160, "loss": 0.4755, "lr": 0.0004693296456839984, "epoch": 11.352201257861635, "percentage": 56.76, "elapsed_time": "0:55:27", "remaining_time": "0:42:14", "throughput": 4245.6, "total_tokens": 14126144} {"current_steps": 21665, "total_steps": 38160, "loss": 0.4726, "lr": 0.0004691013938425796, "epoch": 11.35482180293501, "percentage": 56.77, "elapsed_time": "0:55:28", "remaining_time": "0:42:13", "throughput": 4245.72, "total_tokens": 14129888} {"current_steps": 21670, "total_steps": 38160, "loss": 0.3588, "lr": 0.00046887314846479663, "epoch": 11.357442348008385, "percentage": 56.79, "elapsed_time": "0:55:28", "remaining_time": "0:42:12", "throughput": 4245.68, "total_tokens": 14132448} {"current_steps": 21675, "total_steps": 38160, "loss": 0.3821, "lr": 0.000468644909598396, "epoch": 11.36006289308176, "percentage": 56.8, "elapsed_time": "0:55:29", "remaining_time": "0:42:12", "throughput": 4245.88, "total_tokens": 14136736} {"current_steps": 21680, "total_steps": 38160, "loss": 0.5074, "lr": 0.00046841667729112264, "epoch": 11.362683438155136, "percentage": 56.81, "elapsed_time": "0:55:30", "remaining_time": "0:42:11", "throughput": 4245.91, "total_tokens": 14139840} {"current_steps": 21685, "total_steps": 38160, "loss": 0.4101, "lr": 0.00046818845159071987, "epoch": 11.365303983228511, "percentage": 56.83, "elapsed_time": "0:55:30", "remaining_time": "0:42:10", "throughput": 4245.89, "total_tokens": 14142528} {"current_steps": 21690, "total_steps": 38160, "loss": 0.3693, "lr": 0.0004679602325449302, "epoch": 11.367924528301886, "percentage": 56.84, "elapsed_time": "0:55:31", "remaining_time": "0:42:09", "throughput": 4245.98, "total_tokens": 14145984} {"current_steps": 21695, "total_steps": 38160, "loss": 0.5398, "lr": 0.00046773202020149423, "epoch": 11.370545073375261, "percentage": 56.85, "elapsed_time": "0:55:32", "remaining_time": "0:42:08", "throughput": 4246.03, "total_tokens": 14149120} {"current_steps": 21700, "total_steps": 38160, "loss": 0.4304, "lr": 0.0004675038146081516, "epoch": 11.373165618448636, "percentage": 56.87, "elapsed_time": "0:55:32", "remaining_time": "0:42:08", "throughput": 4246.02, "total_tokens": 14151936} {"current_steps": 21705, "total_steps": 38160, "loss": 0.4676, "lr": 0.0004672756158126403, "epoch": 11.375786163522013, "percentage": 56.88, "elapsed_time": "0:55:33", "remaining_time": "0:42:07", "throughput": 4246.06, "total_tokens": 14155040} {"current_steps": 21710, "total_steps": 38160, "loss": 0.4607, "lr": 0.0004670474238626968, "epoch": 11.378406708595389, "percentage": 56.89, "elapsed_time": "0:55:34", "remaining_time": "0:42:06", "throughput": 4246.14, "total_tokens": 14158336} {"current_steps": 21715, "total_steps": 38160, "loss": 0.3963, "lr": 0.00046681923880605614, "epoch": 11.381027253668764, "percentage": 56.91, "elapsed_time": "0:55:35", "remaining_time": "0:42:05", "throughput": 4246.13, "total_tokens": 14161248} {"current_steps": 21720, "total_steps": 38160, "loss": 0.4603, "lr": 0.0004665910606904523, "epoch": 11.383647798742139, "percentage": 56.92, "elapsed_time": "0:55:35", "remaining_time": "0:42:04", "throughput": 4246.24, "total_tokens": 14164960} {"current_steps": 21725, "total_steps": 38160, "loss": 0.3892, "lr": 0.0004663628895636173, "epoch": 11.386268343815514, "percentage": 56.93, "elapsed_time": "0:55:36", "remaining_time": "0:42:04", "throughput": 4246.21, "total_tokens": 14167584} {"current_steps": 21730, "total_steps": 38160, "loss": 0.361, "lr": 0.0004661347254732822, "epoch": 11.38888888888889, "percentage": 56.94, "elapsed_time": "0:55:37", "remaining_time": "0:42:03", "throughput": 4246.13, "total_tokens": 14169888} {"current_steps": 21735, "total_steps": 38160, "loss": 0.4128, "lr": 0.0004659065684671762, "epoch": 11.391509433962264, "percentage": 56.96, "elapsed_time": "0:55:37", "remaining_time": "0:42:02", "throughput": 4246.18, "total_tokens": 14173024} {"current_steps": 21740, "total_steps": 38160, "loss": 0.3703, "lr": 0.00046567841859302696, "epoch": 11.39412997903564, "percentage": 56.97, "elapsed_time": "0:55:38", "remaining_time": "0:42:01", "throughput": 4246.28, "total_tokens": 14176576} {"current_steps": 21745, "total_steps": 38160, "loss": 0.4839, "lr": 0.0004654502758985611, "epoch": 11.396750524109015, "percentage": 56.98, "elapsed_time": "0:55:39", "remaining_time": "0:42:00", "throughput": 4246.37, "total_tokens": 14180064} {"current_steps": 21750, "total_steps": 38160, "loss": 0.4403, "lr": 0.00046522214043150323, "epoch": 11.39937106918239, "percentage": 57.0, "elapsed_time": "0:55:40", "remaining_time": "0:42:00", "throughput": 4246.44, "total_tokens": 14183456} {"current_steps": 21755, "total_steps": 38160, "loss": 0.3624, "lr": 0.00046499401223957696, "epoch": 11.401991614255765, "percentage": 57.01, "elapsed_time": "0:55:40", "remaining_time": "0:41:59", "throughput": 4246.5, "total_tokens": 14186752} {"current_steps": 21760, "total_steps": 38160, "loss": 0.3023, "lr": 0.0004647658913705038, "epoch": 11.40461215932914, "percentage": 57.02, "elapsed_time": "0:55:41", "remaining_time": "0:41:58", "throughput": 4246.45, "total_tokens": 14189280} {"current_steps": 21765, "total_steps": 38160, "loss": 0.4068, "lr": 0.00046453777787200444, "epoch": 11.407232704402515, "percentage": 57.04, "elapsed_time": "0:55:42", "remaining_time": "0:41:57", "throughput": 4246.59, "total_tokens": 14193120} {"current_steps": 21770, "total_steps": 38160, "loss": 0.5519, "lr": 0.0004643096717917973, "epoch": 11.40985324947589, "percentage": 57.05, "elapsed_time": "0:55:42", "remaining_time": "0:41:56", "throughput": 4246.63, "total_tokens": 14196352} {"current_steps": 21775, "total_steps": 38160, "loss": 0.4315, "lr": 0.0004640815731775995, "epoch": 11.412473794549266, "percentage": 57.06, "elapsed_time": "0:55:43", "remaining_time": "0:41:56", "throughput": 4246.67, "total_tokens": 14199456} {"current_steps": 21780, "total_steps": 38160, "loss": 0.4353, "lr": 0.0004638534820771267, "epoch": 11.415094339622641, "percentage": 57.08, "elapsed_time": "0:55:44", "remaining_time": "0:41:55", "throughput": 4246.56, "total_tokens": 14201600} {"current_steps": 21785, "total_steps": 38160, "loss": 0.4487, "lr": 0.0004636253985380934, "epoch": 11.417714884696016, "percentage": 57.09, "elapsed_time": "0:55:44", "remaining_time": "0:41:54", "throughput": 4246.6, "total_tokens": 14204672} {"current_steps": 21790, "total_steps": 38160, "loss": 0.4887, "lr": 0.00046339732260821173, "epoch": 11.420335429769391, "percentage": 57.1, "elapsed_time": "0:55:45", "remaining_time": "0:41:53", "throughput": 4246.8, "total_tokens": 14208928} {"current_steps": 21795, "total_steps": 38160, "loss": 0.2897, "lr": 0.0004631692543351924, "epoch": 11.422955974842766, "percentage": 57.11, "elapsed_time": "0:55:46", "remaining_time": "0:41:52", "throughput": 4247.09, "total_tokens": 14213888} {"current_steps": 21800, "total_steps": 38160, "loss": 0.3318, "lr": 0.00046294119376674486, "epoch": 11.425576519916142, "percentage": 57.13, "elapsed_time": "0:55:47", "remaining_time": "0:41:52", "throughput": 4247.08, "total_tokens": 14216704} {"current_steps": 21805, "total_steps": 38160, "loss": 0.4706, "lr": 0.0004627131409505768, "epoch": 11.428197064989519, "percentage": 57.14, "elapsed_time": "0:55:48", "remaining_time": "0:41:51", "throughput": 4247.09, "total_tokens": 14219616} {"current_steps": 21810, "total_steps": 38160, "loss": 0.3301, "lr": 0.0004624850959343944, "epoch": 11.430817610062894, "percentage": 57.15, "elapsed_time": "0:55:48", "remaining_time": "0:41:50", "throughput": 4247.07, "total_tokens": 14222368} {"current_steps": 21815, "total_steps": 38160, "loss": 0.4301, "lr": 0.00046225705876590175, "epoch": 11.433438155136269, "percentage": 57.17, "elapsed_time": "0:55:50", "remaining_time": "0:41:50", "throughput": 4247.64, "total_tokens": 14229888} {"current_steps": 21820, "total_steps": 38160, "loss": 0.4259, "lr": 0.00046202902949280206, "epoch": 11.436058700209644, "percentage": 57.18, "elapsed_time": "0:55:50", "remaining_time": "0:41:49", "throughput": 4247.74, "total_tokens": 14233440} {"current_steps": 21825, "total_steps": 38160, "loss": 0.4504, "lr": 0.00046180100816279614, "epoch": 11.43867924528302, "percentage": 57.19, "elapsed_time": "0:55:51", "remaining_time": "0:41:48", "throughput": 4247.62, "total_tokens": 14235488} {"current_steps": 21830, "total_steps": 38160, "loss": 0.4566, "lr": 0.0004615729948235833, "epoch": 11.441299790356394, "percentage": 57.21, "elapsed_time": "0:55:52", "remaining_time": "0:41:47", "throughput": 4247.86, "total_tokens": 14240128} {"current_steps": 21835, "total_steps": 38160, "loss": 0.3331, "lr": 0.00046134498952286174, "epoch": 11.44392033542977, "percentage": 57.22, "elapsed_time": "0:55:53", "remaining_time": "0:41:46", "throughput": 4247.88, "total_tokens": 14243264} {"current_steps": 21840, "total_steps": 38160, "loss": 0.5301, "lr": 0.00046111699230832727, "epoch": 11.446540880503145, "percentage": 57.23, "elapsed_time": "0:55:53", "remaining_time": "0:41:46", "throughput": 4248.1, "total_tokens": 14247712} {"current_steps": 21845, "total_steps": 38160, "loss": 0.4621, "lr": 0.00046088900322767434, "epoch": 11.44916142557652, "percentage": 57.25, "elapsed_time": "0:55:54", "remaining_time": "0:41:45", "throughput": 4248.22, "total_tokens": 14251360} {"current_steps": 21850, "total_steps": 38160, "loss": 0.4184, "lr": 0.0004606610223285961, "epoch": 11.451781970649895, "percentage": 57.26, "elapsed_time": "0:55:55", "remaining_time": "0:41:44", "throughput": 4248.24, "total_tokens": 14254432} {"current_steps": 21855, "total_steps": 38160, "loss": 0.3695, "lr": 0.00046043304965878284, "epoch": 11.45440251572327, "percentage": 57.27, "elapsed_time": "0:55:56", "remaining_time": "0:41:43", "throughput": 4248.28, "total_tokens": 14257664} {"current_steps": 21860, "total_steps": 38160, "loss": 0.3804, "lr": 0.00046020508526592425, "epoch": 11.457023060796645, "percentage": 57.29, "elapsed_time": "0:55:56", "remaining_time": "0:41:43", "throughput": 4248.33, "total_tokens": 14260960} {"current_steps": 21865, "total_steps": 38160, "loss": 0.5566, "lr": 0.0004599771291977079, "epoch": 11.45964360587002, "percentage": 57.3, "elapsed_time": "0:55:57", "remaining_time": "0:41:42", "throughput": 4248.49, "total_tokens": 14264960} {"current_steps": 21870, "total_steps": 38160, "loss": 0.4551, "lr": 0.0004597491815018194, "epoch": 11.462264150943396, "percentage": 57.31, "elapsed_time": "0:55:58", "remaining_time": "0:41:41", "throughput": 4248.49, "total_tokens": 14267840} {"current_steps": 21875, "total_steps": 38160, "loss": 0.462, "lr": 0.0004595212422259431, "epoch": 11.464884696016771, "percentage": 57.32, "elapsed_time": "0:55:58", "remaining_time": "0:41:40", "throughput": 4248.46, "total_tokens": 14270368} {"current_steps": 21880, "total_steps": 38160, "loss": 0.3474, "lr": 0.00045929331141776104, "epoch": 11.467505241090146, "percentage": 57.34, "elapsed_time": "0:55:59", "remaining_time": "0:41:39", "throughput": 4248.46, "total_tokens": 14273248} {"current_steps": 21885, "total_steps": 38160, "loss": 0.4365, "lr": 0.0004590653891249537, "epoch": 11.470125786163521, "percentage": 57.35, "elapsed_time": "0:56:01", "remaining_time": "0:41:39", "throughput": 4249.12, "total_tokens": 14281472} {"current_steps": 21890, "total_steps": 38160, "loss": 0.5274, "lr": 0.0004588374753952001, "epoch": 11.472746331236896, "percentage": 57.36, "elapsed_time": "0:56:01", "remaining_time": "0:41:38", "throughput": 4249.2, "total_tokens": 14284864} {"current_steps": 21895, "total_steps": 38160, "loss": 0.4758, "lr": 0.0004586095702761769, "epoch": 11.475366876310272, "percentage": 57.38, "elapsed_time": "0:56:02", "remaining_time": "0:41:37", "throughput": 4249.23, "total_tokens": 14287968} {"current_steps": 21900, "total_steps": 38160, "loss": 0.5597, "lr": 0.0004583816738155595, "epoch": 11.477987421383649, "percentage": 57.39, "elapsed_time": "0:56:03", "remaining_time": "0:41:37", "throughput": 4249.31, "total_tokens": 14291392} {"current_steps": 21905, "total_steps": 38160, "loss": 0.4156, "lr": 0.0004581537860610213, "epoch": 11.480607966457024, "percentage": 57.4, "elapsed_time": "0:56:03", "remaining_time": "0:41:36", "throughput": 4249.33, "total_tokens": 14294432} {"current_steps": 21910, "total_steps": 38160, "loss": 0.3278, "lr": 0.0004579259070602333, "epoch": 11.483228511530399, "percentage": 57.42, "elapsed_time": "0:56:04", "remaining_time": "0:41:35", "throughput": 4249.58, "total_tokens": 14299328} {"current_steps": 21915, "total_steps": 38160, "loss": 0.3914, "lr": 0.0004576980368608658, "epoch": 11.485849056603774, "percentage": 57.43, "elapsed_time": "0:56:05", "remaining_time": "0:41:34", "throughput": 4249.59, "total_tokens": 14302272} {"current_steps": 21920, "total_steps": 38160, "loss": 0.453, "lr": 0.0004574701755105862, "epoch": 11.48846960167715, "percentage": 57.44, "elapsed_time": "0:56:06", "remaining_time": "0:41:34", "throughput": 4249.77, "total_tokens": 14306432} {"current_steps": 21925, "total_steps": 38160, "loss": 0.5852, "lr": 0.00045724232305706066, "epoch": 11.491090146750524, "percentage": 57.46, "elapsed_time": "0:56:07", "remaining_time": "0:41:33", "throughput": 4250.06, "total_tokens": 14311680} {"current_steps": 21930, "total_steps": 38160, "loss": 0.5088, "lr": 0.00045701447954795343, "epoch": 11.4937106918239, "percentage": 57.47, "elapsed_time": "0:56:08", "remaining_time": "0:41:32", "throughput": 4250.01, "total_tokens": 14314208} {"current_steps": 21935, "total_steps": 38160, "loss": 0.5988, "lr": 0.0004567866450309268, "epoch": 11.496331236897275, "percentage": 57.48, "elapsed_time": "0:56:08", "remaining_time": "0:41:31", "throughput": 4250.1, "total_tokens": 14317696} {"current_steps": 21940, "total_steps": 38160, "loss": 0.4862, "lr": 0.00045655881955364086, "epoch": 11.49895178197065, "percentage": 57.49, "elapsed_time": "0:56:09", "remaining_time": "0:41:31", "throughput": 4250.14, "total_tokens": 14320864} {"current_steps": 21945, "total_steps": 38160, "loss": 0.4587, "lr": 0.0004563310031637543, "epoch": 11.501572327044025, "percentage": 57.51, "elapsed_time": "0:56:10", "remaining_time": "0:41:30", "throughput": 4250.12, "total_tokens": 14323520} {"current_steps": 21950, "total_steps": 38160, "loss": 0.558, "lr": 0.00045610319590892365, "epoch": 11.5041928721174, "percentage": 57.52, "elapsed_time": "0:56:10", "remaining_time": "0:41:29", "throughput": 4250.13, "total_tokens": 14326400} {"current_steps": 21955, "total_steps": 38160, "loss": 0.3354, "lr": 0.00045587539783680366, "epoch": 11.506813417190775, "percentage": 57.53, "elapsed_time": "0:56:11", "remaining_time": "0:41:28", "throughput": 4250.09, "total_tokens": 14328992} {"current_steps": 21960, "total_steps": 38160, "loss": 0.459, "lr": 0.00045564760899504715, "epoch": 11.50943396226415, "percentage": 57.55, "elapsed_time": "0:56:12", "remaining_time": "0:41:27", "throughput": 4250.04, "total_tokens": 14331584} {"current_steps": 21965, "total_steps": 38160, "loss": 0.4596, "lr": 0.00045541982943130466, "epoch": 11.512054507337526, "percentage": 57.56, "elapsed_time": "0:56:12", "remaining_time": "0:41:26", "throughput": 4250.16, "total_tokens": 14335360} {"current_steps": 21970, "total_steps": 38160, "loss": 0.5468, "lr": 0.00045519205919322534, "epoch": 11.514675052410901, "percentage": 57.57, "elapsed_time": "0:56:13", "remaining_time": "0:41:26", "throughput": 4250.3, "total_tokens": 14339360} {"current_steps": 21975, "total_steps": 38160, "loss": 0.4828, "lr": 0.00045496429832845594, "epoch": 11.517295597484276, "percentage": 57.59, "elapsed_time": "0:56:14", "remaining_time": "0:41:25", "throughput": 4250.28, "total_tokens": 14342112} {"current_steps": 21980, "total_steps": 38160, "loss": 0.3619, "lr": 0.0004547365468846416, "epoch": 11.519916142557651, "percentage": 57.6, "elapsed_time": "0:56:15", "remaining_time": "0:41:24", "throughput": 4250.29, "total_tokens": 14344960} {"current_steps": 21985, "total_steps": 38160, "loss": 0.433, "lr": 0.0004545088049094252, "epoch": 11.522536687631026, "percentage": 57.61, "elapsed_time": "0:56:15", "remaining_time": "0:41:23", "throughput": 4250.34, "total_tokens": 14348384} {"current_steps": 21990, "total_steps": 38160, "loss": 0.5784, "lr": 0.00045428107245044805, "epoch": 11.525157232704402, "percentage": 57.63, "elapsed_time": "0:56:16", "remaining_time": "0:41:22", "throughput": 4250.4, "total_tokens": 14351616} {"current_steps": 21995, "total_steps": 38160, "loss": 0.4518, "lr": 0.0004540533495553488, "epoch": 11.527777777777779, "percentage": 57.64, "elapsed_time": "0:56:17", "remaining_time": "0:41:22", "throughput": 4250.45, "total_tokens": 14354848} {"current_steps": 22000, "total_steps": 38160, "loss": 0.4675, "lr": 0.00045382563627176454, "epoch": 11.530398322851154, "percentage": 57.65, "elapsed_time": "0:56:18", "remaining_time": "0:41:21", "throughput": 4250.56, "total_tokens": 14358496} {"current_steps": 22005, "total_steps": 38160, "loss": 0.4605, "lr": 0.0004535979326473304, "epoch": 11.533018867924529, "percentage": 57.67, "elapsed_time": "0:56:18", "remaining_time": "0:41:20", "throughput": 4250.61, "total_tokens": 14361728} {"current_steps": 22010, "total_steps": 38160, "loss": 0.3267, "lr": 0.00045337023872967945, "epoch": 11.535639412997904, "percentage": 57.68, "elapsed_time": "0:56:19", "remaining_time": "0:41:19", "throughput": 4250.7, "total_tokens": 14365248} {"current_steps": 22015, "total_steps": 38160, "loss": 0.4533, "lr": 0.0004531425545664425, "epoch": 11.53825995807128, "percentage": 57.69, "elapsed_time": "0:56:20", "remaining_time": "0:41:18", "throughput": 4250.74, "total_tokens": 14368416} {"current_steps": 22020, "total_steps": 38160, "loss": 0.5493, "lr": 0.0004529148802052488, "epoch": 11.540880503144654, "percentage": 57.7, "elapsed_time": "0:56:20", "remaining_time": "0:41:18", "throughput": 4250.76, "total_tokens": 14371424} {"current_steps": 22025, "total_steps": 38160, "loss": 0.4264, "lr": 0.00045268721569372483, "epoch": 11.54350104821803, "percentage": 57.72, "elapsed_time": "0:56:21", "remaining_time": "0:41:17", "throughput": 4250.8, "total_tokens": 14374592} {"current_steps": 22030, "total_steps": 38160, "loss": 0.4144, "lr": 0.00045245956107949547, "epoch": 11.546121593291405, "percentage": 57.73, "elapsed_time": "0:56:22", "remaining_time": "0:41:16", "throughput": 4250.81, "total_tokens": 14377504} {"current_steps": 22035, "total_steps": 38160, "loss": 0.4449, "lr": 0.0004522319164101837, "epoch": 11.54874213836478, "percentage": 57.74, "elapsed_time": "0:56:23", "remaining_time": "0:41:15", "throughput": 4250.89, "total_tokens": 14380960} {"current_steps": 22040, "total_steps": 38160, "loss": 0.4168, "lr": 0.00045200428173340987, "epoch": 11.551362683438155, "percentage": 57.76, "elapsed_time": "0:56:23", "remaining_time": "0:41:14", "throughput": 4251.0, "total_tokens": 14384608} {"current_steps": 22045, "total_steps": 38160, "loss": 0.3427, "lr": 0.00045177665709679286, "epoch": 11.55398322851153, "percentage": 57.77, "elapsed_time": "0:56:24", "remaining_time": "0:41:14", "throughput": 4251.09, "total_tokens": 14388160} {"current_steps": 22050, "total_steps": 38160, "loss": 0.53, "lr": 0.0004515490425479492, "epoch": 11.556603773584905, "percentage": 57.78, "elapsed_time": "0:56:25", "remaining_time": "0:41:13", "throughput": 4251.14, "total_tokens": 14391296} {"current_steps": 22055, "total_steps": 38160, "loss": 0.2976, "lr": 0.0004513214381344928, "epoch": 11.55922431865828, "percentage": 57.8, "elapsed_time": "0:56:26", "remaining_time": "0:41:12", "throughput": 4251.23, "total_tokens": 14394752} {"current_steps": 22060, "total_steps": 38160, "loss": 0.391, "lr": 0.00045109384390403635, "epoch": 11.561844863731656, "percentage": 57.81, "elapsed_time": "0:56:26", "remaining_time": "0:41:11", "throughput": 4251.2, "total_tokens": 14397376} {"current_steps": 22065, "total_steps": 38160, "loss": 0.4523, "lr": 0.0004508662599041896, "epoch": 11.564465408805031, "percentage": 57.82, "elapsed_time": "0:56:27", "remaining_time": "0:41:10", "throughput": 4251.15, "total_tokens": 14399872} {"current_steps": 22070, "total_steps": 38160, "loss": 0.4942, "lr": 0.0004506386861825609, "epoch": 11.567085953878406, "percentage": 57.84, "elapsed_time": "0:56:28", "remaining_time": "0:41:10", "throughput": 4251.26, "total_tokens": 14403552} {"current_steps": 22075, "total_steps": 38160, "loss": 0.4289, "lr": 0.00045041112278675603, "epoch": 11.569706498951781, "percentage": 57.85, "elapsed_time": "0:56:28", "remaining_time": "0:41:09", "throughput": 4251.41, "total_tokens": 14407552} {"current_steps": 22080, "total_steps": 38160, "loss": 0.4247, "lr": 0.00045018356976437836, "epoch": 11.572327044025156, "percentage": 57.86, "elapsed_time": "0:56:29", "remaining_time": "0:41:08", "throughput": 4251.47, "total_tokens": 14410912} {"current_steps": 22085, "total_steps": 38160, "loss": 0.4926, "lr": 0.0004499560271630295, "epoch": 11.574947589098532, "percentage": 57.87, "elapsed_time": "0:56:30", "remaining_time": "0:41:07", "throughput": 4251.43, "total_tokens": 14413440} {"current_steps": 22090, "total_steps": 38160, "loss": 0.3534, "lr": 0.00044972849503030894, "epoch": 11.577568134171909, "percentage": 57.89, "elapsed_time": "0:56:31", "remaining_time": "0:41:06", "throughput": 4251.6, "total_tokens": 14417568} {"current_steps": 22095, "total_steps": 38160, "loss": 0.4072, "lr": 0.00044950097341381356, "epoch": 11.580188679245284, "percentage": 57.9, "elapsed_time": "0:56:31", "remaining_time": "0:41:06", "throughput": 4251.64, "total_tokens": 14420736} {"current_steps": 22100, "total_steps": 38160, "loss": 0.4377, "lr": 0.0004492734623611385, "epoch": 11.582809224318659, "percentage": 57.91, "elapsed_time": "0:56:32", "remaining_time": "0:41:05", "throughput": 4251.72, "total_tokens": 14424224} {"current_steps": 22105, "total_steps": 38160, "loss": 0.3987, "lr": 0.0004490459619198766, "epoch": 11.585429769392034, "percentage": 57.93, "elapsed_time": "0:56:33", "remaining_time": "0:41:04", "throughput": 4251.74, "total_tokens": 14427264} {"current_steps": 22110, "total_steps": 38160, "loss": 0.5332, "lr": 0.00044881847213761787, "epoch": 11.58805031446541, "percentage": 57.94, "elapsed_time": "0:56:33", "remaining_time": "0:41:03", "throughput": 4251.66, "total_tokens": 14429504} {"current_steps": 22115, "total_steps": 38160, "loss": 0.4922, "lr": 0.000448590993061951, "epoch": 11.590670859538784, "percentage": 57.95, "elapsed_time": "0:56:34", "remaining_time": "0:41:02", "throughput": 4251.69, "total_tokens": 14432672} {"current_steps": 22120, "total_steps": 38160, "loss": 0.4552, "lr": 0.00044836352474046177, "epoch": 11.59329140461216, "percentage": 57.97, "elapsed_time": "0:56:35", "remaining_time": "0:41:01", "throughput": 4251.62, "total_tokens": 14435072} {"current_steps": 22125, "total_steps": 38160, "loss": 0.3688, "lr": 0.00044813606722073415, "epoch": 11.595911949685535, "percentage": 57.98, "elapsed_time": "0:56:36", "remaining_time": "0:41:01", "throughput": 4251.81, "total_tokens": 14439424} {"current_steps": 22130, "total_steps": 38160, "loss": 0.4703, "lr": 0.00044790862055034945, "epoch": 11.59853249475891, "percentage": 57.99, "elapsed_time": "0:56:36", "remaining_time": "0:41:00", "throughput": 4251.76, "total_tokens": 14441888} {"current_steps": 22135, "total_steps": 38160, "loss": 0.4735, "lr": 0.00044768118477688727, "epoch": 11.601153039832285, "percentage": 58.01, "elapsed_time": "0:56:37", "remaining_time": "0:40:59", "throughput": 4251.78, "total_tokens": 14444896} {"current_steps": 22140, "total_steps": 38160, "loss": 0.4262, "lr": 0.00044745375994792425, "epoch": 11.60377358490566, "percentage": 58.02, "elapsed_time": "0:56:38", "remaining_time": "0:40:58", "throughput": 4251.8, "total_tokens": 14447904} {"current_steps": 22145, "total_steps": 38160, "loss": 0.4711, "lr": 0.00044722634611103507, "epoch": 11.606394129979035, "percentage": 58.03, "elapsed_time": "0:56:38", "remaining_time": "0:40:57", "throughput": 4251.78, "total_tokens": 14450624} {"current_steps": 22150, "total_steps": 38160, "loss": 0.441, "lr": 0.0004469989433137923, "epoch": 11.60901467505241, "percentage": 58.05, "elapsed_time": "0:56:39", "remaining_time": "0:40:57", "throughput": 4251.89, "total_tokens": 14454240} {"current_steps": 22155, "total_steps": 38160, "loss": 0.3876, "lr": 0.00044677155160376586, "epoch": 11.611635220125786, "percentage": 58.06, "elapsed_time": "0:56:40", "remaining_time": "0:40:56", "throughput": 4251.89, "total_tokens": 14457088} {"current_steps": 22160, "total_steps": 38160, "loss": 0.4473, "lr": 0.00044654417102852375, "epoch": 11.614255765199161, "percentage": 58.07, "elapsed_time": "0:56:40", "remaining_time": "0:40:55", "throughput": 4251.98, "total_tokens": 14460608} {"current_steps": 22165, "total_steps": 38160, "loss": 0.5397, "lr": 0.0004463168016356309, "epoch": 11.616876310272536, "percentage": 58.08, "elapsed_time": "0:56:41", "remaining_time": "0:40:54", "throughput": 4252.07, "total_tokens": 14464064} {"current_steps": 22170, "total_steps": 38160, "loss": 0.4729, "lr": 0.00044608944347265095, "epoch": 11.619496855345911, "percentage": 58.1, "elapsed_time": "0:56:42", "remaining_time": "0:40:53", "throughput": 4252.16, "total_tokens": 14467584} {"current_steps": 22175, "total_steps": 38160, "loss": 0.4144, "lr": 0.0004458620965871442, "epoch": 11.622117400419286, "percentage": 58.11, "elapsed_time": "0:56:43", "remaining_time": "0:40:53", "throughput": 4252.28, "total_tokens": 14471328} {"current_steps": 22180, "total_steps": 38160, "loss": 0.291, "lr": 0.00044563476102666935, "epoch": 11.624737945492662, "percentage": 58.12, "elapsed_time": "0:56:43", "remaining_time": "0:40:52", "throughput": 4252.38, "total_tokens": 14475072} {"current_steps": 22185, "total_steps": 38160, "loss": 0.4281, "lr": 0.0004454074368387821, "epoch": 11.627358490566039, "percentage": 58.14, "elapsed_time": "0:56:44", "remaining_time": "0:40:51", "throughput": 4252.38, "total_tokens": 14477984} {"current_steps": 22190, "total_steps": 38160, "loss": 0.2446, "lr": 0.0004451801240710365, "epoch": 11.629979035639414, "percentage": 58.15, "elapsed_time": "0:56:45", "remaining_time": "0:40:50", "throughput": 4252.53, "total_tokens": 14481984} {"current_steps": 22195, "total_steps": 38160, "loss": 0.4411, "lr": 0.0004449528227709834, "epoch": 11.632599580712789, "percentage": 58.16, "elapsed_time": "0:56:46", "remaining_time": "0:40:50", "throughput": 4252.66, "total_tokens": 14485760} {"current_steps": 22200, "total_steps": 38160, "loss": 0.4907, "lr": 0.0004447255329861716, "epoch": 11.635220125786164, "percentage": 58.18, "elapsed_time": "0:56:47", "remaining_time": "0:40:49", "throughput": 4252.8, "total_tokens": 14489664} {"current_steps": 22205, "total_steps": 38160, "loss": 0.3189, "lr": 0.0004444982547641479, "epoch": 11.63784067085954, "percentage": 58.19, "elapsed_time": "0:56:47", "remaining_time": "0:40:48", "throughput": 4252.88, "total_tokens": 14493056} {"current_steps": 22210, "total_steps": 38160, "loss": 0.3221, "lr": 0.00044427098815245594, "epoch": 11.640461215932914, "percentage": 58.2, "elapsed_time": "0:56:48", "remaining_time": "0:40:47", "throughput": 4252.84, "total_tokens": 14495680} {"current_steps": 22215, "total_steps": 38160, "loss": 0.393, "lr": 0.00044404373319863763, "epoch": 11.64308176100629, "percentage": 58.22, "elapsed_time": "0:56:49", "remaining_time": "0:40:46", "throughput": 4252.86, "total_tokens": 14498592} {"current_steps": 22220, "total_steps": 38160, "loss": 0.416, "lr": 0.000443816489950232, "epoch": 11.645702306079665, "percentage": 58.23, "elapsed_time": "0:56:49", "remaining_time": "0:40:46", "throughput": 4252.92, "total_tokens": 14501888} {"current_steps": 22225, "total_steps": 38160, "loss": 0.4891, "lr": 0.00044358925845477547, "epoch": 11.64832285115304, "percentage": 58.24, "elapsed_time": "0:56:50", "remaining_time": "0:40:45", "throughput": 4252.97, "total_tokens": 14505088} {"current_steps": 22230, "total_steps": 38160, "loss": 0.4135, "lr": 0.0004433620387598027, "epoch": 11.650943396226415, "percentage": 58.25, "elapsed_time": "0:56:51", "remaining_time": "0:40:44", "throughput": 4252.94, "total_tokens": 14507744} {"current_steps": 22235, "total_steps": 38160, "loss": 0.4179, "lr": 0.00044313483091284507, "epoch": 11.65356394129979, "percentage": 58.27, "elapsed_time": "0:56:51", "remaining_time": "0:40:43", "throughput": 4252.93, "total_tokens": 14510560} {"current_steps": 22240, "total_steps": 38160, "loss": 0.4665, "lr": 0.0004429076349614321, "epoch": 11.656184486373165, "percentage": 58.28, "elapsed_time": "0:56:52", "remaining_time": "0:40:42", "throughput": 4253.06, "total_tokens": 14514432} {"current_steps": 22245, "total_steps": 38160, "loss": 0.4875, "lr": 0.0004426804509530907, "epoch": 11.65880503144654, "percentage": 58.29, "elapsed_time": "0:56:53", "remaining_time": "0:40:42", "throughput": 4253.12, "total_tokens": 14517664} {"current_steps": 22250, "total_steps": 38160, "loss": 0.5195, "lr": 0.000442453278935345, "epoch": 11.661425576519916, "percentage": 58.31, "elapsed_time": "0:56:54", "remaining_time": "0:40:41", "throughput": 4253.14, "total_tokens": 14520704} {"current_steps": 22255, "total_steps": 38160, "loss": 0.3605, "lr": 0.0004422261189557167, "epoch": 11.664046121593291, "percentage": 58.32, "elapsed_time": "0:56:54", "remaining_time": "0:40:40", "throughput": 4253.34, "total_tokens": 14525152} {"current_steps": 22260, "total_steps": 38160, "loss": 0.4483, "lr": 0.00044199897106172526, "epoch": 11.666666666666666, "percentage": 58.33, "elapsed_time": "0:56:55", "remaining_time": "0:40:39", "throughput": 4253.59, "total_tokens": 14529824} {"current_steps": 22265, "total_steps": 38160, "loss": 0.4354, "lr": 0.0004417718353008873, "epoch": 11.669287211740041, "percentage": 58.35, "elapsed_time": "0:56:56", "remaining_time": "0:40:39", "throughput": 4253.54, "total_tokens": 14532416} {"current_steps": 22270, "total_steps": 38160, "loss": 0.5281, "lr": 0.0004415447117207172, "epoch": 11.671907756813416, "percentage": 58.36, "elapsed_time": "0:56:57", "remaining_time": "0:40:38", "throughput": 4253.62, "total_tokens": 14535776} {"current_steps": 22275, "total_steps": 38160, "loss": 0.5512, "lr": 0.00044131760036872657, "epoch": 11.674528301886792, "percentage": 58.37, "elapsed_time": "0:56:57", "remaining_time": "0:40:37", "throughput": 4253.6, "total_tokens": 14538624} {"current_steps": 22280, "total_steps": 38160, "loss": 0.3731, "lr": 0.00044109050129242434, "epoch": 11.677148846960169, "percentage": 58.39, "elapsed_time": "0:56:58", "remaining_time": "0:40:36", "throughput": 4253.68, "total_tokens": 14542112} {"current_steps": 22285, "total_steps": 38160, "loss": 0.3963, "lr": 0.00044086341453931715, "epoch": 11.679769392033544, "percentage": 58.4, "elapsed_time": "0:56:59", "remaining_time": "0:40:35", "throughput": 4253.69, "total_tokens": 14545024} {"current_steps": 22290, "total_steps": 38160, "loss": 0.4068, "lr": 0.00044063634015690893, "epoch": 11.682389937106919, "percentage": 58.41, "elapsed_time": "0:57:00", "remaining_time": "0:40:35", "throughput": 4253.88, "total_tokens": 14549440} {"current_steps": 22295, "total_steps": 38160, "loss": 0.431, "lr": 0.0004404092781927012, "epoch": 11.685010482180294, "percentage": 58.43, "elapsed_time": "0:57:00", "remaining_time": "0:40:34", "throughput": 4253.85, "total_tokens": 14552224} {"current_steps": 22300, "total_steps": 38160, "loss": 0.4176, "lr": 0.00044018222869419255, "epoch": 11.68763102725367, "percentage": 58.44, "elapsed_time": "0:57:01", "remaining_time": "0:40:33", "throughput": 4253.83, "total_tokens": 14555040} {"current_steps": 22305, "total_steps": 38160, "loss": 0.387, "lr": 0.00043995519170887936, "epoch": 11.690251572327044, "percentage": 58.45, "elapsed_time": "0:57:02", "remaining_time": "0:40:32", "throughput": 4253.83, "total_tokens": 14558016} {"current_steps": 22310, "total_steps": 38160, "loss": 0.4349, "lr": 0.00043972816728425504, "epoch": 11.69287211740042, "percentage": 58.46, "elapsed_time": "0:57:02", "remaining_time": "0:40:31", "throughput": 4253.79, "total_tokens": 14560640} {"current_steps": 22315, "total_steps": 38160, "loss": 0.3483, "lr": 0.0004395011554678103, "epoch": 11.695492662473795, "percentage": 58.48, "elapsed_time": "0:57:03", "remaining_time": "0:40:30", "throughput": 4253.76, "total_tokens": 14563264} {"current_steps": 22320, "total_steps": 38160, "loss": 0.4426, "lr": 0.00043927415630703364, "epoch": 11.69811320754717, "percentage": 58.49, "elapsed_time": "0:57:04", "remaining_time": "0:40:30", "throughput": 4253.79, "total_tokens": 14566432} {"current_steps": 22325, "total_steps": 38160, "loss": 0.4035, "lr": 0.0004390471698494108, "epoch": 11.700733752620545, "percentage": 58.5, "elapsed_time": "0:57:05", "remaining_time": "0:40:29", "throughput": 4253.91, "total_tokens": 14570176} {"current_steps": 22330, "total_steps": 38160, "loss": 0.5142, "lr": 0.0004388201961424248, "epoch": 11.70335429769392, "percentage": 58.52, "elapsed_time": "0:57:05", "remaining_time": "0:40:28", "throughput": 4253.97, "total_tokens": 14573536} {"current_steps": 22335, "total_steps": 38160, "loss": 0.3858, "lr": 0.0004385932352335555, "epoch": 11.705974842767295, "percentage": 58.53, "elapsed_time": "0:57:06", "remaining_time": "0:40:27", "throughput": 4254.01, "total_tokens": 14576672} {"current_steps": 22340, "total_steps": 38160, "loss": 0.3979, "lr": 0.000438366287170281, "epoch": 11.70859538784067, "percentage": 58.54, "elapsed_time": "0:57:07", "remaining_time": "0:40:27", "throughput": 4254.0, "total_tokens": 14579584} {"current_steps": 22345, "total_steps": 38160, "loss": 0.4608, "lr": 0.0004381393520000759, "epoch": 11.711215932914046, "percentage": 58.56, "elapsed_time": "0:57:07", "remaining_time": "0:40:26", "throughput": 4254.01, "total_tokens": 14582528} {"current_steps": 22350, "total_steps": 38160, "loss": 0.4578, "lr": 0.0004379124297704127, "epoch": 11.713836477987421, "percentage": 58.57, "elapsed_time": "0:57:08", "remaining_time": "0:40:25", "throughput": 4254.16, "total_tokens": 14586464} {"current_steps": 22355, "total_steps": 38160, "loss": 0.417, "lr": 0.0004376855205287609, "epoch": 11.716457023060796, "percentage": 58.58, "elapsed_time": "0:57:09", "remaining_time": "0:40:24", "throughput": 4254.15, "total_tokens": 14589440} {"current_steps": 22360, "total_steps": 38160, "loss": 0.4762, "lr": 0.0004374586243225874, "epoch": 11.719077568134171, "percentage": 58.6, "elapsed_time": "0:57:10", "remaining_time": "0:40:23", "throughput": 4254.28, "total_tokens": 14593280} {"current_steps": 22365, "total_steps": 38160, "loss": 0.4413, "lr": 0.00043723174119935607, "epoch": 11.721698113207546, "percentage": 58.61, "elapsed_time": "0:57:11", "remaining_time": "0:40:23", "throughput": 4254.37, "total_tokens": 14596800} {"current_steps": 22370, "total_steps": 38160, "loss": 0.5775, "lr": 0.00043700487120652826, "epoch": 11.724318658280922, "percentage": 58.62, "elapsed_time": "0:57:11", "remaining_time": "0:40:22", "throughput": 4254.35, "total_tokens": 14599552} {"current_steps": 22375, "total_steps": 38160, "loss": 0.42, "lr": 0.00043677801439156284, "epoch": 11.726939203354299, "percentage": 58.63, "elapsed_time": "0:57:12", "remaining_time": "0:40:21", "throughput": 4254.27, "total_tokens": 14601952} {"current_steps": 22380, "total_steps": 38160, "loss": 0.4109, "lr": 0.00043655117080191545, "epoch": 11.729559748427674, "percentage": 58.65, "elapsed_time": "0:57:13", "remaining_time": "0:40:20", "throughput": 4254.48, "total_tokens": 14606336} {"current_steps": 22385, "total_steps": 38160, "loss": 0.3297, "lr": 0.00043632434048503934, "epoch": 11.732180293501049, "percentage": 58.66, "elapsed_time": "0:57:13", "remaining_time": "0:40:19", "throughput": 4254.42, "total_tokens": 14608864} {"current_steps": 22390, "total_steps": 38160, "loss": 0.316, "lr": 0.00043609752348838484, "epoch": 11.734800838574424, "percentage": 58.67, "elapsed_time": "0:57:14", "remaining_time": "0:40:18", "throughput": 4254.38, "total_tokens": 14611488} {"current_steps": 22395, "total_steps": 38160, "loss": 0.3946, "lr": 0.0004358707198593992, "epoch": 11.7374213836478, "percentage": 58.69, "elapsed_time": "0:57:15", "remaining_time": "0:40:18", "throughput": 4254.5, "total_tokens": 14615296} {"current_steps": 22400, "total_steps": 38160, "loss": 0.4193, "lr": 0.0004356439296455273, "epoch": 11.740041928721174, "percentage": 58.7, "elapsed_time": "0:57:16", "remaining_time": "0:40:17", "throughput": 4254.77, "total_tokens": 14620096} {"current_steps": 22405, "total_steps": 38160, "loss": 0.6266, "lr": 0.0004354171528942113, "epoch": 11.74266247379455, "percentage": 58.71, "elapsed_time": "0:57:16", "remaining_time": "0:40:16", "throughput": 4254.75, "total_tokens": 14622912} {"current_steps": 22410, "total_steps": 38160, "loss": 0.5293, "lr": 0.00043519038965288994, "epoch": 11.745283018867925, "percentage": 58.73, "elapsed_time": "0:57:17", "remaining_time": "0:40:15", "throughput": 4254.7, "total_tokens": 14625568} {"current_steps": 22415, "total_steps": 38160, "loss": 0.5051, "lr": 0.0004349636399689998, "epoch": 11.7479035639413, "percentage": 58.74, "elapsed_time": "0:57:18", "remaining_time": "0:40:15", "throughput": 4254.72, "total_tokens": 14628576} {"current_steps": 22420, "total_steps": 38160, "loss": 0.4123, "lr": 0.00043473690388997434, "epoch": 11.750524109014675, "percentage": 58.75, "elapsed_time": "0:57:18", "remaining_time": "0:40:14", "throughput": 4254.81, "total_tokens": 14632096} {"current_steps": 22425, "total_steps": 38160, "loss": 0.2961, "lr": 0.0004345101814632438, "epoch": 11.75314465408805, "percentage": 58.77, "elapsed_time": "0:57:19", "remaining_time": "0:40:13", "throughput": 4254.96, "total_tokens": 14636192} {"current_steps": 22430, "total_steps": 38160, "loss": 0.4105, "lr": 0.0004342834727362362, "epoch": 11.755765199161425, "percentage": 58.78, "elapsed_time": "0:57:20", "remaining_time": "0:40:12", "throughput": 4254.93, "total_tokens": 14638944} {"current_steps": 22435, "total_steps": 38160, "loss": 0.4082, "lr": 0.00043405677775637633, "epoch": 11.7583857442348, "percentage": 58.79, "elapsed_time": "0:57:21", "remaining_time": "0:40:11", "throughput": 4254.83, "total_tokens": 14641088} {"current_steps": 22440, "total_steps": 38160, "loss": 0.339, "lr": 0.0004338300965710863, "epoch": 11.761006289308176, "percentage": 58.81, "elapsed_time": "0:57:21", "remaining_time": "0:40:11", "throughput": 4254.97, "total_tokens": 14644992} {"current_steps": 22445, "total_steps": 38160, "loss": 0.4648, "lr": 0.0004336034292277853, "epoch": 11.76362683438155, "percentage": 58.82, "elapsed_time": "0:57:22", "remaining_time": "0:40:10", "throughput": 4254.98, "total_tokens": 14648000} {"current_steps": 22450, "total_steps": 38160, "loss": 0.56, "lr": 0.00043337677577388916, "epoch": 11.766247379454926, "percentage": 58.83, "elapsed_time": "0:57:23", "remaining_time": "0:40:09", "throughput": 4255.0, "total_tokens": 14651168} {"current_steps": 22455, "total_steps": 38160, "loss": 0.463, "lr": 0.0004331501362568116, "epoch": 11.768867924528301, "percentage": 58.84, "elapsed_time": "0:57:24", "remaining_time": "0:40:08", "throughput": 4255.07, "total_tokens": 14654528} {"current_steps": 22460, "total_steps": 38160, "loss": 0.4502, "lr": 0.00043292351072396273, "epoch": 11.771488469601676, "percentage": 58.86, "elapsed_time": "0:57:24", "remaining_time": "0:40:07", "throughput": 4255.02, "total_tokens": 14657088} {"current_steps": 22465, "total_steps": 38160, "loss": 0.3865, "lr": 0.0004326968992227503, "epoch": 11.774109014675052, "percentage": 58.87, "elapsed_time": "0:57:25", "remaining_time": "0:40:07", "throughput": 4255.08, "total_tokens": 14660352} {"current_steps": 22470, "total_steps": 38160, "loss": 0.5278, "lr": 0.0004324703018005786, "epoch": 11.776729559748428, "percentage": 58.88, "elapsed_time": "0:57:26", "remaining_time": "0:40:06", "throughput": 4255.21, "total_tokens": 14664288} {"current_steps": 22475, "total_steps": 38160, "loss": 0.6907, "lr": 0.00043224371850484955, "epoch": 11.779350104821804, "percentage": 58.9, "elapsed_time": "0:57:26", "remaining_time": "0:40:05", "throughput": 4255.32, "total_tokens": 14668000} {"current_steps": 22480, "total_steps": 38160, "loss": 0.3951, "lr": 0.0004320171493829614, "epoch": 11.781970649895179, "percentage": 58.91, "elapsed_time": "0:57:27", "remaining_time": "0:40:04", "throughput": 4255.36, "total_tokens": 14671328} {"current_steps": 22485, "total_steps": 38160, "loss": 0.4493, "lr": 0.00043179059448231004, "epoch": 11.784591194968554, "percentage": 58.92, "elapsed_time": "0:57:28", "remaining_time": "0:40:04", "throughput": 4255.35, "total_tokens": 14674272} {"current_steps": 22490, "total_steps": 38160, "loss": 0.497, "lr": 0.0004315640538502881, "epoch": 11.78721174004193, "percentage": 58.94, "elapsed_time": "0:57:29", "remaining_time": "0:40:03", "throughput": 4255.3, "total_tokens": 14676896} {"current_steps": 22495, "total_steps": 38160, "loss": 0.4738, "lr": 0.00043133752753428547, "epoch": 11.789832285115304, "percentage": 58.95, "elapsed_time": "0:57:29", "remaining_time": "0:40:02", "throughput": 4255.31, "total_tokens": 14679840} {"current_steps": 22500, "total_steps": 38160, "loss": 0.444, "lr": 0.0004311110155816886, "epoch": 11.79245283018868, "percentage": 58.96, "elapsed_time": "0:57:30", "remaining_time": "0:40:01", "throughput": 4255.38, "total_tokens": 14683456} {"current_steps": 22505, "total_steps": 38160, "loss": 0.5423, "lr": 0.00043088451803988153, "epoch": 11.795073375262055, "percentage": 58.98, "elapsed_time": "0:57:31", "remaining_time": "0:40:00", "throughput": 4255.34, "total_tokens": 14686112} {"current_steps": 22510, "total_steps": 38160, "loss": 0.313, "lr": 0.00043065803495624465, "epoch": 11.79769392033543, "percentage": 58.99, "elapsed_time": "0:57:31", "remaining_time": "0:39:59", "throughput": 4255.35, "total_tokens": 14689024} {"current_steps": 22515, "total_steps": 38160, "loss": 0.4606, "lr": 0.00043043156637815575, "epoch": 11.800314465408805, "percentage": 59.0, "elapsed_time": "0:57:32", "remaining_time": "0:39:59", "throughput": 4255.33, "total_tokens": 14691712} {"current_steps": 22520, "total_steps": 38160, "loss": 0.5716, "lr": 0.00043020511235298956, "epoch": 11.80293501048218, "percentage": 59.01, "elapsed_time": "0:57:33", "remaining_time": "0:39:58", "throughput": 4255.39, "total_tokens": 14695104} {"current_steps": 22525, "total_steps": 38160, "loss": 0.4309, "lr": 0.00042997867292811744, "epoch": 11.805555555555555, "percentage": 59.03, "elapsed_time": "0:57:33", "remaining_time": "0:39:57", "throughput": 4255.37, "total_tokens": 14697952} {"current_steps": 22530, "total_steps": 38160, "loss": 0.3832, "lr": 0.00042975224815090834, "epoch": 11.80817610062893, "percentage": 59.04, "elapsed_time": "0:57:34", "remaining_time": "0:39:56", "throughput": 4255.34, "total_tokens": 14700704} {"current_steps": 22535, "total_steps": 38160, "loss": 0.4354, "lr": 0.0004295258380687274, "epoch": 11.810796645702306, "percentage": 59.05, "elapsed_time": "0:57:35", "remaining_time": "0:39:55", "throughput": 4255.33, "total_tokens": 14703488} {"current_steps": 22540, "total_steps": 38160, "loss": 0.5048, "lr": 0.000429299442728937, "epoch": 11.81341719077568, "percentage": 59.07, "elapsed_time": "0:57:36", "remaining_time": "0:39:55", "throughput": 4255.38, "total_tokens": 14706752} {"current_steps": 22545, "total_steps": 38160, "loss": 0.3485, "lr": 0.0004290730621788967, "epoch": 11.816037735849056, "percentage": 59.08, "elapsed_time": "0:57:36", "remaining_time": "0:39:54", "throughput": 4255.45, "total_tokens": 14710176} {"current_steps": 22550, "total_steps": 38160, "loss": 0.5266, "lr": 0.0004288466964659625, "epoch": 11.818658280922431, "percentage": 59.09, "elapsed_time": "0:57:37", "remaining_time": "0:39:53", "throughput": 4255.49, "total_tokens": 14713376} {"current_steps": 22555, "total_steps": 38160, "loss": 0.4775, "lr": 0.0004286203456374877, "epoch": 11.821278825995806, "percentage": 59.11, "elapsed_time": "0:57:38", "remaining_time": "0:39:52", "throughput": 4255.56, "total_tokens": 14716864} {"current_steps": 22560, "total_steps": 38160, "loss": 0.3017, "lr": 0.0004283940097408224, "epoch": 11.823899371069182, "percentage": 59.12, "elapsed_time": "0:57:38", "remaining_time": "0:39:51", "throughput": 4255.57, "total_tokens": 14719776} {"current_steps": 22565, "total_steps": 38160, "loss": 0.4728, "lr": 0.00042816768882331324, "epoch": 11.826519916142558, "percentage": 59.13, "elapsed_time": "0:57:39", "remaining_time": "0:39:51", "throughput": 4255.8, "total_tokens": 14724512} {"current_steps": 22570, "total_steps": 38160, "loss": 0.4436, "lr": 0.000427941382932304, "epoch": 11.829140461215934, "percentage": 59.15, "elapsed_time": "0:57:40", "remaining_time": "0:39:50", "throughput": 4255.76, "total_tokens": 14727168} {"current_steps": 22575, "total_steps": 38160, "loss": 0.3258, "lr": 0.0004277150921151354, "epoch": 11.831761006289309, "percentage": 59.16, "elapsed_time": "0:57:41", "remaining_time": "0:39:49", "throughput": 4255.76, "total_tokens": 14730112} {"current_steps": 22580, "total_steps": 38160, "loss": 0.4424, "lr": 0.0004274888164191448, "epoch": 11.834381551362684, "percentage": 59.17, "elapsed_time": "0:57:41", "remaining_time": "0:39:48", "throughput": 4255.81, "total_tokens": 14733312} {"current_steps": 22585, "total_steps": 38160, "loss": 0.4505, "lr": 0.00042726255589166666, "epoch": 11.83700209643606, "percentage": 59.19, "elapsed_time": "0:57:42", "remaining_time": "0:39:47", "throughput": 4255.96, "total_tokens": 14737440} {"current_steps": 22590, "total_steps": 38160, "loss": 0.4736, "lr": 0.0004270363105800321, "epoch": 11.839622641509434, "percentage": 59.2, "elapsed_time": "0:57:43", "remaining_time": "0:39:47", "throughput": 4256.0, "total_tokens": 14740672} {"current_steps": 22595, "total_steps": 38160, "loss": 0.4578, "lr": 0.0004268100805315688, "epoch": 11.84224318658281, "percentage": 59.21, "elapsed_time": "0:57:44", "remaining_time": "0:39:46", "throughput": 4256.0, "total_tokens": 14743552} {"current_steps": 22600, "total_steps": 38160, "loss": 0.4449, "lr": 0.00042658386579360165, "epoch": 11.844863731656185, "percentage": 59.22, "elapsed_time": "0:57:44", "remaining_time": "0:39:45", "throughput": 4256.04, "total_tokens": 14746816} {"current_steps": 22605, "total_steps": 38160, "loss": 0.438, "lr": 0.00042635766641345213, "epoch": 11.84748427672956, "percentage": 59.24, "elapsed_time": "0:57:45", "remaining_time": "0:39:44", "throughput": 4256.04, "total_tokens": 14749696} {"current_steps": 22610, "total_steps": 38160, "loss": 0.6201, "lr": 0.0004261314824384388, "epoch": 11.850104821802935, "percentage": 59.25, "elapsed_time": "0:57:46", "remaining_time": "0:39:43", "throughput": 4256.14, "total_tokens": 14753376} {"current_steps": 22615, "total_steps": 38160, "loss": 0.5553, "lr": 0.00042590531391587666, "epoch": 11.85272536687631, "percentage": 59.26, "elapsed_time": "0:57:47", "remaining_time": "0:39:43", "throughput": 4256.17, "total_tokens": 14756576} {"current_steps": 22620, "total_steps": 38160, "loss": 0.465, "lr": 0.00042567916089307733, "epoch": 11.855345911949685, "percentage": 59.28, "elapsed_time": "0:57:47", "remaining_time": "0:39:42", "throughput": 4256.18, "total_tokens": 14759552} {"current_steps": 22625, "total_steps": 38160, "loss": 0.4774, "lr": 0.00042545302341734977, "epoch": 11.85796645702306, "percentage": 59.29, "elapsed_time": "0:57:48", "remaining_time": "0:39:41", "throughput": 4256.31, "total_tokens": 14763424} {"current_steps": 22630, "total_steps": 38160, "loss": 0.4655, "lr": 0.0004252269015359991, "epoch": 11.860587002096436, "percentage": 59.3, "elapsed_time": "0:57:49", "remaining_time": "0:39:40", "throughput": 4256.46, "total_tokens": 14767392} {"current_steps": 22635, "total_steps": 38160, "loss": 0.5425, "lr": 0.00042500079529632763, "epoch": 11.86320754716981, "percentage": 59.32, "elapsed_time": "0:57:50", "remaining_time": "0:39:40", "throughput": 4256.44, "total_tokens": 14770272} {"current_steps": 22640, "total_steps": 38160, "loss": 0.4454, "lr": 0.0004247747047456342, "epoch": 11.865828092243186, "percentage": 59.33, "elapsed_time": "0:57:50", "remaining_time": "0:39:39", "throughput": 4256.51, "total_tokens": 14773664} {"current_steps": 22645, "total_steps": 38160, "loss": 0.3499, "lr": 0.0004245486299312144, "epoch": 11.868448637316561, "percentage": 59.34, "elapsed_time": "0:57:51", "remaining_time": "0:39:38", "throughput": 4256.51, "total_tokens": 14776640} {"current_steps": 22650, "total_steps": 38160, "loss": 0.4691, "lr": 0.0004243225709003602, "epoch": 11.871069182389936, "percentage": 59.36, "elapsed_time": "0:57:52", "remaining_time": "0:39:37", "throughput": 4256.5, "total_tokens": 14779584} {"current_steps": 22655, "total_steps": 38160, "loss": 0.5427, "lr": 0.000424096527700361, "epoch": 11.873689727463312, "percentage": 59.37, "elapsed_time": "0:57:52", "remaining_time": "0:39:36", "throughput": 4256.54, "total_tokens": 14782784} {"current_steps": 22660, "total_steps": 38160, "loss": 0.6191, "lr": 0.0004238705003785021, "epoch": 11.876310272536688, "percentage": 59.38, "elapsed_time": "0:57:53", "remaining_time": "0:39:36", "throughput": 4256.71, "total_tokens": 14787040} {"current_steps": 22665, "total_steps": 38160, "loss": 0.455, "lr": 0.0004236444889820661, "epoch": 11.878930817610064, "percentage": 59.39, "elapsed_time": "0:57:54", "remaining_time": "0:39:35", "throughput": 4256.79, "total_tokens": 14790560} {"current_steps": 22670, "total_steps": 38160, "loss": 0.5027, "lr": 0.0004234184935583318, "epoch": 11.881551362683439, "percentage": 59.41, "elapsed_time": "0:57:55", "remaining_time": "0:39:34", "throughput": 4256.99, "total_tokens": 14794976} {"current_steps": 22675, "total_steps": 38160, "loss": 0.4681, "lr": 0.00042319251415457517, "epoch": 11.884171907756814, "percentage": 59.42, "elapsed_time": "0:57:56", "remaining_time": "0:39:33", "throughput": 4257.06, "total_tokens": 14798368} {"current_steps": 22680, "total_steps": 38160, "loss": 0.4236, "lr": 0.0004229665508180681, "epoch": 11.88679245283019, "percentage": 59.43, "elapsed_time": "0:57:56", "remaining_time": "0:39:33", "throughput": 4257.08, "total_tokens": 14801536} {"current_steps": 22685, "total_steps": 38160, "loss": 0.3399, "lr": 0.0004227406035960798, "epoch": 11.889412997903564, "percentage": 59.45, "elapsed_time": "0:57:57", "remaining_time": "0:39:32", "throughput": 4257.1, "total_tokens": 14804544} {"current_steps": 22690, "total_steps": 38160, "loss": 0.3305, "lr": 0.0004225146725358758, "epoch": 11.89203354297694, "percentage": 59.46, "elapsed_time": "0:57:58", "remaining_time": "0:39:31", "throughput": 4257.09, "total_tokens": 14807328} {"current_steps": 22695, "total_steps": 38160, "loss": 0.4008, "lr": 0.0004222887576847183, "epoch": 11.894654088050315, "percentage": 59.47, "elapsed_time": "0:57:58", "remaining_time": "0:39:30", "throughput": 4257.13, "total_tokens": 14810464} {"current_steps": 22700, "total_steps": 38160, "loss": 0.4954, "lr": 0.00042206285908986626, "epoch": 11.89727463312369, "percentage": 59.49, "elapsed_time": "0:57:59", "remaining_time": "0:39:29", "throughput": 4257.23, "total_tokens": 14814080} {"current_steps": 22705, "total_steps": 38160, "loss": 0.5774, "lr": 0.00042183697679857484, "epoch": 11.899895178197065, "percentage": 59.5, "elapsed_time": "0:58:00", "remaining_time": "0:39:29", "throughput": 4257.42, "total_tokens": 14818368} {"current_steps": 22710, "total_steps": 38160, "loss": 0.4135, "lr": 0.00042161111085809604, "epoch": 11.90251572327044, "percentage": 59.51, "elapsed_time": "0:58:01", "remaining_time": "0:39:28", "throughput": 4257.43, "total_tokens": 14821344} {"current_steps": 22715, "total_steps": 38160, "loss": 0.356, "lr": 0.00042138526131567855, "epoch": 11.905136268343815, "percentage": 59.53, "elapsed_time": "0:58:01", "remaining_time": "0:39:27", "throughput": 4257.45, "total_tokens": 14824352} {"current_steps": 22720, "total_steps": 38160, "loss": 0.4461, "lr": 0.0004211594282185677, "epoch": 11.90775681341719, "percentage": 59.54, "elapsed_time": "0:58:02", "remaining_time": "0:39:26", "throughput": 4257.65, "total_tokens": 14828704} {"current_steps": 22725, "total_steps": 38160, "loss": 0.4768, "lr": 0.0004209336116140048, "epoch": 11.910377358490566, "percentage": 59.55, "elapsed_time": "0:58:03", "remaining_time": "0:39:26", "throughput": 4257.62, "total_tokens": 14831456} {"current_steps": 22730, "total_steps": 38160, "loss": 0.4083, "lr": 0.00042070781154922857, "epoch": 11.91299790356394, "percentage": 59.56, "elapsed_time": "0:58:04", "remaining_time": "0:39:25", "throughput": 4257.55, "total_tokens": 14833856} {"current_steps": 22735, "total_steps": 38160, "loss": 0.309, "lr": 0.0004204820280714734, "epoch": 11.915618448637316, "percentage": 59.58, "elapsed_time": "0:58:04", "remaining_time": "0:39:24", "throughput": 4257.6, "total_tokens": 14837120} {"current_steps": 22740, "total_steps": 38160, "loss": 0.4435, "lr": 0.00042025626122797066, "epoch": 11.918238993710691, "percentage": 59.59, "elapsed_time": "0:58:05", "remaining_time": "0:39:23", "throughput": 4257.75, "total_tokens": 14841056} {"current_steps": 22745, "total_steps": 38160, "loss": 0.4415, "lr": 0.0004200305110659484, "epoch": 11.920859538784066, "percentage": 59.6, "elapsed_time": "0:58:06", "remaining_time": "0:39:22", "throughput": 4257.76, "total_tokens": 14844064} {"current_steps": 22750, "total_steps": 38160, "loss": 0.4565, "lr": 0.0004198047776326308, "epoch": 11.923480083857442, "percentage": 59.62, "elapsed_time": "0:58:06", "remaining_time": "0:39:21", "throughput": 4257.72, "total_tokens": 14846656} {"current_steps": 22755, "total_steps": 38160, "loss": 0.5028, "lr": 0.00041957906097523897, "epoch": 11.926100628930818, "percentage": 59.63, "elapsed_time": "0:58:07", "remaining_time": "0:39:21", "throughput": 4257.68, "total_tokens": 14849248} {"current_steps": 22760, "total_steps": 38160, "loss": 0.4526, "lr": 0.00041935336114099013, "epoch": 11.928721174004194, "percentage": 59.64, "elapsed_time": "0:58:08", "remaining_time": "0:39:20", "throughput": 4257.71, "total_tokens": 14852384} {"current_steps": 22765, "total_steps": 38160, "loss": 0.3801, "lr": 0.0004191276781770979, "epoch": 11.931341719077569, "percentage": 59.66, "elapsed_time": "0:58:08", "remaining_time": "0:39:19", "throughput": 4257.64, "total_tokens": 14854720} {"current_steps": 22770, "total_steps": 38160, "loss": 0.4557, "lr": 0.00041890201213077286, "epoch": 11.933962264150944, "percentage": 59.67, "elapsed_time": "0:58:09", "remaining_time": "0:39:18", "throughput": 4257.64, "total_tokens": 14857696} {"current_steps": 22775, "total_steps": 38160, "loss": 0.5389, "lr": 0.00041867636304922153, "epoch": 11.93658280922432, "percentage": 59.68, "elapsed_time": "0:58:10", "remaining_time": "0:39:17", "throughput": 4257.71, "total_tokens": 14861216} {"current_steps": 22780, "total_steps": 38160, "loss": 0.452, "lr": 0.00041845073097964737, "epoch": 11.939203354297694, "percentage": 59.7, "elapsed_time": "0:58:11", "remaining_time": "0:39:17", "throughput": 4257.71, "total_tokens": 14864064} {"current_steps": 22785, "total_steps": 38160, "loss": 0.4536, "lr": 0.0004182251159692498, "epoch": 11.94182389937107, "percentage": 59.71, "elapsed_time": "0:58:11", "remaining_time": "0:39:16", "throughput": 4257.68, "total_tokens": 14866784} {"current_steps": 22790, "total_steps": 38160, "loss": 0.3728, "lr": 0.0004179995180652253, "epoch": 11.944444444444445, "percentage": 59.72, "elapsed_time": "0:58:12", "remaining_time": "0:39:15", "throughput": 4257.67, "total_tokens": 14869664} {"current_steps": 22795, "total_steps": 38160, "loss": 0.4623, "lr": 0.00041777393731476587, "epoch": 11.94706498951782, "percentage": 59.74, "elapsed_time": "0:58:13", "remaining_time": "0:39:14", "throughput": 4257.69, "total_tokens": 14872640} {"current_steps": 22800, "total_steps": 38160, "loss": 0.4321, "lr": 0.0004175483737650608, "epoch": 11.949685534591195, "percentage": 59.75, "elapsed_time": "0:58:13", "remaining_time": "0:39:13", "throughput": 4257.81, "total_tokens": 14876512} {"current_steps": 22805, "total_steps": 38160, "loss": 0.5124, "lr": 0.0004173228274632951, "epoch": 11.95230607966457, "percentage": 59.76, "elapsed_time": "0:58:14", "remaining_time": "0:39:13", "throughput": 4257.87, "total_tokens": 14879776} {"current_steps": 22810, "total_steps": 38160, "loss": 0.3505, "lr": 0.00041709729845665084, "epoch": 11.954926624737945, "percentage": 59.77, "elapsed_time": "0:58:15", "remaining_time": "0:39:12", "throughput": 4257.98, "total_tokens": 14883552} {"current_steps": 22815, "total_steps": 38160, "loss": 0.4351, "lr": 0.0004168717867923061, "epoch": 11.95754716981132, "percentage": 59.79, "elapsed_time": "0:58:16", "remaining_time": "0:39:11", "throughput": 4257.91, "total_tokens": 14885984} {"current_steps": 22820, "total_steps": 38160, "loss": 0.4873, "lr": 0.00041664629251743487, "epoch": 11.960167714884696, "percentage": 59.8, "elapsed_time": "0:58:16", "remaining_time": "0:39:10", "throughput": 4257.92, "total_tokens": 14888992} {"current_steps": 22825, "total_steps": 38160, "loss": 0.4068, "lr": 0.0004164208156792084, "epoch": 11.96278825995807, "percentage": 59.81, "elapsed_time": "0:58:17", "remaining_time": "0:39:09", "throughput": 4257.89, "total_tokens": 14891744} {"current_steps": 22830, "total_steps": 38160, "loss": 0.5988, "lr": 0.00041619535632479374, "epoch": 11.965408805031446, "percentage": 59.83, "elapsed_time": "0:58:18", "remaining_time": "0:39:08", "throughput": 4257.92, "total_tokens": 14894880} {"current_steps": 22835, "total_steps": 38160, "loss": 0.4284, "lr": 0.00041596991450135445, "epoch": 11.968029350104821, "percentage": 59.84, "elapsed_time": "0:58:18", "remaining_time": "0:39:08", "throughput": 4257.9, "total_tokens": 14897760} {"current_steps": 22840, "total_steps": 38160, "loss": 0.4491, "lr": 0.0004157444902560504, "epoch": 11.970649895178196, "percentage": 59.85, "elapsed_time": "0:58:19", "remaining_time": "0:39:07", "throughput": 4257.91, "total_tokens": 14900736} {"current_steps": 22845, "total_steps": 38160, "loss": 0.4006, "lr": 0.00041551908363603786, "epoch": 11.973270440251572, "percentage": 59.87, "elapsed_time": "0:58:20", "remaining_time": "0:39:06", "throughput": 4258.04, "total_tokens": 14904544} {"current_steps": 22850, "total_steps": 38160, "loss": 0.5122, "lr": 0.00041529369468846914, "epoch": 11.975890985324948, "percentage": 59.88, "elapsed_time": "0:58:21", "remaining_time": "0:39:05", "throughput": 4258.07, "total_tokens": 14907648} {"current_steps": 22855, "total_steps": 38160, "loss": 0.3354, "lr": 0.00041506832346049303, "epoch": 11.978511530398324, "percentage": 59.89, "elapsed_time": "0:58:21", "remaining_time": "0:39:04", "throughput": 4258.1, "total_tokens": 14910816} {"current_steps": 22860, "total_steps": 38160, "loss": 0.3654, "lr": 0.00041484296999925476, "epoch": 11.981132075471699, "percentage": 59.91, "elapsed_time": "0:58:22", "remaining_time": "0:39:04", "throughput": 4258.08, "total_tokens": 14913632} {"current_steps": 22865, "total_steps": 38160, "loss": 0.443, "lr": 0.00041461763435189555, "epoch": 11.983752620545074, "percentage": 59.92, "elapsed_time": "0:58:23", "remaining_time": "0:39:03", "throughput": 4258.1, "total_tokens": 14916768} {"current_steps": 22870, "total_steps": 38160, "loss": 0.3665, "lr": 0.00041439231656555315, "epoch": 11.98637316561845, "percentage": 59.93, "elapsed_time": "0:58:23", "remaining_time": "0:39:02", "throughput": 4258.27, "total_tokens": 14920896} {"current_steps": 22875, "total_steps": 38160, "loss": 0.4037, "lr": 0.0004141670166873617, "epoch": 11.988993710691824, "percentage": 59.94, "elapsed_time": "0:58:24", "remaining_time": "0:39:01", "throughput": 4258.32, "total_tokens": 14924192} {"current_steps": 22880, "total_steps": 38160, "loss": 0.4526, "lr": 0.00041394173476445097, "epoch": 11.9916142557652, "percentage": 59.96, "elapsed_time": "0:58:25", "remaining_time": "0:39:00", "throughput": 4258.28, "total_tokens": 14926784} {"current_steps": 22885, "total_steps": 38160, "loss": 0.499, "lr": 0.00041371647084394744, "epoch": 11.994234800838575, "percentage": 59.97, "elapsed_time": "0:58:26", "remaining_time": "0:39:00", "throughput": 4258.36, "total_tokens": 14930432} {"current_steps": 22890, "total_steps": 38160, "loss": 0.5295, "lr": 0.00041349122497297394, "epoch": 11.99685534591195, "percentage": 59.98, "elapsed_time": "0:58:26", "remaining_time": "0:38:59", "throughput": 4258.4, "total_tokens": 14933664} {"current_steps": 22895, "total_steps": 38160, "loss": 0.4353, "lr": 0.0004132659971986491, "epoch": 11.999475890985325, "percentage": 60.0, "elapsed_time": "0:58:27", "remaining_time": "0:38:58", "throughput": 4258.48, "total_tokens": 14937088} {"current_steps": 22896, "total_steps": 38160, "eval_loss": 0.45972055196762085, "epoch": 12.0, "percentage": 60.0, "elapsed_time": "0:58:41", "remaining_time": "0:39:07", "throughput": 4241.88, "total_tokens": 14937216} {"current_steps": 22900, "total_steps": 38160, "loss": 0.4365, "lr": 0.00041304078756808837, "epoch": 12.0020964360587, "percentage": 60.01, "elapsed_time": "0:58:43", "remaining_time": "0:39:07", "throughput": 4240.07, "total_tokens": 14939712} {"current_steps": 22905, "total_steps": 38160, "loss": 0.461, "lr": 0.0004128155961284027, "epoch": 12.004716981132075, "percentage": 60.02, "elapsed_time": "0:58:44", "remaining_time": "0:39:07", "throughput": 4240.03, "total_tokens": 14942272} {"current_steps": 22910, "total_steps": 38160, "loss": 0.5216, "lr": 0.0004125904229266996, "epoch": 12.00733752620545, "percentage": 60.04, "elapsed_time": "0:58:44", "remaining_time": "0:39:06", "throughput": 4240.09, "total_tokens": 14945632} {"current_steps": 22915, "total_steps": 38160, "loss": 0.6418, "lr": 0.0004123652680100828, "epoch": 12.009958071278826, "percentage": 60.05, "elapsed_time": "0:58:45", "remaining_time": "0:39:05", "throughput": 4240.21, "total_tokens": 14949376} {"current_steps": 22920, "total_steps": 38160, "loss": 0.4902, "lr": 0.0004121401314256521, "epoch": 12.0125786163522, "percentage": 60.06, "elapsed_time": "0:58:46", "remaining_time": "0:39:04", "throughput": 4240.15, "total_tokens": 14951840} {"current_steps": 22925, "total_steps": 38160, "loss": 0.3243, "lr": 0.00041191501322050363, "epoch": 12.015199161425576, "percentage": 60.08, "elapsed_time": "0:58:47", "remaining_time": "0:39:04", "throughput": 4240.41, "total_tokens": 14956768} {"current_steps": 22930, "total_steps": 38160, "loss": 0.3588, "lr": 0.0004116899134417296, "epoch": 12.017819706498951, "percentage": 60.09, "elapsed_time": "0:58:47", "remaining_time": "0:39:03", "throughput": 4240.51, "total_tokens": 14960384} {"current_steps": 22935, "total_steps": 38160, "loss": 0.3649, "lr": 0.00041146483213641793, "epoch": 12.020440251572326, "percentage": 60.1, "elapsed_time": "0:58:48", "remaining_time": "0:39:02", "throughput": 4240.52, "total_tokens": 14963392} {"current_steps": 22940, "total_steps": 38160, "loss": 0.4234, "lr": 0.00041123976935165355, "epoch": 12.023060796645701, "percentage": 60.12, "elapsed_time": "0:58:49", "remaining_time": "0:39:01", "throughput": 4240.67, "total_tokens": 14967392} {"current_steps": 22945, "total_steps": 38160, "loss": 0.432, "lr": 0.0004110147251345165, "epoch": 12.025681341719078, "percentage": 60.13, "elapsed_time": "0:58:50", "remaining_time": "0:39:01", "throughput": 4240.98, "total_tokens": 14972704} {"current_steps": 22950, "total_steps": 38160, "loss": 0.383, "lr": 0.0004107896995320839, "epoch": 12.028301886792454, "percentage": 60.14, "elapsed_time": "0:58:51", "remaining_time": "0:39:00", "throughput": 4240.99, "total_tokens": 14975744} {"current_steps": 22955, "total_steps": 38160, "loss": 0.4466, "lr": 0.0004105646925914284, "epoch": 12.030922431865829, "percentage": 60.15, "elapsed_time": "0:58:51", "remaining_time": "0:38:59", "throughput": 4241.05, "total_tokens": 14979104} {"current_steps": 22960, "total_steps": 38160, "loss": 0.5187, "lr": 0.00041033970435961904, "epoch": 12.033542976939204, "percentage": 60.17, "elapsed_time": "0:58:52", "remaining_time": "0:38:58", "throughput": 4241.0, "total_tokens": 14981600} {"current_steps": 22965, "total_steps": 38160, "loss": 0.4048, "lr": 0.00041011473488372044, "epoch": 12.036163522012579, "percentage": 60.18, "elapsed_time": "0:58:53", "remaining_time": "0:38:57", "throughput": 4241.09, "total_tokens": 14985152} {"current_steps": 22970, "total_steps": 38160, "loss": 0.3256, "lr": 0.0004098897842107939, "epoch": 12.038784067085954, "percentage": 60.19, "elapsed_time": "0:58:54", "remaining_time": "0:38:57", "throughput": 4241.28, "total_tokens": 14989568} {"current_steps": 22975, "total_steps": 38160, "loss": 0.4446, "lr": 0.00040966485238789634, "epoch": 12.04140461215933, "percentage": 60.21, "elapsed_time": "0:58:54", "remaining_time": "0:38:56", "throughput": 4241.29, "total_tokens": 14992352} {"current_steps": 22980, "total_steps": 38160, "loss": 0.3498, "lr": 0.00040943993946208126, "epoch": 12.044025157232705, "percentage": 60.22, "elapsed_time": "0:58:55", "remaining_time": "0:38:55", "throughput": 4241.27, "total_tokens": 14995168} {"current_steps": 22985, "total_steps": 38160, "loss": 0.5716, "lr": 0.00040921504548039765, "epoch": 12.04664570230608, "percentage": 60.23, "elapsed_time": "0:58:56", "remaining_time": "0:38:54", "throughput": 4241.29, "total_tokens": 14998240} {"current_steps": 22990, "total_steps": 38160, "loss": 0.4735, "lr": 0.00040899017048989073, "epoch": 12.049266247379455, "percentage": 60.25, "elapsed_time": "0:58:56", "remaining_time": "0:38:53", "throughput": 4241.3, "total_tokens": 15001248} {"current_steps": 22995, "total_steps": 38160, "loss": 0.5159, "lr": 0.00040876531453760186, "epoch": 12.05188679245283, "percentage": 60.26, "elapsed_time": "0:58:57", "remaining_time": "0:38:53", "throughput": 4241.33, "total_tokens": 15004352} {"current_steps": 23000, "total_steps": 38160, "loss": 0.3923, "lr": 0.00040854047767056824, "epoch": 12.054507337526205, "percentage": 60.27, "elapsed_time": "0:58:58", "remaining_time": "0:38:52", "throughput": 4241.43, "total_tokens": 15007968} {"current_steps": 23005, "total_steps": 38160, "loss": 0.3887, "lr": 0.00040831565993582335, "epoch": 12.05712788259958, "percentage": 60.29, "elapsed_time": "0:58:59", "remaining_time": "0:38:51", "throughput": 4241.54, "total_tokens": 15011648} {"current_steps": 23010, "total_steps": 38160, "loss": 0.4027, "lr": 0.0004080908613803964, "epoch": 12.059748427672956, "percentage": 60.3, "elapsed_time": "0:58:59", "remaining_time": "0:38:50", "throughput": 4241.48, "total_tokens": 15014176} {"current_steps": 23015, "total_steps": 38160, "loss": 0.4793, "lr": 0.0004078660820513128, "epoch": 12.06236897274633, "percentage": 60.31, "elapsed_time": "0:59:00", "remaining_time": "0:38:49", "throughput": 4241.5, "total_tokens": 15017184} {"current_steps": 23020, "total_steps": 38160, "loss": 0.3679, "lr": 0.0004076413219955937, "epoch": 12.064989517819706, "percentage": 60.32, "elapsed_time": "0:59:01", "remaining_time": "0:38:49", "throughput": 4241.55, "total_tokens": 15020416} {"current_steps": 23025, "total_steps": 38160, "loss": 0.3905, "lr": 0.00040741658126025614, "epoch": 12.067610062893081, "percentage": 60.34, "elapsed_time": "0:59:02", "remaining_time": "0:38:48", "throughput": 4241.76, "total_tokens": 15024800} {"current_steps": 23030, "total_steps": 38160, "loss": 0.3399, "lr": 0.0004071918598923136, "epoch": 12.070230607966456, "percentage": 60.35, "elapsed_time": "0:59:02", "remaining_time": "0:38:47", "throughput": 4241.72, "total_tokens": 15027456} {"current_steps": 23035, "total_steps": 38160, "loss": 0.5479, "lr": 0.0004069671579387753, "epoch": 12.072851153039831, "percentage": 60.36, "elapsed_time": "0:59:03", "remaining_time": "0:38:46", "throughput": 4241.7, "total_tokens": 15030208} {"current_steps": 23040, "total_steps": 38160, "loss": 0.3814, "lr": 0.000406742475446646, "epoch": 12.075471698113208, "percentage": 60.38, "elapsed_time": "0:59:04", "remaining_time": "0:38:45", "throughput": 4241.69, "total_tokens": 15033120} {"current_steps": 23045, "total_steps": 38160, "loss": 0.4861, "lr": 0.0004065178124629272, "epoch": 12.078092243186584, "percentage": 60.39, "elapsed_time": "0:59:04", "remaining_time": "0:38:45", "throughput": 4241.81, "total_tokens": 15036960} {"current_steps": 23050, "total_steps": 38160, "loss": 0.4285, "lr": 0.0004062931690346153, "epoch": 12.080712788259959, "percentage": 60.4, "elapsed_time": "0:59:05", "remaining_time": "0:38:44", "throughput": 4241.96, "total_tokens": 15040992} {"current_steps": 23055, "total_steps": 38160, "loss": 0.4371, "lr": 0.0004060685452087034, "epoch": 12.083333333333334, "percentage": 60.42, "elapsed_time": "0:59:06", "remaining_time": "0:38:43", "throughput": 4241.98, "total_tokens": 15044096} {"current_steps": 23060, "total_steps": 38160, "loss": 0.4651, "lr": 0.00040584394103218026, "epoch": 12.085953878406709, "percentage": 60.43, "elapsed_time": "0:59:07", "remaining_time": "0:38:42", "throughput": 4242.07, "total_tokens": 15047680} {"current_steps": 23065, "total_steps": 38160, "loss": 0.3653, "lr": 0.0004056193565520304, "epoch": 12.088574423480084, "percentage": 60.44, "elapsed_time": "0:59:08", "remaining_time": "0:38:42", "throughput": 4242.16, "total_tokens": 15051328} {"current_steps": 23070, "total_steps": 38160, "loss": 0.3715, "lr": 0.0004053947918152344, "epoch": 12.09119496855346, "percentage": 60.46, "elapsed_time": "0:59:08", "remaining_time": "0:38:41", "throughput": 4242.21, "total_tokens": 15054560} {"current_steps": 23075, "total_steps": 38160, "loss": 0.4491, "lr": 0.0004051702468687688, "epoch": 12.093815513626835, "percentage": 60.47, "elapsed_time": "0:59:09", "remaining_time": "0:38:40", "throughput": 4242.29, "total_tokens": 15057888} {"current_steps": 23080, "total_steps": 38160, "loss": 0.4924, "lr": 0.0004049457217596055, "epoch": 12.09643605870021, "percentage": 60.48, "elapsed_time": "0:59:10", "remaining_time": "0:38:39", "throughput": 4242.33, "total_tokens": 15061120} {"current_steps": 23085, "total_steps": 38160, "loss": 0.4407, "lr": 0.0004047212165347129, "epoch": 12.099056603773585, "percentage": 60.5, "elapsed_time": "0:59:10", "remaining_time": "0:38:38", "throughput": 4242.36, "total_tokens": 15064224} {"current_steps": 23090, "total_steps": 38160, "loss": 0.4178, "lr": 0.00040449673124105464, "epoch": 12.10167714884696, "percentage": 60.51, "elapsed_time": "0:59:11", "remaining_time": "0:38:38", "throughput": 4242.4, "total_tokens": 15067360} {"current_steps": 23095, "total_steps": 38160, "loss": 0.3697, "lr": 0.00040427226592559064, "epoch": 12.104297693920335, "percentage": 60.52, "elapsed_time": "0:59:12", "remaining_time": "0:38:37", "throughput": 4242.45, "total_tokens": 15070688} {"current_steps": 23100, "total_steps": 38160, "loss": 0.421, "lr": 0.00040404782063527684, "epoch": 12.10691823899371, "percentage": 60.53, "elapsed_time": "0:59:13", "remaining_time": "0:38:36", "throughput": 4242.53, "total_tokens": 15074304} {"current_steps": 23105, "total_steps": 38160, "loss": 0.4695, "lr": 0.00040382339541706393, "epoch": 12.109538784067086, "percentage": 60.55, "elapsed_time": "0:59:13", "remaining_time": "0:38:35", "throughput": 4242.47, "total_tokens": 15076768} {"current_steps": 23110, "total_steps": 38160, "loss": 0.4235, "lr": 0.0004035989903178995, "epoch": 12.11215932914046, "percentage": 60.56, "elapsed_time": "0:59:14", "remaining_time": "0:38:34", "throughput": 4242.41, "total_tokens": 15079232} {"current_steps": 23115, "total_steps": 38160, "loss": 0.356, "lr": 0.0004033746053847266, "epoch": 12.114779874213836, "percentage": 60.57, "elapsed_time": "0:59:15", "remaining_time": "0:38:33", "throughput": 4242.48, "total_tokens": 15082688} {"current_steps": 23120, "total_steps": 38160, "loss": 0.3729, "lr": 0.00040315024066448374, "epoch": 12.117400419287211, "percentage": 60.59, "elapsed_time": "0:59:15", "remaining_time": "0:38:33", "throughput": 4242.57, "total_tokens": 15086400} {"current_steps": 23125, "total_steps": 38160, "loss": 0.3867, "lr": 0.00040292589620410577, "epoch": 12.120020964360586, "percentage": 60.6, "elapsed_time": "0:59:16", "remaining_time": "0:38:32", "throughput": 4242.55, "total_tokens": 15089184} {"current_steps": 23130, "total_steps": 38160, "loss": 0.331, "lr": 0.0004027015720505229, "epoch": 12.122641509433961, "percentage": 60.61, "elapsed_time": "0:59:17", "remaining_time": "0:38:31", "throughput": 4242.58, "total_tokens": 15092384} {"current_steps": 23135, "total_steps": 38160, "loss": 0.4275, "lr": 0.0004024772682506609, "epoch": 12.125262054507338, "percentage": 60.63, "elapsed_time": "0:59:18", "remaining_time": "0:38:30", "throughput": 4242.64, "total_tokens": 15095776} {"current_steps": 23140, "total_steps": 38160, "loss": 0.5171, "lr": 0.0004022529848514419, "epoch": 12.127882599580714, "percentage": 60.64, "elapsed_time": "0:59:18", "remaining_time": "0:38:29", "throughput": 4242.63, "total_tokens": 15098624} {"current_steps": 23145, "total_steps": 38160, "loss": 0.4417, "lr": 0.00040202872189978324, "epoch": 12.130503144654089, "percentage": 60.65, "elapsed_time": "0:59:19", "remaining_time": "0:38:29", "throughput": 4242.55, "total_tokens": 15100992} {"current_steps": 23150, "total_steps": 38160, "loss": 0.339, "lr": 0.0004018044794425983, "epoch": 12.133123689727464, "percentage": 60.67, "elapsed_time": "0:59:20", "remaining_time": "0:38:28", "throughput": 4242.59, "total_tokens": 15104352} {"current_steps": 23155, "total_steps": 38160, "loss": 0.4115, "lr": 0.00040158025752679596, "epoch": 12.135744234800839, "percentage": 60.68, "elapsed_time": "0:59:20", "remaining_time": "0:38:27", "throughput": 4242.59, "total_tokens": 15107200} {"current_steps": 23160, "total_steps": 38160, "loss": 0.5506, "lr": 0.0004013560561992811, "epoch": 12.138364779874214, "percentage": 60.69, "elapsed_time": "0:59:21", "remaining_time": "0:38:26", "throughput": 4242.71, "total_tokens": 15111008} {"current_steps": 23165, "total_steps": 38160, "loss": 0.4476, "lr": 0.0004011318755069537, "epoch": 12.14098532494759, "percentage": 60.7, "elapsed_time": "0:59:22", "remaining_time": "0:38:25", "throughput": 4242.65, "total_tokens": 15113440} {"current_steps": 23170, "total_steps": 38160, "loss": 0.43, "lr": 0.00040090771549670994, "epoch": 12.143605870020965, "percentage": 60.72, "elapsed_time": "0:59:22", "remaining_time": "0:38:25", "throughput": 4242.63, "total_tokens": 15116256} {"current_steps": 23175, "total_steps": 38160, "loss": 0.4576, "lr": 0.00040068357621544167, "epoch": 12.14622641509434, "percentage": 60.73, "elapsed_time": "0:59:23", "remaining_time": "0:38:24", "throughput": 4242.65, "total_tokens": 15119296} {"current_steps": 23180, "total_steps": 38160, "loss": 0.3395, "lr": 0.00040045945771003625, "epoch": 12.148846960167715, "percentage": 60.74, "elapsed_time": "0:59:24", "remaining_time": "0:38:23", "throughput": 4242.82, "total_tokens": 15123584} {"current_steps": 23185, "total_steps": 38160, "loss": 0.4197, "lr": 0.0004002353600273767, "epoch": 12.15146750524109, "percentage": 60.76, "elapsed_time": "0:59:25", "remaining_time": "0:38:22", "throughput": 4242.89, "total_tokens": 15127008} {"current_steps": 23190, "total_steps": 38160, "loss": 0.4162, "lr": 0.0004000112832143415, "epoch": 12.154088050314465, "percentage": 60.77, "elapsed_time": "0:59:25", "remaining_time": "0:38:21", "throughput": 4242.87, "total_tokens": 15129728} {"current_steps": 23195, "total_steps": 38160, "loss": 0.479, "lr": 0.00039978722731780523, "epoch": 12.15670859538784, "percentage": 60.78, "elapsed_time": "0:59:26", "remaining_time": "0:38:21", "throughput": 4242.94, "total_tokens": 15133152} {"current_steps": 23200, "total_steps": 38160, "loss": 0.4822, "lr": 0.00039956319238463754, "epoch": 12.159329140461216, "percentage": 60.8, "elapsed_time": "0:59:27", "remaining_time": "0:38:20", "throughput": 4243.05, "total_tokens": 15136960} {"current_steps": 23205, "total_steps": 38160, "loss": 0.4559, "lr": 0.00039933917846170436, "epoch": 12.16194968553459, "percentage": 60.81, "elapsed_time": "0:59:28", "remaining_time": "0:38:19", "throughput": 4243.1, "total_tokens": 15140128} {"current_steps": 23210, "total_steps": 38160, "loss": 0.4251, "lr": 0.0003991151855958665, "epoch": 12.164570230607966, "percentage": 60.82, "elapsed_time": "0:59:29", "remaining_time": "0:38:18", "throughput": 4243.23, "total_tokens": 15144128} {"current_steps": 23215, "total_steps": 38160, "loss": 0.448, "lr": 0.00039889121383398113, "epoch": 12.167190775681341, "percentage": 60.84, "elapsed_time": "0:59:29", "remaining_time": "0:38:18", "throughput": 4243.37, "total_tokens": 15147968} {"current_steps": 23220, "total_steps": 38160, "loss": 0.3529, "lr": 0.00039866726322290014, "epoch": 12.169811320754716, "percentage": 60.85, "elapsed_time": "0:59:30", "remaining_time": "0:38:17", "throughput": 4243.38, "total_tokens": 15150976} {"current_steps": 23225, "total_steps": 38160, "loss": 0.6012, "lr": 0.0003984433338094715, "epoch": 12.172431865828091, "percentage": 60.86, "elapsed_time": "0:59:31", "remaining_time": "0:38:16", "throughput": 4243.44, "total_tokens": 15154368} {"current_steps": 23230, "total_steps": 38160, "loss": 0.4658, "lr": 0.000398219425640539, "epoch": 12.175052410901468, "percentage": 60.88, "elapsed_time": "0:59:32", "remaining_time": "0:38:15", "throughput": 4243.53, "total_tokens": 15157984} {"current_steps": 23235, "total_steps": 38160, "loss": 0.5087, "lr": 0.0003979955387629413, "epoch": 12.177672955974844, "percentage": 60.89, "elapsed_time": "0:59:32", "remaining_time": "0:38:15", "throughput": 4243.69, "total_tokens": 15162208} {"current_steps": 23240, "total_steps": 38160, "loss": 0.4283, "lr": 0.0003977716732235133, "epoch": 12.180293501048219, "percentage": 60.9, "elapsed_time": "0:59:33", "remaining_time": "0:38:14", "throughput": 4243.7, "total_tokens": 15165088} {"current_steps": 23245, "total_steps": 38160, "loss": 0.3354, "lr": 0.000397547829069085, "epoch": 12.182914046121594, "percentage": 60.91, "elapsed_time": "0:59:34", "remaining_time": "0:38:13", "throughput": 4243.59, "total_tokens": 15167200} {"current_steps": 23250, "total_steps": 38160, "loss": 0.4986, "lr": 0.000397324006346482, "epoch": 12.185534591194969, "percentage": 60.93, "elapsed_time": "0:59:34", "remaining_time": "0:38:12", "throughput": 4243.62, "total_tokens": 15170304} {"current_steps": 23255, "total_steps": 38160, "loss": 0.4516, "lr": 0.0003971002051025253, "epoch": 12.188155136268344, "percentage": 60.94, "elapsed_time": "0:59:35", "remaining_time": "0:38:11", "throughput": 4243.58, "total_tokens": 15173024} {"current_steps": 23260, "total_steps": 38160, "loss": 0.5371, "lr": 0.000396876425384032, "epoch": 12.19077568134172, "percentage": 60.95, "elapsed_time": "0:59:36", "remaining_time": "0:38:10", "throughput": 4243.72, "total_tokens": 15176960} {"current_steps": 23265, "total_steps": 38160, "loss": 0.4434, "lr": 0.00039665266723781377, "epoch": 12.193396226415095, "percentage": 60.97, "elapsed_time": "0:59:37", "remaining_time": "0:38:10", "throughput": 4244.26, "total_tokens": 15184576} {"current_steps": 23270, "total_steps": 38160, "loss": 0.4765, "lr": 0.00039642893071067877, "epoch": 12.19601677148847, "percentage": 60.98, "elapsed_time": "0:59:38", "remaining_time": "0:38:09", "throughput": 4244.3, "total_tokens": 15187840} {"current_steps": 23275, "total_steps": 38160, "loss": 0.3812, "lr": 0.0003962052158494298, "epoch": 12.198637316561845, "percentage": 60.99, "elapsed_time": "0:59:39", "remaining_time": "0:38:08", "throughput": 4244.36, "total_tokens": 15191072} {"current_steps": 23280, "total_steps": 38160, "loss": 0.4022, "lr": 0.00039598152270086534, "epoch": 12.20125786163522, "percentage": 61.01, "elapsed_time": "0:59:39", "remaining_time": "0:38:08", "throughput": 4244.43, "total_tokens": 15194592} {"current_steps": 23285, "total_steps": 38160, "loss": 0.4183, "lr": 0.00039575785131177975, "epoch": 12.203878406708595, "percentage": 61.02, "elapsed_time": "0:59:40", "remaining_time": "0:38:07", "throughput": 4244.54, "total_tokens": 15198240} {"current_steps": 23290, "total_steps": 38160, "loss": 0.4754, "lr": 0.0003955342017289624, "epoch": 12.20649895178197, "percentage": 61.03, "elapsed_time": "0:59:41", "remaining_time": "0:38:06", "throughput": 4244.52, "total_tokens": 15201056} {"current_steps": 23295, "total_steps": 38160, "loss": 0.4722, "lr": 0.0003953105739991982, "epoch": 12.209119496855346, "percentage": 61.05, "elapsed_time": "0:59:42", "remaining_time": "0:38:05", "throughput": 4244.56, "total_tokens": 15204320} {"current_steps": 23300, "total_steps": 38160, "loss": 0.4227, "lr": 0.0003950869681692678, "epoch": 12.21174004192872, "percentage": 61.06, "elapsed_time": "0:59:42", "remaining_time": "0:38:04", "throughput": 4244.58, "total_tokens": 15207264} {"current_steps": 23305, "total_steps": 38160, "loss": 0.3438, "lr": 0.0003948633842859465, "epoch": 12.214360587002096, "percentage": 61.07, "elapsed_time": "0:59:43", "remaining_time": "0:38:04", "throughput": 4244.57, "total_tokens": 15210112} {"current_steps": 23310, "total_steps": 38160, "loss": 0.3426, "lr": 0.00039463982239600575, "epoch": 12.216981132075471, "percentage": 61.08, "elapsed_time": "0:59:44", "remaining_time": "0:38:03", "throughput": 4244.64, "total_tokens": 15213504} {"current_steps": 23315, "total_steps": 38160, "loss": 0.458, "lr": 0.00039441628254621215, "epoch": 12.219601677148846, "percentage": 61.1, "elapsed_time": "0:59:44", "remaining_time": "0:38:02", "throughput": 4244.56, "total_tokens": 15215808} {"current_steps": 23320, "total_steps": 38160, "loss": 0.5023, "lr": 0.00039419276478332773, "epoch": 12.222222222222221, "percentage": 61.11, "elapsed_time": "0:59:45", "remaining_time": "0:38:01", "throughput": 4244.5, "total_tokens": 15218304} {"current_steps": 23325, "total_steps": 38160, "loss": 0.5874, "lr": 0.0003939692691541097, "epoch": 12.224842767295598, "percentage": 61.12, "elapsed_time": "0:59:46", "remaining_time": "0:38:00", "throughput": 4244.48, "total_tokens": 15221024} {"current_steps": 23330, "total_steps": 38160, "loss": 0.4286, "lr": 0.00039374579570531114, "epoch": 12.227463312368974, "percentage": 61.14, "elapsed_time": "0:59:46", "remaining_time": "0:37:59", "throughput": 4244.47, "total_tokens": 15223872} {"current_steps": 23335, "total_steps": 38160, "loss": 0.3845, "lr": 0.0003935223444836797, "epoch": 12.230083857442349, "percentage": 61.15, "elapsed_time": "0:59:47", "remaining_time": "0:37:59", "throughput": 4244.52, "total_tokens": 15227168} {"current_steps": 23340, "total_steps": 38160, "loss": 0.44, "lr": 0.0003932989155359591, "epoch": 12.232704402515724, "percentage": 61.16, "elapsed_time": "0:59:48", "remaining_time": "0:37:58", "throughput": 4244.61, "total_tokens": 15230816} {"current_steps": 23345, "total_steps": 38160, "loss": 0.4287, "lr": 0.000393075508908888, "epoch": 12.235324947589099, "percentage": 61.18, "elapsed_time": "0:59:48", "remaining_time": "0:37:57", "throughput": 4244.59, "total_tokens": 15233568} {"current_steps": 23350, "total_steps": 38160, "loss": 0.3287, "lr": 0.00039285212464920064, "epoch": 12.237945492662474, "percentage": 61.19, "elapsed_time": "0:59:49", "remaining_time": "0:37:56", "throughput": 4244.53, "total_tokens": 15236064} {"current_steps": 23355, "total_steps": 38160, "loss": 0.3825, "lr": 0.0003926287628036265, "epoch": 12.24056603773585, "percentage": 61.2, "elapsed_time": "0:59:50", "remaining_time": "0:37:55", "throughput": 4244.56, "total_tokens": 15239168} {"current_steps": 23360, "total_steps": 38160, "loss": 0.393, "lr": 0.00039240542341889003, "epoch": 12.243186582809225, "percentage": 61.22, "elapsed_time": "0:59:50", "remaining_time": "0:37:55", "throughput": 4244.56, "total_tokens": 15241984} {"current_steps": 23365, "total_steps": 38160, "loss": 0.4415, "lr": 0.0003921821065417116, "epoch": 12.2458071278826, "percentage": 61.23, "elapsed_time": "0:59:51", "remaining_time": "0:37:54", "throughput": 4244.55, "total_tokens": 15244800} {"current_steps": 23370, "total_steps": 38160, "loss": 0.362, "lr": 0.0003919588122188063, "epoch": 12.248427672955975, "percentage": 61.24, "elapsed_time": "0:59:52", "remaining_time": "0:37:53", "throughput": 4244.65, "total_tokens": 15248416} {"current_steps": 23375, "total_steps": 38160, "loss": 0.4136, "lr": 0.000391735540496885, "epoch": 12.25104821802935, "percentage": 61.26, "elapsed_time": "0:59:53", "remaining_time": "0:37:52", "throughput": 4244.62, "total_tokens": 15251008} {"current_steps": 23380, "total_steps": 38160, "loss": 0.4758, "lr": 0.00039151229142265337, "epoch": 12.253668763102725, "percentage": 61.27, "elapsed_time": "0:59:54", "remaining_time": "0:37:52", "throughput": 4244.96, "total_tokens": 15256992} {"current_steps": 23385, "total_steps": 38160, "loss": 0.3518, "lr": 0.00039128906504281295, "epoch": 12.2562893081761, "percentage": 61.28, "elapsed_time": "0:59:54", "remaining_time": "0:37:51", "throughput": 4244.96, "total_tokens": 15259712} {"current_steps": 23390, "total_steps": 38160, "loss": 0.5392, "lr": 0.00039106586140405964, "epoch": 12.258909853249476, "percentage": 61.29, "elapsed_time": "0:59:55", "remaining_time": "0:37:50", "throughput": 4245.0, "total_tokens": 15262880} {"current_steps": 23395, "total_steps": 38160, "loss": 0.448, "lr": 0.00039084268055308537, "epoch": 12.26153039832285, "percentage": 61.31, "elapsed_time": "0:59:56", "remaining_time": "0:37:49", "throughput": 4245.04, "total_tokens": 15266048} {"current_steps": 23400, "total_steps": 38160, "loss": 0.4583, "lr": 0.00039061952253657703, "epoch": 12.264150943396226, "percentage": 61.32, "elapsed_time": "0:59:56", "remaining_time": "0:37:48", "throughput": 4245.04, "total_tokens": 15268928} {"current_steps": 23405, "total_steps": 38160, "loss": 0.5595, "lr": 0.0003903963874012166, "epoch": 12.266771488469601, "percentage": 61.33, "elapsed_time": "0:59:57", "remaining_time": "0:37:47", "throughput": 4245.04, "total_tokens": 15271872} {"current_steps": 23410, "total_steps": 38160, "loss": 0.4636, "lr": 0.0003901732751936815, "epoch": 12.269392033542976, "percentage": 61.35, "elapsed_time": "0:59:58", "remaining_time": "0:37:47", "throughput": 4245.29, "total_tokens": 15276704} {"current_steps": 23415, "total_steps": 38160, "loss": 0.4146, "lr": 0.00038995018596064447, "epoch": 12.272012578616351, "percentage": 61.36, "elapsed_time": "0:59:59", "remaining_time": "0:37:46", "throughput": 4245.3, "total_tokens": 15279648} {"current_steps": 23420, "total_steps": 38160, "loss": 0.4293, "lr": 0.00038972711974877294, "epoch": 12.274633123689728, "percentage": 61.37, "elapsed_time": "0:59:59", "remaining_time": "0:37:45", "throughput": 4245.25, "total_tokens": 15282176} {"current_steps": 23425, "total_steps": 38160, "loss": 0.3889, "lr": 0.0003895040766047298, "epoch": 12.277253668763104, "percentage": 61.39, "elapsed_time": "1:00:00", "remaining_time": "0:37:44", "throughput": 4245.2, "total_tokens": 15284640} {"current_steps": 23430, "total_steps": 38160, "loss": 0.3998, "lr": 0.0003892810565751733, "epoch": 12.279874213836479, "percentage": 61.4, "elapsed_time": "1:00:01", "remaining_time": "0:37:43", "throughput": 4245.23, "total_tokens": 15287712} {"current_steps": 23435, "total_steps": 38160, "loss": 0.3908, "lr": 0.0003890580597067566, "epoch": 12.282494758909854, "percentage": 61.41, "elapsed_time": "1:00:01", "remaining_time": "0:37:43", "throughput": 4245.32, "total_tokens": 15291296} {"current_steps": 23440, "total_steps": 38160, "loss": 0.4184, "lr": 0.0003888350860461281, "epoch": 12.285115303983229, "percentage": 61.43, "elapsed_time": "1:00:02", "remaining_time": "0:37:42", "throughput": 4245.36, "total_tokens": 15294464} {"current_steps": 23445, "total_steps": 38160, "loss": 0.2636, "lr": 0.0003886121356399315, "epoch": 12.287735849056604, "percentage": 61.44, "elapsed_time": "1:00:03", "remaining_time": "0:37:41", "throughput": 4245.59, "total_tokens": 15299392} {"current_steps": 23450, "total_steps": 38160, "loss": 0.46, "lr": 0.0003883892085348052, "epoch": 12.29035639412998, "percentage": 61.45, "elapsed_time": "1:00:04", "remaining_time": "0:37:40", "throughput": 4245.62, "total_tokens": 15302496} {"current_steps": 23455, "total_steps": 38160, "loss": 0.5132, "lr": 0.0003881663047773832, "epoch": 12.292976939203355, "percentage": 61.46, "elapsed_time": "1:00:05", "remaining_time": "0:37:40", "throughput": 4245.77, "total_tokens": 15306464} {"current_steps": 23460, "total_steps": 38160, "loss": 0.394, "lr": 0.00038794342441429426, "epoch": 12.29559748427673, "percentage": 61.48, "elapsed_time": "1:00:05", "remaining_time": "0:37:39", "throughput": 4245.84, "total_tokens": 15309792} {"current_steps": 23465, "total_steps": 38160, "loss": 0.4492, "lr": 0.00038772056749216267, "epoch": 12.298218029350105, "percentage": 61.49, "elapsed_time": "1:00:06", "remaining_time": "0:37:38", "throughput": 4245.83, "total_tokens": 15312576} {"current_steps": 23470, "total_steps": 38160, "loss": 0.4247, "lr": 0.00038749773405760744, "epoch": 12.30083857442348, "percentage": 61.5, "elapsed_time": "1:00:07", "remaining_time": "0:37:37", "throughput": 4245.81, "total_tokens": 15315296} {"current_steps": 23475, "total_steps": 38160, "loss": 0.4625, "lr": 0.00038727492415724265, "epoch": 12.303459119496855, "percentage": 61.52, "elapsed_time": "1:00:07", "remaining_time": "0:37:36", "throughput": 4245.8, "total_tokens": 15318112} {"current_steps": 23480, "total_steps": 38160, "loss": 0.4699, "lr": 0.00038705213783767767, "epoch": 12.30607966457023, "percentage": 61.53, "elapsed_time": "1:00:08", "remaining_time": "0:37:36", "throughput": 4245.79, "total_tokens": 15320896} {"current_steps": 23485, "total_steps": 38160, "loss": 0.3165, "lr": 0.00038682937514551686, "epoch": 12.308700209643606, "percentage": 61.54, "elapsed_time": "1:00:09", "remaining_time": "0:37:35", "throughput": 4245.81, "total_tokens": 15323904} {"current_steps": 23490, "total_steps": 38160, "loss": 0.5175, "lr": 0.0003866066361273596, "epoch": 12.31132075471698, "percentage": 61.56, "elapsed_time": "1:00:09", "remaining_time": "0:37:34", "throughput": 4245.82, "total_tokens": 15326944} {"current_steps": 23495, "total_steps": 38160, "loss": 0.4365, "lr": 0.00038638392082980056, "epoch": 12.313941299790356, "percentage": 61.57, "elapsed_time": "1:00:10", "remaining_time": "0:37:33", "throughput": 4246.05, "total_tokens": 15331776} {"current_steps": 23500, "total_steps": 38160, "loss": 0.4143, "lr": 0.0003861612292994292, "epoch": 12.316561844863731, "percentage": 61.58, "elapsed_time": "1:00:11", "remaining_time": "0:37:32", "throughput": 4246.04, "total_tokens": 15334624} {"current_steps": 23505, "total_steps": 38160, "loss": 0.454, "lr": 0.0003859385615828297, "epoch": 12.319182389937106, "percentage": 61.6, "elapsed_time": "1:00:12", "remaining_time": "0:37:32", "throughput": 4246.24, "total_tokens": 15339072} {"current_steps": 23510, "total_steps": 38160, "loss": 0.3993, "lr": 0.00038571591772658186, "epoch": 12.321802935010481, "percentage": 61.61, "elapsed_time": "1:00:13", "remaining_time": "0:37:31", "throughput": 4246.27, "total_tokens": 15342240} {"current_steps": 23515, "total_steps": 38160, "loss": 0.4008, "lr": 0.0003854932977772602, "epoch": 12.324423480083858, "percentage": 61.62, "elapsed_time": "1:00:13", "remaining_time": "0:37:30", "throughput": 4246.47, "total_tokens": 15346528} {"current_steps": 23520, "total_steps": 38160, "loss": 0.4392, "lr": 0.00038527070178143435, "epoch": 12.327044025157234, "percentage": 61.64, "elapsed_time": "1:00:14", "remaining_time": "0:37:29", "throughput": 4246.57, "total_tokens": 15350144} {"current_steps": 23525, "total_steps": 38160, "loss": 0.3596, "lr": 0.00038504812978566873, "epoch": 12.329664570230609, "percentage": 61.65, "elapsed_time": "1:00:15", "remaining_time": "0:37:29", "throughput": 4246.54, "total_tokens": 15352832} {"current_steps": 23530, "total_steps": 38160, "loss": 0.4853, "lr": 0.00038482558183652307, "epoch": 12.332285115303984, "percentage": 61.66, "elapsed_time": "1:00:16", "remaining_time": "0:37:28", "throughput": 4246.51, "total_tokens": 15355392} {"current_steps": 23535, "total_steps": 38160, "loss": 0.3462, "lr": 0.00038460305798055164, "epoch": 12.334905660377359, "percentage": 61.67, "elapsed_time": "1:00:16", "remaining_time": "0:37:27", "throughput": 4246.4, "total_tokens": 15357504} {"current_steps": 23540, "total_steps": 38160, "loss": 0.3345, "lr": 0.00038438055826430385, "epoch": 12.337526205450734, "percentage": 61.69, "elapsed_time": "1:00:17", "remaining_time": "0:37:26", "throughput": 4246.44, "total_tokens": 15360672} {"current_steps": 23545, "total_steps": 38160, "loss": 0.628, "lr": 0.0003841580827343243, "epoch": 12.34014675052411, "percentage": 61.7, "elapsed_time": "1:00:18", "remaining_time": "0:37:25", "throughput": 4246.5, "total_tokens": 15364128} {"current_steps": 23550, "total_steps": 38160, "loss": 0.4646, "lr": 0.00038393563143715215, "epoch": 12.342767295597485, "percentage": 61.71, "elapsed_time": "1:00:18", "remaining_time": "0:37:25", "throughput": 4246.51, "total_tokens": 15367072} {"current_steps": 23555, "total_steps": 38160, "loss": 0.3447, "lr": 0.00038371320441932195, "epoch": 12.34538784067086, "percentage": 61.73, "elapsed_time": "1:00:19", "remaining_time": "0:37:24", "throughput": 4246.62, "total_tokens": 15370848} {"current_steps": 23560, "total_steps": 38160, "loss": 0.4041, "lr": 0.00038349080172736267, "epoch": 12.348008385744235, "percentage": 61.74, "elapsed_time": "1:00:20", "remaining_time": "0:37:23", "throughput": 4246.85, "total_tokens": 15375680} {"current_steps": 23565, "total_steps": 38160, "loss": 0.5243, "lr": 0.00038326842340779833, "epoch": 12.35062893081761, "percentage": 61.75, "elapsed_time": "1:00:21", "remaining_time": "0:37:22", "throughput": 4246.89, "total_tokens": 15378784} {"current_steps": 23570, "total_steps": 38160, "loss": 0.4355, "lr": 0.00038304606950714803, "epoch": 12.353249475890985, "percentage": 61.77, "elapsed_time": "1:00:21", "remaining_time": "0:37:21", "throughput": 4246.91, "total_tokens": 15381856} {"current_steps": 23575, "total_steps": 38160, "loss": 0.5033, "lr": 0.0003828237400719259, "epoch": 12.35587002096436, "percentage": 61.78, "elapsed_time": "1:00:22", "remaining_time": "0:37:21", "throughput": 4246.98, "total_tokens": 15385376} {"current_steps": 23580, "total_steps": 38160, "loss": 0.3806, "lr": 0.00038260143514864037, "epoch": 12.358490566037736, "percentage": 61.79, "elapsed_time": "1:00:23", "remaining_time": "0:37:20", "throughput": 4247.15, "total_tokens": 15389568} {"current_steps": 23585, "total_steps": 38160, "loss": 0.3465, "lr": 0.0003823791547837955, "epoch": 12.36111111111111, "percentage": 61.81, "elapsed_time": "1:00:24", "remaining_time": "0:37:19", "throughput": 4247.12, "total_tokens": 15392160} {"current_steps": 23590, "total_steps": 38160, "loss": 0.5233, "lr": 0.0003821568990238894, "epoch": 12.363731656184486, "percentage": 61.82, "elapsed_time": "1:00:24", "remaining_time": "0:37:18", "throughput": 4247.17, "total_tokens": 15395520} {"current_steps": 23595, "total_steps": 38160, "loss": 0.5261, "lr": 0.0003819346679154155, "epoch": 12.366352201257861, "percentage": 61.83, "elapsed_time": "1:00:25", "remaining_time": "0:37:18", "throughput": 4247.21, "total_tokens": 15398592} {"current_steps": 23600, "total_steps": 38160, "loss": 0.4551, "lr": 0.0003817124615048623, "epoch": 12.368972746331236, "percentage": 61.84, "elapsed_time": "1:00:26", "remaining_time": "0:37:17", "throughput": 4247.25, "total_tokens": 15401824} {"current_steps": 23605, "total_steps": 38160, "loss": 0.4618, "lr": 0.00038149027983871243, "epoch": 12.371593291404611, "percentage": 61.86, "elapsed_time": "1:00:27", "remaining_time": "0:37:16", "throughput": 4247.35, "total_tokens": 15405536} {"current_steps": 23610, "total_steps": 38160, "loss": 0.482, "lr": 0.00038126812296344415, "epoch": 12.374213836477987, "percentage": 61.87, "elapsed_time": "1:00:27", "remaining_time": "0:37:15", "throughput": 4247.4, "total_tokens": 15408800} {"current_steps": 23615, "total_steps": 38160, "loss": 0.5398, "lr": 0.0003810459909255301, "epoch": 12.376834381551364, "percentage": 61.88, "elapsed_time": "1:00:28", "remaining_time": "0:37:14", "throughput": 4247.37, "total_tokens": 15411392} {"current_steps": 23620, "total_steps": 38160, "loss": 0.5452, "lr": 0.0003808238837714374, "epoch": 12.379454926624739, "percentage": 61.9, "elapsed_time": "1:00:29", "remaining_time": "0:37:14", "throughput": 4247.34, "total_tokens": 15414144} {"current_steps": 23625, "total_steps": 38160, "loss": 0.525, "lr": 0.0003806018015476287, "epoch": 12.382075471698114, "percentage": 61.91, "elapsed_time": "1:00:29", "remaining_time": "0:37:13", "throughput": 4247.46, "total_tokens": 15417984} {"current_steps": 23630, "total_steps": 38160, "loss": 0.3711, "lr": 0.0003803797443005609, "epoch": 12.384696016771489, "percentage": 61.92, "elapsed_time": "1:00:30", "remaining_time": "0:37:12", "throughput": 4247.51, "total_tokens": 15421280} {"current_steps": 23635, "total_steps": 38160, "loss": 0.5364, "lr": 0.0003801577120766859, "epoch": 12.387316561844864, "percentage": 61.94, "elapsed_time": "1:00:31", "remaining_time": "0:37:11", "throughput": 4247.47, "total_tokens": 15423872} {"current_steps": 23640, "total_steps": 38160, "loss": 0.4102, "lr": 0.0003799357049224505, "epoch": 12.38993710691824, "percentage": 61.95, "elapsed_time": "1:00:32", "remaining_time": "0:37:10", "throughput": 4247.5, "total_tokens": 15426976} {"current_steps": 23645, "total_steps": 38160, "loss": 0.4098, "lr": 0.0003797137228842956, "epoch": 12.392557651991615, "percentage": 61.96, "elapsed_time": "1:00:32", "remaining_time": "0:37:10", "throughput": 4247.54, "total_tokens": 15430240} {"current_steps": 23650, "total_steps": 38160, "loss": 0.3328, "lr": 0.0003794917660086576, "epoch": 12.39517819706499, "percentage": 61.98, "elapsed_time": "1:00:33", "remaining_time": "0:37:09", "throughput": 4247.61, "total_tokens": 15433664} {"current_steps": 23655, "total_steps": 38160, "loss": 0.4222, "lr": 0.0003792698343419674, "epoch": 12.397798742138365, "percentage": 61.99, "elapsed_time": "1:00:34", "remaining_time": "0:37:08", "throughput": 4247.69, "total_tokens": 15437088} {"current_steps": 23660, "total_steps": 38160, "loss": 0.4694, "lr": 0.0003790479279306505, "epoch": 12.40041928721174, "percentage": 62.0, "elapsed_time": "1:00:34", "remaining_time": "0:37:07", "throughput": 4247.7, "total_tokens": 15440096} {"current_steps": 23665, "total_steps": 38160, "loss": 0.4321, "lr": 0.0003788260468211271, "epoch": 12.403039832285115, "percentage": 62.02, "elapsed_time": "1:00:35", "remaining_time": "0:37:06", "throughput": 4247.87, "total_tokens": 15444352} {"current_steps": 23670, "total_steps": 38160, "loss": 0.4359, "lr": 0.0003786041910598125, "epoch": 12.40566037735849, "percentage": 62.03, "elapsed_time": "1:00:36", "remaining_time": "0:37:06", "throughput": 4248.04, "total_tokens": 15448736} {"current_steps": 23675, "total_steps": 38160, "loss": 0.3888, "lr": 0.0003783823606931159, "epoch": 12.408280922431866, "percentage": 62.04, "elapsed_time": "1:00:37", "remaining_time": "0:37:05", "throughput": 4248.05, "total_tokens": 15451712} {"current_steps": 23680, "total_steps": 38160, "loss": 0.3723, "lr": 0.0003781605557674421, "epoch": 12.41090146750524, "percentage": 62.05, "elapsed_time": "1:00:37", "remaining_time": "0:37:04", "throughput": 4248.01, "total_tokens": 15454272} {"current_steps": 23685, "total_steps": 38160, "loss": 0.4202, "lr": 0.0003779387763291899, "epoch": 12.413522012578616, "percentage": 62.07, "elapsed_time": "1:00:38", "remaining_time": "0:37:03", "throughput": 4248.11, "total_tokens": 15457856} {"current_steps": 23690, "total_steps": 38160, "loss": 0.3629, "lr": 0.0003777170224247533, "epoch": 12.416142557651991, "percentage": 62.08, "elapsed_time": "1:00:39", "remaining_time": "0:37:03", "throughput": 4248.2, "total_tokens": 15461408} {"current_steps": 23695, "total_steps": 38160, "loss": 0.4792, "lr": 0.0003774952941005204, "epoch": 12.418763102725366, "percentage": 62.09, "elapsed_time": "1:00:40", "remaining_time": "0:37:02", "throughput": 4248.3, "total_tokens": 15464992} {"current_steps": 23700, "total_steps": 38160, "loss": 0.4734, "lr": 0.00037727359140287455, "epoch": 12.421383647798741, "percentage": 62.11, "elapsed_time": "1:00:40", "remaining_time": "0:37:01", "throughput": 4248.32, "total_tokens": 15468096} {"current_steps": 23705, "total_steps": 38160, "loss": 0.3784, "lr": 0.00037705191437819316, "epoch": 12.424004192872117, "percentage": 62.12, "elapsed_time": "1:00:41", "remaining_time": "0:37:00", "throughput": 4248.29, "total_tokens": 15470752} {"current_steps": 23710, "total_steps": 38160, "loss": 0.4823, "lr": 0.00037683026307284853, "epoch": 12.426624737945493, "percentage": 62.13, "elapsed_time": "1:00:42", "remaining_time": "0:36:59", "throughput": 4248.33, "total_tokens": 15473952} {"current_steps": 23715, "total_steps": 38160, "loss": 0.3424, "lr": 0.0003766086375332077, "epoch": 12.429245283018869, "percentage": 62.15, "elapsed_time": "1:00:43", "remaining_time": "0:36:59", "throughput": 4248.45, "total_tokens": 15477760} {"current_steps": 23720, "total_steps": 38160, "loss": 0.3968, "lr": 0.0003763870378056321, "epoch": 12.431865828092244, "percentage": 62.16, "elapsed_time": "1:00:43", "remaining_time": "0:36:58", "throughput": 4248.43, "total_tokens": 15480384} {"current_steps": 23725, "total_steps": 38160, "loss": 0.4313, "lr": 0.00037616546393647824, "epoch": 12.434486373165619, "percentage": 62.17, "elapsed_time": "1:00:44", "remaining_time": "0:36:57", "throughput": 4248.39, "total_tokens": 15482976} {"current_steps": 23730, "total_steps": 38160, "loss": 0.337, "lr": 0.0003759439159720962, "epoch": 12.437106918238994, "percentage": 62.19, "elapsed_time": "1:00:45", "remaining_time": "0:36:56", "throughput": 4248.41, "total_tokens": 15486016} {"current_steps": 23735, "total_steps": 38160, "loss": 0.3647, "lr": 0.0003757223939588318, "epoch": 12.43972746331237, "percentage": 62.2, "elapsed_time": "1:00:45", "remaining_time": "0:36:55", "throughput": 4248.49, "total_tokens": 15489472} {"current_steps": 23740, "total_steps": 38160, "loss": 0.5173, "lr": 0.00037550089794302464, "epoch": 12.442348008385745, "percentage": 62.21, "elapsed_time": "1:00:46", "remaining_time": "0:36:55", "throughput": 4248.6, "total_tokens": 15493120} {"current_steps": 23745, "total_steps": 38160, "loss": 0.4583, "lr": 0.0003752794279710094, "epoch": 12.44496855345912, "percentage": 62.22, "elapsed_time": "1:00:47", "remaining_time": "0:36:54", "throughput": 4248.58, "total_tokens": 15495968} {"current_steps": 23750, "total_steps": 38160, "loss": 0.477, "lr": 0.0003750579840891148, "epoch": 12.447589098532495, "percentage": 62.24, "elapsed_time": "1:00:47", "remaining_time": "0:36:53", "throughput": 4248.57, "total_tokens": 15498784} {"current_steps": 23755, "total_steps": 38160, "loss": 0.5424, "lr": 0.0003748365663436647, "epoch": 12.45020964360587, "percentage": 62.25, "elapsed_time": "1:00:48", "remaining_time": "0:36:52", "throughput": 4248.72, "total_tokens": 15502784} {"current_steps": 23760, "total_steps": 38160, "loss": 0.4203, "lr": 0.0003746151747809769, "epoch": 12.452830188679245, "percentage": 62.26, "elapsed_time": "1:00:49", "remaining_time": "0:36:51", "throughput": 4248.75, "total_tokens": 15505952} {"current_steps": 23765, "total_steps": 38160, "loss": 0.415, "lr": 0.000374393809447364, "epoch": 12.45545073375262, "percentage": 62.28, "elapsed_time": "1:00:50", "remaining_time": "0:36:51", "throughput": 4248.82, "total_tokens": 15509344} {"current_steps": 23770, "total_steps": 38160, "loss": 0.5151, "lr": 0.0003741724703891333, "epoch": 12.458071278825996, "percentage": 62.29, "elapsed_time": "1:00:50", "remaining_time": "0:36:50", "throughput": 4248.88, "total_tokens": 15512544} {"current_steps": 23775, "total_steps": 38160, "loss": 0.5129, "lr": 0.00037395115765258616, "epoch": 12.46069182389937, "percentage": 62.3, "elapsed_time": "1:00:52", "remaining_time": "0:36:49", "throughput": 4249.27, "total_tokens": 15519104} {"current_steps": 23780, "total_steps": 38160, "loss": 0.4578, "lr": 0.0003737298712840188, "epoch": 12.463312368972746, "percentage": 62.32, "elapsed_time": "1:00:52", "remaining_time": "0:36:48", "throughput": 4249.34, "total_tokens": 15522528} {"current_steps": 23785, "total_steps": 38160, "loss": 0.4807, "lr": 0.000373508611329722, "epoch": 12.465932914046121, "percentage": 62.33, "elapsed_time": "1:00:53", "remaining_time": "0:36:48", "throughput": 4249.35, "total_tokens": 15525440} {"current_steps": 23790, "total_steps": 38160, "loss": 0.4359, "lr": 0.00037328737783598036, "epoch": 12.468553459119496, "percentage": 62.34, "elapsed_time": "1:00:54", "remaining_time": "0:36:47", "throughput": 4249.36, "total_tokens": 15528448} {"current_steps": 23795, "total_steps": 38160, "loss": 0.3802, "lr": 0.0003730661708490738, "epoch": 12.471174004192871, "percentage": 62.36, "elapsed_time": "1:00:54", "remaining_time": "0:36:46", "throughput": 4249.38, "total_tokens": 15531392} {"current_steps": 23800, "total_steps": 38160, "loss": 0.295, "lr": 0.0003728449904152761, "epoch": 12.473794549266247, "percentage": 62.37, "elapsed_time": "1:00:55", "remaining_time": "0:36:45", "throughput": 4249.44, "total_tokens": 15534784} {"current_steps": 23805, "total_steps": 38160, "loss": 0.395, "lr": 0.00037262383658085563, "epoch": 12.476415094339623, "percentage": 62.38, "elapsed_time": "1:00:56", "remaining_time": "0:36:44", "throughput": 4249.5, "total_tokens": 15538144} {"current_steps": 23810, "total_steps": 38160, "loss": 0.3625, "lr": 0.00037240270939207555, "epoch": 12.479035639412999, "percentage": 62.4, "elapsed_time": "1:00:57", "remaining_time": "0:36:44", "throughput": 4249.56, "total_tokens": 15541600} {"current_steps": 23815, "total_steps": 38160, "loss": 0.5324, "lr": 0.000372181608895193, "epoch": 12.481656184486374, "percentage": 62.41, "elapsed_time": "1:00:58", "remaining_time": "0:36:43", "throughput": 4249.72, "total_tokens": 15545728} {"current_steps": 23820, "total_steps": 38160, "loss": 0.3684, "lr": 0.00037196053513645957, "epoch": 12.484276729559749, "percentage": 62.42, "elapsed_time": "1:00:58", "remaining_time": "0:36:42", "throughput": 4249.63, "total_tokens": 15548000} {"current_steps": 23825, "total_steps": 38160, "loss": 0.369, "lr": 0.00037173948816212146, "epoch": 12.486897274633124, "percentage": 62.43, "elapsed_time": "1:00:59", "remaining_time": "0:36:41", "throughput": 4249.58, "total_tokens": 15550496} {"current_steps": 23830, "total_steps": 38160, "loss": 0.4411, "lr": 0.00037151846801841904, "epoch": 12.4895178197065, "percentage": 62.45, "elapsed_time": "1:01:00", "remaining_time": "0:36:40", "throughput": 4249.69, "total_tokens": 15554304} {"current_steps": 23835, "total_steps": 38160, "loss": 0.432, "lr": 0.00037129747475158736, "epoch": 12.492138364779874, "percentage": 62.46, "elapsed_time": "1:01:00", "remaining_time": "0:36:40", "throughput": 4249.78, "total_tokens": 15557824} {"current_steps": 23840, "total_steps": 38160, "loss": 0.4265, "lr": 0.0003710765084078558, "epoch": 12.49475890985325, "percentage": 62.47, "elapsed_time": "1:01:01", "remaining_time": "0:36:39", "throughput": 4249.77, "total_tokens": 15560704} {"current_steps": 23845, "total_steps": 38160, "loss": 0.4471, "lr": 0.0003708555690334477, "epoch": 12.497379454926625, "percentage": 62.49, "elapsed_time": "1:01:02", "remaining_time": "0:36:38", "throughput": 4249.92, "total_tokens": 15564832} {"current_steps": 23850, "total_steps": 38160, "loss": 0.3485, "lr": 0.00037063465667458125, "epoch": 12.5, "percentage": 62.5, "elapsed_time": "1:01:03", "remaining_time": "0:36:37", "throughput": 4249.94, "total_tokens": 15567904} {"current_steps": 23855, "total_steps": 38160, "loss": 0.5175, "lr": 0.0003704137713774686, "epoch": 12.502620545073375, "percentage": 62.51, "elapsed_time": "1:01:03", "remaining_time": "0:36:37", "throughput": 4249.99, "total_tokens": 15571168} {"current_steps": 23860, "total_steps": 38160, "loss": 0.3666, "lr": 0.0003701929131883167, "epoch": 12.50524109014675, "percentage": 62.53, "elapsed_time": "1:01:04", "remaining_time": "0:36:36", "throughput": 4250.01, "total_tokens": 15574144} {"current_steps": 23865, "total_steps": 38160, "loss": 0.4889, "lr": 0.0003699720821533264, "epoch": 12.507861635220126, "percentage": 62.54, "elapsed_time": "1:01:05", "remaining_time": "0:36:35", "throughput": 4249.88, "total_tokens": 15576160} {"current_steps": 23870, "total_steps": 38160, "loss": 0.4143, "lr": 0.00036975127831869326, "epoch": 12.5104821802935, "percentage": 62.55, "elapsed_time": "1:01:05", "remaining_time": "0:36:34", "throughput": 4249.93, "total_tokens": 15579424} {"current_steps": 23875, "total_steps": 38160, "loss": 0.2656, "lr": 0.0003695305017306066, "epoch": 12.513102725366876, "percentage": 62.57, "elapsed_time": "1:01:06", "remaining_time": "0:36:33", "throughput": 4250.13, "total_tokens": 15584032} {"current_steps": 23880, "total_steps": 38160, "loss": 0.498, "lr": 0.00036930975243525046, "epoch": 12.515723270440251, "percentage": 62.58, "elapsed_time": "1:01:07", "remaining_time": "0:36:33", "throughput": 4250.31, "total_tokens": 15588544} {"current_steps": 23885, "total_steps": 38160, "loss": 0.3786, "lr": 0.00036908903047880304, "epoch": 12.518343815513626, "percentage": 62.59, "elapsed_time": "1:01:08", "remaining_time": "0:36:32", "throughput": 4250.64, "total_tokens": 15594336} {"current_steps": 23890, "total_steps": 38160, "loss": 0.4795, "lr": 0.00036886833590743707, "epoch": 12.520964360587001, "percentage": 62.6, "elapsed_time": "1:01:09", "remaining_time": "0:36:31", "throughput": 4250.71, "total_tokens": 15597760} {"current_steps": 23895, "total_steps": 38160, "loss": 0.3953, "lr": 0.00036864766876731913, "epoch": 12.523584905660378, "percentage": 62.62, "elapsed_time": "1:01:10", "remaining_time": "0:36:31", "throughput": 4250.86, "total_tokens": 15601824} {"current_steps": 23900, "total_steps": 38160, "loss": 0.5386, "lr": 0.00036842702910461054, "epoch": 12.526205450733752, "percentage": 62.63, "elapsed_time": "1:01:11", "remaining_time": "0:36:30", "throughput": 4250.99, "total_tokens": 15605824} {"current_steps": 23905, "total_steps": 38160, "loss": 0.3989, "lr": 0.0003682064169654663, "epoch": 12.528825995807129, "percentage": 62.64, "elapsed_time": "1:01:11", "remaining_time": "0:36:29", "throughput": 4251.07, "total_tokens": 15609312} {"current_steps": 23910, "total_steps": 38160, "loss": 0.5887, "lr": 0.00036798583239603587, "epoch": 12.531446540880504, "percentage": 62.66, "elapsed_time": "1:01:12", "remaining_time": "0:36:28", "throughput": 4251.2, "total_tokens": 15613216} {"current_steps": 23915, "total_steps": 38160, "loss": 0.3321, "lr": 0.0003677652754424634, "epoch": 12.534067085953879, "percentage": 62.67, "elapsed_time": "1:01:13", "remaining_time": "0:36:28", "throughput": 4251.22, "total_tokens": 15616352} {"current_steps": 23920, "total_steps": 38160, "loss": 0.4605, "lr": 0.0003675447461508865, "epoch": 12.536687631027254, "percentage": 62.68, "elapsed_time": "1:01:14", "remaining_time": "0:36:27", "throughput": 4251.19, "total_tokens": 15619072} {"current_steps": 23925, "total_steps": 38160, "loss": 0.425, "lr": 0.00036732424456743784, "epoch": 12.53930817610063, "percentage": 62.7, "elapsed_time": "1:01:14", "remaining_time": "0:36:26", "throughput": 4251.23, "total_tokens": 15622144} {"current_steps": 23930, "total_steps": 38160, "loss": 0.427, "lr": 0.0003671037707382435, "epoch": 12.541928721174004, "percentage": 62.71, "elapsed_time": "1:01:15", "remaining_time": "0:36:25", "throughput": 4251.24, "total_tokens": 15625152} {"current_steps": 23935, "total_steps": 38160, "loss": 0.4709, "lr": 0.000366883324709424, "epoch": 12.54454926624738, "percentage": 62.72, "elapsed_time": "1:01:16", "remaining_time": "0:36:24", "throughput": 4251.26, "total_tokens": 15628128} {"current_steps": 23940, "total_steps": 38160, "loss": 0.5115, "lr": 0.00036666290652709446, "epoch": 12.547169811320755, "percentage": 62.74, "elapsed_time": "1:01:16", "remaining_time": "0:36:23", "throughput": 4251.3, "total_tokens": 15631328} {"current_steps": 23945, "total_steps": 38160, "loss": 0.5097, "lr": 0.0003664425162373635, "epoch": 12.54979035639413, "percentage": 62.75, "elapsed_time": "1:01:17", "remaining_time": "0:36:23", "throughput": 4251.31, "total_tokens": 15634304} {"current_steps": 23950, "total_steps": 38160, "loss": 0.3046, "lr": 0.0003662221538863346, "epoch": 12.552410901467505, "percentage": 62.76, "elapsed_time": "1:01:18", "remaining_time": "0:36:22", "throughput": 4251.41, "total_tokens": 15637984} {"current_steps": 23955, "total_steps": 38160, "loss": 0.3661, "lr": 0.0003660018195201049, "epoch": 12.55503144654088, "percentage": 62.78, "elapsed_time": "1:01:18", "remaining_time": "0:36:21", "throughput": 4251.37, "total_tokens": 15640672} {"current_steps": 23960, "total_steps": 38160, "loss": 0.4151, "lr": 0.0003657815131847657, "epoch": 12.557651991614255, "percentage": 62.79, "elapsed_time": "1:01:19", "remaining_time": "0:36:20", "throughput": 4251.44, "total_tokens": 15644096} {"current_steps": 23965, "total_steps": 38160, "loss": 0.4729, "lr": 0.0003655612349264027, "epoch": 12.56027253668763, "percentage": 62.8, "elapsed_time": "1:01:20", "remaining_time": "0:36:19", "throughput": 4251.45, "total_tokens": 15647040} {"current_steps": 23970, "total_steps": 38160, "loss": 0.4148, "lr": 0.0003653409847910957, "epoch": 12.562893081761006, "percentage": 62.81, "elapsed_time": "1:01:21", "remaining_time": "0:36:19", "throughput": 4251.44, "total_tokens": 15649824} {"current_steps": 23975, "total_steps": 38160, "loss": 0.3434, "lr": 0.0003651207628249182, "epoch": 12.565513626834381, "percentage": 62.83, "elapsed_time": "1:01:21", "remaining_time": "0:36:18", "throughput": 4251.46, "total_tokens": 15652992} {"current_steps": 23980, "total_steps": 38160, "loss": 0.4445, "lr": 0.0003649005690739386, "epoch": 12.568134171907756, "percentage": 62.84, "elapsed_time": "1:01:22", "remaining_time": "0:36:17", "throughput": 4251.43, "total_tokens": 15655680} {"current_steps": 23985, "total_steps": 38160, "loss": 0.3347, "lr": 0.0003646804035842187, "epoch": 12.570754716981131, "percentage": 62.85, "elapsed_time": "1:01:23", "remaining_time": "0:36:16", "throughput": 4251.43, "total_tokens": 15658496} {"current_steps": 23990, "total_steps": 38160, "loss": 0.5978, "lr": 0.0003644602664018143, "epoch": 12.573375262054507, "percentage": 62.87, "elapsed_time": "1:01:23", "remaining_time": "0:36:15", "throughput": 4251.41, "total_tokens": 15661248} {"current_steps": 23995, "total_steps": 38160, "loss": 0.4552, "lr": 0.000364240157572776, "epoch": 12.575995807127882, "percentage": 62.88, "elapsed_time": "1:01:24", "remaining_time": "0:36:15", "throughput": 4251.37, "total_tokens": 15663840} {"current_steps": 24000, "total_steps": 38160, "loss": 0.5045, "lr": 0.0003640200771431478, "epoch": 12.578616352201259, "percentage": 62.89, "elapsed_time": "1:01:25", "remaining_time": "0:36:14", "throughput": 4251.5, "total_tokens": 15667744} {"current_steps": 24005, "total_steps": 38160, "loss": 0.4629, "lr": 0.0003638000251589683, "epoch": 12.581236897274634, "percentage": 62.91, "elapsed_time": "1:01:25", "remaining_time": "0:36:13", "throughput": 4251.5, "total_tokens": 15670592} {"current_steps": 24010, "total_steps": 38160, "loss": 0.4574, "lr": 0.0003635800016662696, "epoch": 12.583857442348009, "percentage": 62.92, "elapsed_time": "1:01:26", "remaining_time": "0:36:12", "throughput": 4251.65, "total_tokens": 15674688} {"current_steps": 24015, "total_steps": 38160, "loss": 0.4387, "lr": 0.00036336000671107816, "epoch": 12.586477987421384, "percentage": 62.93, "elapsed_time": "1:01:27", "remaining_time": "0:36:11", "throughput": 4251.63, "total_tokens": 15677440} {"current_steps": 24020, "total_steps": 38160, "loss": 0.4743, "lr": 0.00036314004033941445, "epoch": 12.58909853249476, "percentage": 62.95, "elapsed_time": "1:01:28", "remaining_time": "0:36:11", "throughput": 4251.64, "total_tokens": 15680416} {"current_steps": 24025, "total_steps": 38160, "loss": 0.4472, "lr": 0.00036292010259729283, "epoch": 12.591719077568134, "percentage": 62.96, "elapsed_time": "1:01:28", "remaining_time": "0:36:10", "throughput": 4251.84, "total_tokens": 15684800} {"current_steps": 24030, "total_steps": 38160, "loss": 0.4839, "lr": 0.000362700193530722, "epoch": 12.59433962264151, "percentage": 62.97, "elapsed_time": "1:01:29", "remaining_time": "0:36:09", "throughput": 4251.88, "total_tokens": 15687936} {"current_steps": 24035, "total_steps": 38160, "loss": 0.3217, "lr": 0.0003624803131857042, "epoch": 12.596960167714885, "percentage": 62.98, "elapsed_time": "1:01:30", "remaining_time": "0:36:08", "throughput": 4251.91, "total_tokens": 15691104} {"current_steps": 24040, "total_steps": 38160, "loss": 0.4892, "lr": 0.0003622604616082361, "epoch": 12.59958071278826, "percentage": 63.0, "elapsed_time": "1:01:31", "remaining_time": "0:36:07", "throughput": 4251.97, "total_tokens": 15694432} {"current_steps": 24045, "total_steps": 38160, "loss": 0.4765, "lr": 0.0003620406388443078, "epoch": 12.602201257861635, "percentage": 63.01, "elapsed_time": "1:01:31", "remaining_time": "0:36:07", "throughput": 4251.99, "total_tokens": 15697504} {"current_steps": 24050, "total_steps": 38160, "loss": 0.4967, "lr": 0.00036182084493990407, "epoch": 12.60482180293501, "percentage": 63.02, "elapsed_time": "1:01:32", "remaining_time": "0:36:06", "throughput": 4252.16, "total_tokens": 15701824} {"current_steps": 24055, "total_steps": 38160, "loss": 0.4123, "lr": 0.0003616010799410031, "epoch": 12.607442348008385, "percentage": 63.04, "elapsed_time": "1:01:33", "remaining_time": "0:36:05", "throughput": 4252.16, "total_tokens": 15704736} {"current_steps": 24060, "total_steps": 38160, "loss": 0.3552, "lr": 0.0003613813438935773, "epoch": 12.61006289308176, "percentage": 63.05, "elapsed_time": "1:01:34", "remaining_time": "0:36:04", "throughput": 4252.17, "total_tokens": 15707744} {"current_steps": 24065, "total_steps": 38160, "loss": 0.5075, "lr": 0.0003611616368435928, "epoch": 12.612683438155136, "percentage": 63.06, "elapsed_time": "1:01:34", "remaining_time": "0:36:03", "throughput": 4252.11, "total_tokens": 15710208} {"current_steps": 24070, "total_steps": 38160, "loss": 0.4548, "lr": 0.0003609419588370102, "epoch": 12.615303983228511, "percentage": 63.08, "elapsed_time": "1:01:35", "remaining_time": "0:36:03", "throughput": 4252.2, "total_tokens": 15713792} {"current_steps": 24075, "total_steps": 38160, "loss": 0.4447, "lr": 0.00036072230991978326, "epoch": 12.617924528301886, "percentage": 63.09, "elapsed_time": "1:01:36", "remaining_time": "0:36:02", "throughput": 4252.34, "total_tokens": 15717792} {"current_steps": 24080, "total_steps": 38160, "loss": 0.4356, "lr": 0.00036050269013785996, "epoch": 12.620545073375261, "percentage": 63.1, "elapsed_time": "1:01:36", "remaining_time": "0:36:01", "throughput": 4252.38, "total_tokens": 15720896} {"current_steps": 24085, "total_steps": 38160, "loss": 0.3074, "lr": 0.0003602830995371825, "epoch": 12.623165618448636, "percentage": 63.12, "elapsed_time": "1:01:37", "remaining_time": "0:36:00", "throughput": 4252.39, "total_tokens": 15723904} {"current_steps": 24090, "total_steps": 38160, "loss": 0.4754, "lr": 0.0003600635381636866, "epoch": 12.625786163522012, "percentage": 63.13, "elapsed_time": "1:01:38", "remaining_time": "0:36:00", "throughput": 4252.43, "total_tokens": 15727168} {"current_steps": 24095, "total_steps": 38160, "loss": 0.616, "lr": 0.0003598440060633022, "epoch": 12.628406708595389, "percentage": 63.14, "elapsed_time": "1:01:39", "remaining_time": "0:35:59", "throughput": 4252.52, "total_tokens": 15730688} {"current_steps": 24100, "total_steps": 38160, "loss": 0.5177, "lr": 0.00035962450328195264, "epoch": 12.631027253668764, "percentage": 63.16, "elapsed_time": "1:01:39", "remaining_time": "0:35:58", "throughput": 4252.54, "total_tokens": 15733664} {"current_steps": 24105, "total_steps": 38160, "loss": 0.4931, "lr": 0.00035940502986555543, "epoch": 12.633647798742139, "percentage": 63.17, "elapsed_time": "1:01:40", "remaining_time": "0:35:57", "throughput": 4252.53, "total_tokens": 15736352} {"current_steps": 24110, "total_steps": 38160, "loss": 0.3494, "lr": 0.00035918558586002205, "epoch": 12.636268343815514, "percentage": 63.18, "elapsed_time": "1:01:41", "remaining_time": "0:35:56", "throughput": 4252.58, "total_tokens": 15739648} {"current_steps": 24115, "total_steps": 38160, "loss": 0.4538, "lr": 0.0003589661713112575, "epoch": 12.63888888888889, "percentage": 63.19, "elapsed_time": "1:01:41", "remaining_time": "0:35:56", "throughput": 4252.57, "total_tokens": 15742464} {"current_steps": 24120, "total_steps": 38160, "loss": 0.4652, "lr": 0.000358746786265161, "epoch": 12.641509433962264, "percentage": 63.21, "elapsed_time": "1:01:42", "remaining_time": "0:35:55", "throughput": 4252.65, "total_tokens": 15745984} {"current_steps": 24125, "total_steps": 38160, "loss": 0.3703, "lr": 0.0003585274307676254, "epoch": 12.64412997903564, "percentage": 63.22, "elapsed_time": "1:01:43", "remaining_time": "0:35:54", "throughput": 4252.61, "total_tokens": 15748608} {"current_steps": 24130, "total_steps": 38160, "loss": 0.4569, "lr": 0.00035830810486453725, "epoch": 12.646750524109015, "percentage": 63.23, "elapsed_time": "1:01:43", "remaining_time": "0:35:53", "throughput": 4252.62, "total_tokens": 15751520} {"current_steps": 24135, "total_steps": 38160, "loss": 0.4089, "lr": 0.00035808880860177696, "epoch": 12.64937106918239, "percentage": 63.25, "elapsed_time": "1:01:44", "remaining_time": "0:35:52", "throughput": 4252.68, "total_tokens": 15754912} {"current_steps": 24140, "total_steps": 38160, "loss": 0.6009, "lr": 0.00035786954202521895, "epoch": 12.651991614255765, "percentage": 63.26, "elapsed_time": "1:01:45", "remaining_time": "0:35:52", "throughput": 4252.79, "total_tokens": 15758688} {"current_steps": 24145, "total_steps": 38160, "loss": 0.3364, "lr": 0.00035765030518073116, "epoch": 12.65461215932914, "percentage": 63.27, "elapsed_time": "1:01:46", "remaining_time": "0:35:51", "throughput": 4252.76, "total_tokens": 15761248} {"current_steps": 24150, "total_steps": 38160, "loss": 0.5584, "lr": 0.0003574310981141756, "epoch": 12.657232704402515, "percentage": 63.29, "elapsed_time": "1:01:46", "remaining_time": "0:35:50", "throughput": 4252.86, "total_tokens": 15765088} {"current_steps": 24155, "total_steps": 38160, "loss": 0.4695, "lr": 0.00035721192087140796, "epoch": 12.65985324947589, "percentage": 63.3, "elapsed_time": "1:01:47", "remaining_time": "0:35:49", "throughput": 4252.99, "total_tokens": 15768896} {"current_steps": 24160, "total_steps": 38160, "loss": 0.3737, "lr": 0.00035699277349827724, "epoch": 12.662473794549266, "percentage": 63.31, "elapsed_time": "1:01:48", "remaining_time": "0:35:48", "throughput": 4252.96, "total_tokens": 15771584} {"current_steps": 24165, "total_steps": 38160, "loss": 0.5475, "lr": 0.0003567736560406269, "epoch": 12.665094339622641, "percentage": 63.33, "elapsed_time": "1:01:49", "remaining_time": "0:35:48", "throughput": 4252.9, "total_tokens": 15774080} {"current_steps": 24170, "total_steps": 38160, "loss": 0.5807, "lr": 0.0003565545685442936, "epoch": 12.667714884696016, "percentage": 63.34, "elapsed_time": "1:01:49", "remaining_time": "0:35:47", "throughput": 4252.94, "total_tokens": 15777280} {"current_steps": 24175, "total_steps": 38160, "loss": 0.5781, "lr": 0.00035633551105510806, "epoch": 12.670335429769391, "percentage": 63.35, "elapsed_time": "1:01:50", "remaining_time": "0:35:46", "throughput": 4252.99, "total_tokens": 15780544} {"current_steps": 24180, "total_steps": 38160, "loss": 0.5136, "lr": 0.00035611648361889457, "epoch": 12.672955974842766, "percentage": 63.36, "elapsed_time": "1:01:51", "remaining_time": "0:35:45", "throughput": 4253.01, "total_tokens": 15783680} {"current_steps": 24185, "total_steps": 38160, "loss": 0.3965, "lr": 0.00035589748628147145, "epoch": 12.675576519916142, "percentage": 63.38, "elapsed_time": "1:01:51", "remaining_time": "0:35:44", "throughput": 4253.03, "total_tokens": 15786752} {"current_steps": 24190, "total_steps": 38160, "loss": 0.3907, "lr": 0.00035567851908865, "epoch": 12.678197064989519, "percentage": 63.39, "elapsed_time": "1:01:52", "remaining_time": "0:35:44", "throughput": 4253.12, "total_tokens": 15790368} {"current_steps": 24195, "total_steps": 38160, "loss": 0.4791, "lr": 0.0003554595820862358, "epoch": 12.680817610062894, "percentage": 63.4, "elapsed_time": "1:01:53", "remaining_time": "0:35:43", "throughput": 4253.1, "total_tokens": 15793120} {"current_steps": 24200, "total_steps": 38160, "loss": 0.3627, "lr": 0.00035524067532002803, "epoch": 12.683438155136269, "percentage": 63.42, "elapsed_time": "1:01:54", "remaining_time": "0:35:42", "throughput": 4253.29, "total_tokens": 15797600} {"current_steps": 24205, "total_steps": 38160, "loss": 0.4338, "lr": 0.00035502179883581956, "epoch": 12.686058700209644, "percentage": 63.43, "elapsed_time": "1:01:55", "remaining_time": "0:35:41", "throughput": 4253.5, "total_tokens": 15802304} {"current_steps": 24210, "total_steps": 38160, "loss": 0.419, "lr": 0.0003548029526793969, "epoch": 12.68867924528302, "percentage": 63.44, "elapsed_time": "1:01:55", "remaining_time": "0:35:41", "throughput": 4253.44, "total_tokens": 15804672} {"current_steps": 24215, "total_steps": 38160, "loss": 0.4119, "lr": 0.0003545841368965398, "epoch": 12.691299790356394, "percentage": 63.46, "elapsed_time": "1:01:56", "remaining_time": "0:35:40", "throughput": 4253.39, "total_tokens": 15807168} {"current_steps": 24220, "total_steps": 38160, "loss": 0.3235, "lr": 0.00035436535153302235, "epoch": 12.69392033542977, "percentage": 63.47, "elapsed_time": "1:01:57", "remaining_time": "0:35:39", "throughput": 4253.36, "total_tokens": 15809824} {"current_steps": 24225, "total_steps": 38160, "loss": 0.5405, "lr": 0.0003541465966346118, "epoch": 12.696540880503145, "percentage": 63.48, "elapsed_time": "1:01:57", "remaining_time": "0:35:38", "throughput": 4253.46, "total_tokens": 15813408} {"current_steps": 24230, "total_steps": 38160, "loss": 0.4683, "lr": 0.00035392787224706936, "epoch": 12.69916142557652, "percentage": 63.5, "elapsed_time": "1:01:58", "remaining_time": "0:35:37", "throughput": 4253.44, "total_tokens": 15816096} {"current_steps": 24235, "total_steps": 38160, "loss": 0.319, "lr": 0.0003537091784161495, "epoch": 12.701781970649895, "percentage": 63.51, "elapsed_time": "1:01:59", "remaining_time": "0:35:36", "throughput": 4253.48, "total_tokens": 15819328} {"current_steps": 24240, "total_steps": 38160, "loss": 0.4072, "lr": 0.0003534905151876007, "epoch": 12.70440251572327, "percentage": 63.52, "elapsed_time": "1:01:59", "remaining_time": "0:35:36", "throughput": 4253.48, "total_tokens": 15822176} {"current_steps": 24245, "total_steps": 38160, "loss": 0.639, "lr": 0.0003532718826071646, "epoch": 12.707023060796645, "percentage": 63.54, "elapsed_time": "1:02:00", "remaining_time": "0:35:35", "throughput": 4253.45, "total_tokens": 15824768} {"current_steps": 24250, "total_steps": 38160, "loss": 0.5266, "lr": 0.00035305328072057654, "epoch": 12.70964360587002, "percentage": 63.55, "elapsed_time": "1:02:01", "remaining_time": "0:35:34", "throughput": 4253.57, "total_tokens": 15828608} {"current_steps": 24255, "total_steps": 38160, "loss": 0.4551, "lr": 0.00035283470957356576, "epoch": 12.712264150943396, "percentage": 63.56, "elapsed_time": "1:02:01", "remaining_time": "0:35:33", "throughput": 4253.49, "total_tokens": 15830880} {"current_steps": 24260, "total_steps": 38160, "loss": 0.4776, "lr": 0.0003526161692118548, "epoch": 12.714884696016771, "percentage": 63.57, "elapsed_time": "1:02:02", "remaining_time": "0:35:32", "throughput": 4253.53, "total_tokens": 15834112} {"current_steps": 24265, "total_steps": 38160, "loss": 0.3232, "lr": 0.0003523976596811597, "epoch": 12.717505241090146, "percentage": 63.59, "elapsed_time": "1:02:03", "remaining_time": "0:35:32", "throughput": 4253.51, "total_tokens": 15836832} {"current_steps": 24270, "total_steps": 38160, "loss": 0.3771, "lr": 0.0003521791810271906, "epoch": 12.720125786163521, "percentage": 63.6, "elapsed_time": "1:02:03", "remaining_time": "0:35:31", "throughput": 4253.52, "total_tokens": 15839840} {"current_steps": 24275, "total_steps": 38160, "loss": 0.4327, "lr": 0.0003519607332956501, "epoch": 12.722746331236896, "percentage": 63.61, "elapsed_time": "1:02:04", "remaining_time": "0:35:30", "throughput": 4253.53, "total_tokens": 15842848} {"current_steps": 24280, "total_steps": 38160, "loss": 0.4981, "lr": 0.0003517423165322353, "epoch": 12.725366876310272, "percentage": 63.63, "elapsed_time": "1:02:05", "remaining_time": "0:35:29", "throughput": 4253.63, "total_tokens": 15846496} {"current_steps": 24285, "total_steps": 38160, "loss": 0.4769, "lr": 0.0003515239307826366, "epoch": 12.727987421383649, "percentage": 63.64, "elapsed_time": "1:02:06", "remaining_time": "0:35:29", "throughput": 4254.01, "total_tokens": 15852832} {"current_steps": 24290, "total_steps": 38160, "loss": 0.4156, "lr": 0.00035130557609253744, "epoch": 12.730607966457024, "percentage": 63.65, "elapsed_time": "1:02:07", "remaining_time": "0:35:28", "throughput": 4254.1, "total_tokens": 15856416} {"current_steps": 24295, "total_steps": 38160, "loss": 0.4808, "lr": 0.00035108725250761566, "epoch": 12.733228511530399, "percentage": 63.67, "elapsed_time": "1:02:07", "remaining_time": "0:35:27", "throughput": 4254.08, "total_tokens": 15859104} {"current_steps": 24300, "total_steps": 38160, "loss": 0.3467, "lr": 0.0003508689600735416, "epoch": 12.735849056603774, "percentage": 63.68, "elapsed_time": "1:02:08", "remaining_time": "0:35:26", "throughput": 4254.05, "total_tokens": 15861792} {"current_steps": 24305, "total_steps": 38160, "loss": 0.5027, "lr": 0.0003506506988359797, "epoch": 12.73846960167715, "percentage": 63.69, "elapsed_time": "1:02:09", "remaining_time": "0:35:25", "throughput": 4254.01, "total_tokens": 15864320} {"current_steps": 24310, "total_steps": 38160, "loss": 0.2949, "lr": 0.0003504324688405878, "epoch": 12.741090146750524, "percentage": 63.71, "elapsed_time": "1:02:09", "remaining_time": "0:35:25", "throughput": 4254.0, "total_tokens": 15867168} {"current_steps": 24315, "total_steps": 38160, "loss": 0.4304, "lr": 0.000350214270133017, "epoch": 12.7437106918239, "percentage": 63.72, "elapsed_time": "1:02:10", "remaining_time": "0:35:24", "throughput": 4253.99, "total_tokens": 15870048} {"current_steps": 24320, "total_steps": 38160, "loss": 0.4234, "lr": 0.00034999610275891204, "epoch": 12.746331236897275, "percentage": 63.73, "elapsed_time": "1:02:11", "remaining_time": "0:35:23", "throughput": 4254.0, "total_tokens": 15873024} {"current_steps": 24325, "total_steps": 38160, "loss": 0.4444, "lr": 0.0003497779667639113, "epoch": 12.74895178197065, "percentage": 63.74, "elapsed_time": "1:02:11", "remaining_time": "0:35:22", "throughput": 4253.96, "total_tokens": 15875648} {"current_steps": 24330, "total_steps": 38160, "loss": 0.3312, "lr": 0.0003495598621936458, "epoch": 12.751572327044025, "percentage": 63.76, "elapsed_time": "1:02:12", "remaining_time": "0:35:21", "throughput": 4253.92, "total_tokens": 15878240} {"current_steps": 24335, "total_steps": 38160, "loss": 0.4918, "lr": 0.00034934178909374084, "epoch": 12.7541928721174, "percentage": 63.77, "elapsed_time": "1:02:13", "remaining_time": "0:35:20", "throughput": 4253.92, "total_tokens": 15881152} {"current_steps": 24340, "total_steps": 38160, "loss": 0.4564, "lr": 0.0003491237475098148, "epoch": 12.756813417190775, "percentage": 63.78, "elapsed_time": "1:02:14", "remaining_time": "0:35:20", "throughput": 4253.97, "total_tokens": 15884384} {"current_steps": 24345, "total_steps": 38160, "loss": 0.5981, "lr": 0.00034890573748747945, "epoch": 12.75943396226415, "percentage": 63.8, "elapsed_time": "1:02:14", "remaining_time": "0:35:19", "throughput": 4253.95, "total_tokens": 15887232} {"current_steps": 24350, "total_steps": 38160, "loss": 0.4067, "lr": 0.00034868775907234017, "epoch": 12.762054507337526, "percentage": 63.81, "elapsed_time": "1:02:15", "remaining_time": "0:35:18", "throughput": 4253.86, "total_tokens": 15889344} {"current_steps": 24355, "total_steps": 38160, "loss": 0.6466, "lr": 0.0003484698123099956, "epoch": 12.764675052410901, "percentage": 63.82, "elapsed_time": "1:02:16", "remaining_time": "0:35:17", "throughput": 4253.92, "total_tokens": 15892704} {"current_steps": 24360, "total_steps": 38160, "loss": 0.6598, "lr": 0.00034825189724603723, "epoch": 12.767295597484276, "percentage": 63.84, "elapsed_time": "1:02:16", "remaining_time": "0:35:16", "throughput": 4253.94, "total_tokens": 15895840} {"current_steps": 24365, "total_steps": 38160, "loss": 0.3946, "lr": 0.0003480340139260509, "epoch": 12.769916142557651, "percentage": 63.85, "elapsed_time": "1:02:17", "remaining_time": "0:35:16", "throughput": 4253.94, "total_tokens": 15898720} {"current_steps": 24370, "total_steps": 38160, "loss": 0.3147, "lr": 0.000347816162395615, "epoch": 12.772536687631026, "percentage": 63.86, "elapsed_time": "1:02:18", "remaining_time": "0:35:15", "throughput": 4253.9, "total_tokens": 15901408} {"current_steps": 24375, "total_steps": 38160, "loss": 0.4335, "lr": 0.00034759834270030185, "epoch": 12.775157232704402, "percentage": 63.88, "elapsed_time": "1:02:18", "remaining_time": "0:35:14", "throughput": 4253.88, "total_tokens": 15904160} {"current_steps": 24380, "total_steps": 38160, "loss": 0.4615, "lr": 0.0003473805548856768, "epoch": 12.777777777777779, "percentage": 63.89, "elapsed_time": "1:02:19", "remaining_time": "0:35:13", "throughput": 4253.93, "total_tokens": 15907488} {"current_steps": 24385, "total_steps": 38160, "loss": 0.3963, "lr": 0.00034716279899729826, "epoch": 12.780398322851154, "percentage": 63.9, "elapsed_time": "1:02:20", "remaining_time": "0:35:12", "throughput": 4253.98, "total_tokens": 15910784} {"current_steps": 24390, "total_steps": 38160, "loss": 0.4673, "lr": 0.00034694507508071864, "epoch": 12.783018867924529, "percentage": 63.92, "elapsed_time": "1:02:20", "remaining_time": "0:35:12", "throughput": 4254.03, "total_tokens": 15914016} {"current_steps": 24395, "total_steps": 38160, "loss": 0.4457, "lr": 0.00034672738318148303, "epoch": 12.785639412997904, "percentage": 63.93, "elapsed_time": "1:02:21", "remaining_time": "0:35:11", "throughput": 4253.99, "total_tokens": 15916672} {"current_steps": 24400, "total_steps": 38160, "loss": 0.4169, "lr": 0.00034650972334513043, "epoch": 12.78825995807128, "percentage": 63.94, "elapsed_time": "1:02:22", "remaining_time": "0:35:10", "throughput": 4254.09, "total_tokens": 15920288} {"current_steps": 24405, "total_steps": 38160, "loss": 0.5569, "lr": 0.00034629209561719244, "epoch": 12.790880503144654, "percentage": 63.95, "elapsed_time": "1:02:23", "remaining_time": "0:35:09", "throughput": 4254.29, "total_tokens": 15924736} {"current_steps": 24410, "total_steps": 38160, "loss": 0.3611, "lr": 0.0003460745000431946, "epoch": 12.79350104821803, "percentage": 63.97, "elapsed_time": "1:02:24", "remaining_time": "0:35:08", "throughput": 4254.4, "total_tokens": 15928544} {"current_steps": 24415, "total_steps": 38160, "loss": 0.3296, "lr": 0.00034585693666865525, "epoch": 12.796121593291405, "percentage": 63.98, "elapsed_time": "1:02:24", "remaining_time": "0:35:08", "throughput": 4254.58, "total_tokens": 15932864} {"current_steps": 24420, "total_steps": 38160, "loss": 0.379, "lr": 0.00034563940553908605, "epoch": 12.79874213836478, "percentage": 63.99, "elapsed_time": "1:02:25", "remaining_time": "0:35:07", "throughput": 4254.68, "total_tokens": 15936512} {"current_steps": 24425, "total_steps": 38160, "loss": 0.452, "lr": 0.00034542190669999216, "epoch": 12.801362683438155, "percentage": 64.01, "elapsed_time": "1:02:26", "remaining_time": "0:35:06", "throughput": 4254.68, "total_tokens": 15939392} {"current_steps": 24430, "total_steps": 38160, "loss": 0.3885, "lr": 0.000345204440196872, "epoch": 12.80398322851153, "percentage": 64.02, "elapsed_time": "1:02:26", "remaining_time": "0:35:05", "throughput": 4254.68, "total_tokens": 15942272} {"current_steps": 24435, "total_steps": 38160, "loss": 0.5127, "lr": 0.00034498700607521693, "epoch": 12.806603773584905, "percentage": 64.03, "elapsed_time": "1:02:27", "remaining_time": "0:35:05", "throughput": 4254.69, "total_tokens": 15945280} {"current_steps": 24440, "total_steps": 38160, "loss": 0.4416, "lr": 0.00034476960438051187, "epoch": 12.80922431865828, "percentage": 64.05, "elapsed_time": "1:02:28", "remaining_time": "0:35:04", "throughput": 4254.76, "total_tokens": 15948704} {"current_steps": 24445, "total_steps": 38160, "loss": 0.3869, "lr": 0.00034455223515823444, "epoch": 12.811844863731656, "percentage": 64.06, "elapsed_time": "1:02:29", "remaining_time": "0:35:03", "throughput": 4254.86, "total_tokens": 15952320} {"current_steps": 24450, "total_steps": 38160, "loss": 0.3875, "lr": 0.0003443348984538559, "epoch": 12.814465408805031, "percentage": 64.07, "elapsed_time": "1:02:30", "remaining_time": "0:35:02", "throughput": 4255.04, "total_tokens": 15956576} {"current_steps": 24455, "total_steps": 38160, "loss": 0.3814, "lr": 0.0003441175943128407, "epoch": 12.817085953878406, "percentage": 64.09, "elapsed_time": "1:02:30", "remaining_time": "0:35:01", "throughput": 4255.02, "total_tokens": 15959232} {"current_steps": 24460, "total_steps": 38160, "loss": 0.4037, "lr": 0.0003439003227806464, "epoch": 12.819706498951781, "percentage": 64.1, "elapsed_time": "1:02:31", "remaining_time": "0:35:01", "throughput": 4255.1, "total_tokens": 15962720} {"current_steps": 24465, "total_steps": 38160, "loss": 0.3838, "lr": 0.00034368308390272386, "epoch": 12.822327044025156, "percentage": 64.11, "elapsed_time": "1:02:32", "remaining_time": "0:35:00", "throughput": 4255.17, "total_tokens": 15966240} {"current_steps": 24470, "total_steps": 38160, "loss": 0.5359, "lr": 0.0003434658777245167, "epoch": 12.824947589098532, "percentage": 64.12, "elapsed_time": "1:02:32", "remaining_time": "0:34:59", "throughput": 4255.13, "total_tokens": 15968800} {"current_steps": 24475, "total_steps": 38160, "loss": 0.4668, "lr": 0.000343248704291462, "epoch": 12.827568134171909, "percentage": 64.14, "elapsed_time": "1:02:33", "remaining_time": "0:34:58", "throughput": 4255.12, "total_tokens": 15971680} {"current_steps": 24480, "total_steps": 38160, "loss": 0.5136, "lr": 0.00034303156364899016, "epoch": 12.830188679245284, "percentage": 64.15, "elapsed_time": "1:02:34", "remaining_time": "0:34:58", "throughput": 4255.24, "total_tokens": 15975552} {"current_steps": 24485, "total_steps": 38160, "loss": 0.4632, "lr": 0.00034281445584252425, "epoch": 12.832809224318659, "percentage": 64.16, "elapsed_time": "1:02:35", "remaining_time": "0:34:57", "throughput": 4255.28, "total_tokens": 15978656} {"current_steps": 24490, "total_steps": 38160, "loss": 0.4688, "lr": 0.00034259738091748103, "epoch": 12.835429769392034, "percentage": 64.18, "elapsed_time": "1:02:35", "remaining_time": "0:34:56", "throughput": 4255.32, "total_tokens": 15981856} {"current_steps": 24495, "total_steps": 38160, "loss": 0.5216, "lr": 0.00034238033891927013, "epoch": 12.83805031446541, "percentage": 64.19, "elapsed_time": "1:02:36", "remaining_time": "0:34:55", "throughput": 4255.33, "total_tokens": 15984736} {"current_steps": 24500, "total_steps": 38160, "loss": 0.3733, "lr": 0.00034216332989329387, "epoch": 12.840670859538784, "percentage": 64.2, "elapsed_time": "1:02:37", "remaining_time": "0:34:54", "throughput": 4255.3, "total_tokens": 15987424} {"current_steps": 24505, "total_steps": 38160, "loss": 0.6837, "lr": 0.00034194635388494835, "epoch": 12.84329140461216, "percentage": 64.22, "elapsed_time": "1:02:37", "remaining_time": "0:34:54", "throughput": 4255.43, "total_tokens": 15991296} {"current_steps": 24510, "total_steps": 38160, "loss": 0.5857, "lr": 0.00034172941093962237, "epoch": 12.845911949685535, "percentage": 64.23, "elapsed_time": "1:02:38", "remaining_time": "0:34:53", "throughput": 4255.38, "total_tokens": 15993760} {"current_steps": 24515, "total_steps": 38160, "loss": 0.3421, "lr": 0.00034151250110269805, "epoch": 12.84853249475891, "percentage": 64.24, "elapsed_time": "1:02:39", "remaining_time": "0:34:52", "throughput": 4255.34, "total_tokens": 15996288} {"current_steps": 24520, "total_steps": 38160, "loss": 0.4882, "lr": 0.00034129562441955044, "epoch": 12.851153039832285, "percentage": 64.26, "elapsed_time": "1:02:39", "remaining_time": "0:34:51", "throughput": 4255.37, "total_tokens": 15999328} {"current_steps": 24525, "total_steps": 38160, "loss": 0.4102, "lr": 0.00034107878093554765, "epoch": 12.85377358490566, "percentage": 64.27, "elapsed_time": "1:02:40", "remaining_time": "0:34:50", "throughput": 4255.39, "total_tokens": 16002336} {"current_steps": 24530, "total_steps": 38160, "loss": 0.2993, "lr": 0.00034086197069605064, "epoch": 12.856394129979035, "percentage": 64.28, "elapsed_time": "1:02:41", "remaining_time": "0:34:49", "throughput": 4255.42, "total_tokens": 16005440} {"current_steps": 24535, "total_steps": 38160, "loss": 0.5422, "lr": 0.0003406451937464139, "epoch": 12.85901467505241, "percentage": 64.3, "elapsed_time": "1:02:42", "remaining_time": "0:34:49", "throughput": 4255.55, "total_tokens": 16009376} {"current_steps": 24540, "total_steps": 38160, "loss": 0.4176, "lr": 0.0003404284501319845, "epoch": 12.861635220125786, "percentage": 64.31, "elapsed_time": "1:02:42", "remaining_time": "0:34:48", "throughput": 4255.6, "total_tokens": 16012768} {"current_steps": 24545, "total_steps": 38160, "loss": 0.4069, "lr": 0.00034021173989810306, "epoch": 12.864255765199161, "percentage": 64.32, "elapsed_time": "1:02:43", "remaining_time": "0:34:47", "throughput": 4255.54, "total_tokens": 16015136} {"current_steps": 24550, "total_steps": 38160, "loss": 0.4653, "lr": 0.0003399950630901025, "epoch": 12.866876310272536, "percentage": 64.33, "elapsed_time": "1:02:44", "remaining_time": "0:34:46", "throughput": 4255.63, "total_tokens": 16018688} {"current_steps": 24555, "total_steps": 38160, "loss": 0.6755, "lr": 0.0003397784197533095, "epoch": 12.869496855345911, "percentage": 64.35, "elapsed_time": "1:02:44", "remaining_time": "0:34:45", "throughput": 4255.62, "total_tokens": 16021504} {"current_steps": 24560, "total_steps": 38160, "loss": 0.4244, "lr": 0.0003395618099330431, "epoch": 12.872117400419286, "percentage": 64.36, "elapsed_time": "1:02:45", "remaining_time": "0:34:45", "throughput": 4255.65, "total_tokens": 16024736} {"current_steps": 24565, "total_steps": 38160, "loss": 0.4307, "lr": 0.0003393452336746156, "epoch": 12.874737945492662, "percentage": 64.37, "elapsed_time": "1:02:46", "remaining_time": "0:34:44", "throughput": 4255.62, "total_tokens": 16027296} {"current_steps": 24570, "total_steps": 38160, "loss": 0.3542, "lr": 0.00033912869102333237, "epoch": 12.877358490566039, "percentage": 64.39, "elapsed_time": "1:02:46", "remaining_time": "0:34:43", "throughput": 4255.58, "total_tokens": 16029920} {"current_steps": 24575, "total_steps": 38160, "loss": 0.373, "lr": 0.00033891218202449164, "epoch": 12.879979035639414, "percentage": 64.4, "elapsed_time": "1:02:47", "remaining_time": "0:34:42", "throughput": 4255.57, "total_tokens": 16032672} {"current_steps": 24580, "total_steps": 38160, "loss": 0.3284, "lr": 0.00033869570672338486, "epoch": 12.882599580712789, "percentage": 64.41, "elapsed_time": "1:02:48", "remaining_time": "0:34:41", "throughput": 4255.51, "total_tokens": 16035040} {"current_steps": 24585, "total_steps": 38160, "loss": 0.3766, "lr": 0.00033847926516529574, "epoch": 12.885220125786164, "percentage": 64.43, "elapsed_time": "1:02:49", "remaining_time": "0:34:41", "throughput": 4255.77, "total_tokens": 16040064} {"current_steps": 24590, "total_steps": 38160, "loss": 0.4138, "lr": 0.0003382628573955018, "epoch": 12.88784067085954, "percentage": 64.44, "elapsed_time": "1:02:49", "remaining_time": "0:34:40", "throughput": 4255.75, "total_tokens": 16042784} {"current_steps": 24595, "total_steps": 38160, "loss": 0.3703, "lr": 0.00033804648345927267, "epoch": 12.890461215932914, "percentage": 64.45, "elapsed_time": "1:02:50", "remaining_time": "0:34:39", "throughput": 4255.79, "total_tokens": 16045952} {"current_steps": 24600, "total_steps": 38160, "loss": 0.4401, "lr": 0.00033783014340187166, "epoch": 12.89308176100629, "percentage": 64.47, "elapsed_time": "1:02:51", "remaining_time": "0:34:38", "throughput": 4255.84, "total_tokens": 16049248} {"current_steps": 24605, "total_steps": 38160, "loss": 0.5119, "lr": 0.0003376138372685545, "epoch": 12.895702306079665, "percentage": 64.48, "elapsed_time": "1:02:51", "remaining_time": "0:34:37", "throughput": 4255.9, "total_tokens": 16052576} {"current_steps": 24610, "total_steps": 38160, "loss": 0.6587, "lr": 0.00033739756510457015, "epoch": 12.89832285115304, "percentage": 64.49, "elapsed_time": "1:02:52", "remaining_time": "0:34:37", "throughput": 4255.96, "total_tokens": 16055936} {"current_steps": 24615, "total_steps": 38160, "loss": 0.5539, "lr": 0.00033718132695516003, "epoch": 12.900943396226415, "percentage": 64.5, "elapsed_time": "1:02:53", "remaining_time": "0:34:36", "throughput": 4255.88, "total_tokens": 16058176} {"current_steps": 24620, "total_steps": 38160, "loss": 0.4822, "lr": 0.00033696512286555865, "epoch": 12.90356394129979, "percentage": 64.52, "elapsed_time": "1:02:53", "remaining_time": "0:34:35", "throughput": 4255.94, "total_tokens": 16061568} {"current_steps": 24625, "total_steps": 38160, "loss": 0.5082, "lr": 0.0003367489528809936, "epoch": 12.906184486373165, "percentage": 64.53, "elapsed_time": "1:02:54", "remaining_time": "0:34:34", "throughput": 4256.06, "total_tokens": 16065536} {"current_steps": 24630, "total_steps": 38160, "loss": 0.4811, "lr": 0.00033653281704668515, "epoch": 12.90880503144654, "percentage": 64.54, "elapsed_time": "1:02:55", "remaining_time": "0:34:33", "throughput": 4256.03, "total_tokens": 16068192} {"current_steps": 24635, "total_steps": 38160, "loss": 0.4642, "lr": 0.0003363167154078465, "epoch": 12.911425576519916, "percentage": 64.56, "elapsed_time": "1:02:56", "remaining_time": "0:34:33", "throughput": 4256.02, "total_tokens": 16071008} {"current_steps": 24640, "total_steps": 38160, "loss": 0.4206, "lr": 0.0003361006480096837, "epoch": 12.914046121593291, "percentage": 64.57, "elapsed_time": "1:02:56", "remaining_time": "0:34:32", "throughput": 4256.1, "total_tokens": 16074688} {"current_steps": 24645, "total_steps": 38160, "loss": 0.3964, "lr": 0.0003358846148973953, "epoch": 12.916666666666666, "percentage": 64.58, "elapsed_time": "1:02:57", "remaining_time": "0:34:31", "throughput": 4256.02, "total_tokens": 16076928} {"current_steps": 24650, "total_steps": 38160, "loss": 0.5312, "lr": 0.0003356686161161732, "epoch": 12.919287211740041, "percentage": 64.6, "elapsed_time": "1:02:58", "remaining_time": "0:34:30", "throughput": 4256.04, "total_tokens": 16079904} {"current_steps": 24655, "total_steps": 38160, "loss": 0.3497, "lr": 0.00033545265171120163, "epoch": 12.921907756813416, "percentage": 64.61, "elapsed_time": "1:02:58", "remaining_time": "0:34:29", "throughput": 4256.08, "total_tokens": 16083168} {"current_steps": 24660, "total_steps": 38160, "loss": 0.5554, "lr": 0.0003352367217276582, "epoch": 12.924528301886792, "percentage": 64.62, "elapsed_time": "1:02:59", "remaining_time": "0:34:29", "throughput": 4256.13, "total_tokens": 16086592} {"current_steps": 24665, "total_steps": 38160, "loss": 0.4836, "lr": 0.0003350208262107131, "epoch": 12.927148846960169, "percentage": 64.64, "elapsed_time": "1:03:00", "remaining_time": "0:34:28", "throughput": 4256.09, "total_tokens": 16089088} {"current_steps": 24670, "total_steps": 38160, "loss": 0.7884, "lr": 0.00033480496520552874, "epoch": 12.929769392033544, "percentage": 64.65, "elapsed_time": "1:03:00", "remaining_time": "0:34:27", "throughput": 4256.08, "total_tokens": 16091936} {"current_steps": 24675, "total_steps": 38160, "loss": 0.4347, "lr": 0.00033458913875726093, "epoch": 12.932389937106919, "percentage": 64.66, "elapsed_time": "1:03:01", "remaining_time": "0:34:26", "throughput": 4256.01, "total_tokens": 16094336} {"current_steps": 24680, "total_steps": 38160, "loss": 0.4265, "lr": 0.00033437334691105837, "epoch": 12.935010482180294, "percentage": 64.68, "elapsed_time": "1:03:02", "remaining_time": "0:34:25", "throughput": 4256.14, "total_tokens": 16098304} {"current_steps": 24685, "total_steps": 38160, "loss": 0.4267, "lr": 0.0003341575897120619, "epoch": 12.93763102725367, "percentage": 64.69, "elapsed_time": "1:03:03", "remaining_time": "0:34:25", "throughput": 4256.18, "total_tokens": 16101632} {"current_steps": 24690, "total_steps": 38160, "loss": 0.4002, "lr": 0.00033394186720540577, "epoch": 12.940251572327044, "percentage": 64.7, "elapsed_time": "1:03:03", "remaining_time": "0:34:24", "throughput": 4256.25, "total_tokens": 16105024} {"current_steps": 24695, "total_steps": 38160, "loss": 0.3602, "lr": 0.00033372617943621665, "epoch": 12.94287211740042, "percentage": 64.71, "elapsed_time": "1:03:04", "remaining_time": "0:34:23", "throughput": 4256.27, "total_tokens": 16108096} {"current_steps": 24700, "total_steps": 38160, "loss": 0.4372, "lr": 0.00033351052644961353, "epoch": 12.945492662473795, "percentage": 64.73, "elapsed_time": "1:03:05", "remaining_time": "0:34:22", "throughput": 4256.36, "total_tokens": 16111648} {"current_steps": 24705, "total_steps": 38160, "loss": 0.4999, "lr": 0.00033329490829070907, "epoch": 12.94811320754717, "percentage": 64.74, "elapsed_time": "1:03:06", "remaining_time": "0:34:21", "throughput": 4256.38, "total_tokens": 16114752} {"current_steps": 24710, "total_steps": 38160, "loss": 0.5385, "lr": 0.0003330793250046078, "epoch": 12.950733752620545, "percentage": 64.75, "elapsed_time": "1:03:06", "remaining_time": "0:34:21", "throughput": 4256.62, "total_tokens": 16119616} {"current_steps": 24715, "total_steps": 38160, "loss": 0.468, "lr": 0.0003328637766364075, "epoch": 12.95335429769392, "percentage": 64.77, "elapsed_time": "1:03:07", "remaining_time": "0:34:20", "throughput": 4256.71, "total_tokens": 16123232} {"current_steps": 24720, "total_steps": 38160, "loss": 0.464, "lr": 0.00033264826323119824, "epoch": 12.955974842767295, "percentage": 64.78, "elapsed_time": "1:03:08", "remaining_time": "0:34:19", "throughput": 4256.89, "total_tokens": 16127552} {"current_steps": 24725, "total_steps": 38160, "loss": 0.4159, "lr": 0.00033243278483406326, "epoch": 12.95859538784067, "percentage": 64.79, "elapsed_time": "1:03:09", "remaining_time": "0:34:18", "throughput": 4256.88, "total_tokens": 16130368} {"current_steps": 24730, "total_steps": 38160, "loss": 0.4007, "lr": 0.00033221734149007785, "epoch": 12.961215932914046, "percentage": 64.81, "elapsed_time": "1:03:10", "remaining_time": "0:34:18", "throughput": 4257.0, "total_tokens": 16134208} {"current_steps": 24735, "total_steps": 38160, "loss": 0.4159, "lr": 0.0003320019332443104, "epoch": 12.963836477987421, "percentage": 64.82, "elapsed_time": "1:03:10", "remaining_time": "0:34:17", "throughput": 4257.01, "total_tokens": 16137120} {"current_steps": 24740, "total_steps": 38160, "loss": 0.4989, "lr": 0.00033178656014182185, "epoch": 12.966457023060796, "percentage": 64.83, "elapsed_time": "1:03:11", "remaining_time": "0:34:16", "throughput": 4257.08, "total_tokens": 16140576} {"current_steps": 24745, "total_steps": 38160, "loss": 0.4891, "lr": 0.00033157122222766597, "epoch": 12.969077568134171, "percentage": 64.85, "elapsed_time": "1:03:12", "remaining_time": "0:34:15", "throughput": 4257.12, "total_tokens": 16143808} {"current_steps": 24750, "total_steps": 38160, "loss": 0.5541, "lr": 0.0003313559195468889, "epoch": 12.971698113207546, "percentage": 64.86, "elapsed_time": "1:03:12", "remaining_time": "0:34:15", "throughput": 4257.18, "total_tokens": 16147136} {"current_steps": 24755, "total_steps": 38160, "loss": 0.4189, "lr": 0.0003311406521445293, "epoch": 12.974318658280922, "percentage": 64.87, "elapsed_time": "1:03:13", "remaining_time": "0:34:14", "throughput": 4257.2, "total_tokens": 16150272} {"current_steps": 24760, "total_steps": 38160, "loss": 0.506, "lr": 0.000330925420065619, "epoch": 12.976939203354299, "percentage": 64.88, "elapsed_time": "1:03:14", "remaining_time": "0:34:13", "throughput": 4257.3, "total_tokens": 16153920} {"current_steps": 24765, "total_steps": 38160, "loss": 0.3731, "lr": 0.0003307102233551817, "epoch": 12.979559748427674, "percentage": 64.9, "elapsed_time": "1:03:15", "remaining_time": "0:34:12", "throughput": 4257.36, "total_tokens": 16157280} {"current_steps": 24770, "total_steps": 38160, "loss": 0.4751, "lr": 0.0003304950620582344, "epoch": 12.982180293501049, "percentage": 64.91, "elapsed_time": "1:03:15", "remaining_time": "0:34:11", "throughput": 4257.47, "total_tokens": 16161056} {"current_steps": 24775, "total_steps": 38160, "loss": 0.4683, "lr": 0.0003302799362197864, "epoch": 12.984800838574424, "percentage": 64.92, "elapsed_time": "1:03:16", "remaining_time": "0:34:11", "throughput": 4257.46, "total_tokens": 16163776} {"current_steps": 24780, "total_steps": 38160, "loss": 0.3902, "lr": 0.00033006484588483947, "epoch": 12.9874213836478, "percentage": 64.94, "elapsed_time": "1:03:17", "remaining_time": "0:34:10", "throughput": 4257.4, "total_tokens": 16166176} {"current_steps": 24785, "total_steps": 38160, "loss": 0.3613, "lr": 0.00032984979109838803, "epoch": 12.990041928721174, "percentage": 64.95, "elapsed_time": "1:03:17", "remaining_time": "0:34:09", "throughput": 4257.35, "total_tokens": 16168704} {"current_steps": 24790, "total_steps": 38160, "loss": 0.4408, "lr": 0.000329634771905419, "epoch": 12.99266247379455, "percentage": 64.96, "elapsed_time": "1:03:18", "remaining_time": "0:34:08", "throughput": 4257.35, "total_tokens": 16171584} {"current_steps": 24795, "total_steps": 38160, "loss": 0.5501, "lr": 0.0003294197883509122, "epoch": 12.995283018867925, "percentage": 64.98, "elapsed_time": "1:03:19", "remaining_time": "0:34:07", "throughput": 4257.37, "total_tokens": 16174656} {"current_steps": 24800, "total_steps": 38160, "loss": 0.5904, "lr": 0.00032920484047983947, "epoch": 12.9979035639413, "percentage": 64.99, "elapsed_time": "1:03:19", "remaining_time": "0:34:07", "throughput": 4257.35, "total_tokens": 16177344} {"current_steps": 24804, "total_steps": 38160, "eval_loss": 0.45868632197380066, "epoch": 13.0, "percentage": 65.0, "elapsed_time": "1:03:34", "remaining_time": "0:34:13", "throughput": 4242.04, "total_tokens": 16179624} {"current_steps": 24805, "total_steps": 38160, "loss": 0.4989, "lr": 0.0003289899283371657, "epoch": 13.000524109014675, "percentage": 65.0, "elapsed_time": "1:03:36", "remaining_time": "0:34:14", "throughput": 4239.78, "total_tokens": 16180040} {"current_steps": 24810, "total_steps": 38160, "loss": 0.4634, "lr": 0.00032877505196784795, "epoch": 13.00314465408805, "percentage": 65.02, "elapsed_time": "1:03:36", "remaining_time": "0:34:13", "throughput": 4239.81, "total_tokens": 16183176} {"current_steps": 24815, "total_steps": 38160, "loss": 0.4018, "lr": 0.0003285602114168358, "epoch": 13.005765199161425, "percentage": 65.03, "elapsed_time": "1:03:37", "remaining_time": "0:34:13", "throughput": 4239.79, "total_tokens": 16185928} {"current_steps": 24820, "total_steps": 38160, "loss": 0.5085, "lr": 0.00032834540672907144, "epoch": 13.0083857442348, "percentage": 65.04, "elapsed_time": "1:03:38", "remaining_time": "0:34:12", "throughput": 4239.83, "total_tokens": 16189160} {"current_steps": 24825, "total_steps": 38160, "loss": 0.2896, "lr": 0.00032813063794948983, "epoch": 13.011006289308176, "percentage": 65.06, "elapsed_time": "1:03:39", "remaining_time": "0:34:11", "throughput": 4239.84, "total_tokens": 16192392} {"current_steps": 24830, "total_steps": 38160, "loss": 0.4511, "lr": 0.00032791590512301784, "epoch": 13.01362683438155, "percentage": 65.07, "elapsed_time": "1:03:39", "remaining_time": "0:34:10", "throughput": 4239.9, "total_tokens": 16195752} {"current_steps": 24835, "total_steps": 38160, "loss": 0.3863, "lr": 0.00032770120829457534, "epoch": 13.016247379454926, "percentage": 65.08, "elapsed_time": "1:03:40", "remaining_time": "0:34:09", "throughput": 4239.96, "total_tokens": 16199176} {"current_steps": 24840, "total_steps": 38160, "loss": 0.5443, "lr": 0.00032748654750907447, "epoch": 13.018867924528301, "percentage": 65.09, "elapsed_time": "1:03:41", "remaining_time": "0:34:09", "throughput": 4239.92, "total_tokens": 16201768} {"current_steps": 24845, "total_steps": 38160, "loss": 0.391, "lr": 0.0003272719228114196, "epoch": 13.021488469601676, "percentage": 65.11, "elapsed_time": "1:03:41", "remaining_time": "0:34:08", "throughput": 4239.94, "total_tokens": 16204680} {"current_steps": 24850, "total_steps": 38160, "loss": 0.4469, "lr": 0.0003270573342465079, "epoch": 13.024109014675052, "percentage": 65.12, "elapsed_time": "1:03:42", "remaining_time": "0:34:07", "throughput": 4240.02, "total_tokens": 16208264} {"current_steps": 24855, "total_steps": 38160, "loss": 0.3676, "lr": 0.00032684278185922877, "epoch": 13.026729559748428, "percentage": 65.13, "elapsed_time": "1:03:43", "remaining_time": "0:34:06", "throughput": 4239.95, "total_tokens": 16210536} {"current_steps": 24860, "total_steps": 38160, "loss": 0.5692, "lr": 0.0003266282656944643, "epoch": 13.029350104821804, "percentage": 65.15, "elapsed_time": "1:03:44", "remaining_time": "0:34:05", "throughput": 4240.05, "total_tokens": 16214376} {"current_steps": 24865, "total_steps": 38160, "loss": 0.5512, "lr": 0.0003264137857970888, "epoch": 13.031970649895179, "percentage": 65.16, "elapsed_time": "1:03:44", "remaining_time": "0:34:05", "throughput": 4240.07, "total_tokens": 16217416} {"current_steps": 24870, "total_steps": 38160, "loss": 0.472, "lr": 0.0003261993422119688, "epoch": 13.034591194968554, "percentage": 65.17, "elapsed_time": "1:03:45", "remaining_time": "0:34:04", "throughput": 4240.09, "total_tokens": 16220584} {"current_steps": 24875, "total_steps": 38160, "loss": 0.3496, "lr": 0.00032598493498396365, "epoch": 13.03721174004193, "percentage": 65.19, "elapsed_time": "1:03:46", "remaining_time": "0:34:03", "throughput": 4240.16, "total_tokens": 16224040} {"current_steps": 24880, "total_steps": 38160, "loss": 0.4479, "lr": 0.0003257705641579247, "epoch": 13.039832285115304, "percentage": 65.2, "elapsed_time": "1:03:46", "remaining_time": "0:34:02", "throughput": 4240.17, "total_tokens": 16227016} {"current_steps": 24885, "total_steps": 38160, "loss": 0.4787, "lr": 0.00032555622977869614, "epoch": 13.04245283018868, "percentage": 65.21, "elapsed_time": "1:03:47", "remaining_time": "0:34:01", "throughput": 4240.15, "total_tokens": 16229768} {"current_steps": 24890, "total_steps": 38160, "loss": 0.3398, "lr": 0.00032534193189111407, "epoch": 13.045073375262055, "percentage": 65.23, "elapsed_time": "1:03:48", "remaining_time": "0:34:01", "throughput": 4240.22, "total_tokens": 16233224} {"current_steps": 24895, "total_steps": 38160, "loss": 0.3309, "lr": 0.0003251276705400074, "epoch": 13.04769392033543, "percentage": 65.24, "elapsed_time": "1:03:49", "remaining_time": "0:34:00", "throughput": 4240.24, "total_tokens": 16236264} {"current_steps": 24900, "total_steps": 38160, "loss": 0.3948, "lr": 0.0003249134457701968, "epoch": 13.050314465408805, "percentage": 65.25, "elapsed_time": "1:03:49", "remaining_time": "0:33:59", "throughput": 4240.22, "total_tokens": 16238984} {"current_steps": 24905, "total_steps": 38160, "loss": 0.3767, "lr": 0.000324699257626496, "epoch": 13.05293501048218, "percentage": 65.26, "elapsed_time": "1:03:50", "remaining_time": "0:33:58", "throughput": 4240.18, "total_tokens": 16241608} {"current_steps": 24910, "total_steps": 38160, "loss": 0.4519, "lr": 0.00032448510615371045, "epoch": 13.055555555555555, "percentage": 65.28, "elapsed_time": "1:03:51", "remaining_time": "0:33:57", "throughput": 4240.16, "total_tokens": 16244328} {"current_steps": 24915, "total_steps": 38160, "loss": 0.484, "lr": 0.0003242709913966384, "epoch": 13.05817610062893, "percentage": 65.29, "elapsed_time": "1:03:51", "remaining_time": "0:33:57", "throughput": 4240.24, "total_tokens": 16247912} {"current_steps": 24920, "total_steps": 38160, "loss": 0.4899, "lr": 0.00032405691340007, "epoch": 13.060796645702306, "percentage": 65.3, "elapsed_time": "1:03:52", "remaining_time": "0:33:56", "throughput": 4240.25, "total_tokens": 16250920} {"current_steps": 24925, "total_steps": 38160, "loss": 0.4772, "lr": 0.0003238428722087884, "epoch": 13.06341719077568, "percentage": 65.32, "elapsed_time": "1:03:53", "remaining_time": "0:33:55", "throughput": 4240.35, "total_tokens": 16254728} {"current_steps": 24930, "total_steps": 38160, "loss": 0.3624, "lr": 0.00032362886786756797, "epoch": 13.066037735849056, "percentage": 65.33, "elapsed_time": "1:03:54", "remaining_time": "0:33:54", "throughput": 4240.35, "total_tokens": 16257640} {"current_steps": 24935, "total_steps": 38160, "loss": 0.5078, "lr": 0.00032341490042117615, "epoch": 13.068658280922431, "percentage": 65.34, "elapsed_time": "1:03:54", "remaining_time": "0:33:53", "throughput": 4240.38, "total_tokens": 16260808} {"current_steps": 24940, "total_steps": 38160, "loss": 0.3766, "lr": 0.00032320096991437277, "epoch": 13.071278825995806, "percentage": 65.36, "elapsed_time": "1:03:55", "remaining_time": "0:33:53", "throughput": 4240.45, "total_tokens": 16264264} {"current_steps": 24945, "total_steps": 38160, "loss": 0.4104, "lr": 0.0003229870763919093, "epoch": 13.073899371069182, "percentage": 65.37, "elapsed_time": "1:03:56", "remaining_time": "0:33:52", "throughput": 4240.49, "total_tokens": 16267528} {"current_steps": 24950, "total_steps": 38160, "loss": 0.5571, "lr": 0.00032277321989853015, "epoch": 13.076519916142558, "percentage": 65.38, "elapsed_time": "1:03:56", "remaining_time": "0:33:51", "throughput": 4240.46, "total_tokens": 16270088} {"current_steps": 24955, "total_steps": 38160, "loss": 0.5233, "lr": 0.00032255940047897137, "epoch": 13.079140461215934, "percentage": 65.4, "elapsed_time": "1:03:57", "remaining_time": "0:33:50", "throughput": 4240.49, "total_tokens": 16273320} {"current_steps": 24960, "total_steps": 38160, "loss": 0.4398, "lr": 0.0003223456181779616, "epoch": 13.081761006289309, "percentage": 65.41, "elapsed_time": "1:03:58", "remaining_time": "0:33:49", "throughput": 4240.48, "total_tokens": 16276232} {"current_steps": 24965, "total_steps": 38160, "loss": 0.5193, "lr": 0.0003221318730402218, "epoch": 13.084381551362684, "percentage": 65.42, "elapsed_time": "1:03:59", "remaining_time": "0:33:49", "throughput": 4240.49, "total_tokens": 16279272} {"current_steps": 24970, "total_steps": 38160, "loss": 0.4098, "lr": 0.00032191816511046483, "epoch": 13.08700209643606, "percentage": 65.44, "elapsed_time": "1:03:59", "remaining_time": "0:33:48", "throughput": 4240.49, "total_tokens": 16282024} {"current_steps": 24975, "total_steps": 38160, "loss": 0.4231, "lr": 0.0003217044944333961, "epoch": 13.089622641509434, "percentage": 65.45, "elapsed_time": "1:04:00", "remaining_time": "0:33:47", "throughput": 4240.46, "total_tokens": 16284808} {"current_steps": 24980, "total_steps": 38160, "loss": 0.64, "lr": 0.00032149086105371315, "epoch": 13.09224318658281, "percentage": 65.46, "elapsed_time": "1:04:01", "remaining_time": "0:33:46", "throughput": 4240.52, "total_tokens": 16288200} {"current_steps": 24985, "total_steps": 38160, "loss": 0.4141, "lr": 0.00032127726501610554, "epoch": 13.094863731656185, "percentage": 65.47, "elapsed_time": "1:04:01", "remaining_time": "0:33:45", "throughput": 4240.53, "total_tokens": 16291176} {"current_steps": 24990, "total_steps": 38160, "loss": 0.4835, "lr": 0.00032106370636525493, "epoch": 13.09748427672956, "percentage": 65.49, "elapsed_time": "1:04:02", "remaining_time": "0:33:45", "throughput": 4240.51, "total_tokens": 16293896} {"current_steps": 24995, "total_steps": 38160, "loss": 0.3679, "lr": 0.00032085018514583564, "epoch": 13.100104821802935, "percentage": 65.5, "elapsed_time": "1:04:03", "remaining_time": "0:33:44", "throughput": 4240.57, "total_tokens": 16297192} {"current_steps": 25000, "total_steps": 38160, "loss": 0.493, "lr": 0.00032063670140251366, "epoch": 13.10272536687631, "percentage": 65.51, "elapsed_time": "1:04:03", "remaining_time": "0:33:43", "throughput": 4240.64, "total_tokens": 16300680} {"current_steps": 25005, "total_steps": 38160, "loss": 0.2395, "lr": 0.0003204232551799476, "epoch": 13.105345911949685, "percentage": 65.53, "elapsed_time": "1:04:04", "remaining_time": "0:33:42", "throughput": 4240.58, "total_tokens": 16303080} {"current_steps": 25010, "total_steps": 38160, "loss": 0.469, "lr": 0.00032020984652278797, "epoch": 13.10796645702306, "percentage": 65.54, "elapsed_time": "1:04:05", "remaining_time": "0:33:41", "throughput": 4240.49, "total_tokens": 16305224} {"current_steps": 25015, "total_steps": 38160, "loss": 0.5494, "lr": 0.000319996475475677, "epoch": 13.110587002096436, "percentage": 65.55, "elapsed_time": "1:04:05", "remaining_time": "0:33:40", "throughput": 4240.51, "total_tokens": 16308168} {"current_steps": 25020, "total_steps": 38160, "loss": 0.4656, "lr": 0.0003197831420832499, "epoch": 13.11320754716981, "percentage": 65.57, "elapsed_time": "1:04:06", "remaining_time": "0:33:40", "throughput": 4240.63, "total_tokens": 16312072} {"current_steps": 25025, "total_steps": 38160, "loss": 0.4813, "lr": 0.0003195698463901334, "epoch": 13.115828092243186, "percentage": 65.58, "elapsed_time": "1:04:07", "remaining_time": "0:33:39", "throughput": 4240.66, "total_tokens": 16315112} {"current_steps": 25030, "total_steps": 38160, "loss": 0.5548, "lr": 0.0003193565884409466, "epoch": 13.118448637316561, "percentage": 65.59, "elapsed_time": "1:04:07", "remaining_time": "0:33:38", "throughput": 4240.63, "total_tokens": 16317704} {"current_steps": 25035, "total_steps": 38160, "loss": 0.4347, "lr": 0.0003191433682803008, "epoch": 13.121069182389936, "percentage": 65.61, "elapsed_time": "1:04:08", "remaining_time": "0:33:37", "throughput": 4240.71, "total_tokens": 16321288} {"current_steps": 25040, "total_steps": 38160, "loss": 0.322, "lr": 0.00031893018595279877, "epoch": 13.123689727463312, "percentage": 65.62, "elapsed_time": "1:04:09", "remaining_time": "0:33:36", "throughput": 4240.75, "total_tokens": 16324360} {"current_steps": 25045, "total_steps": 38160, "loss": 0.3643, "lr": 0.00031871704150303624, "epoch": 13.126310272536688, "percentage": 65.63, "elapsed_time": "1:04:10", "remaining_time": "0:33:36", "throughput": 4240.82, "total_tokens": 16327784} {"current_steps": 25050, "total_steps": 38160, "loss": 0.5527, "lr": 0.00031850393497560034, "epoch": 13.128930817610064, "percentage": 65.64, "elapsed_time": "1:04:10", "remaining_time": "0:33:35", "throughput": 4240.97, "total_tokens": 16331848} {"current_steps": 25055, "total_steps": 38160, "loss": 0.4775, "lr": 0.00031829086641507054, "epoch": 13.131551362683439, "percentage": 65.66, "elapsed_time": "1:04:11", "remaining_time": "0:33:34", "throughput": 4241.08, "total_tokens": 16335592} {"current_steps": 25060, "total_steps": 38160, "loss": 0.5506, "lr": 0.00031807783586601865, "epoch": 13.134171907756814, "percentage": 65.67, "elapsed_time": "1:04:12", "remaining_time": "0:33:33", "throughput": 4241.29, "total_tokens": 16340200} {"current_steps": 25065, "total_steps": 38160, "loss": 0.4837, "lr": 0.00031786484337300805, "epoch": 13.13679245283019, "percentage": 65.68, "elapsed_time": "1:04:13", "remaining_time": "0:33:33", "throughput": 4241.29, "total_tokens": 16343208} {"current_steps": 25070, "total_steps": 38160, "loss": 0.3508, "lr": 0.0003176518889805941, "epoch": 13.139412997903564, "percentage": 65.7, "elapsed_time": "1:04:14", "remaining_time": "0:33:32", "throughput": 4241.3, "total_tokens": 16346088} {"current_steps": 25075, "total_steps": 38160, "loss": 0.4582, "lr": 0.0003174389727333248, "epoch": 13.14203354297694, "percentage": 65.71, "elapsed_time": "1:04:14", "remaining_time": "0:33:31", "throughput": 4241.39, "total_tokens": 16349768} {"current_steps": 25080, "total_steps": 38160, "loss": 0.44, "lr": 0.00031722609467573946, "epoch": 13.144654088050315, "percentage": 65.72, "elapsed_time": "1:04:15", "remaining_time": "0:33:30", "throughput": 4241.55, "total_tokens": 16353960} {"current_steps": 25085, "total_steps": 38160, "loss": 0.579, "lr": 0.0003170132548523701, "epoch": 13.14727463312369, "percentage": 65.74, "elapsed_time": "1:04:16", "remaining_time": "0:33:30", "throughput": 4241.56, "total_tokens": 16356904} {"current_steps": 25090, "total_steps": 38160, "loss": 0.368, "lr": 0.00031680045330774003, "epoch": 13.149895178197065, "percentage": 65.75, "elapsed_time": "1:04:17", "remaining_time": "0:33:29", "throughput": 4241.59, "total_tokens": 16360040} {"current_steps": 25095, "total_steps": 38160, "loss": 0.4377, "lr": 0.00031658769008636534, "epoch": 13.15251572327044, "percentage": 65.76, "elapsed_time": "1:04:17", "remaining_time": "0:33:28", "throughput": 4241.64, "total_tokens": 16363496} {"current_steps": 25100, "total_steps": 38160, "loss": 0.4494, "lr": 0.0003163749652327532, "epoch": 13.155136268343815, "percentage": 65.78, "elapsed_time": "1:04:18", "remaining_time": "0:33:27", "throughput": 4241.66, "total_tokens": 16366376} {"current_steps": 25105, "total_steps": 38160, "loss": 0.5176, "lr": 0.00031616227879140347, "epoch": 13.15775681341719, "percentage": 65.79, "elapsed_time": "1:04:19", "remaining_time": "0:33:26", "throughput": 4241.77, "total_tokens": 16370184} {"current_steps": 25110, "total_steps": 38160, "loss": 0.4041, "lr": 0.0003159496308068077, "epoch": 13.160377358490566, "percentage": 65.8, "elapsed_time": "1:04:20", "remaining_time": "0:33:26", "throughput": 4241.9, "total_tokens": 16374152} {"current_steps": 25115, "total_steps": 38160, "loss": 0.4344, "lr": 0.00031573702132344926, "epoch": 13.16299790356394, "percentage": 65.81, "elapsed_time": "1:04:20", "remaining_time": "0:33:25", "throughput": 4241.88, "total_tokens": 16376904} {"current_steps": 25120, "total_steps": 38160, "loss": 0.3872, "lr": 0.00031552445038580414, "epoch": 13.165618448637316, "percentage": 65.83, "elapsed_time": "1:04:21", "remaining_time": "0:33:24", "throughput": 4241.88, "total_tokens": 16379784} {"current_steps": 25125, "total_steps": 38160, "loss": 0.4323, "lr": 0.0003153119180383391, "epoch": 13.168238993710691, "percentage": 65.84, "elapsed_time": "1:04:22", "remaining_time": "0:33:23", "throughput": 4241.91, "total_tokens": 16382888} {"current_steps": 25130, "total_steps": 38160, "loss": 0.3843, "lr": 0.0003150994243255138, "epoch": 13.170859538784066, "percentage": 65.85, "elapsed_time": "1:04:22", "remaining_time": "0:33:22", "throughput": 4241.99, "total_tokens": 16386472} {"current_steps": 25135, "total_steps": 38160, "loss": 0.564, "lr": 0.00031488696929177944, "epoch": 13.173480083857442, "percentage": 65.87, "elapsed_time": "1:04:23", "remaining_time": "0:33:22", "throughput": 4242.01, "total_tokens": 16389608} {"current_steps": 25140, "total_steps": 38160, "loss": 0.353, "lr": 0.00031467455298157934, "epoch": 13.176100628930818, "percentage": 65.88, "elapsed_time": "1:04:24", "remaining_time": "0:33:21", "throughput": 4242.08, "total_tokens": 16393032} {"current_steps": 25145, "total_steps": 38160, "loss": 0.3613, "lr": 0.0003144621754393483, "epoch": 13.178721174004194, "percentage": 65.89, "elapsed_time": "1:04:25", "remaining_time": "0:33:20", "throughput": 4242.16, "total_tokens": 16396712} {"current_steps": 25150, "total_steps": 38160, "loss": 0.4972, "lr": 0.0003142498367095137, "epoch": 13.181341719077569, "percentage": 65.91, "elapsed_time": "1:04:25", "remaining_time": "0:33:19", "throughput": 4242.12, "total_tokens": 16399272} {"current_steps": 25155, "total_steps": 38160, "loss": 0.3959, "lr": 0.00031403753683649396, "epoch": 13.183962264150944, "percentage": 65.92, "elapsed_time": "1:04:26", "remaining_time": "0:33:18", "throughput": 4242.12, "total_tokens": 16402088} {"current_steps": 25160, "total_steps": 38160, "loss": 0.6086, "lr": 0.0003138252758646999, "epoch": 13.18658280922432, "percentage": 65.93, "elapsed_time": "1:04:27", "remaining_time": "0:33:18", "throughput": 4242.29, "total_tokens": 16406600} {"current_steps": 25165, "total_steps": 38160, "loss": 0.4022, "lr": 0.00031361305383853413, "epoch": 13.189203354297694, "percentage": 65.95, "elapsed_time": "1:04:28", "remaining_time": "0:33:17", "throughput": 4242.26, "total_tokens": 16409224} {"current_steps": 25170, "total_steps": 38160, "loss": 0.7269, "lr": 0.00031340087080239105, "epoch": 13.19182389937107, "percentage": 65.96, "elapsed_time": "1:04:28", "remaining_time": "0:33:16", "throughput": 4242.27, "total_tokens": 16412136} {"current_steps": 25175, "total_steps": 38160, "loss": 0.4119, "lr": 0.0003131887268006571, "epoch": 13.194444444444445, "percentage": 65.97, "elapsed_time": "1:04:29", "remaining_time": "0:33:15", "throughput": 4242.42, "total_tokens": 16416392} {"current_steps": 25180, "total_steps": 38160, "loss": 0.4705, "lr": 0.00031297662187771026, "epoch": 13.19706498951782, "percentage": 65.99, "elapsed_time": "1:04:30", "remaining_time": "0:33:15", "throughput": 4242.47, "total_tokens": 16419688} {"current_steps": 25185, "total_steps": 38160, "loss": 0.4492, "lr": 0.0003127645560779203, "epoch": 13.199685534591195, "percentage": 66.0, "elapsed_time": "1:04:31", "remaining_time": "0:33:14", "throughput": 4242.51, "total_tokens": 16422856} {"current_steps": 25190, "total_steps": 38160, "loss": 0.4466, "lr": 0.0003125525294456492, "epoch": 13.20230607966457, "percentage": 66.01, "elapsed_time": "1:04:31", "remaining_time": "0:33:13", "throughput": 4242.49, "total_tokens": 16425608} {"current_steps": 25195, "total_steps": 38160, "loss": 0.4108, "lr": 0.0003123405420252503, "epoch": 13.204926624737945, "percentage": 66.02, "elapsed_time": "1:04:32", "remaining_time": "0:33:12", "throughput": 4242.59, "total_tokens": 16429288} {"current_steps": 25200, "total_steps": 38160, "loss": 0.4758, "lr": 0.00031212859386106927, "epoch": 13.20754716981132, "percentage": 66.04, "elapsed_time": "1:04:33", "remaining_time": "0:33:11", "throughput": 4242.66, "total_tokens": 16432744} {"current_steps": 25205, "total_steps": 38160, "loss": 0.2952, "lr": 0.00031191668499744286, "epoch": 13.210167714884696, "percentage": 66.05, "elapsed_time": "1:04:33", "remaining_time": "0:33:11", "throughput": 4242.71, "total_tokens": 16435944} {"current_steps": 25210, "total_steps": 38160, "loss": 0.3296, "lr": 0.00031170481547870046, "epoch": 13.21278825995807, "percentage": 66.06, "elapsed_time": "1:04:34", "remaining_time": "0:33:10", "throughput": 4242.7, "total_tokens": 16438760} {"current_steps": 25215, "total_steps": 38160, "loss": 0.3922, "lr": 0.00031149298534916215, "epoch": 13.215408805031446, "percentage": 66.08, "elapsed_time": "1:04:35", "remaining_time": "0:33:09", "throughput": 4242.79, "total_tokens": 16442280} {"current_steps": 25220, "total_steps": 38160, "loss": 0.3508, "lr": 0.00031128119465314094, "epoch": 13.218029350104821, "percentage": 66.09, "elapsed_time": "1:04:36", "remaining_time": "0:33:08", "throughput": 4242.82, "total_tokens": 16445384} {"current_steps": 25225, "total_steps": 38160, "loss": 0.2925, "lr": 0.0003110694434349406, "epoch": 13.220649895178196, "percentage": 66.1, "elapsed_time": "1:04:36", "remaining_time": "0:33:07", "throughput": 4242.8, "total_tokens": 16448040} {"current_steps": 25230, "total_steps": 38160, "loss": 0.3971, "lr": 0.0003108577317388574, "epoch": 13.223270440251572, "percentage": 66.12, "elapsed_time": "1:04:37", "remaining_time": "0:33:07", "throughput": 4242.86, "total_tokens": 16451432} {"current_steps": 25235, "total_steps": 38160, "loss": 0.3711, "lr": 0.00031064605960917896, "epoch": 13.225890985324948, "percentage": 66.13, "elapsed_time": "1:04:38", "remaining_time": "0:33:06", "throughput": 4243.03, "total_tokens": 16455624} {"current_steps": 25240, "total_steps": 38160, "loss": 0.336, "lr": 0.00031043442709018446, "epoch": 13.228511530398324, "percentage": 66.14, "elapsed_time": "1:04:39", "remaining_time": "0:33:05", "throughput": 4243.09, "total_tokens": 16459112} {"current_steps": 25245, "total_steps": 38160, "loss": 0.4203, "lr": 0.0003102228342261451, "epoch": 13.231132075471699, "percentage": 66.16, "elapsed_time": "1:04:39", "remaining_time": "0:33:04", "throughput": 4243.12, "total_tokens": 16462312} {"current_steps": 25250, "total_steps": 38160, "loss": 0.5935, "lr": 0.0003100112810613237, "epoch": 13.233752620545074, "percentage": 66.17, "elapsed_time": "1:04:40", "remaining_time": "0:33:04", "throughput": 4243.11, "total_tokens": 16465128} {"current_steps": 25255, "total_steps": 38160, "loss": 0.386, "lr": 0.00030979976763997484, "epoch": 13.23637316561845, "percentage": 66.18, "elapsed_time": "1:04:41", "remaining_time": "0:33:03", "throughput": 4243.28, "total_tokens": 16469320} {"current_steps": 25260, "total_steps": 38160, "loss": 0.5704, "lr": 0.0003095882940063447, "epoch": 13.238993710691824, "percentage": 66.19, "elapsed_time": "1:04:41", "remaining_time": "0:33:02", "throughput": 4243.29, "total_tokens": 16472296} {"current_steps": 25265, "total_steps": 38160, "loss": 0.4911, "lr": 0.0003093768602046712, "epoch": 13.2416142557652, "percentage": 66.21, "elapsed_time": "1:04:42", "remaining_time": "0:33:01", "throughput": 4243.29, "total_tokens": 16475240} {"current_steps": 25270, "total_steps": 38160, "loss": 0.4707, "lr": 0.00030916546627918375, "epoch": 13.244234800838575, "percentage": 66.22, "elapsed_time": "1:04:43", "remaining_time": "0:33:00", "throughput": 4243.25, "total_tokens": 16477736} {"current_steps": 25275, "total_steps": 38160, "loss": 0.4881, "lr": 0.00030895411227410354, "epoch": 13.24685534591195, "percentage": 66.23, "elapsed_time": "1:04:43", "remaining_time": "0:33:00", "throughput": 4243.28, "total_tokens": 16480776} {"current_steps": 25280, "total_steps": 38160, "loss": 0.4188, "lr": 0.0003087427982336435, "epoch": 13.249475890985325, "percentage": 66.25, "elapsed_time": "1:04:44", "remaining_time": "0:32:59", "throughput": 4243.38, "total_tokens": 16484584} {"current_steps": 25285, "total_steps": 38160, "loss": 0.4129, "lr": 0.00030853152420200804, "epoch": 13.2520964360587, "percentage": 66.26, "elapsed_time": "1:04:45", "remaining_time": "0:32:58", "throughput": 4243.38, "total_tokens": 16487400} {"current_steps": 25290, "total_steps": 38160, "loss": 0.3981, "lr": 0.0003083202902233932, "epoch": 13.254716981132075, "percentage": 66.27, "elapsed_time": "1:04:46", "remaining_time": "0:32:57", "throughput": 4243.35, "total_tokens": 16490024} {"current_steps": 25295, "total_steps": 38160, "loss": 0.4537, "lr": 0.00030810909634198727, "epoch": 13.25733752620545, "percentage": 66.29, "elapsed_time": "1:04:46", "remaining_time": "0:32:56", "throughput": 4243.36, "total_tokens": 16493064} {"current_steps": 25300, "total_steps": 38160, "loss": 0.3641, "lr": 0.00030789794260196893, "epoch": 13.259958071278826, "percentage": 66.3, "elapsed_time": "1:04:47", "remaining_time": "0:32:56", "throughput": 4243.39, "total_tokens": 16496136} {"current_steps": 25305, "total_steps": 38160, "loss": 0.3836, "lr": 0.00030768682904750935, "epoch": 13.2625786163522, "percentage": 66.31, "elapsed_time": "1:04:48", "remaining_time": "0:32:55", "throughput": 4243.56, "total_tokens": 16500328} {"current_steps": 25310, "total_steps": 38160, "loss": 0.4545, "lr": 0.00030747575572277107, "epoch": 13.265199161425576, "percentage": 66.33, "elapsed_time": "1:04:49", "remaining_time": "0:32:54", "throughput": 4243.62, "total_tokens": 16503688} {"current_steps": 25315, "total_steps": 38160, "loss": 0.4427, "lr": 0.0003072647226719083, "epoch": 13.267819706498951, "percentage": 66.34, "elapsed_time": "1:04:49", "remaining_time": "0:32:53", "throughput": 4243.68, "total_tokens": 16507112} {"current_steps": 25320, "total_steps": 38160, "loss": 0.4518, "lr": 0.0003070537299390669, "epoch": 13.270440251572326, "percentage": 66.35, "elapsed_time": "1:04:50", "remaining_time": "0:32:52", "throughput": 4243.8, "total_tokens": 16510920} {"current_steps": 25325, "total_steps": 38160, "loss": 0.4569, "lr": 0.0003068427775683838, "epoch": 13.273060796645701, "percentage": 66.37, "elapsed_time": "1:04:51", "remaining_time": "0:32:52", "throughput": 4243.79, "total_tokens": 16513736} {"current_steps": 25330, "total_steps": 38160, "loss": 0.4766, "lr": 0.00030663186560398793, "epoch": 13.275681341719078, "percentage": 66.38, "elapsed_time": "1:04:51", "remaining_time": "0:32:51", "throughput": 4243.81, "total_tokens": 16516744} {"current_steps": 25335, "total_steps": 38160, "loss": 0.4835, "lr": 0.0003064209940899998, "epoch": 13.278301886792454, "percentage": 66.39, "elapsed_time": "1:04:52", "remaining_time": "0:32:50", "throughput": 4243.86, "total_tokens": 16519976} {"current_steps": 25340, "total_steps": 38160, "loss": 0.4234, "lr": 0.00030621016307053105, "epoch": 13.280922431865829, "percentage": 66.4, "elapsed_time": "1:04:53", "remaining_time": "0:32:49", "throughput": 4243.89, "total_tokens": 16523112} {"current_steps": 25345, "total_steps": 38160, "loss": 0.5294, "lr": 0.0003059993725896855, "epoch": 13.283542976939204, "percentage": 66.42, "elapsed_time": "1:04:54", "remaining_time": "0:32:48", "throughput": 4243.94, "total_tokens": 16526376} {"current_steps": 25350, "total_steps": 38160, "loss": 0.439, "lr": 0.0003057886226915581, "epoch": 13.286163522012579, "percentage": 66.43, "elapsed_time": "1:04:55", "remaining_time": "0:32:48", "throughput": 4244.35, "total_tokens": 16533160} {"current_steps": 25355, "total_steps": 38160, "loss": 0.3578, "lr": 0.00030557791342023476, "epoch": 13.288784067085954, "percentage": 66.44, "elapsed_time": "1:04:56", "remaining_time": "0:32:47", "throughput": 4244.42, "total_tokens": 16536680} {"current_steps": 25360, "total_steps": 38160, "loss": 0.394, "lr": 0.0003053672448197941, "epoch": 13.29140461215933, "percentage": 66.46, "elapsed_time": "1:04:56", "remaining_time": "0:32:46", "throughput": 4244.43, "total_tokens": 16539656} {"current_steps": 25365, "total_steps": 38160, "loss": 0.3916, "lr": 0.0003051566169343052, "epoch": 13.294025157232705, "percentage": 66.47, "elapsed_time": "1:04:57", "remaining_time": "0:32:46", "throughput": 4244.41, "total_tokens": 16542376} {"current_steps": 25370, "total_steps": 38160, "loss": 0.3956, "lr": 0.00030494602980782917, "epoch": 13.29664570230608, "percentage": 66.48, "elapsed_time": "1:04:58", "remaining_time": "0:32:45", "throughput": 4244.42, "total_tokens": 16545352} {"current_steps": 25375, "total_steps": 38160, "loss": 0.4939, "lr": 0.00030473548348441845, "epoch": 13.299266247379455, "percentage": 66.5, "elapsed_time": "1:04:58", "remaining_time": "0:32:44", "throughput": 4244.45, "total_tokens": 16548424} {"current_steps": 25380, "total_steps": 38160, "loss": 0.426, "lr": 0.000304524978008117, "epoch": 13.30188679245283, "percentage": 66.51, "elapsed_time": "1:04:59", "remaining_time": "0:32:43", "throughput": 4244.48, "total_tokens": 16551592} {"current_steps": 25385, "total_steps": 38160, "loss": 0.3387, "lr": 0.0003043145134229599, "epoch": 13.304507337526205, "percentage": 66.52, "elapsed_time": "1:05:00", "remaining_time": "0:32:42", "throughput": 4244.5, "total_tokens": 16554568} {"current_steps": 25390, "total_steps": 38160, "loss": 0.4126, "lr": 0.0003041040897729742, "epoch": 13.30712788259958, "percentage": 66.54, "elapsed_time": "1:05:00", "remaining_time": "0:32:41", "throughput": 4244.5, "total_tokens": 16557416} {"current_steps": 25395, "total_steps": 38160, "loss": 0.4341, "lr": 0.0003038937071021778, "epoch": 13.309748427672956, "percentage": 66.55, "elapsed_time": "1:05:01", "remaining_time": "0:32:41", "throughput": 4244.53, "total_tokens": 16560424} {"current_steps": 25400, "total_steps": 38160, "loss": 0.3527, "lr": 0.0003036833654545808, "epoch": 13.31236897274633, "percentage": 66.56, "elapsed_time": "1:05:02", "remaining_time": "0:32:40", "throughput": 4244.59, "total_tokens": 16563880} {"current_steps": 25405, "total_steps": 38160, "loss": 0.3698, "lr": 0.0003034730648741841, "epoch": 13.314989517819706, "percentage": 66.57, "elapsed_time": "1:05:03", "remaining_time": "0:32:39", "throughput": 4244.67, "total_tokens": 16567432} {"current_steps": 25410, "total_steps": 38160, "loss": 0.5441, "lr": 0.00030326280540497996, "epoch": 13.317610062893081, "percentage": 66.59, "elapsed_time": "1:05:03", "remaining_time": "0:32:38", "throughput": 4244.74, "total_tokens": 16570888} {"current_steps": 25415, "total_steps": 38160, "loss": 0.4149, "lr": 0.0003030525870909525, "epoch": 13.320230607966456, "percentage": 66.6, "elapsed_time": "1:05:04", "remaining_time": "0:32:38", "throughput": 4244.69, "total_tokens": 16573384} {"current_steps": 25420, "total_steps": 38160, "loss": 0.4701, "lr": 0.0003028424099760768, "epoch": 13.322851153039831, "percentage": 66.61, "elapsed_time": "1:05:05", "remaining_time": "0:32:37", "throughput": 4244.72, "total_tokens": 16576584} {"current_steps": 25425, "total_steps": 38160, "loss": 0.4538, "lr": 0.0003026322741043198, "epoch": 13.325471698113208, "percentage": 66.63, "elapsed_time": "1:05:06", "remaining_time": "0:32:36", "throughput": 4244.86, "total_tokens": 16580584} {"current_steps": 25430, "total_steps": 38160, "loss": 0.5105, "lr": 0.0003024221795196393, "epoch": 13.328092243186584, "percentage": 66.64, "elapsed_time": "1:05:06", "remaining_time": "0:32:35", "throughput": 4244.91, "total_tokens": 16583848} {"current_steps": 25435, "total_steps": 38160, "loss": 0.3254, "lr": 0.0003022121262659849, "epoch": 13.330712788259959, "percentage": 66.65, "elapsed_time": "1:05:07", "remaining_time": "0:32:34", "throughput": 4244.97, "total_tokens": 16587272} {"current_steps": 25440, "total_steps": 38160, "loss": 0.4169, "lr": 0.00030200211438729705, "epoch": 13.333333333333334, "percentage": 66.67, "elapsed_time": "1:05:08", "remaining_time": "0:32:34", "throughput": 4244.97, "total_tokens": 16590088} {"current_steps": 25445, "total_steps": 38160, "loss": 0.4165, "lr": 0.000301792143927508, "epoch": 13.335953878406709, "percentage": 66.68, "elapsed_time": "1:05:08", "remaining_time": "0:32:33", "throughput": 4245.0, "total_tokens": 16593320} {"current_steps": 25450, "total_steps": 38160, "loss": 0.4449, "lr": 0.0003015822149305411, "epoch": 13.338574423480084, "percentage": 66.69, "elapsed_time": "1:05:09", "remaining_time": "0:32:32", "throughput": 4245.03, "total_tokens": 16596328} {"current_steps": 25455, "total_steps": 38160, "loss": 0.5919, "lr": 0.0003013723274403113, "epoch": 13.34119496855346, "percentage": 66.71, "elapsed_time": "1:05:10", "remaining_time": "0:32:31", "throughput": 4245.01, "total_tokens": 16599080} {"current_steps": 25460, "total_steps": 38160, "loss": 0.3897, "lr": 0.00030116248150072444, "epoch": 13.343815513626835, "percentage": 66.72, "elapsed_time": "1:05:10", "remaining_time": "0:32:30", "throughput": 4245.03, "total_tokens": 16602056} {"current_steps": 25465, "total_steps": 38160, "loss": 0.4653, "lr": 0.00030095267715567816, "epoch": 13.34643605870021, "percentage": 66.73, "elapsed_time": "1:05:11", "remaining_time": "0:32:30", "throughput": 4245.17, "total_tokens": 16606216} {"current_steps": 25470, "total_steps": 38160, "loss": 0.3857, "lr": 0.00030074291444906085, "epoch": 13.349056603773585, "percentage": 66.75, "elapsed_time": "1:05:12", "remaining_time": "0:32:29", "throughput": 4245.18, "total_tokens": 16609064} {"current_steps": 25475, "total_steps": 38160, "loss": 0.5212, "lr": 0.00030053319342475247, "epoch": 13.35167714884696, "percentage": 66.76, "elapsed_time": "1:05:13", "remaining_time": "0:32:28", "throughput": 4245.13, "total_tokens": 16611560} {"current_steps": 25480, "total_steps": 38160, "loss": 0.3568, "lr": 0.00030032351412662465, "epoch": 13.354297693920335, "percentage": 66.77, "elapsed_time": "1:05:13", "remaining_time": "0:32:27", "throughput": 4245.12, "total_tokens": 16614408} {"current_steps": 25485, "total_steps": 38160, "loss": 0.4103, "lr": 0.0003001138765985394, "epoch": 13.35691823899371, "percentage": 66.78, "elapsed_time": "1:05:14", "remaining_time": "0:32:26", "throughput": 4245.12, "total_tokens": 16617256} {"current_steps": 25490, "total_steps": 38160, "loss": 0.4433, "lr": 0.00029990428088435097, "epoch": 13.359538784067086, "percentage": 66.8, "elapsed_time": "1:05:15", "remaining_time": "0:32:26", "throughput": 4245.13, "total_tokens": 16620232} {"current_steps": 25495, "total_steps": 38160, "loss": 0.4443, "lr": 0.000299694727027904, "epoch": 13.36215932914046, "percentage": 66.81, "elapsed_time": "1:05:15", "remaining_time": "0:32:25", "throughput": 4245.23, "total_tokens": 16623912} {"current_steps": 25500, "total_steps": 38160, "loss": 0.5486, "lr": 0.00029948521507303495, "epoch": 13.364779874213836, "percentage": 66.82, "elapsed_time": "1:05:16", "remaining_time": "0:32:24", "throughput": 4245.19, "total_tokens": 16626440} {"current_steps": 25505, "total_steps": 38160, "loss": 0.5887, "lr": 0.0002992757450635714, "epoch": 13.367400419287211, "percentage": 66.84, "elapsed_time": "1:05:17", "remaining_time": "0:32:23", "throughput": 4245.32, "total_tokens": 16630440} {"current_steps": 25510, "total_steps": 38160, "loss": 0.4174, "lr": 0.00029906631704333187, "epoch": 13.370020964360586, "percentage": 66.85, "elapsed_time": "1:05:18", "remaining_time": "0:32:22", "throughput": 4245.32, "total_tokens": 16633352} {"current_steps": 25515, "total_steps": 38160, "loss": 0.4742, "lr": 0.0002988569310561264, "epoch": 13.372641509433961, "percentage": 66.86, "elapsed_time": "1:05:18", "remaining_time": "0:32:22", "throughput": 4245.34, "total_tokens": 16636392} {"current_steps": 25520, "total_steps": 38160, "loss": 0.42, "lr": 0.0002986475871457566, "epoch": 13.375262054507338, "percentage": 66.88, "elapsed_time": "1:05:19", "remaining_time": "0:32:21", "throughput": 4245.39, "total_tokens": 16639688} {"current_steps": 25525, "total_steps": 38160, "loss": 0.3853, "lr": 0.000298438285356014, "epoch": 13.377882599580714, "percentage": 66.89, "elapsed_time": "1:05:20", "remaining_time": "0:32:20", "throughput": 4245.46, "total_tokens": 16643176} {"current_steps": 25530, "total_steps": 38160, "loss": 0.4273, "lr": 0.00029822902573068257, "epoch": 13.380503144654089, "percentage": 66.9, "elapsed_time": "1:05:21", "remaining_time": "0:32:19", "throughput": 4245.57, "total_tokens": 16646952} {"current_steps": 25535, "total_steps": 38160, "loss": 0.4151, "lr": 0.0002980198083135372, "epoch": 13.383123689727464, "percentage": 66.92, "elapsed_time": "1:05:21", "remaining_time": "0:32:19", "throughput": 4245.69, "total_tokens": 16650792} {"current_steps": 25540, "total_steps": 38160, "loss": 0.3828, "lr": 0.0002978106331483435, "epoch": 13.385744234800839, "percentage": 66.93, "elapsed_time": "1:05:22", "remaining_time": "0:32:18", "throughput": 4245.81, "total_tokens": 16654568} {"current_steps": 25545, "total_steps": 38160, "loss": 0.5038, "lr": 0.00029760150027885874, "epoch": 13.388364779874214, "percentage": 66.94, "elapsed_time": "1:05:23", "remaining_time": "0:32:17", "throughput": 4245.82, "total_tokens": 16657608} {"current_steps": 25550, "total_steps": 38160, "loss": 0.4382, "lr": 0.0002973924097488311, "epoch": 13.39098532494759, "percentage": 66.95, "elapsed_time": "1:05:23", "remaining_time": "0:32:16", "throughput": 4245.81, "total_tokens": 16660360} {"current_steps": 25555, "total_steps": 38160, "loss": 0.3509, "lr": 0.00029718336160199977, "epoch": 13.393605870020965, "percentage": 66.97, "elapsed_time": "1:05:24", "remaining_time": "0:32:15", "throughput": 4245.77, "total_tokens": 16663048} {"current_steps": 25560, "total_steps": 38160, "loss": 0.3869, "lr": 0.00029697435588209537, "epoch": 13.39622641509434, "percentage": 66.98, "elapsed_time": "1:05:25", "remaining_time": "0:32:15", "throughput": 4245.91, "total_tokens": 16667080} {"current_steps": 25565, "total_steps": 38160, "loss": 0.4187, "lr": 0.00029676539263283943, "epoch": 13.398846960167715, "percentage": 66.99, "elapsed_time": "1:05:26", "remaining_time": "0:32:14", "throughput": 4245.88, "total_tokens": 16669608} {"current_steps": 25570, "total_steps": 38160, "loss": 0.4076, "lr": 0.0002965564718979448, "epoch": 13.40146750524109, "percentage": 67.01, "elapsed_time": "1:05:27", "remaining_time": "0:32:13", "throughput": 4246.35, "total_tokens": 16676968} {"current_steps": 25575, "total_steps": 38160, "loss": 0.4364, "lr": 0.0002963475937211151, "epoch": 13.404088050314465, "percentage": 67.02, "elapsed_time": "1:05:28", "remaining_time": "0:32:12", "throughput": 4246.43, "total_tokens": 16680552} {"current_steps": 25580, "total_steps": 38160, "loss": 0.3872, "lr": 0.0002961387581460456, "epoch": 13.40670859538784, "percentage": 67.03, "elapsed_time": "1:05:28", "remaining_time": "0:32:12", "throughput": 4246.48, "total_tokens": 16683880} {"current_steps": 25585, "total_steps": 38160, "loss": 0.5126, "lr": 0.0002959299652164221, "epoch": 13.409329140461216, "percentage": 67.05, "elapsed_time": "1:05:29", "remaining_time": "0:32:11", "throughput": 4246.43, "total_tokens": 16686312} {"current_steps": 25590, "total_steps": 38160, "loss": 0.4318, "lr": 0.00029572121497592154, "epoch": 13.41194968553459, "percentage": 67.06, "elapsed_time": "1:05:30", "remaining_time": "0:32:10", "throughput": 4246.38, "total_tokens": 16688776} {"current_steps": 25595, "total_steps": 38160, "loss": 0.3188, "lr": 0.00029551250746821236, "epoch": 13.414570230607966, "percentage": 67.07, "elapsed_time": "1:05:30", "remaining_time": "0:32:09", "throughput": 4246.44, "total_tokens": 16692104} {"current_steps": 25600, "total_steps": 38160, "loss": 0.4166, "lr": 0.0002953038427369537, "epoch": 13.417190775681341, "percentage": 67.09, "elapsed_time": "1:05:31", "remaining_time": "0:32:08", "throughput": 4246.4, "total_tokens": 16694600} {"current_steps": 25605, "total_steps": 38160, "loss": 0.4028, "lr": 0.000295095220825796, "epoch": 13.419811320754716, "percentage": 67.1, "elapsed_time": "1:05:32", "remaining_time": "0:32:08", "throughput": 4246.39, "total_tokens": 16697384} {"current_steps": 25610, "total_steps": 38160, "loss": 0.4581, "lr": 0.00029488664177838023, "epoch": 13.422431865828091, "percentage": 67.11, "elapsed_time": "1:05:32", "remaining_time": "0:32:07", "throughput": 4246.45, "total_tokens": 16700776} {"current_steps": 25615, "total_steps": 38160, "loss": 0.4027, "lr": 0.0002946781056383391, "epoch": 13.425052410901468, "percentage": 67.13, "elapsed_time": "1:05:33", "remaining_time": "0:32:06", "throughput": 4246.4, "total_tokens": 16703272} {"current_steps": 25620, "total_steps": 38160, "loss": 0.3359, "lr": 0.0002944696124492956, "epoch": 13.427672955974844, "percentage": 67.14, "elapsed_time": "1:05:34", "remaining_time": "0:32:05", "throughput": 4246.43, "total_tokens": 16706440} {"current_steps": 25625, "total_steps": 38160, "loss": 0.4364, "lr": 0.0002942611622548645, "epoch": 13.430293501048219, "percentage": 67.15, "elapsed_time": "1:05:34", "remaining_time": "0:32:04", "throughput": 4246.43, "total_tokens": 16709256} {"current_steps": 25630, "total_steps": 38160, "loss": 0.3986, "lr": 0.00029405275509865103, "epoch": 13.432914046121594, "percentage": 67.16, "elapsed_time": "1:05:35", "remaining_time": "0:32:04", "throughput": 4246.5, "total_tokens": 16712712} {"current_steps": 25635, "total_steps": 38160, "loss": 0.4233, "lr": 0.00029384439102425174, "epoch": 13.435534591194969, "percentage": 67.18, "elapsed_time": "1:05:36", "remaining_time": "0:32:03", "throughput": 4246.49, "total_tokens": 16715464} {"current_steps": 25640, "total_steps": 38160, "loss": 0.6294, "lr": 0.0002936360700752539, "epoch": 13.438155136268344, "percentage": 67.19, "elapsed_time": "1:05:37", "remaining_time": "0:32:02", "throughput": 4246.59, "total_tokens": 16719304} {"current_steps": 25645, "total_steps": 38160, "loss": 0.4649, "lr": 0.00029342779229523573, "epoch": 13.44077568134172, "percentage": 67.2, "elapsed_time": "1:05:37", "remaining_time": "0:32:01", "throughput": 4246.66, "total_tokens": 16722760} {"current_steps": 25650, "total_steps": 38160, "loss": 0.4898, "lr": 0.00029321955772776675, "epoch": 13.443396226415095, "percentage": 67.22, "elapsed_time": "1:05:38", "remaining_time": "0:32:00", "throughput": 4246.72, "total_tokens": 16726152} {"current_steps": 25655, "total_steps": 38160, "loss": 0.4097, "lr": 0.00029301136641640723, "epoch": 13.44601677148847, "percentage": 67.23, "elapsed_time": "1:05:39", "remaining_time": "0:32:00", "throughput": 4246.69, "total_tokens": 16728808} {"current_steps": 25660, "total_steps": 38160, "loss": 0.4115, "lr": 0.0002928032184047085, "epoch": 13.448637316561845, "percentage": 67.24, "elapsed_time": "1:05:39", "remaining_time": "0:31:59", "throughput": 4246.64, "total_tokens": 16731240} {"current_steps": 25665, "total_steps": 38160, "loss": 0.5604, "lr": 0.0002925951137362126, "epoch": 13.45125786163522, "percentage": 67.26, "elapsed_time": "1:05:40", "remaining_time": "0:31:58", "throughput": 4246.74, "total_tokens": 16735112} {"current_steps": 25670, "total_steps": 38160, "loss": 0.4221, "lr": 0.00029238705245445264, "epoch": 13.453878406708595, "percentage": 67.27, "elapsed_time": "1:05:41", "remaining_time": "0:31:57", "throughput": 4246.81, "total_tokens": 16738568} {"current_steps": 25675, "total_steps": 38160, "loss": 0.4175, "lr": 0.0002921790346029527, "epoch": 13.45649895178197, "percentage": 67.28, "elapsed_time": "1:05:42", "remaining_time": "0:31:56", "throughput": 4246.88, "total_tokens": 16742056} {"current_steps": 25680, "total_steps": 38160, "loss": 0.4121, "lr": 0.0002919710602252279, "epoch": 13.459119496855346, "percentage": 67.3, "elapsed_time": "1:05:42", "remaining_time": "0:31:56", "throughput": 4246.85, "total_tokens": 16744616} {"current_steps": 25685, "total_steps": 38160, "loss": 0.5032, "lr": 0.0002917631293647838, "epoch": 13.46174004192872, "percentage": 67.31, "elapsed_time": "1:05:43", "remaining_time": "0:31:55", "throughput": 4246.85, "total_tokens": 16747464} {"current_steps": 25690, "total_steps": 38160, "loss": 0.4338, "lr": 0.0002915552420651176, "epoch": 13.464360587002096, "percentage": 67.32, "elapsed_time": "1:05:44", "remaining_time": "0:31:54", "throughput": 4247.04, "total_tokens": 16752104} {"current_steps": 25695, "total_steps": 38160, "loss": 0.3598, "lr": 0.00029134739836971657, "epoch": 13.466981132075471, "percentage": 67.33, "elapsed_time": "1:05:45", "remaining_time": "0:31:53", "throughput": 4247.13, "total_tokens": 16755720} {"current_steps": 25700, "total_steps": 38160, "loss": 0.5278, "lr": 0.0002911395983220595, "epoch": 13.469601677148846, "percentage": 67.35, "elapsed_time": "1:05:45", "remaining_time": "0:31:53", "throughput": 4247.13, "total_tokens": 16758600} {"current_steps": 25705, "total_steps": 38160, "loss": 0.4056, "lr": 0.0002909318419656154, "epoch": 13.472222222222221, "percentage": 67.36, "elapsed_time": "1:05:46", "remaining_time": "0:31:52", "throughput": 4247.12, "total_tokens": 16761352} {"current_steps": 25710, "total_steps": 38160, "loss": 0.5266, "lr": 0.00029072412934384484, "epoch": 13.474842767295598, "percentage": 67.37, "elapsed_time": "1:05:47", "remaining_time": "0:31:51", "throughput": 4247.29, "total_tokens": 16765512} {"current_steps": 25715, "total_steps": 38160, "loss": 0.5572, "lr": 0.00029051646050019884, "epoch": 13.477463312368974, "percentage": 67.39, "elapsed_time": "1:05:48", "remaining_time": "0:31:50", "throughput": 4247.36, "total_tokens": 16769064} {"current_steps": 25720, "total_steps": 38160, "loss": 0.5136, "lr": 0.00029030883547811966, "epoch": 13.480083857442349, "percentage": 67.4, "elapsed_time": "1:05:48", "remaining_time": "0:31:49", "throughput": 4247.4, "total_tokens": 16772232} {"current_steps": 25725, "total_steps": 38160, "loss": 0.3606, "lr": 0.0002901012543210397, "epoch": 13.482704402515724, "percentage": 67.41, "elapsed_time": "1:05:49", "remaining_time": "0:31:49", "throughput": 4247.57, "total_tokens": 16776616} {"current_steps": 25730, "total_steps": 38160, "loss": 0.4349, "lr": 0.00028989371707238264, "epoch": 13.485324947589099, "percentage": 67.43, "elapsed_time": "1:05:50", "remaining_time": "0:31:48", "throughput": 4247.58, "total_tokens": 16779496} {"current_steps": 25735, "total_steps": 38160, "loss": 0.3513, "lr": 0.00028968622377556285, "epoch": 13.487945492662474, "percentage": 67.44, "elapsed_time": "1:05:51", "remaining_time": "0:31:47", "throughput": 4247.71, "total_tokens": 16783368} {"current_steps": 25740, "total_steps": 38160, "loss": 0.4589, "lr": 0.00028947877447398567, "epoch": 13.49056603773585, "percentage": 67.45, "elapsed_time": "1:05:51", "remaining_time": "0:31:46", "throughput": 4247.67, "total_tokens": 16785928} {"current_steps": 25745, "total_steps": 38160, "loss": 0.4017, "lr": 0.00028927136921104733, "epoch": 13.493186582809225, "percentage": 67.47, "elapsed_time": "1:05:52", "remaining_time": "0:31:46", "throughput": 4247.74, "total_tokens": 16789320} {"current_steps": 25750, "total_steps": 38160, "loss": 0.4961, "lr": 0.00028906400803013446, "epoch": 13.4958071278826, "percentage": 67.48, "elapsed_time": "1:05:53", "remaining_time": "0:31:45", "throughput": 4247.92, "total_tokens": 16793928} {"current_steps": 25755, "total_steps": 38160, "loss": 0.4943, "lr": 0.00028885669097462435, "epoch": 13.498427672955975, "percentage": 67.49, "elapsed_time": "1:05:54", "remaining_time": "0:31:44", "throughput": 4247.93, "total_tokens": 16796872} {"current_steps": 25760, "total_steps": 38160, "loss": 0.3778, "lr": 0.0002886494180878857, "epoch": 13.50104821802935, "percentage": 67.51, "elapsed_time": "1:05:54", "remaining_time": "0:31:43", "throughput": 4248.02, "total_tokens": 16800552} {"current_steps": 25765, "total_steps": 38160, "loss": 0.413, "lr": 0.00028844218941327757, "epoch": 13.503668763102725, "percentage": 67.52, "elapsed_time": "1:05:55", "remaining_time": "0:31:42", "throughput": 4248.07, "total_tokens": 16803880} {"current_steps": 25770, "total_steps": 38160, "loss": 0.4172, "lr": 0.0002882350049941498, "epoch": 13.5062893081761, "percentage": 67.53, "elapsed_time": "1:05:56", "remaining_time": "0:31:42", "throughput": 4248.05, "total_tokens": 16806600} {"current_steps": 25775, "total_steps": 38160, "loss": 0.415, "lr": 0.0002880278648738432, "epoch": 13.508909853249476, "percentage": 67.54, "elapsed_time": "1:05:56", "remaining_time": "0:31:41", "throughput": 4248.06, "total_tokens": 16809576} {"current_steps": 25780, "total_steps": 38160, "loss": 0.4902, "lr": 0.0002878207690956891, "epoch": 13.51153039832285, "percentage": 67.56, "elapsed_time": "1:05:57", "remaining_time": "0:31:40", "throughput": 4248.09, "total_tokens": 16812776} {"current_steps": 25785, "total_steps": 38160, "loss": 0.3961, "lr": 0.00028761371770300915, "epoch": 13.514150943396226, "percentage": 67.57, "elapsed_time": "1:05:58", "remaining_time": "0:31:39", "throughput": 4248.07, "total_tokens": 16815496} {"current_steps": 25790, "total_steps": 38160, "loss": 0.4292, "lr": 0.0002874067107391164, "epoch": 13.516771488469601, "percentage": 67.58, "elapsed_time": "1:05:59", "remaining_time": "0:31:38", "throughput": 4248.15, "total_tokens": 16818984} {"current_steps": 25795, "total_steps": 38160, "loss": 0.3117, "lr": 0.00028719974824731445, "epoch": 13.519392033542976, "percentage": 67.6, "elapsed_time": "1:06:00", "remaining_time": "0:31:38", "throughput": 4248.52, "total_tokens": 16825096} {"current_steps": 25800, "total_steps": 38160, "loss": 0.5012, "lr": 0.0002869928302708975, "epoch": 13.522012578616351, "percentage": 67.61, "elapsed_time": "1:06:00", "remaining_time": "0:31:37", "throughput": 4248.51, "total_tokens": 16827880} {"current_steps": 25805, "total_steps": 38160, "loss": 0.5046, "lr": 0.00028678595685315044, "epoch": 13.524633123689728, "percentage": 67.62, "elapsed_time": "1:06:01", "remaining_time": "0:31:36", "throughput": 4248.48, "total_tokens": 16830504} {"current_steps": 25810, "total_steps": 38160, "loss": 0.3811, "lr": 0.00028657912803734854, "epoch": 13.527253668763104, "percentage": 67.64, "elapsed_time": "1:06:02", "remaining_time": "0:31:35", "throughput": 4248.45, "total_tokens": 16833128} {"current_steps": 25815, "total_steps": 38160, "loss": 0.4478, "lr": 0.00028637234386675816, "epoch": 13.529874213836479, "percentage": 67.65, "elapsed_time": "1:06:02", "remaining_time": "0:31:35", "throughput": 4248.4, "total_tokens": 16835592} {"current_steps": 25820, "total_steps": 38160, "loss": 0.5281, "lr": 0.00028616560438463626, "epoch": 13.532494758909854, "percentage": 67.66, "elapsed_time": "1:06:03", "remaining_time": "0:31:34", "throughput": 4248.56, "total_tokens": 16839752} {"current_steps": 25825, "total_steps": 38160, "loss": 0.4338, "lr": 0.00028595890963423057, "epoch": 13.535115303983229, "percentage": 67.68, "elapsed_time": "1:06:04", "remaining_time": "0:31:33", "throughput": 4248.56, "total_tokens": 16842568} {"current_steps": 25830, "total_steps": 38160, "loss": 0.4221, "lr": 0.0002857522596587789, "epoch": 13.537735849056604, "percentage": 67.69, "elapsed_time": "1:06:04", "remaining_time": "0:31:32", "throughput": 4248.55, "total_tokens": 16845320} {"current_steps": 25835, "total_steps": 38160, "loss": 0.4213, "lr": 0.00028554565450151045, "epoch": 13.54035639412998, "percentage": 67.7, "elapsed_time": "1:06:05", "remaining_time": "0:31:31", "throughput": 4248.59, "total_tokens": 16848552} {"current_steps": 25840, "total_steps": 38160, "loss": 0.5695, "lr": 0.00028533909420564417, "epoch": 13.542976939203355, "percentage": 67.71, "elapsed_time": "1:06:06", "remaining_time": "0:31:31", "throughput": 4248.83, "total_tokens": 16853608} {"current_steps": 25845, "total_steps": 38160, "loss": 0.4006, "lr": 0.00028513257881439047, "epoch": 13.54559748427673, "percentage": 67.73, "elapsed_time": "1:06:07", "remaining_time": "0:31:30", "throughput": 4248.85, "total_tokens": 16856648} {"current_steps": 25850, "total_steps": 38160, "loss": 0.4623, "lr": 0.00028492610837095003, "epoch": 13.548218029350105, "percentage": 67.74, "elapsed_time": "1:06:08", "remaining_time": "0:31:29", "throughput": 4249.11, "total_tokens": 16861864} {"current_steps": 25855, "total_steps": 38160, "loss": 0.4228, "lr": 0.00028471968291851407, "epoch": 13.55083857442348, "percentage": 67.75, "elapsed_time": "1:06:09", "remaining_time": "0:31:28", "throughput": 4249.16, "total_tokens": 16865256} {"current_steps": 25860, "total_steps": 38160, "loss": 0.4133, "lr": 0.0002845133025002645, "epoch": 13.553459119496855, "percentage": 67.77, "elapsed_time": "1:06:09", "remaining_time": "0:31:28", "throughput": 4249.26, "total_tokens": 16868936} {"current_steps": 25865, "total_steps": 38160, "loss": 0.4377, "lr": 0.0002843069671593734, "epoch": 13.55607966457023, "percentage": 67.78, "elapsed_time": "1:06:10", "remaining_time": "0:31:27", "throughput": 4249.32, "total_tokens": 16872200} {"current_steps": 25870, "total_steps": 38160, "loss": 0.4109, "lr": 0.000284100676939004, "epoch": 13.558700209643606, "percentage": 67.79, "elapsed_time": "1:06:11", "remaining_time": "0:31:26", "throughput": 4249.73, "total_tokens": 16878824} {"current_steps": 25875, "total_steps": 38160, "loss": 0.3637, "lr": 0.0002838944318823099, "epoch": 13.56132075471698, "percentage": 67.81, "elapsed_time": "1:06:12", "remaining_time": "0:31:26", "throughput": 4249.9, "total_tokens": 16883080} {"current_steps": 25880, "total_steps": 38160, "loss": 0.5524, "lr": 0.0002836882320324354, "epoch": 13.563941299790356, "percentage": 67.82, "elapsed_time": "1:06:13", "remaining_time": "0:31:25", "throughput": 4250.05, "total_tokens": 16887336} {"current_steps": 25885, "total_steps": 38160, "loss": 0.4727, "lr": 0.00028348207743251477, "epoch": 13.566561844863731, "percentage": 67.83, "elapsed_time": "1:06:14", "remaining_time": "0:31:24", "throughput": 4250.11, "total_tokens": 16890760} {"current_steps": 25890, "total_steps": 38160, "loss": 0.3744, "lr": 0.0002832759681256735, "epoch": 13.569182389937106, "percentage": 67.85, "elapsed_time": "1:06:14", "remaining_time": "0:31:23", "throughput": 4250.14, "total_tokens": 16893928} {"current_steps": 25895, "total_steps": 38160, "loss": 0.3282, "lr": 0.000283069904155027, "epoch": 13.571802935010481, "percentage": 67.86, "elapsed_time": "1:06:15", "remaining_time": "0:31:23", "throughput": 4250.17, "total_tokens": 16897032} {"current_steps": 25900, "total_steps": 38160, "loss": 0.3813, "lr": 0.0002828638855636817, "epoch": 13.574423480083858, "percentage": 67.87, "elapsed_time": "1:06:16", "remaining_time": "0:31:22", "throughput": 4250.25, "total_tokens": 16900648} {"current_steps": 25905, "total_steps": 38160, "loss": 0.538, "lr": 0.0002826579123947345, "epoch": 13.577044025157234, "percentage": 67.89, "elapsed_time": "1:06:17", "remaining_time": "0:31:21", "throughput": 4250.3, "total_tokens": 16903880} {"current_steps": 25910, "total_steps": 38160, "loss": 0.5017, "lr": 0.0002824519846912723, "epoch": 13.579664570230609, "percentage": 67.9, "elapsed_time": "1:06:17", "remaining_time": "0:31:20", "throughput": 4250.41, "total_tokens": 16907816} {"current_steps": 25915, "total_steps": 38160, "loss": 0.3594, "lr": 0.00028224610249637293, "epoch": 13.582285115303984, "percentage": 67.91, "elapsed_time": "1:06:18", "remaining_time": "0:31:19", "throughput": 4250.4, "total_tokens": 16910664} {"current_steps": 25920, "total_steps": 38160, "loss": 0.4773, "lr": 0.00028204026585310483, "epoch": 13.584905660377359, "percentage": 67.92, "elapsed_time": "1:06:19", "remaining_time": "0:31:19", "throughput": 4250.51, "total_tokens": 16914408} {"current_steps": 25925, "total_steps": 38160, "loss": 0.5621, "lr": 0.0002818344748045264, "epoch": 13.587526205450734, "percentage": 67.94, "elapsed_time": "1:06:20", "remaining_time": "0:31:18", "throughput": 4250.59, "total_tokens": 16918120} {"current_steps": 25930, "total_steps": 38160, "loss": 0.509, "lr": 0.0002816287293936868, "epoch": 13.59014675052411, "percentage": 67.95, "elapsed_time": "1:06:20", "remaining_time": "0:31:17", "throughput": 4250.55, "total_tokens": 16920680} {"current_steps": 25935, "total_steps": 38160, "loss": 0.4016, "lr": 0.0002814230296636259, "epoch": 13.592767295597485, "percentage": 67.96, "elapsed_time": "1:06:21", "remaining_time": "0:31:16", "throughput": 4250.55, "total_tokens": 16923592} {"current_steps": 25940, "total_steps": 38160, "loss": 0.3705, "lr": 0.0002812173756573734, "epoch": 13.59538784067086, "percentage": 67.98, "elapsed_time": "1:06:22", "remaining_time": "0:31:15", "throughput": 4250.59, "total_tokens": 16926920} {"current_steps": 25945, "total_steps": 38160, "loss": 0.4637, "lr": 0.00028101176741794984, "epoch": 13.598008385744235, "percentage": 67.99, "elapsed_time": "1:06:22", "remaining_time": "0:31:15", "throughput": 4250.62, "total_tokens": 16930056} {"current_steps": 25950, "total_steps": 38160, "loss": 0.4466, "lr": 0.0002808062049883664, "epoch": 13.60062893081761, "percentage": 68.0, "elapsed_time": "1:06:23", "remaining_time": "0:31:14", "throughput": 4250.56, "total_tokens": 16932424} {"current_steps": 25955, "total_steps": 38160, "loss": 0.368, "lr": 0.00028060068841162403, "epoch": 13.603249475890985, "percentage": 68.02, "elapsed_time": "1:06:24", "remaining_time": "0:31:13", "throughput": 4250.66, "total_tokens": 16936200} {"current_steps": 25960, "total_steps": 38160, "loss": 0.3936, "lr": 0.00028039521773071477, "epoch": 13.60587002096436, "percentage": 68.03, "elapsed_time": "1:06:25", "remaining_time": "0:31:12", "throughput": 4250.67, "total_tokens": 16939176} {"current_steps": 25965, "total_steps": 38160, "loss": 0.398, "lr": 0.0002801897929886204, "epoch": 13.608490566037736, "percentage": 68.04, "elapsed_time": "1:06:25", "remaining_time": "0:31:12", "throughput": 4250.79, "total_tokens": 16943048} {"current_steps": 25970, "total_steps": 38160, "loss": 0.4201, "lr": 0.0002799844142283135, "epoch": 13.61111111111111, "percentage": 68.06, "elapsed_time": "1:06:26", "remaining_time": "0:31:11", "throughput": 4250.8, "total_tokens": 16946056} {"current_steps": 25975, "total_steps": 38160, "loss": 0.4705, "lr": 0.00027977908149275733, "epoch": 13.613731656184486, "percentage": 68.07, "elapsed_time": "1:06:27", "remaining_time": "0:31:10", "throughput": 4250.77, "total_tokens": 16948712} {"current_steps": 25980, "total_steps": 38160, "loss": 0.4597, "lr": 0.00027957379482490476, "epoch": 13.616352201257861, "percentage": 68.08, "elapsed_time": "1:06:27", "remaining_time": "0:31:09", "throughput": 4250.85, "total_tokens": 16952168} {"current_steps": 25985, "total_steps": 38160, "loss": 0.4165, "lr": 0.0002793685542676997, "epoch": 13.618972746331236, "percentage": 68.09, "elapsed_time": "1:06:28", "remaining_time": "0:31:08", "throughput": 4250.91, "total_tokens": 16955496} {"current_steps": 25990, "total_steps": 38160, "loss": 0.4514, "lr": 0.0002791633598640758, "epoch": 13.621593291404611, "percentage": 68.11, "elapsed_time": "1:06:29", "remaining_time": "0:31:08", "throughput": 4250.92, "total_tokens": 16958472} {"current_steps": 25995, "total_steps": 38160, "loss": 0.3884, "lr": 0.0002789582116569576, "epoch": 13.624213836477988, "percentage": 68.12, "elapsed_time": "1:06:30", "remaining_time": "0:31:07", "throughput": 4250.97, "total_tokens": 16961832} {"current_steps": 26000, "total_steps": 38160, "loss": 0.352, "lr": 0.0002787531096892597, "epoch": 13.626834381551364, "percentage": 68.13, "elapsed_time": "1:06:30", "remaining_time": "0:31:06", "throughput": 4250.95, "total_tokens": 16964552} {"current_steps": 26005, "total_steps": 38160, "loss": 0.3903, "lr": 0.0002785480540038874, "epoch": 13.629454926624739, "percentage": 68.15, "elapsed_time": "1:06:31", "remaining_time": "0:31:05", "throughput": 4250.98, "total_tokens": 16967688} {"current_steps": 26010, "total_steps": 38160, "loss": 0.456, "lr": 0.0002783430446437355, "epoch": 13.632075471698114, "percentage": 68.16, "elapsed_time": "1:06:32", "remaining_time": "0:31:04", "throughput": 4251.04, "total_tokens": 16971176} {"current_steps": 26015, "total_steps": 38160, "loss": 0.3898, "lr": 0.00027813808165169006, "epoch": 13.634696016771489, "percentage": 68.17, "elapsed_time": "1:06:32", "remaining_time": "0:31:04", "throughput": 4251.11, "total_tokens": 16974568} {"current_steps": 26020, "total_steps": 38160, "loss": 0.4794, "lr": 0.00027793316507062667, "epoch": 13.637316561844864, "percentage": 68.19, "elapsed_time": "1:06:33", "remaining_time": "0:31:03", "throughput": 4251.26, "total_tokens": 16978728} {"current_steps": 26025, "total_steps": 38160, "loss": 0.3134, "lr": 0.00027772829494341163, "epoch": 13.63993710691824, "percentage": 68.2, "elapsed_time": "1:06:34", "remaining_time": "0:31:02", "throughput": 4251.3, "total_tokens": 16981928} {"current_steps": 26030, "total_steps": 38160, "loss": 0.4302, "lr": 0.00027752347131290147, "epoch": 13.642557651991615, "percentage": 68.21, "elapsed_time": "1:06:35", "remaining_time": "0:31:01", "throughput": 4251.22, "total_tokens": 16984104} {"current_steps": 26035, "total_steps": 38160, "loss": 0.4544, "lr": 0.0002773186942219431, "epoch": 13.64517819706499, "percentage": 68.23, "elapsed_time": "1:06:35", "remaining_time": "0:31:00", "throughput": 4251.22, "total_tokens": 16986952} {"current_steps": 26040, "total_steps": 38160, "loss": 0.3274, "lr": 0.0002771139637133735, "epoch": 13.647798742138365, "percentage": 68.24, "elapsed_time": "1:06:36", "remaining_time": "0:31:00", "throughput": 4251.55, "total_tokens": 16993160} {"current_steps": 26045, "total_steps": 38160, "loss": 0.4322, "lr": 0.00027690927983001966, "epoch": 13.65041928721174, "percentage": 68.25, "elapsed_time": "1:06:37", "remaining_time": "0:30:59", "throughput": 4251.49, "total_tokens": 16995560} {"current_steps": 26050, "total_steps": 38160, "loss": 0.4747, "lr": 0.00027670464261469937, "epoch": 13.653039832285115, "percentage": 68.27, "elapsed_time": "1:06:38", "remaining_time": "0:30:58", "throughput": 4251.55, "total_tokens": 16999016} {"current_steps": 26055, "total_steps": 38160, "loss": 0.3408, "lr": 0.0002765000521102203, "epoch": 13.65566037735849, "percentage": 68.28, "elapsed_time": "1:06:38", "remaining_time": "0:30:57", "throughput": 4251.56, "total_tokens": 17001960} {"current_steps": 26060, "total_steps": 38160, "loss": 0.5073, "lr": 0.0002762955083593807, "epoch": 13.658280922431866, "percentage": 68.29, "elapsed_time": "1:06:39", "remaining_time": "0:30:57", "throughput": 4251.57, "total_tokens": 17004936} {"current_steps": 26065, "total_steps": 38160, "loss": 0.3646, "lr": 0.0002760910114049686, "epoch": 13.66090146750524, "percentage": 68.3, "elapsed_time": "1:06:40", "remaining_time": "0:30:56", "throughput": 4251.66, "total_tokens": 17008584} {"current_steps": 26070, "total_steps": 38160, "loss": 0.463, "lr": 0.0002758865612897623, "epoch": 13.663522012578616, "percentage": 68.32, "elapsed_time": "1:06:41", "remaining_time": "0:30:55", "throughput": 4251.61, "total_tokens": 17011048} {"current_steps": 26075, "total_steps": 38160, "loss": 0.3482, "lr": 0.00027568215805653045, "epoch": 13.666142557651991, "percentage": 68.33, "elapsed_time": "1:06:41", "remaining_time": "0:30:54", "throughput": 4251.54, "total_tokens": 17013384} {"current_steps": 26080, "total_steps": 38160, "loss": 0.4047, "lr": 0.00027547780174803205, "epoch": 13.668763102725366, "percentage": 68.34, "elapsed_time": "1:06:42", "remaining_time": "0:30:53", "throughput": 4251.58, "total_tokens": 17016584} {"current_steps": 26085, "total_steps": 38160, "loss": 0.4789, "lr": 0.0002752734924070161, "epoch": 13.671383647798741, "percentage": 68.36, "elapsed_time": "1:06:43", "remaining_time": "0:30:53", "throughput": 4251.58, "total_tokens": 17019368} {"current_steps": 26090, "total_steps": 38160, "loss": 0.3794, "lr": 0.00027506923007622177, "epoch": 13.674004192872118, "percentage": 68.37, "elapsed_time": "1:06:43", "remaining_time": "0:30:52", "throughput": 4251.58, "total_tokens": 17022184} {"current_steps": 26095, "total_steps": 38160, "loss": 0.4117, "lr": 0.00027486501479837846, "epoch": 13.676624737945493, "percentage": 68.38, "elapsed_time": "1:06:44", "remaining_time": "0:30:51", "throughput": 4251.6, "total_tokens": 17025288} {"current_steps": 26100, "total_steps": 38160, "loss": 0.3838, "lr": 0.0002746608466162053, "epoch": 13.679245283018869, "percentage": 68.4, "elapsed_time": "1:06:45", "remaining_time": "0:30:50", "throughput": 4251.63, "total_tokens": 17028424} {"current_steps": 26105, "total_steps": 38160, "loss": 0.3276, "lr": 0.0002744567255724123, "epoch": 13.681865828092244, "percentage": 68.41, "elapsed_time": "1:06:45", "remaining_time": "0:30:49", "throughput": 4251.68, "total_tokens": 17031720} {"current_steps": 26110, "total_steps": 38160, "loss": 0.5021, "lr": 0.0002742526517096992, "epoch": 13.684486373165619, "percentage": 68.42, "elapsed_time": "1:06:46", "remaining_time": "0:30:49", "throughput": 4251.71, "total_tokens": 17034888} {"current_steps": 26115, "total_steps": 38160, "loss": 0.4406, "lr": 0.000274048625070756, "epoch": 13.687106918238994, "percentage": 68.44, "elapsed_time": "1:06:47", "remaining_time": "0:30:48", "throughput": 4252.08, "total_tokens": 17041576} {"current_steps": 26120, "total_steps": 38160, "loss": 0.4191, "lr": 0.0002738446456982627, "epoch": 13.68972746331237, "percentage": 68.45, "elapsed_time": "1:06:48", "remaining_time": "0:30:47", "throughput": 4252.07, "total_tokens": 17044424} {"current_steps": 26125, "total_steps": 38160, "loss": 0.3577, "lr": 0.0002736407136348892, "epoch": 13.692348008385745, "percentage": 68.46, "elapsed_time": "1:06:49", "remaining_time": "0:30:46", "throughput": 4252.15, "total_tokens": 17047976} {"current_steps": 26130, "total_steps": 38160, "loss": 0.5922, "lr": 0.0002734368289232959, "epoch": 13.69496855345912, "percentage": 68.47, "elapsed_time": "1:06:49", "remaining_time": "0:30:46", "throughput": 4252.19, "total_tokens": 17051208} {"current_steps": 26135, "total_steps": 38160, "loss": 0.3889, "lr": 0.00027323299160613335, "epoch": 13.697589098532495, "percentage": 68.49, "elapsed_time": "1:06:50", "remaining_time": "0:30:45", "throughput": 4252.14, "total_tokens": 17053640} {"current_steps": 26140, "total_steps": 38160, "loss": 0.3653, "lr": 0.00027302920172604173, "epoch": 13.70020964360587, "percentage": 68.5, "elapsed_time": "1:06:51", "remaining_time": "0:30:44", "throughput": 4252.19, "total_tokens": 17056968} {"current_steps": 26145, "total_steps": 38160, "loss": 0.4593, "lr": 0.00027282545932565214, "epoch": 13.702830188679245, "percentage": 68.51, "elapsed_time": "1:06:51", "remaining_time": "0:30:43", "throughput": 4252.17, "total_tokens": 17059688} {"current_steps": 26150, "total_steps": 38160, "loss": 0.4668, "lr": 0.00027262176444758435, "epoch": 13.70545073375262, "percentage": 68.53, "elapsed_time": "1:06:52", "remaining_time": "0:30:43", "throughput": 4252.41, "total_tokens": 17064712} {"current_steps": 26155, "total_steps": 38160, "loss": 0.3835, "lr": 0.00027241811713444935, "epoch": 13.708071278825996, "percentage": 68.54, "elapsed_time": "1:06:53", "remaining_time": "0:30:42", "throughput": 4252.4, "total_tokens": 17067528} {"current_steps": 26160, "total_steps": 38160, "loss": 0.3736, "lr": 0.0002722145174288478, "epoch": 13.71069182389937, "percentage": 68.55, "elapsed_time": "1:06:54", "remaining_time": "0:30:41", "throughput": 4252.47, "total_tokens": 17070952} {"current_steps": 26165, "total_steps": 38160, "loss": 0.5258, "lr": 0.0002720109653733706, "epoch": 13.713312368972746, "percentage": 68.57, "elapsed_time": "1:06:55", "remaining_time": "0:30:40", "throughput": 4252.49, "total_tokens": 17073992} {"current_steps": 26170, "total_steps": 38160, "loss": 0.4275, "lr": 0.00027180746101059856, "epoch": 13.715932914046121, "percentage": 68.58, "elapsed_time": "1:06:55", "remaining_time": "0:30:39", "throughput": 4252.66, "total_tokens": 17078376} {"current_steps": 26175, "total_steps": 38160, "loss": 0.4863, "lr": 0.0002716040043831023, "epoch": 13.718553459119496, "percentage": 68.59, "elapsed_time": "1:06:56", "remaining_time": "0:30:39", "throughput": 4252.86, "total_tokens": 17082952} {"current_steps": 26180, "total_steps": 38160, "loss": 0.4571, "lr": 0.0002714005955334424, "epoch": 13.721174004192871, "percentage": 68.61, "elapsed_time": "1:06:57", "remaining_time": "0:30:38", "throughput": 4252.85, "total_tokens": 17085640} {"current_steps": 26185, "total_steps": 38160, "loss": 0.3215, "lr": 0.00027119723450417, "epoch": 13.723794549266248, "percentage": 68.62, "elapsed_time": "1:06:58", "remaining_time": "0:30:37", "throughput": 4252.92, "total_tokens": 17089096} {"current_steps": 26190, "total_steps": 38160, "loss": 0.5921, "lr": 0.0002709939213378258, "epoch": 13.726415094339622, "percentage": 68.63, "elapsed_time": "1:06:58", "remaining_time": "0:30:36", "throughput": 4252.89, "total_tokens": 17091752} {"current_steps": 26195, "total_steps": 38160, "loss": 0.4604, "lr": 0.0002707906560769408, "epoch": 13.729035639412999, "percentage": 68.65, "elapsed_time": "1:06:59", "remaining_time": "0:30:35", "throughput": 4252.92, "total_tokens": 17094824} {"current_steps": 26200, "total_steps": 38160, "loss": 0.579, "lr": 0.0002705874387640354, "epoch": 13.731656184486374, "percentage": 68.66, "elapsed_time": "1:07:00", "remaining_time": "0:30:35", "throughput": 4252.95, "total_tokens": 17097992} {"current_steps": 26205, "total_steps": 38160, "loss": 0.544, "lr": 0.00027038426944162074, "epoch": 13.734276729559749, "percentage": 68.67, "elapsed_time": "1:07:00", "remaining_time": "0:30:34", "throughput": 4252.96, "total_tokens": 17100968} {"current_steps": 26210, "total_steps": 38160, "loss": 0.456, "lr": 0.0002701811481521971, "epoch": 13.736897274633124, "percentage": 68.68, "elapsed_time": "1:07:01", "remaining_time": "0:30:33", "throughput": 4252.92, "total_tokens": 17103496} {"current_steps": 26215, "total_steps": 38160, "loss": 0.4135, "lr": 0.0002699780749382554, "epoch": 13.7395178197065, "percentage": 68.7, "elapsed_time": "1:07:02", "remaining_time": "0:30:32", "throughput": 4252.98, "total_tokens": 17106920} {"current_steps": 26220, "total_steps": 38160, "loss": 0.378, "lr": 0.0002697750498422761, "epoch": 13.742138364779874, "percentage": 68.71, "elapsed_time": "1:07:03", "remaining_time": "0:30:32", "throughput": 4253.06, "total_tokens": 17110472} {"current_steps": 26225, "total_steps": 38160, "loss": 0.4785, "lr": 0.0002695720729067301, "epoch": 13.74475890985325, "percentage": 68.72, "elapsed_time": "1:07:03", "remaining_time": "0:30:31", "throughput": 4253.09, "total_tokens": 17113640} {"current_steps": 26230, "total_steps": 38160, "loss": 0.5544, "lr": 0.00026936914417407756, "epoch": 13.747379454926625, "percentage": 68.74, "elapsed_time": "1:07:04", "remaining_time": "0:30:30", "throughput": 4253.12, "total_tokens": 17116808} {"current_steps": 26235, "total_steps": 38160, "loss": 0.4384, "lr": 0.0002691662636867687, "epoch": 13.75, "percentage": 68.75, "elapsed_time": "1:07:05", "remaining_time": "0:30:29", "throughput": 4253.05, "total_tokens": 17119144} {"current_steps": 26240, "total_steps": 38160, "loss": 0.3803, "lr": 0.000268963431487244, "epoch": 13.752620545073375, "percentage": 68.76, "elapsed_time": "1:07:05", "remaining_time": "0:30:28", "throughput": 4253.06, "total_tokens": 17122056} {"current_steps": 26245, "total_steps": 38160, "loss": 0.3674, "lr": 0.0002687606476179336, "epoch": 13.75524109014675, "percentage": 68.78, "elapsed_time": "1:07:06", "remaining_time": "0:30:28", "throughput": 4253.11, "total_tokens": 17125352} {"current_steps": 26250, "total_steps": 38160, "loss": 0.3969, "lr": 0.0002685579121212578, "epoch": 13.757861635220126, "percentage": 68.79, "elapsed_time": "1:07:07", "remaining_time": "0:30:27", "throughput": 4253.13, "total_tokens": 17128456} {"current_steps": 26255, "total_steps": 38160, "loss": 0.3178, "lr": 0.00026835522503962616, "epoch": 13.7604821802935, "percentage": 68.8, "elapsed_time": "1:07:07", "remaining_time": "0:30:26", "throughput": 4253.15, "total_tokens": 17131496} {"current_steps": 26260, "total_steps": 38160, "loss": 0.3043, "lr": 0.00026815258641543896, "epoch": 13.763102725366876, "percentage": 68.82, "elapsed_time": "1:07:08", "remaining_time": "0:30:25", "throughput": 4253.29, "total_tokens": 17135528} {"current_steps": 26265, "total_steps": 38160, "loss": 0.4483, "lr": 0.0002679499962910853, "epoch": 13.765723270440251, "percentage": 68.83, "elapsed_time": "1:07:09", "remaining_time": "0:30:24", "throughput": 4253.32, "total_tokens": 17138728} {"current_steps": 26270, "total_steps": 38160, "loss": 0.4558, "lr": 0.0002677474547089451, "epoch": 13.768343815513626, "percentage": 68.84, "elapsed_time": "1:07:10", "remaining_time": "0:30:24", "throughput": 4253.44, "total_tokens": 17142600} {"current_steps": 26275, "total_steps": 38160, "loss": 0.4988, "lr": 0.000267544961711388, "epoch": 13.770964360587001, "percentage": 68.85, "elapsed_time": "1:07:10", "remaining_time": "0:30:23", "throughput": 4253.44, "total_tokens": 17145448} {"current_steps": 26280, "total_steps": 38160, "loss": 0.336, "lr": 0.0002673425173407726, "epoch": 13.773584905660378, "percentage": 68.87, "elapsed_time": "1:07:11", "remaining_time": "0:30:22", "throughput": 4253.48, "total_tokens": 17148712} {"current_steps": 26285, "total_steps": 38160, "loss": 0.3821, "lr": 0.00026714012163944826, "epoch": 13.776205450733752, "percentage": 68.88, "elapsed_time": "1:07:12", "remaining_time": "0:30:21", "throughput": 4253.44, "total_tokens": 17151144} {"current_steps": 26290, "total_steps": 38160, "loss": 0.3646, "lr": 0.0002669377746497541, "epoch": 13.778825995807129, "percentage": 68.89, "elapsed_time": "1:07:12", "remaining_time": "0:30:20", "throughput": 4253.42, "total_tokens": 17153864} {"current_steps": 26295, "total_steps": 38160, "loss": 0.4495, "lr": 0.0002667354764140184, "epoch": 13.781446540880504, "percentage": 68.91, "elapsed_time": "1:07:13", "remaining_time": "0:30:20", "throughput": 4253.45, "total_tokens": 17156968} {"current_steps": 26300, "total_steps": 38160, "loss": 0.4992, "lr": 0.00026653322697455987, "epoch": 13.784067085953879, "percentage": 68.92, "elapsed_time": "1:07:14", "remaining_time": "0:30:19", "throughput": 4253.53, "total_tokens": 17160520} {"current_steps": 26305, "total_steps": 38160, "loss": 0.3798, "lr": 0.00026633102637368684, "epoch": 13.786687631027254, "percentage": 68.93, "elapsed_time": "1:07:15", "remaining_time": "0:30:18", "throughput": 4253.53, "total_tokens": 17163368} {"current_steps": 26310, "total_steps": 38160, "loss": 0.5994, "lr": 0.00026612887465369704, "epoch": 13.78930817610063, "percentage": 68.95, "elapsed_time": "1:07:15", "remaining_time": "0:30:17", "throughput": 4253.56, "total_tokens": 17166472} {"current_steps": 26315, "total_steps": 38160, "loss": 0.54, "lr": 0.0002659267718568786, "epoch": 13.791928721174004, "percentage": 68.96, "elapsed_time": "1:07:16", "remaining_time": "0:30:16", "throughput": 4253.64, "total_tokens": 17170088} {"current_steps": 26320, "total_steps": 38160, "loss": 0.4276, "lr": 0.0002657247180255091, "epoch": 13.79454926624738, "percentage": 68.97, "elapsed_time": "1:07:17", "remaining_time": "0:30:16", "throughput": 4253.62, "total_tokens": 17172840} {"current_steps": 26325, "total_steps": 38160, "loss": 0.381, "lr": 0.0002655227132018558, "epoch": 13.797169811320755, "percentage": 68.99, "elapsed_time": "1:07:17", "remaining_time": "0:30:15", "throughput": 4253.62, "total_tokens": 17175752} {"current_steps": 26330, "total_steps": 38160, "loss": 0.4879, "lr": 0.00026532075742817594, "epoch": 13.79979035639413, "percentage": 69.0, "elapsed_time": "1:07:18", "remaining_time": "0:30:14", "throughput": 4253.61, "total_tokens": 17178504} {"current_steps": 26335, "total_steps": 38160, "loss": 0.467, "lr": 0.0002651188507467161, "epoch": 13.802410901467505, "percentage": 69.01, "elapsed_time": "1:07:19", "remaining_time": "0:30:13", "throughput": 4253.52, "total_tokens": 17180648} {"current_steps": 26340, "total_steps": 38160, "loss": 0.5361, "lr": 0.00026491699319971303, "epoch": 13.80503144654088, "percentage": 69.03, "elapsed_time": "1:07:19", "remaining_time": "0:30:12", "throughput": 4253.63, "total_tokens": 17184648} {"current_steps": 26345, "total_steps": 38160, "loss": 0.5441, "lr": 0.00026471518482939317, "epoch": 13.807651991614255, "percentage": 69.04, "elapsed_time": "1:07:20", "remaining_time": "0:30:12", "throughput": 4253.71, "total_tokens": 17188264} {"current_steps": 26350, "total_steps": 38160, "loss": 0.3345, "lr": 0.0002645134256779722, "epoch": 13.81027253668763, "percentage": 69.05, "elapsed_time": "1:07:21", "remaining_time": "0:30:11", "throughput": 4253.76, "total_tokens": 17191464} {"current_steps": 26355, "total_steps": 38160, "loss": 0.4181, "lr": 0.00026431171578765624, "epoch": 13.812893081761006, "percentage": 69.06, "elapsed_time": "1:07:22", "remaining_time": "0:30:10", "throughput": 4253.81, "total_tokens": 17194792} {"current_steps": 26360, "total_steps": 38160, "loss": 0.4172, "lr": 0.0002641100552006402, "epoch": 13.815513626834381, "percentage": 69.08, "elapsed_time": "1:07:22", "remaining_time": "0:30:09", "throughput": 4253.83, "total_tokens": 17197864} {"current_steps": 26365, "total_steps": 38160, "loss": 0.4742, "lr": 0.0002639084439591095, "epoch": 13.818134171907756, "percentage": 69.09, "elapsed_time": "1:07:23", "remaining_time": "0:30:08", "throughput": 4253.84, "total_tokens": 17200840} {"current_steps": 26370, "total_steps": 38160, "loss": 0.3871, "lr": 0.00026370688210523873, "epoch": 13.820754716981131, "percentage": 69.1, "elapsed_time": "1:07:24", "remaining_time": "0:30:08", "throughput": 4253.91, "total_tokens": 17204296} {"current_steps": 26375, "total_steps": 38160, "loss": 0.4273, "lr": 0.00026350536968119275, "epoch": 13.823375262054507, "percentage": 69.12, "elapsed_time": "1:07:24", "remaining_time": "0:30:07", "throughput": 4253.88, "total_tokens": 17206920} {"current_steps": 26380, "total_steps": 38160, "loss": 0.4938, "lr": 0.0002633039067291252, "epoch": 13.825995807127882, "percentage": 69.13, "elapsed_time": "1:07:25", "remaining_time": "0:30:06", "throughput": 4253.86, "total_tokens": 17209672} {"current_steps": 26385, "total_steps": 38160, "loss": 0.605, "lr": 0.00026310249329118007, "epoch": 13.828616352201259, "percentage": 69.14, "elapsed_time": "1:07:26", "remaining_time": "0:30:05", "throughput": 4253.83, "total_tokens": 17212296} {"current_steps": 26390, "total_steps": 38160, "loss": 0.5555, "lr": 0.0002629011294094905, "epoch": 13.831236897274634, "percentage": 69.16, "elapsed_time": "1:07:27", "remaining_time": "0:30:05", "throughput": 4253.91, "total_tokens": 17215880} {"current_steps": 26395, "total_steps": 38160, "loss": 0.4642, "lr": 0.0002626998151261798, "epoch": 13.833857442348009, "percentage": 69.17, "elapsed_time": "1:07:27", "remaining_time": "0:30:04", "throughput": 4253.92, "total_tokens": 17218760} {"current_steps": 26400, "total_steps": 38160, "loss": 0.5778, "lr": 0.0002624985504833604, "epoch": 13.836477987421384, "percentage": 69.18, "elapsed_time": "1:07:28", "remaining_time": "0:30:03", "throughput": 4254.01, "total_tokens": 17222408} {"current_steps": 26405, "total_steps": 38160, "loss": 0.5037, "lr": 0.0002622973355231349, "epoch": 13.83909853249476, "percentage": 69.2, "elapsed_time": "1:07:29", "remaining_time": "0:30:02", "throughput": 4254.07, "total_tokens": 17225800} {"current_steps": 26410, "total_steps": 38160, "loss": 0.3418, "lr": 0.00026209617028759497, "epoch": 13.841719077568134, "percentage": 69.21, "elapsed_time": "1:07:30", "remaining_time": "0:30:01", "throughput": 4254.13, "total_tokens": 17229256} {"current_steps": 26415, "total_steps": 38160, "loss": 0.5377, "lr": 0.00026189505481882184, "epoch": 13.84433962264151, "percentage": 69.22, "elapsed_time": "1:07:30", "remaining_time": "0:30:01", "throughput": 4254.12, "total_tokens": 17232104} {"current_steps": 26420, "total_steps": 38160, "loss": 0.6781, "lr": 0.00026169398915888687, "epoch": 13.846960167714885, "percentage": 69.23, "elapsed_time": "1:07:31", "remaining_time": "0:30:00", "throughput": 4254.19, "total_tokens": 17235528} {"current_steps": 26425, "total_steps": 38160, "loss": 0.3971, "lr": 0.0002614929733498506, "epoch": 13.84958071278826, "percentage": 69.25, "elapsed_time": "1:07:32", "remaining_time": "0:29:59", "throughput": 4254.15, "total_tokens": 17238088} {"current_steps": 26430, "total_steps": 38160, "loss": 0.4537, "lr": 0.0002612920074337634, "epoch": 13.852201257861635, "percentage": 69.26, "elapsed_time": "1:07:32", "remaining_time": "0:29:58", "throughput": 4254.18, "total_tokens": 17241288} {"current_steps": 26435, "total_steps": 38160, "loss": 0.3835, "lr": 0.00026109109145266496, "epoch": 13.85482180293501, "percentage": 69.27, "elapsed_time": "1:07:33", "remaining_time": "0:29:57", "throughput": 4254.25, "total_tokens": 17244840} {"current_steps": 26440, "total_steps": 38160, "loss": 0.4609, "lr": 0.00026089022544858445, "epoch": 13.857442348008385, "percentage": 69.29, "elapsed_time": "1:07:34", "remaining_time": "0:29:57", "throughput": 4254.24, "total_tokens": 17247688} {"current_steps": 26445, "total_steps": 38160, "loss": 0.5057, "lr": 0.00026068940946354075, "epoch": 13.86006289308176, "percentage": 69.3, "elapsed_time": "1:07:35", "remaining_time": "0:29:56", "throughput": 4254.45, "total_tokens": 17252360} {"current_steps": 26450, "total_steps": 38160, "loss": 0.5158, "lr": 0.0002604886435395425, "epoch": 13.862683438155136, "percentage": 69.31, "elapsed_time": "1:07:35", "remaining_time": "0:29:55", "throughput": 4254.46, "total_tokens": 17255368} {"current_steps": 26455, "total_steps": 38160, "loss": 0.4853, "lr": 0.00026028792771858744, "epoch": 13.865303983228511, "percentage": 69.33, "elapsed_time": "1:07:36", "remaining_time": "0:29:54", "throughput": 4254.41, "total_tokens": 17257832} {"current_steps": 26460, "total_steps": 38160, "loss": 0.3186, "lr": 0.00026008726204266333, "epoch": 13.867924528301886, "percentage": 69.34, "elapsed_time": "1:07:37", "remaining_time": "0:29:54", "throughput": 4254.5, "total_tokens": 17261480} {"current_steps": 26465, "total_steps": 38160, "loss": 0.5021, "lr": 0.00025988664655374693, "epoch": 13.870545073375261, "percentage": 69.35, "elapsed_time": "1:07:37", "remaining_time": "0:29:53", "throughput": 4254.51, "total_tokens": 17264360} {"current_steps": 26470, "total_steps": 38160, "loss": 0.3804, "lr": 0.00025968608129380455, "epoch": 13.873165618448636, "percentage": 69.37, "elapsed_time": "1:07:38", "remaining_time": "0:29:52", "throughput": 4254.6, "total_tokens": 17268104} {"current_steps": 26475, "total_steps": 38160, "loss": 0.4037, "lr": 0.00025948556630479234, "epoch": 13.875786163522012, "percentage": 69.38, "elapsed_time": "1:07:39", "remaining_time": "0:29:51", "throughput": 4254.6, "total_tokens": 17271048} {"current_steps": 26480, "total_steps": 38160, "loss": 0.4066, "lr": 0.0002592851016286557, "epoch": 13.878406708595389, "percentage": 69.39, "elapsed_time": "1:07:40", "remaining_time": "0:29:50", "throughput": 4254.62, "total_tokens": 17274056} {"current_steps": 26485, "total_steps": 38160, "loss": 0.4393, "lr": 0.0002590846873073298, "epoch": 13.881027253668764, "percentage": 69.41, "elapsed_time": "1:07:40", "remaining_time": "0:29:50", "throughput": 4254.65, "total_tokens": 17277192} {"current_steps": 26490, "total_steps": 38160, "loss": 0.4274, "lr": 0.0002588843233827387, "epoch": 13.883647798742139, "percentage": 69.42, "elapsed_time": "1:07:41", "remaining_time": "0:29:49", "throughput": 4254.76, "total_tokens": 17281128} {"current_steps": 26495, "total_steps": 38160, "loss": 0.3752, "lr": 0.0002586840098967963, "epoch": 13.886268343815514, "percentage": 69.43, "elapsed_time": "1:07:42", "remaining_time": "0:29:48", "throughput": 4254.74, "total_tokens": 17283848} {"current_steps": 26500, "total_steps": 38160, "loss": 0.3575, "lr": 0.00025848374689140587, "epoch": 13.88888888888889, "percentage": 69.44, "elapsed_time": "1:07:42", "remaining_time": "0:29:47", "throughput": 4254.8, "total_tokens": 17287208} {"current_steps": 26505, "total_steps": 38160, "loss": 0.374, "lr": 0.0002582835344084602, "epoch": 13.891509433962264, "percentage": 69.46, "elapsed_time": "1:07:43", "remaining_time": "0:29:46", "throughput": 4254.87, "total_tokens": 17290696} {"current_steps": 26510, "total_steps": 38160, "loss": 0.4262, "lr": 0.00025808337248984175, "epoch": 13.89412997903564, "percentage": 69.47, "elapsed_time": "1:07:44", "remaining_time": "0:29:46", "throughput": 4254.98, "total_tokens": 17294600} {"current_steps": 26515, "total_steps": 38160, "loss": 0.4677, "lr": 0.00025788326117742185, "epoch": 13.896750524109015, "percentage": 69.48, "elapsed_time": "1:07:45", "remaining_time": "0:29:45", "throughput": 4255.01, "total_tokens": 17297768} {"current_steps": 26520, "total_steps": 38160, "loss": 0.4232, "lr": 0.00025768320051306127, "epoch": 13.89937106918239, "percentage": 69.5, "elapsed_time": "1:07:45", "remaining_time": "0:29:44", "throughput": 4255.02, "total_tokens": 17300808} {"current_steps": 26525, "total_steps": 38160, "loss": 0.4454, "lr": 0.00025748319053861063, "epoch": 13.901991614255765, "percentage": 69.51, "elapsed_time": "1:07:46", "remaining_time": "0:29:43", "throughput": 4254.99, "total_tokens": 17303432} {"current_steps": 26530, "total_steps": 38160, "loss": 0.3939, "lr": 0.0002572832312959098, "epoch": 13.90461215932914, "percentage": 69.52, "elapsed_time": "1:07:47", "remaining_time": "0:29:42", "throughput": 4254.97, "total_tokens": 17306152} {"current_steps": 26535, "total_steps": 38160, "loss": 0.4091, "lr": 0.0002570833228267879, "epoch": 13.907232704402515, "percentage": 69.54, "elapsed_time": "1:07:47", "remaining_time": "0:29:42", "throughput": 4254.94, "total_tokens": 17308840} {"current_steps": 26540, "total_steps": 38160, "loss": 0.5132, "lr": 0.00025688346517306366, "epoch": 13.90985324947589, "percentage": 69.55, "elapsed_time": "1:07:48", "remaining_time": "0:29:41", "throughput": 4254.97, "total_tokens": 17311944} {"current_steps": 26545, "total_steps": 38160, "loss": 0.4254, "lr": 0.00025668365837654497, "epoch": 13.912473794549266, "percentage": 69.56, "elapsed_time": "1:07:49", "remaining_time": "0:29:40", "throughput": 4254.97, "total_tokens": 17314888} {"current_steps": 26550, "total_steps": 38160, "loss": 0.506, "lr": 0.0002564839024790288, "epoch": 13.915094339622641, "percentage": 69.58, "elapsed_time": "1:07:50", "remaining_time": "0:29:39", "throughput": 4255.03, "total_tokens": 17318248} {"current_steps": 26555, "total_steps": 38160, "loss": 0.4366, "lr": 0.000256284197522302, "epoch": 13.917714884696016, "percentage": 69.59, "elapsed_time": "1:07:50", "remaining_time": "0:29:38", "throughput": 4255.05, "total_tokens": 17321320} {"current_steps": 26560, "total_steps": 38160, "loss": 0.4063, "lr": 0.00025608454354814075, "epoch": 13.920335429769391, "percentage": 69.6, "elapsed_time": "1:07:51", "remaining_time": "0:29:38", "throughput": 4255.1, "total_tokens": 17324680} {"current_steps": 26565, "total_steps": 38160, "loss": 0.405, "lr": 0.0002558849405983104, "epoch": 13.922955974842766, "percentage": 69.61, "elapsed_time": "1:07:52", "remaining_time": "0:29:37", "throughput": 4255.17, "total_tokens": 17328072} {"current_steps": 26570, "total_steps": 38160, "loss": 0.4629, "lr": 0.00025568538871456527, "epoch": 13.925576519916142, "percentage": 69.63, "elapsed_time": "1:07:52", "remaining_time": "0:29:36", "throughput": 4255.2, "total_tokens": 17331272} {"current_steps": 26575, "total_steps": 38160, "loss": 0.3954, "lr": 0.00025548588793864976, "epoch": 13.928197064989519, "percentage": 69.64, "elapsed_time": "1:07:53", "remaining_time": "0:29:35", "throughput": 4255.28, "total_tokens": 17334920} {"current_steps": 26580, "total_steps": 38160, "loss": 0.4863, "lr": 0.0002552864383122967, "epoch": 13.930817610062894, "percentage": 69.65, "elapsed_time": "1:07:54", "remaining_time": "0:29:35", "throughput": 4255.38, "total_tokens": 17338664} {"current_steps": 26585, "total_steps": 38160, "loss": 0.5157, "lr": 0.0002550870398772289, "epoch": 13.933438155136269, "percentage": 69.67, "elapsed_time": "1:07:55", "remaining_time": "0:29:34", "throughput": 4255.31, "total_tokens": 17341000} {"current_steps": 26590, "total_steps": 38160, "loss": 0.3602, "lr": 0.0002548876926751584, "epoch": 13.936058700209644, "percentage": 69.68, "elapsed_time": "1:07:55", "remaining_time": "0:29:33", "throughput": 4255.38, "total_tokens": 17344456} {"current_steps": 26595, "total_steps": 38160, "loss": 0.537, "lr": 0.0002546883967477861, "epoch": 13.93867924528302, "percentage": 69.69, "elapsed_time": "1:07:56", "remaining_time": "0:29:32", "throughput": 4255.43, "total_tokens": 17347976} {"current_steps": 26600, "total_steps": 38160, "loss": 0.4811, "lr": 0.00025448915213680245, "epoch": 13.941299790356394, "percentage": 69.71, "elapsed_time": "1:07:57", "remaining_time": "0:29:31", "throughput": 4255.5, "total_tokens": 17351336} {"current_steps": 26605, "total_steps": 38160, "loss": 0.3862, "lr": 0.0002542899588838875, "epoch": 13.94392033542977, "percentage": 69.72, "elapsed_time": "1:07:58", "remaining_time": "0:29:31", "throughput": 4255.79, "total_tokens": 17356744} {"current_steps": 26610, "total_steps": 38160, "loss": 0.4415, "lr": 0.0002540908170307097, "epoch": 13.946540880503145, "percentage": 69.73, "elapsed_time": "1:07:59", "remaining_time": "0:29:30", "throughput": 4255.74, "total_tokens": 17359240} {"current_steps": 26615, "total_steps": 38160, "loss": 0.4592, "lr": 0.00025389172661892753, "epoch": 13.94916142557652, "percentage": 69.75, "elapsed_time": "1:07:59", "remaining_time": "0:29:29", "throughput": 4255.91, "total_tokens": 17363592} {"current_steps": 26620, "total_steps": 38160, "loss": 0.6062, "lr": 0.00025369268769018856, "epoch": 13.951781970649895, "percentage": 69.76, "elapsed_time": "1:08:00", "remaining_time": "0:29:28", "throughput": 4255.86, "total_tokens": 17365992} {"current_steps": 26625, "total_steps": 38160, "loss": 0.4416, "lr": 0.00025349370028612914, "epoch": 13.95440251572327, "percentage": 69.77, "elapsed_time": "1:08:01", "remaining_time": "0:29:28", "throughput": 4255.82, "total_tokens": 17368520} {"current_steps": 26630, "total_steps": 38160, "loss": 0.3878, "lr": 0.0002532947644483755, "epoch": 13.957023060796645, "percentage": 69.79, "elapsed_time": "1:08:01", "remaining_time": "0:29:27", "throughput": 4255.88, "total_tokens": 17371880} {"current_steps": 26635, "total_steps": 38160, "loss": 0.3673, "lr": 0.00025309588021854237, "epoch": 13.95964360587002, "percentage": 69.8, "elapsed_time": "1:08:02", "remaining_time": "0:29:26", "throughput": 4255.86, "total_tokens": 17374600} {"current_steps": 26640, "total_steps": 38160, "loss": 0.3481, "lr": 0.0002528970476382343, "epoch": 13.962264150943396, "percentage": 69.81, "elapsed_time": "1:08:03", "remaining_time": "0:29:25", "throughput": 4256.0, "total_tokens": 17378600} {"current_steps": 26645, "total_steps": 38160, "loss": 0.4077, "lr": 0.00025269826674904493, "epoch": 13.964884696016771, "percentage": 69.82, "elapsed_time": "1:08:03", "remaining_time": "0:29:24", "throughput": 4256.0, "total_tokens": 17381416} {"current_steps": 26650, "total_steps": 38160, "loss": 0.416, "lr": 0.0002524995375925566, "epoch": 13.967505241090146, "percentage": 69.84, "elapsed_time": "1:08:04", "remaining_time": "0:29:24", "throughput": 4256.0, "total_tokens": 17384264} {"current_steps": 26655, "total_steps": 38160, "loss": 0.5194, "lr": 0.0002523008602103414, "epoch": 13.970125786163521, "percentage": 69.85, "elapsed_time": "1:08:05", "remaining_time": "0:29:23", "throughput": 4256.08, "total_tokens": 17387912} {"current_steps": 26660, "total_steps": 38160, "loss": 0.3366, "lr": 0.00025210223464396055, "epoch": 13.972746331236896, "percentage": 69.86, "elapsed_time": "1:08:06", "remaining_time": "0:29:22", "throughput": 4256.05, "total_tokens": 17390600} {"current_steps": 26665, "total_steps": 38160, "loss": 0.4129, "lr": 0.00025190366093496376, "epoch": 13.975366876310272, "percentage": 69.88, "elapsed_time": "1:08:06", "remaining_time": "0:29:21", "throughput": 4256.08, "total_tokens": 17393704} {"current_steps": 26670, "total_steps": 38160, "loss": 0.5076, "lr": 0.0002517051391248909, "epoch": 13.977987421383649, "percentage": 69.89, "elapsed_time": "1:08:07", "remaining_time": "0:29:20", "throughput": 4256.11, "total_tokens": 17396808} {"current_steps": 26675, "total_steps": 38160, "loss": 0.4579, "lr": 0.0002515066692552701, "epoch": 13.980607966457024, "percentage": 69.9, "elapsed_time": "1:08:08", "remaining_time": "0:29:20", "throughput": 4256.16, "total_tokens": 17400040} {"current_steps": 26680, "total_steps": 38160, "loss": 0.3365, "lr": 0.00025130825136761916, "epoch": 13.983228511530399, "percentage": 69.92, "elapsed_time": "1:08:08", "remaining_time": "0:29:19", "throughput": 4256.24, "total_tokens": 17403624} {"current_steps": 26685, "total_steps": 38160, "loss": 0.6446, "lr": 0.0002511098855034447, "epoch": 13.985849056603774, "percentage": 69.93, "elapsed_time": "1:08:09", "remaining_time": "0:29:18", "throughput": 4256.27, "total_tokens": 17406760} {"current_steps": 26690, "total_steps": 38160, "loss": 0.4397, "lr": 0.00025091157170424296, "epoch": 13.98846960167715, "percentage": 69.94, "elapsed_time": "1:08:10", "remaining_time": "0:29:17", "throughput": 4256.28, "total_tokens": 17409832} {"current_steps": 26695, "total_steps": 38160, "loss": 0.4179, "lr": 0.0002507133100114984, "epoch": 13.991090146750524, "percentage": 69.96, "elapsed_time": "1:08:11", "remaining_time": "0:29:17", "throughput": 4256.38, "total_tokens": 17413672} {"current_steps": 26700, "total_steps": 38160, "loss": 0.5487, "lr": 0.0002505151004666857, "epoch": 13.9937106918239, "percentage": 69.97, "elapsed_time": "1:08:11", "remaining_time": "0:29:16", "throughput": 4256.43, "total_tokens": 17416936} {"current_steps": 26705, "total_steps": 38160, "loss": 0.4638, "lr": 0.0002503169431112674, "epoch": 13.996331236897275, "percentage": 69.98, "elapsed_time": "1:08:12", "remaining_time": "0:29:15", "throughput": 4256.51, "total_tokens": 17420520} {"current_steps": 26710, "total_steps": 38160, "loss": 0.3804, "lr": 0.0002501188379866961, "epoch": 13.99895178197065, "percentage": 69.99, "elapsed_time": "1:08:13", "remaining_time": "0:29:14", "throughput": 4256.65, "total_tokens": 17424840} {"current_steps": 26712, "total_steps": 38160, "eval_loss": 0.4591861665248871, "epoch": 14.0, "percentage": 70.0, "elapsed_time": "1:08:27", "remaining_time": "0:29:20", "throughput": 4242.37, "total_tokens": 17425368} {"current_steps": 26715, "total_steps": 38160, "loss": 0.3925, "lr": 0.0002499207851344133, "epoch": 14.001572327044025, "percentage": 70.01, "elapsed_time": "1:08:29", "remaining_time": "0:29:20", "throughput": 4240.33, "total_tokens": 17427448} {"current_steps": 26720, "total_steps": 38160, "loss": 0.4476, "lr": 0.00024972278459584903, "epoch": 14.0041928721174, "percentage": 70.02, "elapsed_time": "1:08:30", "remaining_time": "0:29:19", "throughput": 4240.29, "total_tokens": 17430008} {"current_steps": 26725, "total_steps": 38160, "loss": 0.5064, "lr": 0.00024952483641242304, "epoch": 14.006813417190775, "percentage": 70.03, "elapsed_time": "1:08:31", "remaining_time": "0:29:19", "throughput": 4240.31, "total_tokens": 17433080} {"current_steps": 26730, "total_steps": 38160, "loss": 0.4679, "lr": 0.0002493269406255435, "epoch": 14.00943396226415, "percentage": 70.05, "elapsed_time": "1:08:31", "remaining_time": "0:29:18", "throughput": 4240.3, "total_tokens": 17436088} {"current_steps": 26735, "total_steps": 38160, "loss": 0.3463, "lr": 0.0002491290972766082, "epoch": 14.012054507337526, "percentage": 70.06, "elapsed_time": "1:08:32", "remaining_time": "0:29:17", "throughput": 4240.24, "total_tokens": 17438680} {"current_steps": 26740, "total_steps": 38160, "loss": 0.4037, "lr": 0.0002489313064070037, "epoch": 14.014675052410901, "percentage": 70.07, "elapsed_time": "1:08:33", "remaining_time": "0:29:16", "throughput": 4240.34, "total_tokens": 17442424} {"current_steps": 26745, "total_steps": 38160, "loss": 0.4141, "lr": 0.00024873356805810566, "epoch": 14.017295597484276, "percentage": 70.09, "elapsed_time": "1:08:34", "remaining_time": "0:29:15", "throughput": 4240.39, "total_tokens": 17445784} {"current_steps": 26750, "total_steps": 38160, "loss": 0.3221, "lr": 0.00024853588227127864, "epoch": 14.019916142557651, "percentage": 70.1, "elapsed_time": "1:08:34", "remaining_time": "0:29:15", "throughput": 4240.34, "total_tokens": 17448280} {"current_steps": 26755, "total_steps": 38160, "loss": 0.4558, "lr": 0.000248338249087876, "epoch": 14.022536687631026, "percentage": 70.11, "elapsed_time": "1:08:35", "remaining_time": "0:29:14", "throughput": 4240.45, "total_tokens": 17452248} {"current_steps": 26760, "total_steps": 38160, "loss": 0.3421, "lr": 0.0002481406685492405, "epoch": 14.025157232704403, "percentage": 70.13, "elapsed_time": "1:08:36", "remaining_time": "0:29:13", "throughput": 4240.51, "total_tokens": 17455672} {"current_steps": 26765, "total_steps": 38160, "loss": 0.3263, "lr": 0.00024794314069670383, "epoch": 14.027777777777779, "percentage": 70.14, "elapsed_time": "1:08:37", "remaining_time": "0:29:12", "throughput": 4240.49, "total_tokens": 17458328} {"current_steps": 26770, "total_steps": 38160, "loss": 0.474, "lr": 0.0002477456655715865, "epoch": 14.030398322851154, "percentage": 70.15, "elapsed_time": "1:08:37", "remaining_time": "0:29:11", "throughput": 4240.45, "total_tokens": 17460856} {"current_steps": 26775, "total_steps": 38160, "loss": 0.3763, "lr": 0.0002475482432151982, "epoch": 14.033018867924529, "percentage": 70.17, "elapsed_time": "1:08:38", "remaining_time": "0:29:11", "throughput": 4240.54, "total_tokens": 17464440} {"current_steps": 26780, "total_steps": 38160, "loss": 0.48, "lr": 0.00024735087366883733, "epoch": 14.035639412997904, "percentage": 70.18, "elapsed_time": "1:08:39", "remaining_time": "0:29:10", "throughput": 4240.56, "total_tokens": 17467512} {"current_steps": 26785, "total_steps": 38160, "loss": 0.4154, "lr": 0.00024715355697379115, "epoch": 14.03825995807128, "percentage": 70.19, "elapsed_time": "1:08:39", "remaining_time": "0:29:09", "throughput": 4240.66, "total_tokens": 17471224} {"current_steps": 26790, "total_steps": 38160, "loss": 0.3371, "lr": 0.0002469562931713362, "epoch": 14.040880503144654, "percentage": 70.2, "elapsed_time": "1:08:40", "remaining_time": "0:29:08", "throughput": 4240.71, "total_tokens": 17474616} {"current_steps": 26795, "total_steps": 38160, "loss": 0.3785, "lr": 0.00024675908230273785, "epoch": 14.04350104821803, "percentage": 70.22, "elapsed_time": "1:08:41", "remaining_time": "0:29:08", "throughput": 4240.75, "total_tokens": 17477880} {"current_steps": 26800, "total_steps": 38160, "loss": 0.5621, "lr": 0.00024656192440925055, "epoch": 14.046121593291405, "percentage": 70.23, "elapsed_time": "1:08:42", "remaining_time": "0:29:07", "throughput": 4240.77, "total_tokens": 17481016} {"current_steps": 26805, "total_steps": 38160, "loss": 0.358, "lr": 0.0002463648195321173, "epoch": 14.04874213836478, "percentage": 70.24, "elapsed_time": "1:08:42", "remaining_time": "0:29:06", "throughput": 4240.84, "total_tokens": 17484568} {"current_steps": 26810, "total_steps": 38160, "loss": 0.3875, "lr": 0.00024616776771257, "epoch": 14.051362683438155, "percentage": 70.26, "elapsed_time": "1:08:44", "remaining_time": "0:29:05", "throughput": 4241.2, "total_tokens": 17491032} {"current_steps": 26815, "total_steps": 38160, "loss": 0.3318, "lr": 0.00024597076899182977, "epoch": 14.05398322851153, "percentage": 70.27, "elapsed_time": "1:08:44", "remaining_time": "0:29:05", "throughput": 4241.21, "total_tokens": 17494136} {"current_steps": 26820, "total_steps": 38160, "loss": 0.5217, "lr": 0.0002457738234111066, "epoch": 14.056603773584905, "percentage": 70.28, "elapsed_time": "1:08:45", "remaining_time": "0:29:04", "throughput": 4241.19, "total_tokens": 17496920} {"current_steps": 26825, "total_steps": 38160, "loss": 0.3004, "lr": 0.00024557693101159937, "epoch": 14.05922431865828, "percentage": 70.3, "elapsed_time": "1:08:46", "remaining_time": "0:29:03", "throughput": 4241.21, "total_tokens": 17500024} {"current_steps": 26830, "total_steps": 38160, "loss": 0.4132, "lr": 0.00024538009183449553, "epoch": 14.061844863731656, "percentage": 70.31, "elapsed_time": "1:08:46", "remaining_time": "0:29:02", "throughput": 4241.26, "total_tokens": 17503416} {"current_steps": 26835, "total_steps": 38160, "loss": 0.3423, "lr": 0.0002451833059209715, "epoch": 14.064465408805031, "percentage": 70.32, "elapsed_time": "1:08:47", "remaining_time": "0:29:01", "throughput": 4241.29, "total_tokens": 17506648} {"current_steps": 26840, "total_steps": 38160, "loss": 0.3787, "lr": 0.00024498657331219274, "epoch": 14.067085953878406, "percentage": 70.34, "elapsed_time": "1:08:48", "remaining_time": "0:29:01", "throughput": 4241.29, "total_tokens": 17509496} {"current_steps": 26845, "total_steps": 38160, "loss": 0.4157, "lr": 0.0002447898940493135, "epoch": 14.069706498951781, "percentage": 70.35, "elapsed_time": "1:08:49", "remaining_time": "0:29:00", "throughput": 4241.42, "total_tokens": 17513464} {"current_steps": 26850, "total_steps": 38160, "loss": 0.2986, "lr": 0.00024459326817347684, "epoch": 14.072327044025156, "percentage": 70.36, "elapsed_time": "1:08:49", "remaining_time": "0:28:59", "throughput": 4241.43, "total_tokens": 17516568} {"current_steps": 26855, "total_steps": 38160, "loss": 0.5198, "lr": 0.0002443966957258148, "epoch": 14.074947589098532, "percentage": 70.37, "elapsed_time": "1:08:50", "remaining_time": "0:28:58", "throughput": 4241.54, "total_tokens": 17520440} {"current_steps": 26860, "total_steps": 38160, "loss": 0.4157, "lr": 0.000244200176747448, "epoch": 14.077568134171909, "percentage": 70.39, "elapsed_time": "1:08:51", "remaining_time": "0:28:58", "throughput": 4241.53, "total_tokens": 17523224} {"current_steps": 26865, "total_steps": 38160, "loss": 0.4103, "lr": 0.00024400371127948568, "epoch": 14.080188679245284, "percentage": 70.4, "elapsed_time": "1:08:52", "remaining_time": "0:28:57", "throughput": 4241.89, "total_tokens": 17530008} {"current_steps": 26870, "total_steps": 38160, "loss": 0.4075, "lr": 0.00024380729936302636, "epoch": 14.082809224318659, "percentage": 70.41, "elapsed_time": "1:08:53", "remaining_time": "0:28:56", "throughput": 4241.9, "total_tokens": 17533048} {"current_steps": 26875, "total_steps": 38160, "loss": 0.3429, "lr": 0.00024361094103915725, "epoch": 14.085429769392034, "percentage": 70.43, "elapsed_time": "1:08:53", "remaining_time": "0:28:55", "throughput": 4241.86, "total_tokens": 17535608} {"current_steps": 26880, "total_steps": 38160, "loss": 0.3687, "lr": 0.00024341463634895444, "epoch": 14.08805031446541, "percentage": 70.44, "elapsed_time": "1:08:54", "remaining_time": "0:28:55", "throughput": 4241.94, "total_tokens": 17539096} {"current_steps": 26885, "total_steps": 38160, "loss": 0.5294, "lr": 0.0002432183853334824, "epoch": 14.090670859538784, "percentage": 70.45, "elapsed_time": "1:08:55", "remaining_time": "0:28:54", "throughput": 4242.04, "total_tokens": 17542936} {"current_steps": 26890, "total_steps": 38160, "loss": 0.5257, "lr": 0.00024302218803379445, "epoch": 14.09329140461216, "percentage": 70.47, "elapsed_time": "1:08:56", "remaining_time": "0:28:53", "throughput": 4242.03, "total_tokens": 17545688} {"current_steps": 26895, "total_steps": 38160, "loss": 0.4288, "lr": 0.000242826044490933, "epoch": 14.095911949685535, "percentage": 70.48, "elapsed_time": "1:08:56", "remaining_time": "0:28:52", "throughput": 4242.02, "total_tokens": 17548536} {"current_steps": 26900, "total_steps": 38160, "loss": 0.3789, "lr": 0.00024262995474592903, "epoch": 14.09853249475891, "percentage": 70.49, "elapsed_time": "1:08:57", "remaining_time": "0:28:51", "throughput": 4242.1, "total_tokens": 17552056} {"current_steps": 26905, "total_steps": 38160, "loss": 0.3553, "lr": 0.0002424339188398025, "epoch": 14.101153039832285, "percentage": 70.51, "elapsed_time": "1:08:58", "remaining_time": "0:28:51", "throughput": 4242.17, "total_tokens": 17555512} {"current_steps": 26910, "total_steps": 38160, "loss": 0.3996, "lr": 0.00024223793681356148, "epoch": 14.10377358490566, "percentage": 70.52, "elapsed_time": "1:08:59", "remaining_time": "0:28:50", "throughput": 4242.28, "total_tokens": 17559320} {"current_steps": 26915, "total_steps": 38160, "loss": 0.3149, "lr": 0.00024204200870820358, "epoch": 14.106394129979035, "percentage": 70.53, "elapsed_time": "1:08:59", "remaining_time": "0:28:49", "throughput": 4242.34, "total_tokens": 17562616} {"current_steps": 26920, "total_steps": 38160, "loss": 0.4558, "lr": 0.0002418461345647143, "epoch": 14.10901467505241, "percentage": 70.55, "elapsed_time": "1:09:00", "remaining_time": "0:28:48", "throughput": 4242.41, "total_tokens": 17566200} {"current_steps": 26925, "total_steps": 38160, "loss": 0.3815, "lr": 0.00024165031442406853, "epoch": 14.111635220125786, "percentage": 70.56, "elapsed_time": "1:09:01", "remaining_time": "0:28:48", "throughput": 4242.46, "total_tokens": 17569496} {"current_steps": 26930, "total_steps": 38160, "loss": 0.4644, "lr": 0.00024145454832722956, "epoch": 14.114255765199161, "percentage": 70.57, "elapsed_time": "1:09:01", "remaining_time": "0:28:47", "throughput": 4242.39, "total_tokens": 17571832} {"current_steps": 26935, "total_steps": 38160, "loss": 0.4277, "lr": 0.00024125883631514967, "epoch": 14.116876310272536, "percentage": 70.58, "elapsed_time": "1:09:02", "remaining_time": "0:28:46", "throughput": 4242.39, "total_tokens": 17574744} {"current_steps": 26940, "total_steps": 38160, "loss": 0.4537, "lr": 0.00024106317842876907, "epoch": 14.119496855345911, "percentage": 70.6, "elapsed_time": "1:09:03", "remaining_time": "0:28:45", "throughput": 4242.46, "total_tokens": 17578232} {"current_steps": 26945, "total_steps": 38160, "loss": 0.4758, "lr": 0.0002408675747090177, "epoch": 14.122117400419286, "percentage": 70.61, "elapsed_time": "1:09:04", "remaining_time": "0:28:44", "throughput": 4242.52, "total_tokens": 17581688} {"current_steps": 26950, "total_steps": 38160, "loss": 0.4128, "lr": 0.00024067202519681313, "epoch": 14.124737945492662, "percentage": 70.62, "elapsed_time": "1:09:04", "remaining_time": "0:28:44", "throughput": 4242.61, "total_tokens": 17585336} {"current_steps": 26955, "total_steps": 38160, "loss": 0.4044, "lr": 0.00024047652993306235, "epoch": 14.127358490566039, "percentage": 70.64, "elapsed_time": "1:09:05", "remaining_time": "0:28:43", "throughput": 4242.59, "total_tokens": 17588120} {"current_steps": 26960, "total_steps": 38160, "loss": 0.421, "lr": 0.00024028108895866084, "epoch": 14.129979035639414, "percentage": 70.65, "elapsed_time": "1:09:06", "remaining_time": "0:28:42", "throughput": 4242.7, "total_tokens": 17591928} {"current_steps": 26965, "total_steps": 38160, "loss": 0.3263, "lr": 0.00024008570231449239, "epoch": 14.132599580712789, "percentage": 70.66, "elapsed_time": "1:09:07", "remaining_time": "0:28:41", "throughput": 4242.83, "total_tokens": 17596120} {"current_steps": 26970, "total_steps": 38160, "loss": 0.5023, "lr": 0.00023989037004142966, "epoch": 14.135220125786164, "percentage": 70.68, "elapsed_time": "1:09:07", "remaining_time": "0:28:41", "throughput": 4242.87, "total_tokens": 17599416} {"current_steps": 26975, "total_steps": 38160, "loss": 0.4866, "lr": 0.0002396950921803343, "epoch": 14.13784067085954, "percentage": 70.69, "elapsed_time": "1:09:08", "remaining_time": "0:28:40", "throughput": 4242.98, "total_tokens": 17603192} {"current_steps": 26980, "total_steps": 38160, "loss": 0.4279, "lr": 0.0002394998687720557, "epoch": 14.140461215932914, "percentage": 70.7, "elapsed_time": "1:09:09", "remaining_time": "0:28:39", "throughput": 4243.01, "total_tokens": 17606520} {"current_steps": 26985, "total_steps": 38160, "loss": 0.3894, "lr": 0.0002393046998574328, "epoch": 14.14308176100629, "percentage": 70.72, "elapsed_time": "1:09:10", "remaining_time": "0:28:38", "throughput": 4242.98, "total_tokens": 17609112} {"current_steps": 26990, "total_steps": 38160, "loss": 0.4584, "lr": 0.0002391095854772924, "epoch": 14.145702306079665, "percentage": 70.73, "elapsed_time": "1:09:10", "remaining_time": "0:28:37", "throughput": 4243.03, "total_tokens": 17612440} {"current_steps": 26995, "total_steps": 38160, "loss": 0.3622, "lr": 0.00023891452567245027, "epoch": 14.14832285115304, "percentage": 70.74, "elapsed_time": "1:09:11", "remaining_time": "0:28:37", "throughput": 4243.04, "total_tokens": 17615384} {"current_steps": 27000, "total_steps": 38160, "loss": 0.3356, "lr": 0.00023871952048371093, "epoch": 14.150943396226415, "percentage": 70.75, "elapsed_time": "1:09:12", "remaining_time": "0:28:36", "throughput": 4243.06, "total_tokens": 17618456} {"current_steps": 27005, "total_steps": 38160, "loss": 0.7076, "lr": 0.00023852456995186684, "epoch": 14.15356394129979, "percentage": 70.77, "elapsed_time": "1:09:13", "remaining_time": "0:28:35", "throughput": 4243.1, "total_tokens": 17621720} {"current_steps": 27010, "total_steps": 38160, "loss": 0.4553, "lr": 0.0002383296741176997, "epoch": 14.156184486373165, "percentage": 70.78, "elapsed_time": "1:09:13", "remaining_time": "0:28:34", "throughput": 4243.14, "total_tokens": 17625112} {"current_steps": 27015, "total_steps": 38160, "loss": 0.5749, "lr": 0.00023813483302197964, "epoch": 14.15880503144654, "percentage": 70.79, "elapsed_time": "1:09:14", "remaining_time": "0:28:33", "throughput": 4243.24, "total_tokens": 17628824} {"current_steps": 27020, "total_steps": 38160, "loss": 0.3204, "lr": 0.00023794004670546476, "epoch": 14.161425576519916, "percentage": 70.81, "elapsed_time": "1:09:15", "remaining_time": "0:28:33", "throughput": 4243.33, "total_tokens": 17632568} {"current_steps": 27025, "total_steps": 38160, "loss": 0.3653, "lr": 0.00023774531520890242, "epoch": 14.164046121593291, "percentage": 70.82, "elapsed_time": "1:09:16", "remaining_time": "0:28:32", "throughput": 4243.39, "total_tokens": 17635928} {"current_steps": 27030, "total_steps": 38160, "loss": 0.4855, "lr": 0.00023755063857302833, "epoch": 14.166666666666666, "percentage": 70.83, "elapsed_time": "1:09:16", "remaining_time": "0:28:31", "throughput": 4243.48, "total_tokens": 17639832} {"current_steps": 27035, "total_steps": 38160, "loss": 0.396, "lr": 0.00023735601683856628, "epoch": 14.169287211740041, "percentage": 70.85, "elapsed_time": "1:09:17", "remaining_time": "0:28:30", "throughput": 4243.53, "total_tokens": 17643160} {"current_steps": 27040, "total_steps": 38160, "loss": 0.5298, "lr": 0.0002371614500462293, "epoch": 14.171907756813416, "percentage": 70.86, "elapsed_time": "1:09:18", "remaining_time": "0:28:30", "throughput": 4243.53, "total_tokens": 17646040} {"current_steps": 27045, "total_steps": 38160, "loss": 0.392, "lr": 0.00023696693823671816, "epoch": 14.174528301886792, "percentage": 70.87, "elapsed_time": "1:09:18", "remaining_time": "0:28:29", "throughput": 4243.49, "total_tokens": 17648600} {"current_steps": 27050, "total_steps": 38160, "loss": 0.4408, "lr": 0.00023677248145072272, "epoch": 14.177148846960169, "percentage": 70.89, "elapsed_time": "1:09:19", "remaining_time": "0:28:28", "throughput": 4243.54, "total_tokens": 17652024} {"current_steps": 27055, "total_steps": 38160, "loss": 0.3969, "lr": 0.0002365780797289211, "epoch": 14.179769392033544, "percentage": 70.9, "elapsed_time": "1:09:20", "remaining_time": "0:28:27", "throughput": 4243.57, "total_tokens": 17655160} {"current_steps": 27060, "total_steps": 38160, "loss": 0.4465, "lr": 0.00023638373311198014, "epoch": 14.182389937106919, "percentage": 70.91, "elapsed_time": "1:09:21", "remaining_time": "0:28:26", "throughput": 4243.64, "total_tokens": 17658712} {"current_steps": 27065, "total_steps": 38160, "loss": 0.3525, "lr": 0.00023618944164055468, "epoch": 14.185010482180294, "percentage": 70.93, "elapsed_time": "1:09:21", "remaining_time": "0:28:26", "throughput": 4243.62, "total_tokens": 17661432} {"current_steps": 27070, "total_steps": 38160, "loss": 0.5085, "lr": 0.00023599520535528813, "epoch": 14.18763102725367, "percentage": 70.94, "elapsed_time": "1:09:22", "remaining_time": "0:28:25", "throughput": 4243.62, "total_tokens": 17664408} {"current_steps": 27075, "total_steps": 38160, "loss": 0.3629, "lr": 0.00023580102429681266, "epoch": 14.190251572327044, "percentage": 70.95, "elapsed_time": "1:09:23", "remaining_time": "0:28:24", "throughput": 4243.65, "total_tokens": 17667608} {"current_steps": 27080, "total_steps": 38160, "loss": 0.4342, "lr": 0.00023560689850574885, "epoch": 14.19287211740042, "percentage": 70.96, "elapsed_time": "1:09:24", "remaining_time": "0:28:23", "throughput": 4243.7, "total_tokens": 17670872} {"current_steps": 27085, "total_steps": 38160, "loss": 0.4748, "lr": 0.00023541282802270563, "epoch": 14.195492662473795, "percentage": 70.98, "elapsed_time": "1:09:24", "remaining_time": "0:28:22", "throughput": 4243.64, "total_tokens": 17673368} {"current_steps": 27090, "total_steps": 38160, "loss": 0.4059, "lr": 0.00023521881288828005, "epoch": 14.19811320754717, "percentage": 70.99, "elapsed_time": "1:09:25", "remaining_time": "0:28:22", "throughput": 4243.58, "total_tokens": 17675800} {"current_steps": 27095, "total_steps": 38160, "loss": 0.355, "lr": 0.00023502485314305828, "epoch": 14.200733752620545, "percentage": 71.0, "elapsed_time": "1:09:26", "remaining_time": "0:28:21", "throughput": 4243.64, "total_tokens": 17679288} {"current_steps": 27100, "total_steps": 38160, "loss": 0.4886, "lr": 0.00023483094882761397, "epoch": 14.20335429769392, "percentage": 71.02, "elapsed_time": "1:09:26", "remaining_time": "0:28:20", "throughput": 4243.66, "total_tokens": 17682392} {"current_steps": 27105, "total_steps": 38160, "loss": 0.4809, "lr": 0.00023463709998250998, "epoch": 14.205974842767295, "percentage": 71.03, "elapsed_time": "1:09:27", "remaining_time": "0:28:19", "throughput": 4243.63, "total_tokens": 17685176} {"current_steps": 27110, "total_steps": 38160, "loss": 0.3818, "lr": 0.00023444330664829728, "epoch": 14.20859538784067, "percentage": 71.04, "elapsed_time": "1:09:28", "remaining_time": "0:28:18", "throughput": 4243.59, "total_tokens": 17687768} {"current_steps": 27115, "total_steps": 38160, "loss": 0.3166, "lr": 0.00023424956886551536, "epoch": 14.211215932914046, "percentage": 71.06, "elapsed_time": "1:09:28", "remaining_time": "0:28:18", "throughput": 4243.59, "total_tokens": 17690712} {"current_steps": 27120, "total_steps": 38160, "loss": 0.6865, "lr": 0.0002340558866746918, "epoch": 14.213836477987421, "percentage": 71.07, "elapsed_time": "1:09:29", "remaining_time": "0:28:17", "throughput": 4243.63, "total_tokens": 17693944} {"current_steps": 27125, "total_steps": 38160, "loss": 0.379, "lr": 0.0002338622601163425, "epoch": 14.216457023060796, "percentage": 71.08, "elapsed_time": "1:09:30", "remaining_time": "0:28:16", "throughput": 4243.7, "total_tokens": 17697528} {"current_steps": 27130, "total_steps": 38160, "loss": 0.4568, "lr": 0.00023366868923097213, "epoch": 14.219077568134171, "percentage": 71.1, "elapsed_time": "1:09:30", "remaining_time": "0:28:15", "throughput": 4243.71, "total_tokens": 17700472} {"current_steps": 27135, "total_steps": 38160, "loss": 0.3836, "lr": 0.0002334751740590735, "epoch": 14.221698113207546, "percentage": 71.11, "elapsed_time": "1:09:31", "remaining_time": "0:28:14", "throughput": 4243.78, "total_tokens": 17704024} {"current_steps": 27140, "total_steps": 38160, "loss": 0.3723, "lr": 0.00023328171464112796, "epoch": 14.224318658280922, "percentage": 71.12, "elapsed_time": "1:09:32", "remaining_time": "0:28:14", "throughput": 4243.76, "total_tokens": 17706840} {"current_steps": 27145, "total_steps": 38160, "loss": 0.565, "lr": 0.00023308831101760485, "epoch": 14.226939203354299, "percentage": 71.13, "elapsed_time": "1:09:33", "remaining_time": "0:28:13", "throughput": 4243.74, "total_tokens": 17709592} {"current_steps": 27150, "total_steps": 38160, "loss": 0.4555, "lr": 0.00023289496322896174, "epoch": 14.229559748427674, "percentage": 71.15, "elapsed_time": "1:09:33", "remaining_time": "0:28:12", "throughput": 4243.81, "total_tokens": 17713112} {"current_steps": 27155, "total_steps": 38160, "loss": 0.5168, "lr": 0.00023270167131564512, "epoch": 14.232180293501049, "percentage": 71.16, "elapsed_time": "1:09:34", "remaining_time": "0:28:11", "throughput": 4243.82, "total_tokens": 17716056} {"current_steps": 27160, "total_steps": 38160, "loss": 0.4273, "lr": 0.0002325084353180893, "epoch": 14.234800838574424, "percentage": 71.17, "elapsed_time": "1:09:35", "remaining_time": "0:28:11", "throughput": 4243.91, "total_tokens": 17719704} {"current_steps": 27165, "total_steps": 38160, "loss": 0.418, "lr": 0.00023231525527671716, "epoch": 14.2374213836478, "percentage": 71.19, "elapsed_time": "1:09:35", "remaining_time": "0:28:10", "throughput": 4243.89, "total_tokens": 17722456} {"current_steps": 27170, "total_steps": 38160, "loss": 0.3973, "lr": 0.00023212213123193986, "epoch": 14.240041928721174, "percentage": 71.2, "elapsed_time": "1:09:36", "remaining_time": "0:28:09", "throughput": 4243.9, "total_tokens": 17725400} {"current_steps": 27175, "total_steps": 38160, "loss": 0.5558, "lr": 0.0002319290632241566, "epoch": 14.24266247379455, "percentage": 71.21, "elapsed_time": "1:09:37", "remaining_time": "0:28:08", "throughput": 4243.91, "total_tokens": 17728440} {"current_steps": 27180, "total_steps": 38160, "loss": 0.3618, "lr": 0.0002317360512937548, "epoch": 14.245283018867925, "percentage": 71.23, "elapsed_time": "1:09:38", "remaining_time": "0:28:07", "throughput": 4243.9, "total_tokens": 17731192} {"current_steps": 27185, "total_steps": 38160, "loss": 0.3425, "lr": 0.00023154309548111058, "epoch": 14.2479035639413, "percentage": 71.24, "elapsed_time": "1:09:38", "remaining_time": "0:28:07", "throughput": 4244.0, "total_tokens": 17735096} {"current_steps": 27190, "total_steps": 38160, "loss": 0.4678, "lr": 0.000231350195826588, "epoch": 14.250524109014675, "percentage": 71.25, "elapsed_time": "1:09:39", "remaining_time": "0:28:06", "throughput": 4244.1, "total_tokens": 17739000} {"current_steps": 27195, "total_steps": 38160, "loss": 0.3757, "lr": 0.00023115735237053982, "epoch": 14.25314465408805, "percentage": 71.27, "elapsed_time": "1:09:40", "remaining_time": "0:28:05", "throughput": 4244.08, "total_tokens": 17741784} {"current_steps": 27200, "total_steps": 38160, "loss": 0.5084, "lr": 0.00023096456515330632, "epoch": 14.255765199161425, "percentage": 71.28, "elapsed_time": "1:09:41", "remaining_time": "0:28:04", "throughput": 4244.04, "total_tokens": 17744440} {"current_steps": 27205, "total_steps": 38160, "loss": 0.6026, "lr": 0.0002307718342152163, "epoch": 14.2583857442348, "percentage": 71.29, "elapsed_time": "1:09:41", "remaining_time": "0:28:03", "throughput": 4244.03, "total_tokens": 17747352} {"current_steps": 27210, "total_steps": 38160, "loss": 0.4028, "lr": 0.0002305791595965871, "epoch": 14.261006289308176, "percentage": 71.31, "elapsed_time": "1:09:42", "remaining_time": "0:28:03", "throughput": 4244.01, "total_tokens": 17750104} {"current_steps": 27215, "total_steps": 38160, "loss": 0.3945, "lr": 0.00023038654133772395, "epoch": 14.26362683438155, "percentage": 71.32, "elapsed_time": "1:09:43", "remaining_time": "0:28:02", "throughput": 4243.97, "total_tokens": 17752728} {"current_steps": 27220, "total_steps": 38160, "loss": 0.3533, "lr": 0.00023019397947892062, "epoch": 14.266247379454926, "percentage": 71.33, "elapsed_time": "1:09:43", "remaining_time": "0:28:01", "throughput": 4244.03, "total_tokens": 17756248} {"current_steps": 27225, "total_steps": 38160, "loss": 0.3934, "lr": 0.00023000147406045853, "epoch": 14.268867924528301, "percentage": 71.34, "elapsed_time": "1:09:44", "remaining_time": "0:28:00", "throughput": 4244.08, "total_tokens": 17759704} {"current_steps": 27230, "total_steps": 38160, "loss": 0.4363, "lr": 0.00022980902512260786, "epoch": 14.271488469601676, "percentage": 71.36, "elapsed_time": "1:09:45", "remaining_time": "0:27:59", "throughput": 4244.13, "total_tokens": 17763064} {"current_steps": 27235, "total_steps": 38160, "loss": 0.4902, "lr": 0.00022961663270562656, "epoch": 14.274109014675052, "percentage": 71.37, "elapsed_time": "1:09:46", "remaining_time": "0:27:59", "throughput": 4244.28, "total_tokens": 17767384} {"current_steps": 27240, "total_steps": 38160, "loss": 0.4956, "lr": 0.0002294242968497609, "epoch": 14.276729559748428, "percentage": 71.38, "elapsed_time": "1:09:46", "remaining_time": "0:27:58", "throughput": 4244.28, "total_tokens": 17770328} {"current_steps": 27245, "total_steps": 38160, "loss": 0.401, "lr": 0.00022923201759524552, "epoch": 14.279350104821804, "percentage": 71.4, "elapsed_time": "1:09:47", "remaining_time": "0:27:57", "throughput": 4244.36, "total_tokens": 17774072} {"current_steps": 27250, "total_steps": 38160, "loss": 0.2827, "lr": 0.00022903979498230316, "epoch": 14.281970649895179, "percentage": 71.41, "elapsed_time": "1:09:48", "remaining_time": "0:27:56", "throughput": 4244.29, "total_tokens": 17776344} {"current_steps": 27255, "total_steps": 38160, "loss": 0.4809, "lr": 0.00022884762905114436, "epoch": 14.284591194968554, "percentage": 71.42, "elapsed_time": "1:09:49", "remaining_time": "0:27:56", "throughput": 4244.44, "total_tokens": 17780536} {"current_steps": 27260, "total_steps": 38160, "loss": 0.4658, "lr": 0.00022865551984196792, "epoch": 14.28721174004193, "percentage": 71.44, "elapsed_time": "1:09:49", "remaining_time": "0:27:55", "throughput": 4244.49, "total_tokens": 17784024} {"current_steps": 27265, "total_steps": 38160, "loss": 0.5698, "lr": 0.0002284634673949611, "epoch": 14.289832285115304, "percentage": 71.45, "elapsed_time": "1:09:50", "remaining_time": "0:27:54", "throughput": 4244.62, "total_tokens": 17788248} {"current_steps": 27270, "total_steps": 38160, "loss": 0.4158, "lr": 0.00022827147175029906, "epoch": 14.29245283018868, "percentage": 71.46, "elapsed_time": "1:09:51", "remaining_time": "0:27:53", "throughput": 4244.59, "total_tokens": 17790872} {"current_steps": 27275, "total_steps": 38160, "loss": 0.4105, "lr": 0.0002280795329481452, "epoch": 14.295073375262055, "percentage": 71.48, "elapsed_time": "1:09:52", "remaining_time": "0:27:53", "throughput": 4244.61, "total_tokens": 17793912} {"current_steps": 27280, "total_steps": 38160, "loss": 0.4106, "lr": 0.00022788765102865066, "epoch": 14.29769392033543, "percentage": 71.49, "elapsed_time": "1:09:52", "remaining_time": "0:27:52", "throughput": 4244.66, "total_tokens": 17797336} {"current_steps": 27285, "total_steps": 38160, "loss": 0.499, "lr": 0.00022769582603195533, "epoch": 14.300314465408805, "percentage": 71.5, "elapsed_time": "1:09:53", "remaining_time": "0:27:51", "throughput": 4244.72, "total_tokens": 17800728} {"current_steps": 27290, "total_steps": 38160, "loss": 0.6324, "lr": 0.00022750405799818634, "epoch": 14.30293501048218, "percentage": 71.51, "elapsed_time": "1:09:54", "remaining_time": "0:27:50", "throughput": 4244.7, "total_tokens": 17803448} {"current_steps": 27295, "total_steps": 38160, "loss": 0.3636, "lr": 0.00022731234696745967, "epoch": 14.305555555555555, "percentage": 71.53, "elapsed_time": "1:09:55", "remaining_time": "0:27:49", "throughput": 4244.87, "total_tokens": 17807896} {"current_steps": 27300, "total_steps": 38160, "loss": 0.4193, "lr": 0.0002271206929798792, "epoch": 14.30817610062893, "percentage": 71.54, "elapsed_time": "1:09:55", "remaining_time": "0:27:49", "throughput": 4244.89, "total_tokens": 17811032} {"current_steps": 27305, "total_steps": 38160, "loss": 0.4644, "lr": 0.00022692909607553642, "epoch": 14.310796645702306, "percentage": 71.55, "elapsed_time": "1:09:56", "remaining_time": "0:27:48", "throughput": 4245.06, "total_tokens": 17815640} {"current_steps": 27310, "total_steps": 38160, "loss": 0.3895, "lr": 0.00022673755629451132, "epoch": 14.31341719077568, "percentage": 71.57, "elapsed_time": "1:09:57", "remaining_time": "0:27:47", "throughput": 4245.08, "total_tokens": 17818744} {"current_steps": 27315, "total_steps": 38160, "loss": 0.3785, "lr": 0.00022654607367687213, "epoch": 14.316037735849056, "percentage": 71.58, "elapsed_time": "1:09:58", "remaining_time": "0:27:46", "throughput": 4245.06, "total_tokens": 17821432} {"current_steps": 27320, "total_steps": 38160, "loss": 0.45, "lr": 0.00022635464826267442, "epoch": 14.318658280922431, "percentage": 71.59, "elapsed_time": "1:09:58", "remaining_time": "0:27:46", "throughput": 4245.05, "total_tokens": 17824312} {"current_steps": 27325, "total_steps": 38160, "loss": 0.315, "lr": 0.00022616328009196236, "epoch": 14.321278825995806, "percentage": 71.61, "elapsed_time": "1:09:59", "remaining_time": "0:27:45", "throughput": 4245.06, "total_tokens": 17827288} {"current_steps": 27330, "total_steps": 38160, "loss": 0.3779, "lr": 0.0002259719692047682, "epoch": 14.323899371069182, "percentage": 71.62, "elapsed_time": "1:10:00", "remaining_time": "0:27:44", "throughput": 4245.07, "total_tokens": 17830392} {"current_steps": 27335, "total_steps": 38160, "loss": 0.4083, "lr": 0.00022578071564111163, "epoch": 14.326519916142558, "percentage": 71.63, "elapsed_time": "1:10:00", "remaining_time": "0:27:43", "throughput": 4245.09, "total_tokens": 17833432} {"current_steps": 27340, "total_steps": 38160, "loss": 0.4311, "lr": 0.00022558951944100087, "epoch": 14.329140461215934, "percentage": 71.65, "elapsed_time": "1:10:01", "remaining_time": "0:27:42", "throughput": 4245.18, "total_tokens": 17837112} {"current_steps": 27345, "total_steps": 38160, "loss": 0.3599, "lr": 0.00022539838064443223, "epoch": 14.331761006289309, "percentage": 71.66, "elapsed_time": "1:10:02", "remaining_time": "0:27:42", "throughput": 4245.19, "total_tokens": 17840088} {"current_steps": 27350, "total_steps": 38160, "loss": 0.3837, "lr": 0.00022520729929138933, "epoch": 14.334381551362684, "percentage": 71.67, "elapsed_time": "1:10:03", "remaining_time": "0:27:41", "throughput": 4245.19, "total_tokens": 17843000} {"current_steps": 27355, "total_steps": 38160, "loss": 0.447, "lr": 0.0002250162754218446, "epoch": 14.33700209643606, "percentage": 71.69, "elapsed_time": "1:10:03", "remaining_time": "0:27:40", "throughput": 4245.29, "total_tokens": 17846872} {"current_steps": 27360, "total_steps": 38160, "loss": 0.4453, "lr": 0.00022482530907575767, "epoch": 14.339622641509434, "percentage": 71.7, "elapsed_time": "1:10:04", "remaining_time": "0:27:39", "throughput": 4245.35, "total_tokens": 17850232} {"current_steps": 27365, "total_steps": 38160, "loss": 0.6233, "lr": 0.00022463440029307674, "epoch": 14.34224318658281, "percentage": 71.71, "elapsed_time": "1:10:05", "remaining_time": "0:27:38", "throughput": 4245.47, "total_tokens": 17854360} {"current_steps": 27370, "total_steps": 38160, "loss": 0.4312, "lr": 0.00022444354911373794, "epoch": 14.344863731656185, "percentage": 71.72, "elapsed_time": "1:10:06", "remaining_time": "0:27:38", "throughput": 4245.55, "total_tokens": 17858040} {"current_steps": 27375, "total_steps": 38160, "loss": 0.5198, "lr": 0.00022425275557766473, "epoch": 14.34748427672956, "percentage": 71.74, "elapsed_time": "1:10:07", "remaining_time": "0:27:37", "throughput": 4245.61, "total_tokens": 17861400} {"current_steps": 27380, "total_steps": 38160, "loss": 0.6471, "lr": 0.00022406201972476937, "epoch": 14.350104821802935, "percentage": 71.75, "elapsed_time": "1:10:07", "remaining_time": "0:27:36", "throughput": 4245.71, "total_tokens": 17865176} {"current_steps": 27385, "total_steps": 38160, "loss": 0.5096, "lr": 0.00022387134159495122, "epoch": 14.35272536687631, "percentage": 71.76, "elapsed_time": "1:10:08", "remaining_time": "0:27:35", "throughput": 4245.65, "total_tokens": 17867544} {"current_steps": 27390, "total_steps": 38160, "loss": 0.3584, "lr": 0.00022368072122809813, "epoch": 14.355345911949685, "percentage": 71.78, "elapsed_time": "1:10:09", "remaining_time": "0:27:35", "throughput": 4245.67, "total_tokens": 17870584} {"current_steps": 27395, "total_steps": 38160, "loss": 0.4, "lr": 0.0002234901586640858, "epoch": 14.35796645702306, "percentage": 71.79, "elapsed_time": "1:10:09", "remaining_time": "0:27:34", "throughput": 4245.68, "total_tokens": 17873560} {"current_steps": 27400, "total_steps": 38160, "loss": 0.5054, "lr": 0.00022329965394277785, "epoch": 14.360587002096436, "percentage": 71.8, "elapsed_time": "1:10:10", "remaining_time": "0:27:33", "throughput": 4245.7, "total_tokens": 17876824} {"current_steps": 27405, "total_steps": 38160, "loss": 0.458, "lr": 0.00022310920710402532, "epoch": 14.36320754716981, "percentage": 71.82, "elapsed_time": "1:10:11", "remaining_time": "0:27:32", "throughput": 4245.73, "total_tokens": 17879928} {"current_steps": 27410, "total_steps": 38160, "loss": 0.5034, "lr": 0.00022291881818766796, "epoch": 14.365828092243186, "percentage": 71.83, "elapsed_time": "1:10:12", "remaining_time": "0:27:31", "throughput": 4245.82, "total_tokens": 17883672} {"current_steps": 27415, "total_steps": 38160, "loss": 0.3752, "lr": 0.00022272848723353252, "epoch": 14.368448637316561, "percentage": 71.84, "elapsed_time": "1:10:12", "remaining_time": "0:27:31", "throughput": 4245.86, "total_tokens": 17887032} {"current_steps": 27420, "total_steps": 38160, "loss": 0.4214, "lr": 0.00022253821428143422, "epoch": 14.371069182389936, "percentage": 71.86, "elapsed_time": "1:10:13", "remaining_time": "0:27:30", "throughput": 4245.85, "total_tokens": 17889816} {"current_steps": 27425, "total_steps": 38160, "loss": 0.4439, "lr": 0.0002223479993711761, "epoch": 14.373689727463312, "percentage": 71.87, "elapsed_time": "1:10:14", "remaining_time": "0:27:29", "throughput": 4245.87, "total_tokens": 17893016} {"current_steps": 27430, "total_steps": 38160, "loss": 0.3837, "lr": 0.00022215784254254906, "epoch": 14.376310272536688, "percentage": 71.88, "elapsed_time": "1:10:14", "remaining_time": "0:27:28", "throughput": 4245.89, "total_tokens": 17896056} {"current_steps": 27435, "total_steps": 38160, "loss": 0.5243, "lr": 0.00022196774383533157, "epoch": 14.378930817610064, "percentage": 71.89, "elapsed_time": "1:10:15", "remaining_time": "0:27:27", "throughput": 4245.91, "total_tokens": 17899224} {"current_steps": 27440, "total_steps": 38160, "loss": 0.5312, "lr": 0.0002217777032892899, "epoch": 14.381551362683439, "percentage": 71.91, "elapsed_time": "1:10:16", "remaining_time": "0:27:27", "throughput": 4245.98, "total_tokens": 17902840} {"current_steps": 27445, "total_steps": 38160, "loss": 0.5216, "lr": 0.00022158772094417863, "epoch": 14.384171907756814, "percentage": 71.92, "elapsed_time": "1:10:17", "remaining_time": "0:27:26", "throughput": 4245.93, "total_tokens": 17905272} {"current_steps": 27450, "total_steps": 38160, "loss": 0.4644, "lr": 0.00022139779683973983, "epoch": 14.38679245283019, "percentage": 71.93, "elapsed_time": "1:10:17", "remaining_time": "0:27:25", "throughput": 4245.92, "total_tokens": 17907992} {"current_steps": 27455, "total_steps": 38160, "loss": 0.3629, "lr": 0.00022120793101570364, "epoch": 14.389412997903564, "percentage": 71.95, "elapsed_time": "1:10:18", "remaining_time": "0:27:24", "throughput": 4245.91, "total_tokens": 17910904} {"current_steps": 27460, "total_steps": 38160, "loss": 0.3779, "lr": 0.00022101812351178762, "epoch": 14.39203354297694, "percentage": 71.96, "elapsed_time": "1:10:19", "remaining_time": "0:27:24", "throughput": 4246.03, "total_tokens": 17914904} {"current_steps": 27465, "total_steps": 38160, "loss": 0.4284, "lr": 0.00022082837436769725, "epoch": 14.394654088050315, "percentage": 71.97, "elapsed_time": "1:10:19", "remaining_time": "0:27:23", "throughput": 4246.06, "total_tokens": 17918104} {"current_steps": 27470, "total_steps": 38160, "loss": 0.4381, "lr": 0.00022063868362312596, "epoch": 14.39727463312369, "percentage": 71.99, "elapsed_time": "1:10:20", "remaining_time": "0:27:22", "throughput": 4246.13, "total_tokens": 17921720} {"current_steps": 27475, "total_steps": 38160, "loss": 0.4691, "lr": 0.00022044905131775495, "epoch": 14.399895178197065, "percentage": 72.0, "elapsed_time": "1:10:21", "remaining_time": "0:27:21", "throughput": 4246.17, "total_tokens": 17924984} {"current_steps": 27480, "total_steps": 38160, "loss": 0.4297, "lr": 0.00022025947749125313, "epoch": 14.40251572327044, "percentage": 72.01, "elapsed_time": "1:10:22", "remaining_time": "0:27:20", "throughput": 4246.15, "total_tokens": 17927672} {"current_steps": 27485, "total_steps": 38160, "loss": 0.5454, "lr": 0.0002200699621832773, "epoch": 14.405136268343815, "percentage": 72.03, "elapsed_time": "1:10:22", "remaining_time": "0:27:20", "throughput": 4246.19, "total_tokens": 17931128} {"current_steps": 27490, "total_steps": 38160, "loss": 0.4346, "lr": 0.0002198805054334718, "epoch": 14.40775681341719, "percentage": 72.04, "elapsed_time": "1:10:23", "remaining_time": "0:27:19", "throughput": 4246.29, "total_tokens": 17934936} {"current_steps": 27495, "total_steps": 38160, "loss": 0.3197, "lr": 0.00021969110728146862, "epoch": 14.410377358490566, "percentage": 72.05, "elapsed_time": "1:10:24", "remaining_time": "0:27:18", "throughput": 4246.24, "total_tokens": 17937432} {"current_steps": 27500, "total_steps": 38160, "loss": 0.4141, "lr": 0.00021950176776688784, "epoch": 14.41299790356394, "percentage": 72.06, "elapsed_time": "1:10:24", "remaining_time": "0:27:17", "throughput": 4246.18, "total_tokens": 17939800} {"current_steps": 27505, "total_steps": 38160, "loss": 0.4581, "lr": 0.0002193124869293372, "epoch": 14.415618448637316, "percentage": 72.08, "elapsed_time": "1:10:25", "remaining_time": "0:27:16", "throughput": 4246.2, "total_tokens": 17942808} {"current_steps": 27510, "total_steps": 38160, "loss": 0.4366, "lr": 0.00021912326480841223, "epoch": 14.418238993710691, "percentage": 72.09, "elapsed_time": "1:10:26", "remaining_time": "0:27:16", "throughput": 4246.18, "total_tokens": 17945592} {"current_steps": 27515, "total_steps": 38160, "loss": 0.5102, "lr": 0.0002189341014436958, "epoch": 14.420859538784066, "percentage": 72.1, "elapsed_time": "1:10:26", "remaining_time": "0:27:15", "throughput": 4246.18, "total_tokens": 17948536} {"current_steps": 27520, "total_steps": 38160, "loss": 0.4377, "lr": 0.00021874499687475857, "epoch": 14.423480083857442, "percentage": 72.12, "elapsed_time": "1:10:27", "remaining_time": "0:27:14", "throughput": 4246.28, "total_tokens": 17952408} {"current_steps": 27525, "total_steps": 38160, "loss": 0.4317, "lr": 0.00021855595114115935, "epoch": 14.426100628930818, "percentage": 72.13, "elapsed_time": "1:10:28", "remaining_time": "0:27:13", "throughput": 4246.35, "total_tokens": 17955896} {"current_steps": 27530, "total_steps": 38160, "loss": 0.4883, "lr": 0.00021836696428244418, "epoch": 14.428721174004194, "percentage": 72.14, "elapsed_time": "1:10:29", "remaining_time": "0:27:13", "throughput": 4246.76, "total_tokens": 17963128} {"current_steps": 27535, "total_steps": 38160, "loss": 0.4481, "lr": 0.0002181780363381473, "epoch": 14.431341719077569, "percentage": 72.16, "elapsed_time": "1:10:30", "remaining_time": "0:27:12", "throughput": 4246.71, "total_tokens": 17965688} {"current_steps": 27540, "total_steps": 38160, "loss": 0.3266, "lr": 0.00021798916734779, "epoch": 14.433962264150944, "percentage": 72.17, "elapsed_time": "1:10:31", "remaining_time": "0:27:11", "throughput": 4246.73, "total_tokens": 17968888} {"current_steps": 27545, "total_steps": 38160, "loss": 0.3941, "lr": 0.00021780035735088132, "epoch": 14.43658280922432, "percentage": 72.18, "elapsed_time": "1:10:31", "remaining_time": "0:27:10", "throughput": 4246.76, "total_tokens": 17972120} {"current_steps": 27550, "total_steps": 38160, "loss": 0.3652, "lr": 0.0002176116063869184, "epoch": 14.439203354297694, "percentage": 72.2, "elapsed_time": "1:10:32", "remaining_time": "0:27:10", "throughput": 4246.82, "total_tokens": 17975608} {"current_steps": 27555, "total_steps": 38160, "loss": 0.5321, "lr": 0.00021742291449538582, "epoch": 14.44182389937107, "percentage": 72.21, "elapsed_time": "1:10:33", "remaining_time": "0:27:09", "throughput": 4246.89, "total_tokens": 17979128} {"current_steps": 27560, "total_steps": 38160, "loss": 0.4673, "lr": 0.00021723428171575566, "epoch": 14.444444444444445, "percentage": 72.22, "elapsed_time": "1:10:34", "remaining_time": "0:27:08", "throughput": 4246.92, "total_tokens": 17982456} {"current_steps": 27565, "total_steps": 38160, "loss": 0.4984, "lr": 0.00021704570808748802, "epoch": 14.44706498951782, "percentage": 72.24, "elapsed_time": "1:10:34", "remaining_time": "0:27:07", "throughput": 4246.96, "total_tokens": 17985720} {"current_steps": 27570, "total_steps": 38160, "loss": 0.4086, "lr": 0.00021685719365003008, "epoch": 14.449685534591195, "percentage": 72.25, "elapsed_time": "1:10:35", "remaining_time": "0:27:06", "throughput": 4247.03, "total_tokens": 17989272} {"current_steps": 27575, "total_steps": 38160, "loss": 0.5114, "lr": 0.00021666873844281682, "epoch": 14.45230607966457, "percentage": 72.26, "elapsed_time": "1:10:36", "remaining_time": "0:27:06", "throughput": 4247.06, "total_tokens": 17992408} {"current_steps": 27580, "total_steps": 38160, "loss": 0.4045, "lr": 0.0002164803425052711, "epoch": 14.454926624737945, "percentage": 72.27, "elapsed_time": "1:10:37", "remaining_time": "0:27:05", "throughput": 4247.19, "total_tokens": 17996568} {"current_steps": 27585, "total_steps": 38160, "loss": 0.3825, "lr": 0.0002162920058768031, "epoch": 14.45754716981132, "percentage": 72.29, "elapsed_time": "1:10:38", "remaining_time": "0:27:04", "throughput": 4247.23, "total_tokens": 17999832} {"current_steps": 27590, "total_steps": 38160, "loss": 0.5266, "lr": 0.000216103728596811, "epoch": 14.460167714884696, "percentage": 72.3, "elapsed_time": "1:10:38", "remaining_time": "0:27:03", "throughput": 4247.35, "total_tokens": 18003704} {"current_steps": 27595, "total_steps": 38160, "loss": 0.3689, "lr": 0.00021591551070467975, "epoch": 14.46278825995807, "percentage": 72.31, "elapsed_time": "1:10:39", "remaining_time": "0:27:03", "throughput": 4247.31, "total_tokens": 18006328} {"current_steps": 27600, "total_steps": 38160, "loss": 0.4523, "lr": 0.0002157273522397829, "epoch": 14.465408805031446, "percentage": 72.33, "elapsed_time": "1:10:40", "remaining_time": "0:27:02", "throughput": 4247.39, "total_tokens": 18010008} {"current_steps": 27605, "total_steps": 38160, "loss": 0.4956, "lr": 0.0002155392532414806, "epoch": 14.468029350104821, "percentage": 72.34, "elapsed_time": "1:10:41", "remaining_time": "0:27:01", "throughput": 4247.5, "total_tokens": 18013880} {"current_steps": 27610, "total_steps": 38160, "loss": 0.4188, "lr": 0.00021535121374912126, "epoch": 14.470649895178196, "percentage": 72.35, "elapsed_time": "1:10:41", "remaining_time": "0:27:00", "throughput": 4247.5, "total_tokens": 18016824} {"current_steps": 27615, "total_steps": 38160, "loss": 0.4129, "lr": 0.00021516323380204073, "epoch": 14.473270440251572, "percentage": 72.37, "elapsed_time": "1:10:42", "remaining_time": "0:27:00", "throughput": 4247.58, "total_tokens": 18020472} {"current_steps": 27620, "total_steps": 38160, "loss": 0.3598, "lr": 0.00021497531343956188, "epoch": 14.475890985324948, "percentage": 72.38, "elapsed_time": "1:10:43", "remaining_time": "0:26:59", "throughput": 4247.55, "total_tokens": 18023128} {"current_steps": 27625, "total_steps": 38160, "loss": 0.47, "lr": 0.00021478745270099591, "epoch": 14.478511530398324, "percentage": 72.39, "elapsed_time": "1:10:43", "remaining_time": "0:26:58", "throughput": 4247.64, "total_tokens": 18026872} {"current_steps": 27630, "total_steps": 38160, "loss": 0.5318, "lr": 0.0002145996516256408, "epoch": 14.481132075471699, "percentage": 72.41, "elapsed_time": "1:10:44", "remaining_time": "0:26:57", "throughput": 4247.69, "total_tokens": 18030200} {"current_steps": 27635, "total_steps": 38160, "loss": 0.325, "lr": 0.00021441191025278256, "epoch": 14.483752620545074, "percentage": 72.42, "elapsed_time": "1:10:45", "remaining_time": "0:26:56", "throughput": 4247.73, "total_tokens": 18033528} {"current_steps": 27640, "total_steps": 38160, "loss": 0.4335, "lr": 0.00021422422862169455, "epoch": 14.48637316561845, "percentage": 72.43, "elapsed_time": "1:10:46", "remaining_time": "0:26:56", "throughput": 4247.69, "total_tokens": 18036088} {"current_steps": 27645, "total_steps": 38160, "loss": 0.4405, "lr": 0.00021403660677163773, "epoch": 14.488993710691824, "percentage": 72.44, "elapsed_time": "1:10:46", "remaining_time": "0:26:55", "throughput": 4247.83, "total_tokens": 18040408} {"current_steps": 27650, "total_steps": 38160, "loss": 0.3386, "lr": 0.00021384904474186018, "epoch": 14.4916142557652, "percentage": 72.46, "elapsed_time": "1:10:47", "remaining_time": "0:26:54", "throughput": 4247.81, "total_tokens": 18043096} {"current_steps": 27655, "total_steps": 38160, "loss": 0.4441, "lr": 0.00021366154257159808, "epoch": 14.494234800838575, "percentage": 72.47, "elapsed_time": "1:10:48", "remaining_time": "0:26:53", "throughput": 4247.82, "total_tokens": 18046232} {"current_steps": 27660, "total_steps": 38160, "loss": 0.4572, "lr": 0.00021347410030007435, "epoch": 14.49685534591195, "percentage": 72.48, "elapsed_time": "1:10:49", "remaining_time": "0:26:52", "throughput": 4247.76, "total_tokens": 18048792} {"current_steps": 27665, "total_steps": 38160, "loss": 0.4399, "lr": 0.0002132867179665, "epoch": 14.499475890985325, "percentage": 72.5, "elapsed_time": "1:10:49", "remaining_time": "0:26:52", "throughput": 4247.85, "total_tokens": 18052696} {"current_steps": 27670, "total_steps": 38160, "loss": 0.3349, "lr": 0.00021309939561007341, "epoch": 14.5020964360587, "percentage": 72.51, "elapsed_time": "1:10:50", "remaining_time": "0:26:51", "throughput": 4247.82, "total_tokens": 18055256} {"current_steps": 27675, "total_steps": 38160, "loss": 0.4181, "lr": 0.00021291213326997998, "epoch": 14.504716981132075, "percentage": 72.52, "elapsed_time": "1:10:51", "remaining_time": "0:26:50", "throughput": 4247.77, "total_tokens": 18057784} {"current_steps": 27680, "total_steps": 38160, "loss": 0.5568, "lr": 0.00021272493098539296, "epoch": 14.50733752620545, "percentage": 72.54, "elapsed_time": "1:10:51", "remaining_time": "0:26:49", "throughput": 4247.78, "total_tokens": 18060920} {"current_steps": 27685, "total_steps": 38160, "loss": 0.4279, "lr": 0.0002125377887954732, "epoch": 14.509958071278826, "percentage": 72.55, "elapsed_time": "1:10:52", "remaining_time": "0:26:49", "throughput": 4247.83, "total_tokens": 18064184} {"current_steps": 27690, "total_steps": 38160, "loss": 0.5101, "lr": 0.00021235070673936824, "epoch": 14.5125786163522, "percentage": 72.56, "elapsed_time": "1:10:53", "remaining_time": "0:26:48", "throughput": 4247.88, "total_tokens": 18067672} {"current_steps": 27695, "total_steps": 38160, "loss": 0.4108, "lr": 0.00021216368485621394, "epoch": 14.515199161425576, "percentage": 72.58, "elapsed_time": "1:10:54", "remaining_time": "0:26:47", "throughput": 4247.93, "total_tokens": 18071032} {"current_steps": 27700, "total_steps": 38160, "loss": 0.671, "lr": 0.00021197672318513282, "epoch": 14.517819706498951, "percentage": 72.59, "elapsed_time": "1:10:54", "remaining_time": "0:26:46", "throughput": 4247.95, "total_tokens": 18074200} {"current_steps": 27705, "total_steps": 38160, "loss": 0.4102, "lr": 0.00021178982176523525, "epoch": 14.520440251572326, "percentage": 72.6, "elapsed_time": "1:10:55", "remaining_time": "0:26:45", "throughput": 4247.92, "total_tokens": 18076824} {"current_steps": 27710, "total_steps": 38160, "loss": 0.458, "lr": 0.0002116029806356189, "epoch": 14.523060796645701, "percentage": 72.62, "elapsed_time": "1:10:56", "remaining_time": "0:26:45", "throughput": 4247.88, "total_tokens": 18079512} {"current_steps": 27715, "total_steps": 38160, "loss": 0.4078, "lr": 0.00021141619983536893, "epoch": 14.525681341719078, "percentage": 72.63, "elapsed_time": "1:10:56", "remaining_time": "0:26:44", "throughput": 4247.88, "total_tokens": 18082424} {"current_steps": 27720, "total_steps": 38160, "loss": 0.3927, "lr": 0.00021122947940355747, "epoch": 14.528301886792454, "percentage": 72.64, "elapsed_time": "1:10:57", "remaining_time": "0:26:43", "throughput": 4247.9, "total_tokens": 18085400} {"current_steps": 27725, "total_steps": 38160, "loss": 0.5814, "lr": 0.00021104281937924462, "epoch": 14.530922431865829, "percentage": 72.65, "elapsed_time": "1:10:58", "remaining_time": "0:26:42", "throughput": 4247.92, "total_tokens": 18088664} {"current_steps": 27730, "total_steps": 38160, "loss": 0.4301, "lr": 0.00021085621980147716, "epoch": 14.533542976939204, "percentage": 72.67, "elapsed_time": "1:10:58", "remaining_time": "0:26:41", "throughput": 4247.91, "total_tokens": 18091512} {"current_steps": 27735, "total_steps": 38160, "loss": 0.6106, "lr": 0.00021066968070928982, "epoch": 14.536163522012579, "percentage": 72.68, "elapsed_time": "1:10:59", "remaining_time": "0:26:41", "throughput": 4247.83, "total_tokens": 18093752} {"current_steps": 27740, "total_steps": 38160, "loss": 0.4995, "lr": 0.00021048320214170463, "epoch": 14.538784067085954, "percentage": 72.69, "elapsed_time": "1:11:00", "remaining_time": "0:26:40", "throughput": 4247.81, "total_tokens": 18096440} {"current_steps": 27745, "total_steps": 38160, "loss": 0.3567, "lr": 0.00021029678413773034, "epoch": 14.54140461215933, "percentage": 72.71, "elapsed_time": "1:11:00", "remaining_time": "0:26:39", "throughput": 4247.82, "total_tokens": 18099384} {"current_steps": 27750, "total_steps": 38160, "loss": 0.4003, "lr": 0.0002101104267363639, "epoch": 14.544025157232705, "percentage": 72.72, "elapsed_time": "1:11:01", "remaining_time": "0:26:38", "throughput": 4247.87, "total_tokens": 18102744} {"current_steps": 27755, "total_steps": 38160, "loss": 0.4727, "lr": 0.00020992412997658877, "epoch": 14.54664570230608, "percentage": 72.73, "elapsed_time": "1:11:02", "remaining_time": "0:26:37", "throughput": 4247.87, "total_tokens": 18105720} {"current_steps": 27760, "total_steps": 38160, "loss": 0.348, "lr": 0.0002097378938973763, "epoch": 14.549266247379455, "percentage": 72.75, "elapsed_time": "1:11:02", "remaining_time": "0:26:37", "throughput": 4247.86, "total_tokens": 18108536} {"current_steps": 27765, "total_steps": 38160, "loss": 0.4787, "lr": 0.0002095517185376849, "epoch": 14.55188679245283, "percentage": 72.76, "elapsed_time": "1:11:03", "remaining_time": "0:26:36", "throughput": 4247.8, "total_tokens": 18110904} {"current_steps": 27770, "total_steps": 38160, "loss": 0.3921, "lr": 0.0002093656039364606, "epoch": 14.554507337526205, "percentage": 72.77, "elapsed_time": "1:11:04", "remaining_time": "0:26:35", "throughput": 4247.81, "total_tokens": 18113944} {"current_steps": 27775, "total_steps": 38160, "loss": 0.469, "lr": 0.00020917955013263618, "epoch": 14.55712788259958, "percentage": 72.79, "elapsed_time": "1:11:05", "remaining_time": "0:26:34", "throughput": 4247.85, "total_tokens": 18117304} {"current_steps": 27780, "total_steps": 38160, "loss": 0.4926, "lr": 0.00020899355716513186, "epoch": 14.559748427672956, "percentage": 72.8, "elapsed_time": "1:11:05", "remaining_time": "0:26:33", "throughput": 4247.8, "total_tokens": 18119704} {"current_steps": 27785, "total_steps": 38160, "loss": 0.5208, "lr": 0.00020880762507285544, "epoch": 14.56236897274633, "percentage": 72.81, "elapsed_time": "1:11:06", "remaining_time": "0:26:33", "throughput": 4247.97, "total_tokens": 18124312} {"current_steps": 27790, "total_steps": 38160, "loss": 0.3929, "lr": 0.00020862175389470172, "epoch": 14.564989517819706, "percentage": 72.82, "elapsed_time": "1:11:07", "remaining_time": "0:26:32", "throughput": 4248.1, "total_tokens": 18128408} {"current_steps": 27795, "total_steps": 38160, "loss": 0.3652, "lr": 0.00020843594366955288, "epoch": 14.567610062893081, "percentage": 72.84, "elapsed_time": "1:11:08", "remaining_time": "0:26:31", "throughput": 4248.11, "total_tokens": 18131416} {"current_steps": 27800, "total_steps": 38160, "loss": 0.4895, "lr": 0.0002082501944362784, "epoch": 14.570230607966456, "percentage": 72.85, "elapsed_time": "1:11:08", "remaining_time": "0:26:30", "throughput": 4248.17, "total_tokens": 18134872} {"current_steps": 27805, "total_steps": 38160, "loss": 0.3076, "lr": 0.00020806450623373486, "epoch": 14.572851153039831, "percentage": 72.86, "elapsed_time": "1:11:09", "remaining_time": "0:26:30", "throughput": 4248.28, "total_tokens": 18138776} {"current_steps": 27810, "total_steps": 38160, "loss": 0.4591, "lr": 0.00020787887910076586, "epoch": 14.575471698113208, "percentage": 72.88, "elapsed_time": "1:11:10", "remaining_time": "0:26:29", "throughput": 4248.29, "total_tokens": 18141752} {"current_steps": 27815, "total_steps": 38160, "loss": 0.3184, "lr": 0.00020769331307620258, "epoch": 14.578092243186584, "percentage": 72.89, "elapsed_time": "1:11:10", "remaining_time": "0:26:28", "throughput": 4248.23, "total_tokens": 18144152} {"current_steps": 27820, "total_steps": 38160, "loss": 0.4383, "lr": 0.0002075078081988635, "epoch": 14.580712788259959, "percentage": 72.9, "elapsed_time": "1:11:11", "remaining_time": "0:26:27", "throughput": 4248.24, "total_tokens": 18147192} {"current_steps": 27825, "total_steps": 38160, "loss": 0.3873, "lr": 0.00020732236450755415, "epoch": 14.583333333333334, "percentage": 72.92, "elapsed_time": "1:11:12", "remaining_time": "0:26:26", "throughput": 4248.27, "total_tokens": 18150456} {"current_steps": 27830, "total_steps": 38160, "loss": 0.4103, "lr": 0.00020713698204106708, "epoch": 14.585953878406709, "percentage": 72.93, "elapsed_time": "1:11:13", "remaining_time": "0:26:26", "throughput": 4248.27, "total_tokens": 18153464} {"current_steps": 27835, "total_steps": 38160, "loss": 0.5051, "lr": 0.00020695166083818206, "epoch": 14.588574423480084, "percentage": 72.94, "elapsed_time": "1:11:13", "remaining_time": "0:26:25", "throughput": 4248.36, "total_tokens": 18157336} {"current_steps": 27840, "total_steps": 38160, "loss": 0.3511, "lr": 0.0002067664009376663, "epoch": 14.59119496855346, "percentage": 72.96, "elapsed_time": "1:11:14", "remaining_time": "0:26:24", "throughput": 4248.43, "total_tokens": 18161016} {"current_steps": 27845, "total_steps": 38160, "loss": 0.4972, "lr": 0.0002065812023782741, "epoch": 14.593815513626835, "percentage": 72.97, "elapsed_time": "1:11:15", "remaining_time": "0:26:23", "throughput": 4248.38, "total_tokens": 18163480} {"current_steps": 27850, "total_steps": 38160, "loss": 0.4087, "lr": 0.00020639606519874703, "epoch": 14.59643605870021, "percentage": 72.98, "elapsed_time": "1:11:16", "remaining_time": "0:26:23", "throughput": 4248.4, "total_tokens": 18166584} {"current_steps": 27855, "total_steps": 38160, "loss": 0.371, "lr": 0.00020621098943781352, "epoch": 14.599056603773585, "percentage": 73.0, "elapsed_time": "1:11:16", "remaining_time": "0:26:22", "throughput": 4248.36, "total_tokens": 18169144} {"current_steps": 27860, "total_steps": 38160, "loss": 0.4787, "lr": 0.0002060259751341891, "epoch": 14.60167714884696, "percentage": 73.01, "elapsed_time": "1:11:17", "remaining_time": "0:26:21", "throughput": 4248.38, "total_tokens": 18172184} {"current_steps": 27865, "total_steps": 38160, "loss": 0.4043, "lr": 0.00020584102232657688, "epoch": 14.604297693920335, "percentage": 73.02, "elapsed_time": "1:11:18", "remaining_time": "0:26:20", "throughput": 4248.35, "total_tokens": 18174840} {"current_steps": 27870, "total_steps": 38160, "loss": 0.353, "lr": 0.0002056561310536668, "epoch": 14.60691823899371, "percentage": 73.03, "elapsed_time": "1:11:18", "remaining_time": "0:26:19", "throughput": 4248.45, "total_tokens": 18178584} {"current_steps": 27875, "total_steps": 38160, "loss": 0.423, "lr": 0.0002054713013541361, "epoch": 14.609538784067086, "percentage": 73.05, "elapsed_time": "1:11:20", "remaining_time": "0:26:19", "throughput": 4248.74, "total_tokens": 18184792} {"current_steps": 27880, "total_steps": 38160, "loss": 0.4417, "lr": 0.00020528653326664915, "epoch": 14.61215932914046, "percentage": 73.06, "elapsed_time": "1:11:20", "remaining_time": "0:26:18", "throughput": 4248.81, "total_tokens": 18188248} {"current_steps": 27885, "total_steps": 38160, "loss": 0.3315, "lr": 0.00020510182682985717, "epoch": 14.614779874213836, "percentage": 73.07, "elapsed_time": "1:11:21", "remaining_time": "0:26:17", "throughput": 4248.81, "total_tokens": 18191160} {"current_steps": 27890, "total_steps": 38160, "loss": 0.346, "lr": 0.00020491718208239847, "epoch": 14.617400419287211, "percentage": 73.09, "elapsed_time": "1:11:22", "remaining_time": "0:26:16", "throughput": 4248.9, "total_tokens": 18195000} {"current_steps": 27895, "total_steps": 38160, "loss": 0.3484, "lr": 0.00020473259906289877, "epoch": 14.620020964360586, "percentage": 73.1, "elapsed_time": "1:11:22", "remaining_time": "0:26:16", "throughput": 4248.95, "total_tokens": 18198232} {"current_steps": 27900, "total_steps": 38160, "loss": 0.5374, "lr": 0.00020454807780997077, "epoch": 14.622641509433961, "percentage": 73.11, "elapsed_time": "1:11:23", "remaining_time": "0:26:15", "throughput": 4248.92, "total_tokens": 18200856} {"current_steps": 27905, "total_steps": 38160, "loss": 0.4136, "lr": 0.0002043636183622144, "epoch": 14.625262054507338, "percentage": 73.13, "elapsed_time": "1:11:24", "remaining_time": "0:26:14", "throughput": 4248.86, "total_tokens": 18203256} {"current_steps": 27910, "total_steps": 38160, "loss": 0.526, "lr": 0.00020417922075821626, "epoch": 14.627882599580714, "percentage": 73.14, "elapsed_time": "1:11:24", "remaining_time": "0:26:13", "throughput": 4248.85, "total_tokens": 18206008} {"current_steps": 27915, "total_steps": 38160, "loss": 0.4936, "lr": 0.00020399488503655005, "epoch": 14.630503144654089, "percentage": 73.15, "elapsed_time": "1:11:25", "remaining_time": "0:26:12", "throughput": 4248.85, "total_tokens": 18208984} {"current_steps": 27920, "total_steps": 38160, "loss": 0.3058, "lr": 0.00020381061123577688, "epoch": 14.633123689727464, "percentage": 73.17, "elapsed_time": "1:11:26", "remaining_time": "0:26:12", "throughput": 4249.04, "total_tokens": 18213848} {"current_steps": 27925, "total_steps": 38160, "loss": 0.4368, "lr": 0.00020362639939444473, "epoch": 14.635744234800839, "percentage": 73.18, "elapsed_time": "1:11:27", "remaining_time": "0:26:11", "throughput": 4249.11, "total_tokens": 18217496} {"current_steps": 27930, "total_steps": 38160, "loss": 0.4145, "lr": 0.0002034422495510888, "epoch": 14.638364779874214, "percentage": 73.19, "elapsed_time": "1:11:28", "remaining_time": "0:26:10", "throughput": 4249.13, "total_tokens": 18220536} {"current_steps": 27935, "total_steps": 38160, "loss": 0.5382, "lr": 0.00020325816174423077, "epoch": 14.64098532494759, "percentage": 73.2, "elapsed_time": "1:11:28", "remaining_time": "0:26:09", "throughput": 4249.28, "total_tokens": 18224888} {"current_steps": 27940, "total_steps": 38160, "loss": 0.3083, "lr": 0.00020307413601238012, "epoch": 14.643605870020965, "percentage": 73.22, "elapsed_time": "1:11:29", "remaining_time": "0:26:09", "throughput": 4249.46, "total_tokens": 18229368} {"current_steps": 27945, "total_steps": 38160, "loss": 0.4429, "lr": 0.00020289017239403246, "epoch": 14.64622641509434, "percentage": 73.23, "elapsed_time": "1:11:30", "remaining_time": "0:26:08", "throughput": 4249.51, "total_tokens": 18232760} {"current_steps": 27950, "total_steps": 38160, "loss": 0.4543, "lr": 0.0002027062709276712, "epoch": 14.648846960167715, "percentage": 73.24, "elapsed_time": "1:11:31", "remaining_time": "0:26:07", "throughput": 4249.51, "total_tokens": 18235576} {"current_steps": 27955, "total_steps": 38160, "loss": 0.4403, "lr": 0.00020252243165176632, "epoch": 14.65146750524109, "percentage": 73.26, "elapsed_time": "1:11:31", "remaining_time": "0:26:06", "throughput": 4249.59, "total_tokens": 18239224} {"current_steps": 27960, "total_steps": 38160, "loss": 0.4001, "lr": 0.00020233865460477508, "epoch": 14.654088050314465, "percentage": 73.27, "elapsed_time": "1:11:32", "remaining_time": "0:26:05", "throughput": 4249.56, "total_tokens": 18241912} {"current_steps": 27965, "total_steps": 38160, "loss": 0.365, "lr": 0.00020215493982514128, "epoch": 14.65670859538784, "percentage": 73.28, "elapsed_time": "1:11:33", "remaining_time": "0:26:05", "throughput": 4249.54, "total_tokens": 18244632} {"current_steps": 27970, "total_steps": 38160, "loss": 0.4279, "lr": 0.00020197128735129622, "epoch": 14.659329140461216, "percentage": 73.3, "elapsed_time": "1:11:34", "remaining_time": "0:26:04", "throughput": 4249.56, "total_tokens": 18247768} {"current_steps": 27975, "total_steps": 38160, "loss": 0.3793, "lr": 0.0002017876972216575, "epoch": 14.66194968553459, "percentage": 73.31, "elapsed_time": "1:11:34", "remaining_time": "0:26:03", "throughput": 4249.55, "total_tokens": 18250456} {"current_steps": 27980, "total_steps": 38160, "loss": 0.4435, "lr": 0.00020160416947463046, "epoch": 14.664570230607966, "percentage": 73.32, "elapsed_time": "1:11:35", "remaining_time": "0:26:02", "throughput": 4249.59, "total_tokens": 18253688} {"current_steps": 27985, "total_steps": 38160, "loss": 0.3702, "lr": 0.00020142070414860702, "epoch": 14.667190775681341, "percentage": 73.34, "elapsed_time": "1:11:36", "remaining_time": "0:26:02", "throughput": 4249.64, "total_tokens": 18256952} {"current_steps": 27990, "total_steps": 38160, "loss": 0.3632, "lr": 0.0002012373012819657, "epoch": 14.669811320754716, "percentage": 73.35, "elapsed_time": "1:11:37", "remaining_time": "0:26:01", "throughput": 4249.94, "total_tokens": 18263064} {"current_steps": 27995, "total_steps": 38160, "loss": 0.3704, "lr": 0.00020105396091307247, "epoch": 14.672431865828091, "percentage": 73.36, "elapsed_time": "1:11:37", "remaining_time": "0:26:00", "throughput": 4249.93, "total_tokens": 18265848} {"current_steps": 28000, "total_steps": 38160, "loss": 0.5836, "lr": 0.0002008706830802803, "epoch": 14.675052410901468, "percentage": 73.38, "elapsed_time": "1:11:38", "remaining_time": "0:25:59", "throughput": 4249.98, "total_tokens": 18269208} {"current_steps": 28005, "total_steps": 38160, "loss": 0.402, "lr": 0.00020068746782192837, "epoch": 14.677672955974844, "percentage": 73.39, "elapsed_time": "1:11:39", "remaining_time": "0:25:59", "throughput": 4250.2, "total_tokens": 18274136} {"current_steps": 28010, "total_steps": 38160, "loss": 0.3425, "lr": 0.00020050431517634366, "epoch": 14.680293501048219, "percentage": 73.4, "elapsed_time": "1:11:40", "remaining_time": "0:25:58", "throughput": 4250.19, "total_tokens": 18277016} {"current_steps": 28015, "total_steps": 38160, "loss": 0.3709, "lr": 0.00020032122518183915, "epoch": 14.682914046121594, "percentage": 73.41, "elapsed_time": "1:11:40", "remaining_time": "0:25:57", "throughput": 4250.16, "total_tokens": 18279640} {"current_steps": 28020, "total_steps": 38160, "loss": 0.3969, "lr": 0.00020013819787671538, "epoch": 14.685534591194969, "percentage": 73.43, "elapsed_time": "1:11:41", "remaining_time": "0:25:56", "throughput": 4250.07, "total_tokens": 18281816} {"current_steps": 28025, "total_steps": 38160, "loss": 0.5475, "lr": 0.00019995523329925985, "epoch": 14.688155136268344, "percentage": 73.44, "elapsed_time": "1:11:42", "remaining_time": "0:25:55", "throughput": 4250.06, "total_tokens": 18284568} {"current_steps": 28030, "total_steps": 38160, "loss": 0.4128, "lr": 0.00019977233148774627, "epoch": 14.69077568134172, "percentage": 73.45, "elapsed_time": "1:11:43", "remaining_time": "0:25:55", "throughput": 4250.2, "total_tokens": 18288792} {"current_steps": 28035, "total_steps": 38160, "loss": 0.4173, "lr": 0.00019958949248043573, "epoch": 14.693396226415095, "percentage": 73.47, "elapsed_time": "1:11:43", "remaining_time": "0:25:54", "throughput": 4250.26, "total_tokens": 18292344} {"current_steps": 28040, "total_steps": 38160, "loss": 0.4024, "lr": 0.00019940671631557628, "epoch": 14.69601677148847, "percentage": 73.48, "elapsed_time": "1:11:44", "remaining_time": "0:25:53", "throughput": 4250.35, "total_tokens": 18296184} {"current_steps": 28045, "total_steps": 38160, "loss": 0.4967, "lr": 0.0001992240030314022, "epoch": 14.698637316561845, "percentage": 73.49, "elapsed_time": "1:11:45", "remaining_time": "0:25:52", "throughput": 4250.45, "total_tokens": 18299960} {"current_steps": 28050, "total_steps": 38160, "loss": 0.4293, "lr": 0.00019904135266613532, "epoch": 14.70125786163522, "percentage": 73.51, "elapsed_time": "1:11:46", "remaining_time": "0:25:52", "throughput": 4250.56, "total_tokens": 18304024} {"current_steps": 28055, "total_steps": 38160, "loss": 0.4687, "lr": 0.00019885876525798407, "epoch": 14.703878406708595, "percentage": 73.52, "elapsed_time": "1:11:46", "remaining_time": "0:25:51", "throughput": 4250.55, "total_tokens": 18306808} {"current_steps": 28060, "total_steps": 38160, "loss": 0.3956, "lr": 0.0001986762408451434, "epoch": 14.70649895178197, "percentage": 73.53, "elapsed_time": "1:11:47", "remaining_time": "0:25:50", "throughput": 4250.47, "total_tokens": 18308984} {"current_steps": 28065, "total_steps": 38160, "loss": 0.4069, "lr": 0.00019849377946579562, "epoch": 14.709119496855346, "percentage": 73.55, "elapsed_time": "1:11:48", "remaining_time": "0:25:49", "throughput": 4250.42, "total_tokens": 18311416} {"current_steps": 28070, "total_steps": 38160, "loss": 0.5485, "lr": 0.00019831138115810926, "epoch": 14.71174004192872, "percentage": 73.56, "elapsed_time": "1:11:48", "remaining_time": "0:25:48", "throughput": 4250.45, "total_tokens": 18314552} {"current_steps": 28075, "total_steps": 38160, "loss": 0.355, "lr": 0.00019812904596024005, "epoch": 14.714360587002096, "percentage": 73.57, "elapsed_time": "1:11:49", "remaining_time": "0:25:48", "throughput": 4250.48, "total_tokens": 18317752} {"current_steps": 28080, "total_steps": 38160, "loss": 0.4653, "lr": 0.00019794677391033055, "epoch": 14.716981132075471, "percentage": 73.58, "elapsed_time": "1:11:50", "remaining_time": "0:25:47", "throughput": 4250.51, "total_tokens": 18320888} {"current_steps": 28085, "total_steps": 38160, "loss": 0.585, "lr": 0.00019776456504651014, "epoch": 14.719601677148846, "percentage": 73.6, "elapsed_time": "1:11:51", "remaining_time": "0:25:46", "throughput": 4250.61, "total_tokens": 18324600} {"current_steps": 28090, "total_steps": 38160, "loss": 0.3826, "lr": 0.0001975824194068946, "epoch": 14.722222222222221, "percentage": 73.61, "elapsed_time": "1:11:51", "remaining_time": "0:25:45", "throughput": 4250.67, "total_tokens": 18328184} {"current_steps": 28095, "total_steps": 38160, "loss": 0.3754, "lr": 0.00019740033702958653, "epoch": 14.724842767295598, "percentage": 73.62, "elapsed_time": "1:11:52", "remaining_time": "0:25:44", "throughput": 4250.63, "total_tokens": 18330680} {"current_steps": 28100, "total_steps": 38160, "loss": 0.4737, "lr": 0.0001972183179526758, "epoch": 14.727463312368974, "percentage": 73.64, "elapsed_time": "1:11:53", "remaining_time": "0:25:44", "throughput": 4250.73, "total_tokens": 18334552} {"current_steps": 28105, "total_steps": 38160, "loss": 0.4519, "lr": 0.0001970363622142386, "epoch": 14.730083857442349, "percentage": 73.65, "elapsed_time": "1:11:54", "remaining_time": "0:25:43", "throughput": 4250.81, "total_tokens": 18338168} {"current_steps": 28110, "total_steps": 38160, "loss": 0.3977, "lr": 0.00019685446985233824, "epoch": 14.732704402515724, "percentage": 73.66, "elapsed_time": "1:11:54", "remaining_time": "0:25:42", "throughput": 4250.85, "total_tokens": 18341528} {"current_steps": 28115, "total_steps": 38160, "loss": 0.4254, "lr": 0.00019667264090502412, "epoch": 14.735324947589099, "percentage": 73.68, "elapsed_time": "1:11:55", "remaining_time": "0:25:41", "throughput": 4250.91, "total_tokens": 18344920} {"current_steps": 28120, "total_steps": 38160, "loss": 0.337, "lr": 0.0001964908754103331, "epoch": 14.737945492662474, "percentage": 73.69, "elapsed_time": "1:11:56", "remaining_time": "0:25:41", "throughput": 4250.96, "total_tokens": 18348312} {"current_steps": 28125, "total_steps": 38160, "loss": 0.3855, "lr": 0.00019630917340628822, "epoch": 14.74056603773585, "percentage": 73.7, "elapsed_time": "1:11:56", "remaining_time": "0:25:40", "throughput": 4250.96, "total_tokens": 18351160} {"current_steps": 28130, "total_steps": 38160, "loss": 0.5121, "lr": 0.00019612753493089959, "epoch": 14.743186582809225, "percentage": 73.72, "elapsed_time": "1:11:57", "remaining_time": "0:25:39", "throughput": 4250.97, "total_tokens": 18354104} {"current_steps": 28135, "total_steps": 38160, "loss": 0.42, "lr": 0.00019594596002216387, "epoch": 14.7458071278826, "percentage": 73.73, "elapsed_time": "1:11:58", "remaining_time": "0:25:38", "throughput": 4251.05, "total_tokens": 18357784} {"current_steps": 28140, "total_steps": 38160, "loss": 0.5088, "lr": 0.00019576444871806465, "epoch": 14.748427672955975, "percentage": 73.74, "elapsed_time": "1:11:59", "remaining_time": "0:25:37", "throughput": 4251.08, "total_tokens": 18360984} {"current_steps": 28145, "total_steps": 38160, "loss": 0.4218, "lr": 0.0001955830010565719, "epoch": 14.75104821802935, "percentage": 73.76, "elapsed_time": "1:11:59", "remaining_time": "0:25:37", "throughput": 4251.21, "total_tokens": 18365080} {"current_steps": 28150, "total_steps": 38160, "loss": 0.4746, "lr": 0.00019540161707564213, "epoch": 14.753668763102725, "percentage": 73.77, "elapsed_time": "1:12:00", "remaining_time": "0:25:36", "throughput": 4251.18, "total_tokens": 18367800} {"current_steps": 28155, "total_steps": 38160, "loss": 0.6041, "lr": 0.000195220296813219, "epoch": 14.7562893081761, "percentage": 73.78, "elapsed_time": "1:12:01", "remaining_time": "0:25:35", "throughput": 4251.15, "total_tokens": 18370392} {"current_steps": 28160, "total_steps": 38160, "loss": 0.4578, "lr": 0.00019503904030723274, "epoch": 14.758909853249476, "percentage": 73.79, "elapsed_time": "1:12:01", "remaining_time": "0:25:34", "throughput": 4251.18, "total_tokens": 18373560} {"current_steps": 28165, "total_steps": 38160, "loss": 0.3485, "lr": 0.00019485784759560004, "epoch": 14.76153039832285, "percentage": 73.81, "elapsed_time": "1:12:02", "remaining_time": "0:25:34", "throughput": 4251.38, "total_tokens": 18378296} {"current_steps": 28170, "total_steps": 38160, "loss": 0.441, "lr": 0.0001946767187162247, "epoch": 14.764150943396226, "percentage": 73.82, "elapsed_time": "1:12:03", "remaining_time": "0:25:33", "throughput": 4251.35, "total_tokens": 18381016} {"current_steps": 28175, "total_steps": 38160, "loss": 0.4791, "lr": 0.00019449565370699618, "epoch": 14.766771488469601, "percentage": 73.83, "elapsed_time": "1:12:04", "remaining_time": "0:25:32", "throughput": 4251.38, "total_tokens": 18384248} {"current_steps": 28180, "total_steps": 38160, "loss": 0.5008, "lr": 0.00019431465260579152, "epoch": 14.769392033542976, "percentage": 73.85, "elapsed_time": "1:12:04", "remaining_time": "0:25:31", "throughput": 4251.32, "total_tokens": 18386648} {"current_steps": 28185, "total_steps": 38160, "loss": 0.3914, "lr": 0.00019413371545047404, "epoch": 14.772012578616351, "percentage": 73.86, "elapsed_time": "1:12:05", "remaining_time": "0:25:30", "throughput": 4251.39, "total_tokens": 18390232} {"current_steps": 28190, "total_steps": 38160, "loss": 0.4522, "lr": 0.00019395284227889382, "epoch": 14.774633123689728, "percentage": 73.87, "elapsed_time": "1:12:06", "remaining_time": "0:25:30", "throughput": 4251.45, "total_tokens": 18393624} {"current_steps": 28195, "total_steps": 38160, "loss": 0.3622, "lr": 0.00019377203312888764, "epoch": 14.777253668763104, "percentage": 73.89, "elapsed_time": "1:12:07", "remaining_time": "0:25:29", "throughput": 4251.53, "total_tokens": 18397176} {"current_steps": 28200, "total_steps": 38160, "loss": 0.4624, "lr": 0.0001935912880382784, "epoch": 14.779874213836479, "percentage": 73.9, "elapsed_time": "1:12:07", "remaining_time": "0:25:28", "throughput": 4251.56, "total_tokens": 18400472} {"current_steps": 28205, "total_steps": 38160, "loss": 0.4039, "lr": 0.00019341060704487596, "epoch": 14.782494758909854, "percentage": 73.91, "elapsed_time": "1:12:08", "remaining_time": "0:25:27", "throughput": 4251.54, "total_tokens": 18403224} {"current_steps": 28210, "total_steps": 38160, "loss": 0.311, "lr": 0.00019322999018647668, "epoch": 14.785115303983229, "percentage": 73.93, "elapsed_time": "1:12:09", "remaining_time": "0:25:26", "throughput": 4251.56, "total_tokens": 18406200} {"current_steps": 28215, "total_steps": 38160, "loss": 0.4322, "lr": 0.00019304943750086362, "epoch": 14.787735849056604, "percentage": 73.94, "elapsed_time": "1:12:10", "remaining_time": "0:25:26", "throughput": 4251.58, "total_tokens": 18409432} {"current_steps": 28220, "total_steps": 38160, "loss": 0.3906, "lr": 0.0001928689490258066, "epoch": 14.79035639412998, "percentage": 73.95, "elapsed_time": "1:12:10", "remaining_time": "0:25:25", "throughput": 4251.52, "total_tokens": 18411736} {"current_steps": 28225, "total_steps": 38160, "loss": 0.4403, "lr": 0.00019268852479906146, "epoch": 14.792976939203355, "percentage": 73.96, "elapsed_time": "1:12:11", "remaining_time": "0:25:24", "throughput": 4251.61, "total_tokens": 18415448} {"current_steps": 28230, "total_steps": 38160, "loss": 0.5206, "lr": 0.0001925081648583708, "epoch": 14.79559748427673, "percentage": 73.98, "elapsed_time": "1:12:12", "remaining_time": "0:25:23", "throughput": 4251.67, "total_tokens": 18419032} {"current_steps": 28235, "total_steps": 38160, "loss": 0.4659, "lr": 0.00019232786924146394, "epoch": 14.798218029350105, "percentage": 73.99, "elapsed_time": "1:12:12", "remaining_time": "0:25:23", "throughput": 4251.69, "total_tokens": 18422136} {"current_steps": 28240, "total_steps": 38160, "loss": 0.5776, "lr": 0.00019214763798605677, "epoch": 14.80083857442348, "percentage": 74.0, "elapsed_time": "1:12:13", "remaining_time": "0:25:22", "throughput": 4251.66, "total_tokens": 18424696} {"current_steps": 28245, "total_steps": 38160, "loss": 0.5047, "lr": 0.00019196747112985158, "epoch": 14.803459119496855, "percentage": 74.02, "elapsed_time": "1:12:14", "remaining_time": "0:25:21", "throughput": 4251.67, "total_tokens": 18427704} {"current_steps": 28250, "total_steps": 38160, "loss": 0.3606, "lr": 0.00019178736871053737, "epoch": 14.80607966457023, "percentage": 74.03, "elapsed_time": "1:12:14", "remaining_time": "0:25:20", "throughput": 4251.63, "total_tokens": 18430328} {"current_steps": 28255, "total_steps": 38160, "loss": 0.513, "lr": 0.00019160733076578935, "epoch": 14.808700209643606, "percentage": 74.04, "elapsed_time": "1:12:15", "remaining_time": "0:25:19", "throughput": 4251.6, "total_tokens": 18432920} {"current_steps": 28260, "total_steps": 38160, "loss": 0.547, "lr": 0.0001914273573332692, "epoch": 14.81132075471698, "percentage": 74.06, "elapsed_time": "1:12:16", "remaining_time": "0:25:19", "throughput": 4251.61, "total_tokens": 18435896} {"current_steps": 28265, "total_steps": 38160, "loss": 0.4331, "lr": 0.00019124744845062553, "epoch": 14.813941299790356, "percentage": 74.07, "elapsed_time": "1:12:16", "remaining_time": "0:25:18", "throughput": 4251.6, "total_tokens": 18438712} {"current_steps": 28270, "total_steps": 38160, "loss": 0.45, "lr": 0.00019106760415549324, "epoch": 14.816561844863731, "percentage": 74.08, "elapsed_time": "1:12:17", "remaining_time": "0:25:17", "throughput": 4251.6, "total_tokens": 18441592} {"current_steps": 28275, "total_steps": 38160, "loss": 0.3922, "lr": 0.0001908878244854938, "epoch": 14.819182389937106, "percentage": 74.1, "elapsed_time": "1:12:18", "remaining_time": "0:25:16", "throughput": 4251.55, "total_tokens": 18444120} {"current_steps": 28280, "total_steps": 38160, "loss": 0.3579, "lr": 0.00019070810947823498, "epoch": 14.821802935010481, "percentage": 74.11, "elapsed_time": "1:12:18", "remaining_time": "0:25:15", "throughput": 4251.62, "total_tokens": 18447640} {"current_steps": 28285, "total_steps": 38160, "loss": 0.4888, "lr": 0.0001905284591713109, "epoch": 14.824423480083858, "percentage": 74.12, "elapsed_time": "1:12:19", "remaining_time": "0:25:15", "throughput": 4251.81, "total_tokens": 18452312} {"current_steps": 28290, "total_steps": 38160, "loss": 0.4001, "lr": 0.00019034887360230246, "epoch": 14.827044025157234, "percentage": 74.14, "elapsed_time": "1:12:20", "remaining_time": "0:25:14", "throughput": 4251.87, "total_tokens": 18455704} {"current_steps": 28295, "total_steps": 38160, "loss": 0.3922, "lr": 0.000190169352808777, "epoch": 14.829664570230609, "percentage": 74.15, "elapsed_time": "1:12:21", "remaining_time": "0:25:13", "throughput": 4251.96, "total_tokens": 18459384} {"current_steps": 28300, "total_steps": 38160, "loss": 0.5439, "lr": 0.00018998989682828844, "epoch": 14.832285115303984, "percentage": 74.16, "elapsed_time": "1:12:22", "remaining_time": "0:25:12", "throughput": 4252.1, "total_tokens": 18463512} {"current_steps": 28305, "total_steps": 38160, "loss": 0.5382, "lr": 0.00018981050569837643, "epoch": 14.834905660377359, "percentage": 74.17, "elapsed_time": "1:12:22", "remaining_time": "0:25:12", "throughput": 4252.12, "total_tokens": 18466520} {"current_steps": 28310, "total_steps": 38160, "loss": 0.3706, "lr": 0.000189631179456568, "epoch": 14.837526205450734, "percentage": 74.19, "elapsed_time": "1:12:23", "remaining_time": "0:25:11", "throughput": 4252.09, "total_tokens": 18469240} {"current_steps": 28315, "total_steps": 38160, "loss": 0.4329, "lr": 0.00018945191814037578, "epoch": 14.84014675052411, "percentage": 74.2, "elapsed_time": "1:12:24", "remaining_time": "0:25:10", "throughput": 4252.21, "total_tokens": 18473272} {"current_steps": 28320, "total_steps": 38160, "loss": 0.4565, "lr": 0.00018927272178729938, "epoch": 14.842767295597485, "percentage": 74.21, "elapsed_time": "1:12:25", "remaining_time": "0:25:09", "throughput": 4252.43, "total_tokens": 18478392} {"current_steps": 28325, "total_steps": 38160, "loss": 0.3881, "lr": 0.00018909359043482477, "epoch": 14.84538784067086, "percentage": 74.23, "elapsed_time": "1:12:26", "remaining_time": "0:25:09", "throughput": 4252.4, "total_tokens": 18481048} {"current_steps": 28330, "total_steps": 38160, "loss": 0.5028, "lr": 0.00018891452412042386, "epoch": 14.848008385744235, "percentage": 74.24, "elapsed_time": "1:12:26", "remaining_time": "0:25:08", "throughput": 4252.45, "total_tokens": 18484376} {"current_steps": 28335, "total_steps": 38160, "loss": 0.3035, "lr": 0.00018873552288155542, "epoch": 14.85062893081761, "percentage": 74.25, "elapsed_time": "1:12:27", "remaining_time": "0:25:07", "throughput": 4252.51, "total_tokens": 18487928} {"current_steps": 28340, "total_steps": 38160, "loss": 0.5628, "lr": 0.00018855658675566471, "epoch": 14.853249475890985, "percentage": 74.27, "elapsed_time": "1:12:28", "remaining_time": "0:25:06", "throughput": 4252.56, "total_tokens": 18491192} {"current_steps": 28345, "total_steps": 38160, "loss": 0.3837, "lr": 0.00018837771578018275, "epoch": 14.85587002096436, "percentage": 74.28, "elapsed_time": "1:12:29", "remaining_time": "0:25:05", "throughput": 4252.63, "total_tokens": 18494744} {"current_steps": 28350, "total_steps": 38160, "loss": 0.4937, "lr": 0.00018819890999252747, "epoch": 14.858490566037736, "percentage": 74.29, "elapsed_time": "1:12:29", "remaining_time": "0:25:05", "throughput": 4252.72, "total_tokens": 18498584} {"current_steps": 28355, "total_steps": 38160, "loss": 0.4963, "lr": 0.0001880201694301032, "epoch": 14.86111111111111, "percentage": 74.31, "elapsed_time": "1:12:30", "remaining_time": "0:25:04", "throughput": 4252.71, "total_tokens": 18501400} {"current_steps": 28360, "total_steps": 38160, "loss": 0.4233, "lr": 0.00018784149413030005, "epoch": 14.863731656184486, "percentage": 74.32, "elapsed_time": "1:12:31", "remaining_time": "0:25:03", "throughput": 4252.66, "total_tokens": 18503864} {"current_steps": 28365, "total_steps": 38160, "loss": 0.3782, "lr": 0.00018766288413049503, "epoch": 14.866352201257861, "percentage": 74.33, "elapsed_time": "1:12:31", "remaining_time": "0:25:02", "throughput": 4252.67, "total_tokens": 18506712} {"current_steps": 28370, "total_steps": 38160, "loss": 0.4684, "lr": 0.00018748433946805148, "epoch": 14.868972746331236, "percentage": 74.34, "elapsed_time": "1:12:32", "remaining_time": "0:25:01", "throughput": 4252.75, "total_tokens": 18510360} {"current_steps": 28375, "total_steps": 38160, "loss": 0.4308, "lr": 0.00018730586018031854, "epoch": 14.871593291404611, "percentage": 74.36, "elapsed_time": "1:12:33", "remaining_time": "0:25:01", "throughput": 4252.76, "total_tokens": 18513432} {"current_steps": 28380, "total_steps": 38160, "loss": 0.4509, "lr": 0.00018712744630463248, "epoch": 14.874213836477988, "percentage": 74.37, "elapsed_time": "1:12:33", "remaining_time": "0:25:00", "throughput": 4252.79, "total_tokens": 18516632} {"current_steps": 28385, "total_steps": 38160, "loss": 0.5006, "lr": 0.000186949097878315, "epoch": 14.876834381551364, "percentage": 74.38, "elapsed_time": "1:12:34", "remaining_time": "0:24:59", "throughput": 4253.02, "total_tokens": 18521624} {"current_steps": 28390, "total_steps": 38160, "loss": 0.4871, "lr": 0.0001867708149386748, "epoch": 14.879454926624739, "percentage": 74.4, "elapsed_time": "1:12:35", "remaining_time": "0:24:58", "throughput": 4253.04, "total_tokens": 18524760} {"current_steps": 28395, "total_steps": 38160, "loss": 0.3779, "lr": 0.0001865925975230068, "epoch": 14.882075471698114, "percentage": 74.41, "elapsed_time": "1:12:36", "remaining_time": "0:24:58", "throughput": 4253.01, "total_tokens": 18527416} {"current_steps": 28400, "total_steps": 38160, "loss": 0.4869, "lr": 0.0001864144456685916, "epoch": 14.884696016771489, "percentage": 74.42, "elapsed_time": "1:12:37", "remaining_time": "0:24:57", "throughput": 4253.08, "total_tokens": 18531032} {"current_steps": 28405, "total_steps": 38160, "loss": 0.4433, "lr": 0.00018623635941269706, "epoch": 14.887316561844864, "percentage": 74.44, "elapsed_time": "1:12:37", "remaining_time": "0:24:56", "throughput": 4253.16, "total_tokens": 18534744} {"current_steps": 28410, "total_steps": 38160, "loss": 0.45, "lr": 0.00018605833879257628, "epoch": 14.88993710691824, "percentage": 74.45, "elapsed_time": "1:12:38", "remaining_time": "0:24:55", "throughput": 4253.24, "total_tokens": 18538392} {"current_steps": 28415, "total_steps": 38160, "loss": 0.3744, "lr": 0.0001858803838454694, "epoch": 14.892557651991615, "percentage": 74.46, "elapsed_time": "1:12:39", "remaining_time": "0:24:55", "throughput": 4253.25, "total_tokens": 18541400} {"current_steps": 28420, "total_steps": 38160, "loss": 0.4207, "lr": 0.0001857024946086026, "epoch": 14.89517819706499, "percentage": 74.48, "elapsed_time": "1:12:40", "remaining_time": "0:24:54", "throughput": 4253.29, "total_tokens": 18544696} {"current_steps": 28425, "total_steps": 38160, "loss": 0.3215, "lr": 0.00018552467111918836, "epoch": 14.897798742138365, "percentage": 74.49, "elapsed_time": "1:12:40", "remaining_time": "0:24:53", "throughput": 4253.32, "total_tokens": 18547864} {"current_steps": 28430, "total_steps": 38160, "loss": 0.4216, "lr": 0.00018534691341442507, "epoch": 14.90041928721174, "percentage": 74.5, "elapsed_time": "1:12:41", "remaining_time": "0:24:52", "throughput": 4253.3, "total_tokens": 18550584} {"current_steps": 28435, "total_steps": 38160, "loss": 0.5193, "lr": 0.0001851692215314979, "epoch": 14.903039832285115, "percentage": 74.52, "elapsed_time": "1:12:42", "remaining_time": "0:24:51", "throughput": 4253.33, "total_tokens": 18553624} {"current_steps": 28440, "total_steps": 38160, "loss": 0.5083, "lr": 0.0001849915955075776, "epoch": 14.90566037735849, "percentage": 74.53, "elapsed_time": "1:12:42", "remaining_time": "0:24:51", "throughput": 4253.32, "total_tokens": 18556472} {"current_steps": 28445, "total_steps": 38160, "loss": 0.3134, "lr": 0.0001848140353798217, "epoch": 14.908280922431866, "percentage": 74.54, "elapsed_time": "1:12:43", "remaining_time": "0:24:50", "throughput": 4253.25, "total_tokens": 18558840} {"current_steps": 28450, "total_steps": 38160, "loss": 0.421, "lr": 0.00018463654118537382, "epoch": 14.91090146750524, "percentage": 74.55, "elapsed_time": "1:12:44", "remaining_time": "0:24:49", "throughput": 4253.28, "total_tokens": 18562008} {"current_steps": 28455, "total_steps": 38160, "loss": 0.5235, "lr": 0.00018445911296136386, "epoch": 14.913522012578616, "percentage": 74.57, "elapsed_time": "1:12:44", "remaining_time": "0:24:48", "throughput": 4253.29, "total_tokens": 18564952} {"current_steps": 28460, "total_steps": 38160, "loss": 0.4262, "lr": 0.00018428175074490754, "epoch": 14.916142557651991, "percentage": 74.58, "elapsed_time": "1:12:45", "remaining_time": "0:24:47", "throughput": 4253.28, "total_tokens": 18567800} {"current_steps": 28465, "total_steps": 38160, "loss": 0.5019, "lr": 0.00018410445457310687, "epoch": 14.918763102725366, "percentage": 74.59, "elapsed_time": "1:12:46", "remaining_time": "0:24:47", "throughput": 4253.32, "total_tokens": 18571096} {"current_steps": 28470, "total_steps": 38160, "loss": 0.3308, "lr": 0.00018392722448305044, "epoch": 14.921383647798741, "percentage": 74.61, "elapsed_time": "1:12:46", "remaining_time": "0:24:46", "throughput": 4253.34, "total_tokens": 18574136} {"current_steps": 28475, "total_steps": 38160, "loss": 0.4541, "lr": 0.00018375006051181265, "epoch": 14.924004192872118, "percentage": 74.62, "elapsed_time": "1:12:47", "remaining_time": "0:24:45", "throughput": 4253.3, "total_tokens": 18576664} {"current_steps": 28480, "total_steps": 38160, "loss": 0.4104, "lr": 0.0001835729626964544, "epoch": 14.926624737945493, "percentage": 74.63, "elapsed_time": "1:12:48", "remaining_time": "0:24:44", "throughput": 4253.43, "total_tokens": 18580824} {"current_steps": 28485, "total_steps": 38160, "loss": 0.3758, "lr": 0.00018339593107402242, "epoch": 14.929245283018869, "percentage": 74.65, "elapsed_time": "1:12:49", "remaining_time": "0:24:43", "throughput": 4253.44, "total_tokens": 18583864} {"current_steps": 28490, "total_steps": 38160, "loss": 0.419, "lr": 0.00018321896568154945, "epoch": 14.931865828092244, "percentage": 74.66, "elapsed_time": "1:12:49", "remaining_time": "0:24:43", "throughput": 4253.43, "total_tokens": 18586680} {"current_steps": 28495, "total_steps": 38160, "loss": 0.338, "lr": 0.00018304206655605476, "epoch": 14.934486373165619, "percentage": 74.67, "elapsed_time": "1:12:50", "remaining_time": "0:24:42", "throughput": 4253.57, "total_tokens": 18590776} {"current_steps": 28500, "total_steps": 38160, "loss": 0.3391, "lr": 0.00018286523373454378, "epoch": 14.937106918238994, "percentage": 74.69, "elapsed_time": "1:12:51", "remaining_time": "0:24:41", "throughput": 4253.67, "total_tokens": 18594616} {"current_steps": 28505, "total_steps": 38160, "loss": 0.5165, "lr": 0.00018268846725400783, "epoch": 14.93972746331237, "percentage": 74.7, "elapsed_time": "1:12:52", "remaining_time": "0:24:40", "throughput": 4253.67, "total_tokens": 18597528} {"current_steps": 28510, "total_steps": 38160, "loss": 0.2367, "lr": 0.00018251176715142458, "epoch": 14.942348008385745, "percentage": 74.71, "elapsed_time": "1:12:52", "remaining_time": "0:24:40", "throughput": 4253.63, "total_tokens": 18599992} {"current_steps": 28515, "total_steps": 38160, "loss": 0.3931, "lr": 0.00018233513346375756, "epoch": 14.94496855345912, "percentage": 74.72, "elapsed_time": "1:12:53", "remaining_time": "0:24:39", "throughput": 4253.63, "total_tokens": 18602872} {"current_steps": 28520, "total_steps": 38160, "loss": 0.4069, "lr": 0.00018215856622795634, "epoch": 14.947589098532495, "percentage": 74.74, "elapsed_time": "1:12:54", "remaining_time": "0:24:38", "throughput": 4253.7, "total_tokens": 18606360} {"current_steps": 28525, "total_steps": 38160, "loss": 0.3629, "lr": 0.00018198206548095697, "epoch": 14.95020964360587, "percentage": 74.75, "elapsed_time": "1:12:54", "remaining_time": "0:24:37", "throughput": 4253.65, "total_tokens": 18608824} {"current_steps": 28530, "total_steps": 38160, "loss": 0.4171, "lr": 0.00018180563125968135, "epoch": 14.952830188679245, "percentage": 74.76, "elapsed_time": "1:12:55", "remaining_time": "0:24:36", "throughput": 4253.66, "total_tokens": 18611864} {"current_steps": 28535, "total_steps": 38160, "loss": 0.5268, "lr": 0.00018162926360103766, "epoch": 14.95545073375262, "percentage": 74.78, "elapsed_time": "1:12:56", "remaining_time": "0:24:36", "throughput": 4253.74, "total_tokens": 18615480} {"current_steps": 28540, "total_steps": 38160, "loss": 0.4742, "lr": 0.0001814529625419199, "epoch": 14.958071278825996, "percentage": 74.79, "elapsed_time": "1:12:56", "remaining_time": "0:24:35", "throughput": 4253.75, "total_tokens": 18618392} {"current_steps": 28545, "total_steps": 38160, "loss": 0.5148, "lr": 0.00018127672811920798, "epoch": 14.96069182389937, "percentage": 74.8, "elapsed_time": "1:12:57", "remaining_time": "0:24:34", "throughput": 4253.84, "total_tokens": 18622200} {"current_steps": 28550, "total_steps": 38160, "loss": 0.4374, "lr": 0.00018110056036976834, "epoch": 14.963312368972746, "percentage": 74.82, "elapsed_time": "1:12:58", "remaining_time": "0:24:33", "throughput": 4253.84, "total_tokens": 18625080} {"current_steps": 28555, "total_steps": 38160, "loss": 0.4768, "lr": 0.00018092445933045332, "epoch": 14.965932914046121, "percentage": 74.83, "elapsed_time": "1:12:59", "remaining_time": "0:24:32", "throughput": 4253.84, "total_tokens": 18627992} {"current_steps": 28560, "total_steps": 38160, "loss": 0.4182, "lr": 0.00018074842503810118, "epoch": 14.968553459119496, "percentage": 74.84, "elapsed_time": "1:12:59", "remaining_time": "0:24:32", "throughput": 4253.87, "total_tokens": 18631192} {"current_steps": 28565, "total_steps": 38160, "loss": 0.3927, "lr": 0.00018057245752953666, "epoch": 14.971174004192871, "percentage": 74.86, "elapsed_time": "1:13:00", "remaining_time": "0:24:31", "throughput": 4253.96, "total_tokens": 18634904} {"current_steps": 28570, "total_steps": 38160, "loss": 0.4503, "lr": 0.00018039655684156948, "epoch": 14.973794549266248, "percentage": 74.87, "elapsed_time": "1:13:01", "remaining_time": "0:24:30", "throughput": 4253.96, "total_tokens": 18637784} {"current_steps": 28575, "total_steps": 38160, "loss": 0.4223, "lr": 0.00018022072301099635, "epoch": 14.976415094339622, "percentage": 74.88, "elapsed_time": "1:13:01", "remaining_time": "0:24:29", "throughput": 4253.9, "total_tokens": 18640120} {"current_steps": 28580, "total_steps": 38160, "loss": 0.5831, "lr": 0.00018004495607459975, "epoch": 14.979035639412999, "percentage": 74.9, "elapsed_time": "1:13:02", "remaining_time": "0:24:29", "throughput": 4253.96, "total_tokens": 18643672} {"current_steps": 28585, "total_steps": 38160, "loss": 0.5325, "lr": 0.00017986925606914805, "epoch": 14.981656184486374, "percentage": 74.91, "elapsed_time": "1:13:03", "remaining_time": "0:24:28", "throughput": 4254.0, "total_tokens": 18646872} {"current_steps": 28590, "total_steps": 38160, "loss": 0.3273, "lr": 0.00017969362303139598, "epoch": 14.984276729559749, "percentage": 74.92, "elapsed_time": "1:13:04", "remaining_time": "0:24:27", "throughput": 4254.1, "total_tokens": 18650744} {"current_steps": 28595, "total_steps": 38160, "loss": 0.437, "lr": 0.00017951805699808365, "epoch": 14.986897274633124, "percentage": 74.93, "elapsed_time": "1:13:04", "remaining_time": "0:24:26", "throughput": 4254.18, "total_tokens": 18654296} {"current_steps": 28600, "total_steps": 38160, "loss": 0.4013, "lr": 0.00017934255800593747, "epoch": 14.9895178197065, "percentage": 74.95, "elapsed_time": "1:13:05", "remaining_time": "0:24:25", "throughput": 4254.22, "total_tokens": 18657560} {"current_steps": 28605, "total_steps": 38160, "loss": 0.4373, "lr": 0.0001791671260916698, "epoch": 14.992138364779874, "percentage": 74.96, "elapsed_time": "1:13:06", "remaining_time": "0:24:25", "throughput": 4254.25, "total_tokens": 18660728} {"current_steps": 28610, "total_steps": 38160, "loss": 0.413, "lr": 0.00017899176129197914, "epoch": 14.99475890985325, "percentage": 74.97, "elapsed_time": "1:13:07", "remaining_time": "0:24:24", "throughput": 4254.21, "total_tokens": 18663352} {"current_steps": 28615, "total_steps": 38160, "loss": 0.4405, "lr": 0.00017881646364354998, "epoch": 14.997379454926625, "percentage": 74.99, "elapsed_time": "1:13:07", "remaining_time": "0:24:23", "throughput": 4254.17, "total_tokens": 18665816} {"current_steps": 28620, "total_steps": 38160, "loss": 0.3276, "lr": 0.00017864123318305213, "epoch": 15.0, "percentage": 75.0, "elapsed_time": "1:13:08", "remaining_time": "0:24:22", "throughput": 4254.01, "total_tokens": 18668536} {"current_steps": 28620, "total_steps": 38160, "eval_loss": 0.4626333713531494, "epoch": 15.0, "percentage": 75.0, "elapsed_time": "1:13:22", "remaining_time": "0:24:27", "throughput": 4240.91, "total_tokens": 18668536} {"current_steps": 28625, "total_steps": 38160, "loss": 0.6707, "lr": 0.00017846606994714222, "epoch": 15.002620545073375, "percentage": 75.01, "elapsed_time": "1:13:24", "remaining_time": "0:24:27", "throughput": 4239.17, "total_tokens": 18672024} {"current_steps": 28630, "total_steps": 38160, "loss": 0.5198, "lr": 0.0001782909739724621, "epoch": 15.00524109014675, "percentage": 75.03, "elapsed_time": "1:13:25", "remaining_time": "0:24:26", "throughput": 4239.12, "total_tokens": 18674712} {"current_steps": 28635, "total_steps": 38160, "loss": 0.4104, "lr": 0.0001781159452956399, "epoch": 15.007861635220126, "percentage": 75.04, "elapsed_time": "1:13:26", "remaining_time": "0:24:25", "throughput": 4239.58, "total_tokens": 18682488} {"current_steps": 28640, "total_steps": 38160, "loss": 0.4259, "lr": 0.00017794098395328977, "epoch": 15.0104821802935, "percentage": 75.05, "elapsed_time": "1:13:27", "remaining_time": "0:24:25", "throughput": 4239.62, "total_tokens": 18685816} {"current_steps": 28645, "total_steps": 38160, "loss": 0.4407, "lr": 0.00017776608998201172, "epoch": 15.013102725366876, "percentage": 75.07, "elapsed_time": "1:13:28", "remaining_time": "0:24:24", "throughput": 4239.62, "total_tokens": 18688760} {"current_steps": 28650, "total_steps": 38160, "loss": 0.3249, "lr": 0.00017759126341839132, "epoch": 15.015723270440251, "percentage": 75.08, "elapsed_time": "1:13:28", "remaining_time": "0:24:23", "throughput": 4239.55, "total_tokens": 18691160} {"current_steps": 28655, "total_steps": 38160, "loss": 0.4684, "lr": 0.0001774165042990003, "epoch": 15.018343815513626, "percentage": 75.09, "elapsed_time": "1:13:29", "remaining_time": "0:24:22", "throughput": 4239.62, "total_tokens": 18694616} {"current_steps": 28660, "total_steps": 38160, "loss": 0.3643, "lr": 0.00017724181266039635, "epoch": 15.020964360587001, "percentage": 75.1, "elapsed_time": "1:13:30", "remaining_time": "0:24:21", "throughput": 4239.62, "total_tokens": 18697656} {"current_steps": 28665, "total_steps": 38160, "loss": 0.3651, "lr": 0.00017706718853912292, "epoch": 15.023584905660377, "percentage": 75.12, "elapsed_time": "1:13:30", "remaining_time": "0:24:21", "throughput": 4239.63, "total_tokens": 18700536} {"current_steps": 28670, "total_steps": 38160, "loss": 0.5224, "lr": 0.00017689263197170964, "epoch": 15.026205450733753, "percentage": 75.13, "elapsed_time": "1:13:31", "remaining_time": "0:24:20", "throughput": 4239.68, "total_tokens": 18703960} {"current_steps": 28675, "total_steps": 38160, "loss": 0.3571, "lr": 0.00017671814299467136, "epoch": 15.028825995807129, "percentage": 75.14, "elapsed_time": "1:13:32", "remaining_time": "0:24:19", "throughput": 4239.68, "total_tokens": 18706744} {"current_steps": 28680, "total_steps": 38160, "loss": 0.4294, "lr": 0.00017654372164450954, "epoch": 15.031446540880504, "percentage": 75.16, "elapsed_time": "1:13:33", "remaining_time": "0:24:18", "throughput": 4239.77, "total_tokens": 18710424} {"current_steps": 28685, "total_steps": 38160, "loss": 0.5382, "lr": 0.0001763693679577108, "epoch": 15.034067085953879, "percentage": 75.17, "elapsed_time": "1:13:34", "remaining_time": "0:24:18", "throughput": 4240.0, "total_tokens": 18715640} {"current_steps": 28690, "total_steps": 38160, "loss": 0.5208, "lr": 0.00017619508197074812, "epoch": 15.036687631027254, "percentage": 75.18, "elapsed_time": "1:13:34", "remaining_time": "0:24:17", "throughput": 4240.03, "total_tokens": 18718680} {"current_steps": 28695, "total_steps": 38160, "loss": 0.4411, "lr": 0.0001760208637200803, "epoch": 15.03930817610063, "percentage": 75.2, "elapsed_time": "1:13:35", "remaining_time": "0:24:16", "throughput": 4240.04, "total_tokens": 18721688} {"current_steps": 28700, "total_steps": 38160, "loss": 0.3974, "lr": 0.00017584671324215152, "epoch": 15.041928721174004, "percentage": 75.21, "elapsed_time": "1:13:36", "remaining_time": "0:24:15", "throughput": 4240.08, "total_tokens": 18724920} {"current_steps": 28705, "total_steps": 38160, "loss": 0.566, "lr": 0.00017567263057339212, "epoch": 15.04454926624738, "percentage": 75.22, "elapsed_time": "1:13:36", "remaining_time": "0:24:14", "throughput": 4240.14, "total_tokens": 18728376} {"current_steps": 28710, "total_steps": 38160, "loss": 0.3245, "lr": 0.00017549861575021848, "epoch": 15.047169811320755, "percentage": 75.24, "elapsed_time": "1:13:37", "remaining_time": "0:24:14", "throughput": 4240.18, "total_tokens": 18731704} {"current_steps": 28715, "total_steps": 38160, "loss": 0.4922, "lr": 0.00017532466880903214, "epoch": 15.04979035639413, "percentage": 75.25, "elapsed_time": "1:13:38", "remaining_time": "0:24:13", "throughput": 4240.22, "total_tokens": 18734968} {"current_steps": 28720, "total_steps": 38160, "loss": 0.4778, "lr": 0.00017515078978622102, "epoch": 15.052410901467505, "percentage": 75.26, "elapsed_time": "1:13:39", "remaining_time": "0:24:12", "throughput": 4240.32, "total_tokens": 18738680} {"current_steps": 28725, "total_steps": 38160, "loss": 0.3965, "lr": 0.0001749769787181587, "epoch": 15.05503144654088, "percentage": 75.28, "elapsed_time": "1:13:39", "remaining_time": "0:24:11", "throughput": 4240.38, "total_tokens": 18742136} {"current_steps": 28730, "total_steps": 38160, "loss": 0.3345, "lr": 0.00017480323564120426, "epoch": 15.057651991614255, "percentage": 75.29, "elapsed_time": "1:13:40", "remaining_time": "0:24:10", "throughput": 4240.38, "total_tokens": 18745016} {"current_steps": 28735, "total_steps": 38160, "loss": 0.4448, "lr": 0.00017462956059170287, "epoch": 15.06027253668763, "percentage": 75.3, "elapsed_time": "1:13:41", "remaining_time": "0:24:10", "throughput": 4240.49, "total_tokens": 18748920} {"current_steps": 28740, "total_steps": 38160, "loss": 0.4326, "lr": 0.00017445595360598553, "epoch": 15.062893081761006, "percentage": 75.31, "elapsed_time": "1:13:42", "remaining_time": "0:24:09", "throughput": 4240.68, "total_tokens": 18753560} {"current_steps": 28745, "total_steps": 38160, "loss": 0.5243, "lr": 0.0001742824147203686, "epoch": 15.065513626834381, "percentage": 75.33, "elapsed_time": "1:13:43", "remaining_time": "0:24:08", "throughput": 4240.74, "total_tokens": 18756952} {"current_steps": 28750, "total_steps": 38160, "loss": 0.4811, "lr": 0.00017410894397115463, "epoch": 15.068134171907756, "percentage": 75.34, "elapsed_time": "1:13:43", "remaining_time": "0:24:07", "throughput": 4240.81, "total_tokens": 18760472} {"current_steps": 28755, "total_steps": 38160, "loss": 0.4364, "lr": 0.00017393554139463147, "epoch": 15.070754716981131, "percentage": 75.35, "elapsed_time": "1:13:44", "remaining_time": "0:24:07", "throughput": 4240.87, "total_tokens": 18763928} {"current_steps": 28760, "total_steps": 38160, "loss": 0.4327, "lr": 0.00017376220702707308, "epoch": 15.073375262054507, "percentage": 75.37, "elapsed_time": "1:13:45", "remaining_time": "0:24:06", "throughput": 4240.94, "total_tokens": 18767512} {"current_steps": 28765, "total_steps": 38160, "loss": 0.5443, "lr": 0.00017358894090473926, "epoch": 15.075995807127883, "percentage": 75.38, "elapsed_time": "1:13:46", "remaining_time": "0:24:05", "throughput": 4241.26, "total_tokens": 18774040} {"current_steps": 28770, "total_steps": 38160, "loss": 0.3806, "lr": 0.00017341574306387492, "epoch": 15.078616352201259, "percentage": 75.39, "elapsed_time": "1:13:47", "remaining_time": "0:24:04", "throughput": 4241.31, "total_tokens": 18777336} {"current_steps": 28775, "total_steps": 38160, "loss": 0.3143, "lr": 0.00017324261354071147, "epoch": 15.081236897274634, "percentage": 75.41, "elapsed_time": "1:13:47", "remaining_time": "0:24:04", "throughput": 4241.35, "total_tokens": 18780504} {"current_steps": 28780, "total_steps": 38160, "loss": 0.623, "lr": 0.00017306955237146522, "epoch": 15.083857442348009, "percentage": 75.42, "elapsed_time": "1:13:48", "remaining_time": "0:24:03", "throughput": 4241.4, "total_tokens": 18783800} {"current_steps": 28785, "total_steps": 38160, "loss": 0.4155, "lr": 0.0001728965595923388, "epoch": 15.086477987421384, "percentage": 75.43, "elapsed_time": "1:13:49", "remaining_time": "0:24:02", "throughput": 4241.44, "total_tokens": 18786968} {"current_steps": 28790, "total_steps": 38160, "loss": 0.3829, "lr": 0.00017272363523952033, "epoch": 15.08909853249476, "percentage": 75.45, "elapsed_time": "1:13:50", "remaining_time": "0:24:01", "throughput": 4241.43, "total_tokens": 18789720} {"current_steps": 28795, "total_steps": 38160, "loss": 0.3937, "lr": 0.0001725507793491838, "epoch": 15.091719077568134, "percentage": 75.46, "elapsed_time": "1:13:50", "remaining_time": "0:24:01", "throughput": 4241.48, "total_tokens": 18792952} {"current_steps": 28800, "total_steps": 38160, "loss": 0.374, "lr": 0.00017237799195748827, "epoch": 15.09433962264151, "percentage": 75.47, "elapsed_time": "1:13:51", "remaining_time": "0:24:00", "throughput": 4241.44, "total_tokens": 18795480} {"current_steps": 28805, "total_steps": 38160, "loss": 0.2897, "lr": 0.00017220527310057927, "epoch": 15.096960167714885, "percentage": 75.48, "elapsed_time": "1:13:52", "remaining_time": "0:23:59", "throughput": 4241.46, "total_tokens": 18798648} {"current_steps": 28810, "total_steps": 38160, "loss": 0.4896, "lr": 0.0001720326228145873, "epoch": 15.09958071278826, "percentage": 75.5, "elapsed_time": "1:13:52", "remaining_time": "0:23:58", "throughput": 4241.59, "total_tokens": 18802680} {"current_steps": 28815, "total_steps": 38160, "loss": 0.4537, "lr": 0.00017186004113562903, "epoch": 15.102201257861635, "percentage": 75.51, "elapsed_time": "1:13:53", "remaining_time": "0:23:57", "throughput": 4241.54, "total_tokens": 18805112} {"current_steps": 28820, "total_steps": 38160, "loss": 0.4025, "lr": 0.00017168752809980655, "epoch": 15.10482180293501, "percentage": 75.52, "elapsed_time": "1:13:54", "remaining_time": "0:23:57", "throughput": 4241.67, "total_tokens": 18809272} {"current_steps": 28825, "total_steps": 38160, "loss": 0.401, "lr": 0.00017151508374320767, "epoch": 15.107442348008385, "percentage": 75.54, "elapsed_time": "1:13:55", "remaining_time": "0:23:56", "throughput": 4241.71, "total_tokens": 18812440} {"current_steps": 28830, "total_steps": 38160, "loss": 0.5515, "lr": 0.00017134270810190583, "epoch": 15.11006289308176, "percentage": 75.55, "elapsed_time": "1:13:55", "remaining_time": "0:23:55", "throughput": 4241.7, "total_tokens": 18815288} {"current_steps": 28835, "total_steps": 38160, "loss": 0.5263, "lr": 0.0001711704012119597, "epoch": 15.112683438155136, "percentage": 75.56, "elapsed_time": "1:13:56", "remaining_time": "0:23:54", "throughput": 4241.74, "total_tokens": 18818424} {"current_steps": 28840, "total_steps": 38160, "loss": 0.4733, "lr": 0.0001709981631094142, "epoch": 15.115303983228511, "percentage": 75.58, "elapsed_time": "1:13:57", "remaining_time": "0:23:53", "throughput": 4241.72, "total_tokens": 18821144} {"current_steps": 28845, "total_steps": 38160, "loss": 0.3621, "lr": 0.00017082599383029946, "epoch": 15.117924528301886, "percentage": 75.59, "elapsed_time": "1:13:57", "remaining_time": "0:23:53", "throughput": 4241.8, "total_tokens": 18824632} {"current_steps": 28850, "total_steps": 38160, "loss": 0.4647, "lr": 0.0001706538934106316, "epoch": 15.120545073375261, "percentage": 75.6, "elapsed_time": "1:13:58", "remaining_time": "0:23:52", "throughput": 4241.77, "total_tokens": 18827224} {"current_steps": 28855, "total_steps": 38160, "loss": 0.4375, "lr": 0.00017048186188641185, "epoch": 15.123165618448636, "percentage": 75.62, "elapsed_time": "1:13:59", "remaining_time": "0:23:51", "throughput": 4241.77, "total_tokens": 18830072} {"current_steps": 28860, "total_steps": 38160, "loss": 0.5073, "lr": 0.0001703098992936271, "epoch": 15.125786163522013, "percentage": 75.63, "elapsed_time": "1:13:59", "remaining_time": "0:23:50", "throughput": 4241.76, "total_tokens": 18832856} {"current_steps": 28865, "total_steps": 38160, "loss": 0.6184, "lr": 0.00017013800566825012, "epoch": 15.128406708595389, "percentage": 75.64, "elapsed_time": "1:14:00", "remaining_time": "0:23:49", "throughput": 4241.75, "total_tokens": 18835544} {"current_steps": 28870, "total_steps": 38160, "loss": 0.4407, "lr": 0.00016996618104623905, "epoch": 15.131027253668764, "percentage": 75.66, "elapsed_time": "1:14:01", "remaining_time": "0:23:49", "throughput": 4241.74, "total_tokens": 18838360} {"current_steps": 28875, "total_steps": 38160, "loss": 0.5716, "lr": 0.00016979442546353774, "epoch": 15.133647798742139, "percentage": 75.67, "elapsed_time": "1:14:01", "remaining_time": "0:23:48", "throughput": 4241.84, "total_tokens": 18842168} {"current_steps": 28880, "total_steps": 38160, "loss": 0.4662, "lr": 0.00016962273895607555, "epoch": 15.136268343815514, "percentage": 75.68, "elapsed_time": "1:14:02", "remaining_time": "0:23:47", "throughput": 4241.89, "total_tokens": 18845496} {"current_steps": 28885, "total_steps": 38160, "loss": 0.3317, "lr": 0.00016945112155976723, "epoch": 15.13888888888889, "percentage": 75.69, "elapsed_time": "1:14:03", "remaining_time": "0:23:46", "throughput": 4242.08, "total_tokens": 18850232} {"current_steps": 28890, "total_steps": 38160, "loss": 0.4561, "lr": 0.000169279573310513, "epoch": 15.141509433962264, "percentage": 75.71, "elapsed_time": "1:14:04", "remaining_time": "0:23:46", "throughput": 4242.02, "total_tokens": 18852536} {"current_steps": 28895, "total_steps": 38160, "loss": 0.4835, "lr": 0.00016910809424419904, "epoch": 15.14412997903564, "percentage": 75.72, "elapsed_time": "1:14:04", "remaining_time": "0:23:45", "throughput": 4242.04, "total_tokens": 18855544} {"current_steps": 28900, "total_steps": 38160, "loss": 0.5213, "lr": 0.00016893668439669674, "epoch": 15.146750524109015, "percentage": 75.73, "elapsed_time": "1:14:05", "remaining_time": "0:23:44", "throughput": 4242.06, "total_tokens": 18858584} {"current_steps": 28905, "total_steps": 38160, "loss": 0.4261, "lr": 0.0001687653438038632, "epoch": 15.14937106918239, "percentage": 75.75, "elapsed_time": "1:14:06", "remaining_time": "0:23:43", "throughput": 4242.09, "total_tokens": 18861688} {"current_steps": 28910, "total_steps": 38160, "loss": 0.4456, "lr": 0.00016859407250154084, "epoch": 15.151991614255765, "percentage": 75.76, "elapsed_time": "1:14:06", "remaining_time": "0:23:42", "throughput": 4242.03, "total_tokens": 18864056} {"current_steps": 28915, "total_steps": 38160, "loss": 0.4171, "lr": 0.0001684228705255575, "epoch": 15.15461215932914, "percentage": 75.77, "elapsed_time": "1:14:07", "remaining_time": "0:23:42", "throughput": 4242.14, "total_tokens": 18867960} {"current_steps": 28920, "total_steps": 38160, "loss": 0.3193, "lr": 0.00016825173791172677, "epoch": 15.157232704402515, "percentage": 75.79, "elapsed_time": "1:14:08", "remaining_time": "0:23:41", "throughput": 4242.08, "total_tokens": 18870328} {"current_steps": 28925, "total_steps": 38160, "loss": 0.4287, "lr": 0.0001680806746958477, "epoch": 15.15985324947589, "percentage": 75.8, "elapsed_time": "1:14:09", "remaining_time": "0:23:40", "throughput": 4242.15, "total_tokens": 18873976} {"current_steps": 28930, "total_steps": 38160, "loss": 0.2876, "lr": 0.00016790968091370494, "epoch": 15.162473794549266, "percentage": 75.81, "elapsed_time": "1:14:09", "remaining_time": "0:23:39", "throughput": 4242.18, "total_tokens": 18877112} {"current_steps": 28935, "total_steps": 38160, "loss": 0.4337, "lr": 0.00016773875660106824, "epoch": 15.165094339622641, "percentage": 75.83, "elapsed_time": "1:14:10", "remaining_time": "0:23:38", "throughput": 4242.13, "total_tokens": 18879480} {"current_steps": 28940, "total_steps": 38160, "loss": 0.3511, "lr": 0.0001675679017936928, "epoch": 15.167714884696016, "percentage": 75.84, "elapsed_time": "1:14:11", "remaining_time": "0:23:38", "throughput": 4242.11, "total_tokens": 18882072} {"current_steps": 28945, "total_steps": 38160, "loss": 0.5126, "lr": 0.00016739711652731976, "epoch": 15.170335429769391, "percentage": 75.85, "elapsed_time": "1:14:11", "remaining_time": "0:23:37", "throughput": 4242.08, "total_tokens": 18884760} {"current_steps": 28950, "total_steps": 38160, "loss": 0.4085, "lr": 0.00016722640083767542, "epoch": 15.172955974842766, "percentage": 75.86, "elapsed_time": "1:14:12", "remaining_time": "0:23:36", "throughput": 4242.09, "total_tokens": 18887736} {"current_steps": 28955, "total_steps": 38160, "loss": 0.3887, "lr": 0.00016705575476047153, "epoch": 15.175576519916143, "percentage": 75.88, "elapsed_time": "1:14:13", "remaining_time": "0:23:35", "throughput": 4242.1, "total_tokens": 18890584} {"current_steps": 28960, "total_steps": 38160, "loss": 0.3876, "lr": 0.0001668851783314055, "epoch": 15.178197064989519, "percentage": 75.89, "elapsed_time": "1:14:13", "remaining_time": "0:23:34", "throughput": 4242.07, "total_tokens": 18893208} {"current_steps": 28965, "total_steps": 38160, "loss": 0.3772, "lr": 0.00016671467158615977, "epoch": 15.180817610062894, "percentage": 75.9, "elapsed_time": "1:14:14", "remaining_time": "0:23:34", "throughput": 4242.05, "total_tokens": 18895864} {"current_steps": 28970, "total_steps": 38160, "loss": 0.3856, "lr": 0.00016654423456040224, "epoch": 15.183438155136269, "percentage": 75.92, "elapsed_time": "1:14:15", "remaining_time": "0:23:33", "throughput": 4242.05, "total_tokens": 18898712} {"current_steps": 28975, "total_steps": 38160, "loss": 0.4494, "lr": 0.0001663738672897866, "epoch": 15.186058700209644, "percentage": 75.93, "elapsed_time": "1:14:15", "remaining_time": "0:23:32", "throughput": 4242.05, "total_tokens": 18901624} {"current_steps": 28980, "total_steps": 38160, "loss": 0.3284, "lr": 0.0001662035698099517, "epoch": 15.18867924528302, "percentage": 75.94, "elapsed_time": "1:14:16", "remaining_time": "0:23:31", "throughput": 4242.12, "total_tokens": 18905176} {"current_steps": 28985, "total_steps": 38160, "loss": 0.277, "lr": 0.00016603334215652206, "epoch": 15.191299790356394, "percentage": 75.96, "elapsed_time": "1:14:17", "remaining_time": "0:23:30", "throughput": 4242.11, "total_tokens": 18907864} {"current_steps": 28990, "total_steps": 38160, "loss": 0.3376, "lr": 0.0001658631843651069, "epoch": 15.19392033542977, "percentage": 75.97, "elapsed_time": "1:14:17", "remaining_time": "0:23:30", "throughput": 4242.14, "total_tokens": 18911064} {"current_steps": 28995, "total_steps": 38160, "loss": 0.5244, "lr": 0.00016569309647130177, "epoch": 15.196540880503145, "percentage": 75.98, "elapsed_time": "1:14:18", "remaining_time": "0:23:29", "throughput": 4242.16, "total_tokens": 18914136} {"current_steps": 29000, "total_steps": 38160, "loss": 0.3902, "lr": 0.00016552307851068666, "epoch": 15.19916142557652, "percentage": 76.0, "elapsed_time": "1:14:19", "remaining_time": "0:23:28", "throughput": 4242.16, "total_tokens": 18917048} {"current_steps": 29005, "total_steps": 38160, "loss": 0.5331, "lr": 0.00016535313051882765, "epoch": 15.201781970649895, "percentage": 76.01, "elapsed_time": "1:14:19", "remaining_time": "0:23:27", "throughput": 4242.16, "total_tokens": 18919864} {"current_steps": 29010, "total_steps": 38160, "loss": 0.4084, "lr": 0.00016518325253127604, "epoch": 15.20440251572327, "percentage": 76.02, "elapsed_time": "1:14:20", "remaining_time": "0:23:26", "throughput": 4242.19, "total_tokens": 18922968} {"current_steps": 29015, "total_steps": 38160, "loss": 0.3807, "lr": 0.00016501344458356803, "epoch": 15.207023060796645, "percentage": 76.04, "elapsed_time": "1:14:21", "remaining_time": "0:23:26", "throughput": 4242.25, "total_tokens": 18926328} {"current_steps": 29020, "total_steps": 38160, "loss": 0.405, "lr": 0.00016484370671122588, "epoch": 15.20964360587002, "percentage": 76.05, "elapsed_time": "1:14:22", "remaining_time": "0:23:25", "throughput": 4242.26, "total_tokens": 18929368} {"current_steps": 29025, "total_steps": 38160, "loss": 0.3928, "lr": 0.00016467403894975641, "epoch": 15.212264150943396, "percentage": 76.06, "elapsed_time": "1:14:22", "remaining_time": "0:23:24", "throughput": 4242.25, "total_tokens": 18932056} {"current_steps": 29030, "total_steps": 38160, "loss": 0.5303, "lr": 0.0001645044413346524, "epoch": 15.214884696016771, "percentage": 76.07, "elapsed_time": "1:14:23", "remaining_time": "0:23:23", "throughput": 4242.34, "total_tokens": 18935896} {"current_steps": 29035, "total_steps": 38160, "loss": 0.3798, "lr": 0.00016433491390139177, "epoch": 15.217505241090146, "percentage": 76.09, "elapsed_time": "1:14:24", "remaining_time": "0:23:23", "throughput": 4242.36, "total_tokens": 18938968} {"current_steps": 29040, "total_steps": 38160, "loss": 0.4882, "lr": 0.00016416545668543786, "epoch": 15.220125786163521, "percentage": 76.1, "elapsed_time": "1:14:25", "remaining_time": "0:23:22", "throughput": 4242.49, "total_tokens": 18943000} {"current_steps": 29045, "total_steps": 38160, "loss": 0.4827, "lr": 0.0001639960697222388, "epoch": 15.222746331236896, "percentage": 76.11, "elapsed_time": "1:14:25", "remaining_time": "0:23:21", "throughput": 4242.52, "total_tokens": 18946104} {"current_steps": 29050, "total_steps": 38160, "loss": 0.4119, "lr": 0.00016382675304722877, "epoch": 15.225366876310272, "percentage": 76.13, "elapsed_time": "1:14:26", "remaining_time": "0:23:20", "throughput": 4242.67, "total_tokens": 18950328} {"current_steps": 29055, "total_steps": 38160, "loss": 0.3502, "lr": 0.00016365750669582662, "epoch": 15.227987421383649, "percentage": 76.14, "elapsed_time": "1:14:27", "remaining_time": "0:23:19", "throughput": 4242.67, "total_tokens": 18953144} {"current_steps": 29060, "total_steps": 38160, "loss": 0.5097, "lr": 0.00016348833070343682, "epoch": 15.230607966457024, "percentage": 76.15, "elapsed_time": "1:14:28", "remaining_time": "0:23:19", "throughput": 4243.05, "total_tokens": 18960248} {"current_steps": 29065, "total_steps": 38160, "loss": 0.3738, "lr": 0.00016331922510544932, "epoch": 15.233228511530399, "percentage": 76.17, "elapsed_time": "1:14:29", "remaining_time": "0:23:18", "throughput": 4243.02, "total_tokens": 18962744} {"current_steps": 29070, "total_steps": 38160, "loss": 0.3708, "lr": 0.0001631501899372387, "epoch": 15.235849056603774, "percentage": 76.18, "elapsed_time": "1:14:29", "remaining_time": "0:23:17", "throughput": 4243.04, "total_tokens": 18965816} {"current_steps": 29075, "total_steps": 38160, "loss": 0.3965, "lr": 0.0001629812252341653, "epoch": 15.23846960167715, "percentage": 76.19, "elapsed_time": "1:14:30", "remaining_time": "0:23:16", "throughput": 4243.12, "total_tokens": 18969560} {"current_steps": 29080, "total_steps": 38160, "loss": 0.2507, "lr": 0.0001628123310315749, "epoch": 15.241090146750524, "percentage": 76.21, "elapsed_time": "1:14:31", "remaining_time": "0:23:16", "throughput": 4243.16, "total_tokens": 18972792} {"current_steps": 29085, "total_steps": 38160, "loss": 0.3178, "lr": 0.00016264350736479777, "epoch": 15.2437106918239, "percentage": 76.22, "elapsed_time": "1:14:32", "remaining_time": "0:23:15", "throughput": 4243.16, "total_tokens": 18975640} {"current_steps": 29090, "total_steps": 38160, "loss": 0.3639, "lr": 0.00016247475426915038, "epoch": 15.246331236897275, "percentage": 76.23, "elapsed_time": "1:14:32", "remaining_time": "0:23:14", "throughput": 4243.2, "total_tokens": 18978840} {"current_steps": 29095, "total_steps": 38160, "loss": 0.3854, "lr": 0.0001623060717799335, "epoch": 15.24895178197065, "percentage": 76.24, "elapsed_time": "1:14:33", "remaining_time": "0:23:13", "throughput": 4243.18, "total_tokens": 18981464} {"current_steps": 29100, "total_steps": 38160, "loss": 0.3662, "lr": 0.0001621374599324338, "epoch": 15.251572327044025, "percentage": 76.26, "elapsed_time": "1:14:34", "remaining_time": "0:23:13", "throughput": 4243.29, "total_tokens": 18985368} {"current_steps": 29105, "total_steps": 38160, "loss": 0.4752, "lr": 0.00016196891876192292, "epoch": 15.2541928721174, "percentage": 76.27, "elapsed_time": "1:14:34", "remaining_time": "0:23:12", "throughput": 4243.28, "total_tokens": 18988120} {"current_steps": 29110, "total_steps": 38160, "loss": 0.5296, "lr": 0.00016180044830365798, "epoch": 15.256813417190775, "percentage": 76.28, "elapsed_time": "1:14:35", "remaining_time": "0:23:11", "throughput": 4243.34, "total_tokens": 18991640} {"current_steps": 29115, "total_steps": 38160, "loss": 0.4803, "lr": 0.00016163204859288066, "epoch": 15.25943396226415, "percentage": 76.3, "elapsed_time": "1:14:36", "remaining_time": "0:23:10", "throughput": 4243.34, "total_tokens": 18994552} {"current_steps": 29120, "total_steps": 38160, "loss": 0.5611, "lr": 0.00016146371966481866, "epoch": 15.262054507337526, "percentage": 76.31, "elapsed_time": "1:14:37", "remaining_time": "0:23:09", "throughput": 4243.52, "total_tokens": 18999224} {"current_steps": 29125, "total_steps": 38160, "loss": 0.6806, "lr": 0.00016129546155468411, "epoch": 15.264675052410901, "percentage": 76.32, "elapsed_time": "1:14:37", "remaining_time": "0:23:09", "throughput": 4243.58, "total_tokens": 19002648} {"current_steps": 29130, "total_steps": 38160, "loss": 0.3748, "lr": 0.00016112727429767483, "epoch": 15.267295597484276, "percentage": 76.34, "elapsed_time": "1:14:38", "remaining_time": "0:23:08", "throughput": 4243.63, "total_tokens": 19005976} {"current_steps": 29135, "total_steps": 38160, "loss": 0.4514, "lr": 0.00016095915792897392, "epoch": 15.269916142557651, "percentage": 76.35, "elapsed_time": "1:14:39", "remaining_time": "0:23:07", "throughput": 4243.66, "total_tokens": 19009144} {"current_steps": 29140, "total_steps": 38160, "loss": 0.3547, "lr": 0.000160791112483749, "epoch": 15.272536687631026, "percentage": 76.36, "elapsed_time": "1:14:40", "remaining_time": "0:23:06", "throughput": 4243.66, "total_tokens": 19011896} {"current_steps": 29145, "total_steps": 38160, "loss": 0.569, "lr": 0.00016062313799715362, "epoch": 15.275157232704402, "percentage": 76.38, "elapsed_time": "1:14:40", "remaining_time": "0:23:05", "throughput": 4243.71, "total_tokens": 19015256} {"current_steps": 29150, "total_steps": 38160, "loss": 0.5013, "lr": 0.00016045523450432576, "epoch": 15.277777777777779, "percentage": 76.39, "elapsed_time": "1:14:41", "remaining_time": "0:23:05", "throughput": 4243.73, "total_tokens": 19018360} {"current_steps": 29155, "total_steps": 38160, "loss": 0.2841, "lr": 0.0001602874020403891, "epoch": 15.280398322851154, "percentage": 76.4, "elapsed_time": "1:14:42", "remaining_time": "0:23:04", "throughput": 4243.83, "total_tokens": 19022136} {"current_steps": 29160, "total_steps": 38160, "loss": 0.4597, "lr": 0.00016011964064045232, "epoch": 15.283018867924529, "percentage": 76.42, "elapsed_time": "1:14:42", "remaining_time": "0:23:03", "throughput": 4243.82, "total_tokens": 19024920} {"current_steps": 29165, "total_steps": 38160, "loss": 0.3531, "lr": 0.00015995195033960936, "epoch": 15.285639412997904, "percentage": 76.43, "elapsed_time": "1:14:43", "remaining_time": "0:23:02", "throughput": 4244.0, "total_tokens": 19029464} {"current_steps": 29170, "total_steps": 38160, "loss": 0.4728, "lr": 0.00015978433117293884, "epoch": 15.28825995807128, "percentage": 76.44, "elapsed_time": "1:14:44", "remaining_time": "0:23:02", "throughput": 4244.1, "total_tokens": 19033272} {"current_steps": 29175, "total_steps": 38160, "loss": 0.4482, "lr": 0.0001596167831755047, "epoch": 15.290880503144654, "percentage": 76.45, "elapsed_time": "1:14:45", "remaining_time": "0:23:01", "throughput": 4244.06, "total_tokens": 19035736} {"current_steps": 29180, "total_steps": 38160, "loss": 0.4761, "lr": 0.00015944930638235626, "epoch": 15.29350104821803, "percentage": 76.47, "elapsed_time": "1:14:45", "remaining_time": "0:23:00", "throughput": 4244.1, "total_tokens": 19038904} {"current_steps": 29185, "total_steps": 38160, "loss": 0.3973, "lr": 0.00015928190082852773, "epoch": 15.296121593291405, "percentage": 76.48, "elapsed_time": "1:14:46", "remaining_time": "0:22:59", "throughput": 4244.16, "total_tokens": 19042424} {"current_steps": 29190, "total_steps": 38160, "loss": 0.2993, "lr": 0.0001591145665490384, "epoch": 15.29874213836478, "percentage": 76.49, "elapsed_time": "1:14:47", "remaining_time": "0:22:58", "throughput": 4244.21, "total_tokens": 19045784} {"current_steps": 29195, "total_steps": 38160, "loss": 0.4085, "lr": 0.00015894730357889287, "epoch": 15.301362683438155, "percentage": 76.51, "elapsed_time": "1:14:48", "remaining_time": "0:22:58", "throughput": 4244.26, "total_tokens": 19049016} {"current_steps": 29200, "total_steps": 38160, "loss": 0.3686, "lr": 0.0001587801119530805, "epoch": 15.30398322851153, "percentage": 76.52, "elapsed_time": "1:14:48", "remaining_time": "0:22:57", "throughput": 4244.34, "total_tokens": 19052536} {"current_steps": 29205, "total_steps": 38160, "loss": 0.3254, "lr": 0.00015861299170657572, "epoch": 15.306603773584905, "percentage": 76.53, "elapsed_time": "1:14:49", "remaining_time": "0:22:56", "throughput": 4244.34, "total_tokens": 19055480} {"current_steps": 29210, "total_steps": 38160, "loss": 0.4599, "lr": 0.00015844594287433834, "epoch": 15.30922431865828, "percentage": 76.55, "elapsed_time": "1:14:50", "remaining_time": "0:22:55", "throughput": 4244.45, "total_tokens": 19059416} {"current_steps": 29215, "total_steps": 38160, "loss": 0.3451, "lr": 0.00015827896549131304, "epoch": 15.311844863731656, "percentage": 76.56, "elapsed_time": "1:14:51", "remaining_time": "0:22:55", "throughput": 4244.46, "total_tokens": 19062360} {"current_steps": 29220, "total_steps": 38160, "loss": 0.3943, "lr": 0.0001581120595924298, "epoch": 15.314465408805031, "percentage": 76.57, "elapsed_time": "1:14:51", "remaining_time": "0:22:54", "throughput": 4244.47, "total_tokens": 19065400} {"current_steps": 29225, "total_steps": 38160, "loss": 0.435, "lr": 0.00015794522521260317, "epoch": 15.317085953878406, "percentage": 76.59, "elapsed_time": "1:14:52", "remaining_time": "0:22:53", "throughput": 4244.47, "total_tokens": 19068376} {"current_steps": 29230, "total_steps": 38160, "loss": 0.312, "lr": 0.00015777846238673293, "epoch": 15.319706498951781, "percentage": 76.6, "elapsed_time": "1:14:53", "remaining_time": "0:22:52", "throughput": 4244.45, "total_tokens": 19071032} {"current_steps": 29235, "total_steps": 38160, "loss": 0.4379, "lr": 0.00015761177114970404, "epoch": 15.322327044025156, "percentage": 76.61, "elapsed_time": "1:14:53", "remaining_time": "0:22:51", "throughput": 4244.45, "total_tokens": 19073944} {"current_steps": 29240, "total_steps": 38160, "loss": 0.408, "lr": 0.0001574451515363865, "epoch": 15.324947589098532, "percentage": 76.62, "elapsed_time": "1:14:54", "remaining_time": "0:22:51", "throughput": 4244.44, "total_tokens": 19076760} {"current_steps": 29245, "total_steps": 38160, "loss": 0.5459, "lr": 0.00015727860358163536, "epoch": 15.327568134171909, "percentage": 76.64, "elapsed_time": "1:14:55", "remaining_time": "0:22:50", "throughput": 4244.43, "total_tokens": 19079480} {"current_steps": 29250, "total_steps": 38160, "loss": 0.5369, "lr": 0.00015711212732029035, "epoch": 15.330188679245284, "percentage": 76.65, "elapsed_time": "1:14:55", "remaining_time": "0:22:49", "throughput": 4244.39, "total_tokens": 19081944} {"current_steps": 29255, "total_steps": 38160, "loss": 0.4147, "lr": 0.00015694572278717627, "epoch": 15.332809224318659, "percentage": 76.66, "elapsed_time": "1:14:56", "remaining_time": "0:22:48", "throughput": 4244.43, "total_tokens": 19085272} {"current_steps": 29260, "total_steps": 38160, "loss": 0.4487, "lr": 0.00015677939001710323, "epoch": 15.335429769392034, "percentage": 76.68, "elapsed_time": "1:14:57", "remaining_time": "0:22:47", "throughput": 4244.44, "total_tokens": 19088152} {"current_steps": 29265, "total_steps": 38160, "loss": 0.5447, "lr": 0.00015661312904486613, "epoch": 15.33805031446541, "percentage": 76.69, "elapsed_time": "1:14:57", "remaining_time": "0:22:47", "throughput": 4244.49, "total_tokens": 19091576} {"current_steps": 29270, "total_steps": 38160, "loss": 0.5069, "lr": 0.00015644693990524483, "epoch": 15.340670859538784, "percentage": 76.7, "elapsed_time": "1:14:58", "remaining_time": "0:22:46", "throughput": 4244.62, "total_tokens": 19095672} {"current_steps": 29275, "total_steps": 38160, "loss": 0.4931, "lr": 0.00015628082263300448, "epoch": 15.34329140461216, "percentage": 76.72, "elapsed_time": "1:14:59", "remaining_time": "0:22:45", "throughput": 4244.71, "total_tokens": 19099416} {"current_steps": 29280, "total_steps": 38160, "loss": 0.41, "lr": 0.00015611477726289465, "epoch": 15.345911949685535, "percentage": 76.73, "elapsed_time": "1:15:00", "remaining_time": "0:22:44", "throughput": 4244.7, "total_tokens": 19102296} {"current_steps": 29285, "total_steps": 38160, "loss": 0.3951, "lr": 0.00015594880382964994, "epoch": 15.34853249475891, "percentage": 76.74, "elapsed_time": "1:15:00", "remaining_time": "0:22:44", "throughput": 4244.73, "total_tokens": 19105432} {"current_steps": 29290, "total_steps": 38160, "loss": 0.327, "lr": 0.00015578290236799037, "epoch": 15.351153039832285, "percentage": 76.76, "elapsed_time": "1:15:01", "remaining_time": "0:22:43", "throughput": 4244.77, "total_tokens": 19108632} {"current_steps": 29295, "total_steps": 38160, "loss": 0.5696, "lr": 0.00015561707291262061, "epoch": 15.35377358490566, "percentage": 76.77, "elapsed_time": "1:15:02", "remaining_time": "0:22:42", "throughput": 4244.82, "total_tokens": 19111832} {"current_steps": 29300, "total_steps": 38160, "loss": 0.3717, "lr": 0.00015545131549823043, "epoch": 15.356394129979035, "percentage": 76.78, "elapsed_time": "1:15:03", "remaining_time": "0:22:41", "throughput": 4244.88, "total_tokens": 19115288} {"current_steps": 29305, "total_steps": 38160, "loss": 0.3701, "lr": 0.0001552856301594942, "epoch": 15.35901467505241, "percentage": 76.8, "elapsed_time": "1:15:03", "remaining_time": "0:22:40", "throughput": 4244.91, "total_tokens": 19118456} {"current_steps": 29310, "total_steps": 38160, "loss": 0.3763, "lr": 0.00015512001693107126, "epoch": 15.361635220125786, "percentage": 76.81, "elapsed_time": "1:15:04", "remaining_time": "0:22:40", "throughput": 4244.91, "total_tokens": 19121272} {"current_steps": 29315, "total_steps": 38160, "loss": 0.347, "lr": 0.0001549544758476062, "epoch": 15.364255765199161, "percentage": 76.82, "elapsed_time": "1:15:05", "remaining_time": "0:22:39", "throughput": 4244.94, "total_tokens": 19124440} {"current_steps": 29320, "total_steps": 38160, "loss": 0.4427, "lr": 0.00015478900694372832, "epoch": 15.366876310272536, "percentage": 76.83, "elapsed_time": "1:15:05", "remaining_time": "0:22:38", "throughput": 4244.99, "total_tokens": 19127672} {"current_steps": 29325, "total_steps": 38160, "loss": 0.4926, "lr": 0.00015462361025405196, "epoch": 15.369496855345911, "percentage": 76.85, "elapsed_time": "1:15:06", "remaining_time": "0:22:37", "throughput": 4245.01, "total_tokens": 19130776} {"current_steps": 29330, "total_steps": 38160, "loss": 0.4259, "lr": 0.0001544582858131759, "epoch": 15.372117400419286, "percentage": 76.86, "elapsed_time": "1:15:07", "remaining_time": "0:22:36", "throughput": 4245.03, "total_tokens": 19133720} {"current_steps": 29335, "total_steps": 38160, "loss": 0.4652, "lr": 0.00015429303365568448, "epoch": 15.374737945492662, "percentage": 76.87, "elapsed_time": "1:15:08", "remaining_time": "0:22:36", "throughput": 4245.08, "total_tokens": 19137112} {"current_steps": 29340, "total_steps": 38160, "loss": 0.4168, "lr": 0.00015412785381614625, "epoch": 15.377358490566039, "percentage": 76.89, "elapsed_time": "1:15:08", "remaining_time": "0:22:35", "throughput": 4245.12, "total_tokens": 19140408} {"current_steps": 29345, "total_steps": 38160, "loss": 0.4216, "lr": 0.000153962746329115, "epoch": 15.379979035639414, "percentage": 76.9, "elapsed_time": "1:15:09", "remaining_time": "0:22:34", "throughput": 4245.17, "total_tokens": 19143672} {"current_steps": 29350, "total_steps": 38160, "loss": 0.3544, "lr": 0.0001537977112291295, "epoch": 15.382599580712789, "percentage": 76.91, "elapsed_time": "1:15:10", "remaining_time": "0:22:33", "throughput": 4245.25, "total_tokens": 19147288} {"current_steps": 29355, "total_steps": 38160, "loss": 0.5045, "lr": 0.00015363274855071323, "epoch": 15.385220125786164, "percentage": 76.93, "elapsed_time": "1:15:10", "remaining_time": "0:22:33", "throughput": 4245.2, "total_tokens": 19149688} {"current_steps": 29360, "total_steps": 38160, "loss": 0.4403, "lr": 0.0001534678583283743, "epoch": 15.38784067085954, "percentage": 76.94, "elapsed_time": "1:15:11", "remaining_time": "0:22:32", "throughput": 4245.33, "total_tokens": 19153752} {"current_steps": 29365, "total_steps": 38160, "loss": 0.5249, "lr": 0.00015330304059660605, "epoch": 15.390461215932914, "percentage": 76.95, "elapsed_time": "1:15:12", "remaining_time": "0:22:31", "throughput": 4245.4, "total_tokens": 19157208} {"current_steps": 29370, "total_steps": 38160, "loss": 0.506, "lr": 0.00015313829538988628, "epoch": 15.39308176100629, "percentage": 76.97, "elapsed_time": "1:15:13", "remaining_time": "0:22:30", "throughput": 4245.56, "total_tokens": 19161656} {"current_steps": 29375, "total_steps": 38160, "loss": 0.4393, "lr": 0.00015297362274267783, "epoch": 15.395702306079665, "percentage": 76.98, "elapsed_time": "1:15:14", "remaining_time": "0:22:29", "throughput": 4245.6, "total_tokens": 19164824} {"current_steps": 29380, "total_steps": 38160, "loss": 0.424, "lr": 0.00015280902268942866, "epoch": 15.39832285115304, "percentage": 76.99, "elapsed_time": "1:15:14", "remaining_time": "0:22:29", "throughput": 4245.58, "total_tokens": 19167480} {"current_steps": 29385, "total_steps": 38160, "loss": 0.3932, "lr": 0.00015264449526457074, "epoch": 15.400943396226415, "percentage": 77.0, "elapsed_time": "1:15:15", "remaining_time": "0:22:28", "throughput": 4245.5, "total_tokens": 19169752} {"current_steps": 29390, "total_steps": 38160, "loss": 0.5358, "lr": 0.00015248004050252178, "epoch": 15.40356394129979, "percentage": 77.02, "elapsed_time": "1:15:15", "remaining_time": "0:22:27", "throughput": 4245.52, "total_tokens": 19172696} {"current_steps": 29395, "total_steps": 38160, "loss": 0.4283, "lr": 0.00015231565843768348, "epoch": 15.406184486373165, "percentage": 77.03, "elapsed_time": "1:15:16", "remaining_time": "0:22:26", "throughput": 4245.63, "total_tokens": 19176600} {"current_steps": 29400, "total_steps": 38160, "loss": 0.3074, "lr": 0.00015215134910444284, "epoch": 15.40880503144654, "percentage": 77.04, "elapsed_time": "1:15:17", "remaining_time": "0:22:26", "throughput": 4245.58, "total_tokens": 19179000} {"current_steps": 29405, "total_steps": 38160, "loss": 0.4889, "lr": 0.00015198711253717163, "epoch": 15.411425576519916, "percentage": 77.06, "elapsed_time": "1:15:18", "remaining_time": "0:22:25", "throughput": 4245.63, "total_tokens": 19182264} {"current_steps": 29410, "total_steps": 38160, "loss": 0.4093, "lr": 0.00015182294877022596, "epoch": 15.414046121593291, "percentage": 77.07, "elapsed_time": "1:15:18", "remaining_time": "0:22:24", "throughput": 4245.64, "total_tokens": 19185240} {"current_steps": 29415, "total_steps": 38160, "loss": 0.3703, "lr": 0.00015165885783794726, "epoch": 15.416666666666666, "percentage": 77.08, "elapsed_time": "1:15:19", "remaining_time": "0:22:23", "throughput": 4245.73, "total_tokens": 19188920} {"current_steps": 29420, "total_steps": 38160, "loss": 0.4462, "lr": 0.0001514948397746615, "epoch": 15.419287211740041, "percentage": 77.1, "elapsed_time": "1:15:20", "remaining_time": "0:22:22", "throughput": 4245.72, "total_tokens": 19191672} {"current_steps": 29425, "total_steps": 38160, "loss": 0.3886, "lr": 0.0001513308946146792, "epoch": 15.421907756813416, "percentage": 77.11, "elapsed_time": "1:15:20", "remaining_time": "0:22:22", "throughput": 4245.73, "total_tokens": 19194744} {"current_steps": 29430, "total_steps": 38160, "loss": 0.5069, "lr": 0.0001511670223922959, "epoch": 15.424528301886792, "percentage": 77.12, "elapsed_time": "1:15:21", "remaining_time": "0:22:21", "throughput": 4245.75, "total_tokens": 19197848} {"current_steps": 29435, "total_steps": 38160, "loss": 0.3027, "lr": 0.000151003223141792, "epoch": 15.427148846960169, "percentage": 77.14, "elapsed_time": "1:15:22", "remaining_time": "0:22:20", "throughput": 4245.83, "total_tokens": 19201432} {"current_steps": 29440, "total_steps": 38160, "loss": 0.3631, "lr": 0.00015083949689743202, "epoch": 15.429769392033544, "percentage": 77.15, "elapsed_time": "1:15:23", "remaining_time": "0:22:19", "throughput": 4245.94, "total_tokens": 19205304} {"current_steps": 29445, "total_steps": 38160, "loss": 0.4936, "lr": 0.00015067584369346594, "epoch": 15.432389937106919, "percentage": 77.16, "elapsed_time": "1:15:23", "remaining_time": "0:22:18", "throughput": 4246.02, "total_tokens": 19208888} {"current_steps": 29450, "total_steps": 38160, "loss": 0.4229, "lr": 0.00015051226356412818, "epoch": 15.435010482180294, "percentage": 77.18, "elapsed_time": "1:15:24", "remaining_time": "0:22:18", "throughput": 4246.07, "total_tokens": 19212216} {"current_steps": 29455, "total_steps": 38160, "loss": 0.5184, "lr": 0.00015034875654363754, "epoch": 15.43763102725367, "percentage": 77.19, "elapsed_time": "1:15:25", "remaining_time": "0:22:17", "throughput": 4246.14, "total_tokens": 19215736} {"current_steps": 29460, "total_steps": 38160, "loss": 0.4074, "lr": 0.00015018532266619818, "epoch": 15.440251572327044, "percentage": 77.2, "elapsed_time": "1:15:26", "remaining_time": "0:22:16", "throughput": 4246.22, "total_tokens": 19219224} {"current_steps": 29465, "total_steps": 38160, "loss": 0.4812, "lr": 0.00015002196196599828, "epoch": 15.44287211740042, "percentage": 77.21, "elapsed_time": "1:15:26", "remaining_time": "0:22:15", "throughput": 4246.26, "total_tokens": 19222424} {"current_steps": 29470, "total_steps": 38160, "loss": 0.4863, "lr": 0.00014985867447721114, "epoch": 15.445492662473795, "percentage": 77.23, "elapsed_time": "1:15:27", "remaining_time": "0:22:15", "throughput": 4246.31, "total_tokens": 19225784} {"current_steps": 29475, "total_steps": 38160, "loss": 0.3264, "lr": 0.00014969546023399467, "epoch": 15.44811320754717, "percentage": 77.24, "elapsed_time": "1:15:28", "remaining_time": "0:22:14", "throughput": 4246.31, "total_tokens": 19228600} {"current_steps": 29480, "total_steps": 38160, "loss": 0.4071, "lr": 0.00014953231927049165, "epoch": 15.450733752620545, "percentage": 77.25, "elapsed_time": "1:15:29", "remaining_time": "0:22:13", "throughput": 4246.35, "total_tokens": 19231864} {"current_steps": 29485, "total_steps": 38160, "loss": 0.4995, "lr": 0.00014936925162082904, "epoch": 15.45335429769392, "percentage": 77.27, "elapsed_time": "1:15:29", "remaining_time": "0:22:12", "throughput": 4246.44, "total_tokens": 19235480} {"current_steps": 29490, "total_steps": 38160, "loss": 0.5062, "lr": 0.00014920625731911863, "epoch": 15.455974842767295, "percentage": 77.28, "elapsed_time": "1:15:30", "remaining_time": "0:22:11", "throughput": 4246.5, "total_tokens": 19238904} {"current_steps": 29495, "total_steps": 38160, "loss": 0.3622, "lr": 0.00014904333639945716, "epoch": 15.45859538784067, "percentage": 77.29, "elapsed_time": "1:15:31", "remaining_time": "0:22:11", "throughput": 4246.53, "total_tokens": 19242040} {"current_steps": 29500, "total_steps": 38160, "loss": 0.4051, "lr": 0.00014888048889592575, "epoch": 15.461215932914046, "percentage": 77.31, "elapsed_time": "1:15:31", "remaining_time": "0:22:10", "throughput": 4246.57, "total_tokens": 19245336} {"current_steps": 29505, "total_steps": 38160, "loss": 0.4213, "lr": 0.00014871771484259046, "epoch": 15.463836477987421, "percentage": 77.32, "elapsed_time": "1:15:32", "remaining_time": "0:22:09", "throughput": 4246.79, "total_tokens": 19250264} {"current_steps": 29510, "total_steps": 38160, "loss": 0.7696, "lr": 0.00014855501427350144, "epoch": 15.466457023060796, "percentage": 77.33, "elapsed_time": "1:15:33", "remaining_time": "0:22:08", "throughput": 4246.83, "total_tokens": 19253592} {"current_steps": 29515, "total_steps": 38160, "loss": 0.375, "lr": 0.00014839238722269405, "epoch": 15.469077568134171, "percentage": 77.35, "elapsed_time": "1:15:34", "remaining_time": "0:22:08", "throughput": 4246.86, "total_tokens": 19256728} {"current_steps": 29520, "total_steps": 38160, "loss": 0.4203, "lr": 0.00014822983372418774, "epoch": 15.471698113207546, "percentage": 77.36, "elapsed_time": "1:15:35", "remaining_time": "0:22:07", "throughput": 4246.86, "total_tokens": 19259640} {"current_steps": 29525, "total_steps": 38160, "loss": 0.3626, "lr": 0.00014806735381198705, "epoch": 15.474318658280922, "percentage": 77.37, "elapsed_time": "1:15:35", "remaining_time": "0:22:06", "throughput": 4246.92, "total_tokens": 19263128} {"current_steps": 29530, "total_steps": 38160, "loss": 0.3694, "lr": 0.00014790494752008087, "epoch": 15.476939203354299, "percentage": 77.38, "elapsed_time": "1:15:36", "remaining_time": "0:22:05", "throughput": 4247.1, "total_tokens": 19267928} {"current_steps": 29535, "total_steps": 38160, "loss": 0.4243, "lr": 0.00014774261488244295, "epoch": 15.479559748427674, "percentage": 77.4, "elapsed_time": "1:15:37", "remaining_time": "0:22:05", "throughput": 4247.08, "total_tokens": 19270552} {"current_steps": 29540, "total_steps": 38160, "loss": 0.3924, "lr": 0.00014758035593303114, "epoch": 15.482180293501049, "percentage": 77.41, "elapsed_time": "1:15:38", "remaining_time": "0:22:04", "throughput": 4247.14, "total_tokens": 19274072} {"current_steps": 29545, "total_steps": 38160, "loss": 0.3936, "lr": 0.00014741817070578817, "epoch": 15.484800838574424, "percentage": 77.42, "elapsed_time": "1:15:38", "remaining_time": "0:22:03", "throughput": 4247.15, "total_tokens": 19277048} {"current_steps": 29550, "total_steps": 38160, "loss": 0.419, "lr": 0.0001472560592346414, "epoch": 15.4874213836478, "percentage": 77.44, "elapsed_time": "1:15:39", "remaining_time": "0:22:02", "throughput": 4247.12, "total_tokens": 19279576} {"current_steps": 29555, "total_steps": 38160, "loss": 0.4058, "lr": 0.0001470940215535027, "epoch": 15.490041928721174, "percentage": 77.45, "elapsed_time": "1:15:40", "remaining_time": "0:22:01", "throughput": 4247.1, "total_tokens": 19282200} {"current_steps": 29560, "total_steps": 38160, "loss": 0.51, "lr": 0.00014693205769626878, "epoch": 15.49266247379455, "percentage": 77.46, "elapsed_time": "1:15:40", "remaining_time": "0:22:01", "throughput": 4247.12, "total_tokens": 19285336} {"current_steps": 29565, "total_steps": 38160, "loss": 0.4565, "lr": 0.00014677016769682028, "epoch": 15.495283018867925, "percentage": 77.48, "elapsed_time": "1:15:41", "remaining_time": "0:22:00", "throughput": 4247.14, "total_tokens": 19288344} {"current_steps": 29570, "total_steps": 38160, "loss": 0.366, "lr": 0.00014660835158902268, "epoch": 15.4979035639413, "percentage": 77.49, "elapsed_time": "1:15:42", "remaining_time": "0:21:59", "throughput": 4247.21, "total_tokens": 19291928} {"current_steps": 29575, "total_steps": 38160, "loss": 0.3503, "lr": 0.00014644660940672628, "epoch": 15.500524109014675, "percentage": 77.5, "elapsed_time": "1:15:43", "remaining_time": "0:21:58", "throughput": 4247.31, "total_tokens": 19295736} {"current_steps": 29580, "total_steps": 38160, "loss": 0.4004, "lr": 0.0001462849411837656, "epoch": 15.50314465408805, "percentage": 77.52, "elapsed_time": "1:15:43", "remaining_time": "0:21:57", "throughput": 4247.32, "total_tokens": 19298744} {"current_steps": 29585, "total_steps": 38160, "loss": 0.4137, "lr": 0.00014612334695395985, "epoch": 15.505765199161425, "percentage": 77.53, "elapsed_time": "1:15:44", "remaining_time": "0:21:57", "throughput": 4247.3, "total_tokens": 19301368} {"current_steps": 29590, "total_steps": 38160, "loss": 0.3588, "lr": 0.0001459618267511128, "epoch": 15.5083857442348, "percentage": 77.54, "elapsed_time": "1:15:45", "remaining_time": "0:21:56", "throughput": 4247.38, "total_tokens": 19304952} {"current_steps": 29595, "total_steps": 38160, "loss": 0.49, "lr": 0.00014580038060901256, "epoch": 15.511006289308176, "percentage": 77.56, "elapsed_time": "1:15:45", "remaining_time": "0:21:55", "throughput": 4247.41, "total_tokens": 19308088} {"current_steps": 29600, "total_steps": 38160, "loss": 0.4128, "lr": 0.00014563900856143157, "epoch": 15.51362683438155, "percentage": 77.57, "elapsed_time": "1:15:46", "remaining_time": "0:21:54", "throughput": 4247.4, "total_tokens": 19310840} {"current_steps": 29605, "total_steps": 38160, "loss": 0.4632, "lr": 0.0001454777106421273, "epoch": 15.516247379454926, "percentage": 77.58, "elapsed_time": "1:15:47", "remaining_time": "0:21:54", "throughput": 4247.4, "total_tokens": 19313720} {"current_steps": 29610, "total_steps": 38160, "loss": 0.5195, "lr": 0.00014531648688484127, "epoch": 15.518867924528301, "percentage": 77.59, "elapsed_time": "1:15:48", "remaining_time": "0:21:53", "throughput": 4247.58, "total_tokens": 19318424} {"current_steps": 29615, "total_steps": 38160, "loss": 0.3347, "lr": 0.0001451553373233, "epoch": 15.521488469601676, "percentage": 77.61, "elapsed_time": "1:15:48", "remaining_time": "0:21:52", "throughput": 4247.7, "total_tokens": 19322488} {"current_steps": 29620, "total_steps": 38160, "loss": 0.6154, "lr": 0.00014499426199121379, "epoch": 15.524109014675052, "percentage": 77.62, "elapsed_time": "1:15:49", "remaining_time": "0:21:51", "throughput": 4247.73, "total_tokens": 19325592} {"current_steps": 29625, "total_steps": 38160, "loss": 0.453, "lr": 0.0001448332609222777, "epoch": 15.526729559748428, "percentage": 77.63, "elapsed_time": "1:15:50", "remaining_time": "0:21:50", "throughput": 4247.72, "total_tokens": 19328408} {"current_steps": 29630, "total_steps": 38160, "loss": 0.5547, "lr": 0.0001446723341501715, "epoch": 15.529350104821804, "percentage": 77.65, "elapsed_time": "1:15:50", "remaining_time": "0:21:50", "throughput": 4247.67, "total_tokens": 19330776} {"current_steps": 29635, "total_steps": 38160, "loss": 0.4228, "lr": 0.00014451148170855922, "epoch": 15.531970649895179, "percentage": 77.66, "elapsed_time": "1:15:51", "remaining_time": "0:21:49", "throughput": 4247.75, "total_tokens": 19334360} {"current_steps": 29640, "total_steps": 38160, "loss": 0.3782, "lr": 0.0001443507036310895, "epoch": 15.534591194968554, "percentage": 77.67, "elapsed_time": "1:15:52", "remaining_time": "0:21:48", "throughput": 4247.69, "total_tokens": 19336664} {"current_steps": 29645, "total_steps": 38160, "loss": 0.3817, "lr": 0.00014418999995139493, "epoch": 15.53721174004193, "percentage": 77.69, "elapsed_time": "1:15:52", "remaining_time": "0:21:47", "throughput": 4247.69, "total_tokens": 19339608} {"current_steps": 29650, "total_steps": 38160, "loss": 0.4162, "lr": 0.00014402937070309325, "epoch": 15.539832285115304, "percentage": 77.7, "elapsed_time": "1:15:53", "remaining_time": "0:21:46", "throughput": 4247.72, "total_tokens": 19342712} {"current_steps": 29655, "total_steps": 38160, "loss": 0.3923, "lr": 0.0001438688159197859, "epoch": 15.54245283018868, "percentage": 77.71, "elapsed_time": "1:15:54", "remaining_time": "0:21:46", "throughput": 4247.78, "total_tokens": 19346296} {"current_steps": 29660, "total_steps": 38160, "loss": 0.3106, "lr": 0.0001437083356350593, "epoch": 15.545073375262055, "percentage": 77.73, "elapsed_time": "1:15:55", "remaining_time": "0:21:45", "throughput": 4247.84, "total_tokens": 19349656} {"current_steps": 29665, "total_steps": 38160, "loss": 0.4044, "lr": 0.0001435479298824841, "epoch": 15.54769392033543, "percentage": 77.74, "elapsed_time": "1:15:55", "remaining_time": "0:21:44", "throughput": 4247.82, "total_tokens": 19352280} {"current_steps": 29670, "total_steps": 38160, "loss": 0.4575, "lr": 0.00014338759869561557, "epoch": 15.550314465408805, "percentage": 77.75, "elapsed_time": "1:15:56", "remaining_time": "0:21:43", "throughput": 4247.83, "total_tokens": 19355128} {"current_steps": 29675, "total_steps": 38160, "loss": 0.5723, "lr": 0.00014322734210799287, "epoch": 15.55293501048218, "percentage": 77.76, "elapsed_time": "1:15:57", "remaining_time": "0:21:43", "throughput": 4247.94, "total_tokens": 19359096} {"current_steps": 29680, "total_steps": 38160, "loss": 0.4145, "lr": 0.0001430671601531398, "epoch": 15.555555555555555, "percentage": 77.78, "elapsed_time": "1:15:57", "remaining_time": "0:21:42", "throughput": 4247.93, "total_tokens": 19361784} {"current_steps": 29685, "total_steps": 38160, "loss": 0.3651, "lr": 0.00014290705286456473, "epoch": 15.55817610062893, "percentage": 77.79, "elapsed_time": "1:15:58", "remaining_time": "0:21:41", "throughput": 4247.94, "total_tokens": 19364824} {"current_steps": 29690, "total_steps": 38160, "loss": 0.5448, "lr": 0.00014274702027576024, "epoch": 15.560796645702306, "percentage": 77.8, "elapsed_time": "1:15:59", "remaining_time": "0:21:40", "throughput": 4247.97, "total_tokens": 19368056} {"current_steps": 29695, "total_steps": 38160, "loss": 0.3964, "lr": 0.00014258706242020354, "epoch": 15.56341719077568, "percentage": 77.82, "elapsed_time": "1:16:00", "remaining_time": "0:21:39", "throughput": 4248.02, "total_tokens": 19371448} {"current_steps": 29700, "total_steps": 38160, "loss": 0.544, "lr": 0.00014242717933135558, "epoch": 15.566037735849056, "percentage": 77.83, "elapsed_time": "1:16:00", "remaining_time": "0:21:39", "throughput": 4248.12, "total_tokens": 19375448} {"current_steps": 29705, "total_steps": 38160, "loss": 0.4148, "lr": 0.0001422673710426625, "epoch": 15.568658280922431, "percentage": 77.84, "elapsed_time": "1:16:01", "remaining_time": "0:21:38", "throughput": 4248.21, "total_tokens": 19379256} {"current_steps": 29710, "total_steps": 38160, "loss": 0.4235, "lr": 0.00014210763758755403, "epoch": 15.571278825995806, "percentage": 77.86, "elapsed_time": "1:16:02", "remaining_time": "0:21:37", "throughput": 4248.3, "total_tokens": 19383032} {"current_steps": 29715, "total_steps": 38160, "loss": 0.4117, "lr": 0.00014194797899944468, "epoch": 15.573899371069182, "percentage": 77.87, "elapsed_time": "1:16:03", "remaining_time": "0:21:36", "throughput": 4248.48, "total_tokens": 19387640} {"current_steps": 29720, "total_steps": 38160, "loss": 0.4698, "lr": 0.00014178839531173344, "epoch": 15.576519916142558, "percentage": 77.88, "elapsed_time": "1:16:04", "remaining_time": "0:21:36", "throughput": 4248.42, "total_tokens": 19389944} {"current_steps": 29725, "total_steps": 38160, "loss": 0.4523, "lr": 0.00014162888655780303, "epoch": 15.579140461215934, "percentage": 77.9, "elapsed_time": "1:16:04", "remaining_time": "0:21:35", "throughput": 4248.49, "total_tokens": 19393464} {"current_steps": 29730, "total_steps": 38160, "loss": 0.3196, "lr": 0.00014146945277102108, "epoch": 15.581761006289309, "percentage": 77.91, "elapsed_time": "1:16:05", "remaining_time": "0:21:34", "throughput": 4248.44, "total_tokens": 19395864} {"current_steps": 29735, "total_steps": 38160, "loss": 0.4547, "lr": 0.00014131009398473938, "epoch": 15.584381551362684, "percentage": 77.92, "elapsed_time": "1:16:06", "remaining_time": "0:21:33", "throughput": 4248.43, "total_tokens": 19398552} {"current_steps": 29740, "total_steps": 38160, "loss": 0.3847, "lr": 0.00014115081023229376, "epoch": 15.58700209643606, "percentage": 77.94, "elapsed_time": "1:16:06", "remaining_time": "0:21:32", "throughput": 4248.46, "total_tokens": 19401688} {"current_steps": 29745, "total_steps": 38160, "loss": 0.3791, "lr": 0.00014099160154700462, "epoch": 15.589622641509434, "percentage": 77.95, "elapsed_time": "1:16:07", "remaining_time": "0:21:32", "throughput": 4248.45, "total_tokens": 19404472} {"current_steps": 29750, "total_steps": 38160, "loss": 0.4237, "lr": 0.00014083246796217684, "epoch": 15.59224318658281, "percentage": 77.96, "elapsed_time": "1:16:08", "remaining_time": "0:21:31", "throughput": 4248.47, "total_tokens": 19407544} {"current_steps": 29755, "total_steps": 38160, "loss": 0.4341, "lr": 0.00014067340951109898, "epoch": 15.594863731656185, "percentage": 77.97, "elapsed_time": "1:16:08", "remaining_time": "0:21:30", "throughput": 4248.48, "total_tokens": 19410488} {"current_steps": 29760, "total_steps": 38160, "loss": 0.5962, "lr": 0.00014051442622704447, "epoch": 15.59748427672956, "percentage": 77.99, "elapsed_time": "1:16:09", "remaining_time": "0:21:29", "throughput": 4248.57, "total_tokens": 19414360} {"current_steps": 29765, "total_steps": 38160, "loss": 0.4197, "lr": 0.0001403555181432709, "epoch": 15.600104821802935, "percentage": 78.0, "elapsed_time": "1:16:10", "remaining_time": "0:21:29", "throughput": 4248.65, "total_tokens": 19418072} {"current_steps": 29770, "total_steps": 38160, "loss": 0.4136, "lr": 0.00014019668529301977, "epoch": 15.60272536687631, "percentage": 78.01, "elapsed_time": "1:16:11", "remaining_time": "0:21:28", "throughput": 4248.66, "total_tokens": 19421016} {"current_steps": 29775, "total_steps": 38160, "loss": 0.4794, "lr": 0.00014003792770951733, "epoch": 15.605345911949685, "percentage": 78.03, "elapsed_time": "1:16:11", "remaining_time": "0:21:27", "throughput": 4248.74, "total_tokens": 19424568} {"current_steps": 29780, "total_steps": 38160, "loss": 0.4373, "lr": 0.00013987924542597363, "epoch": 15.60796645702306, "percentage": 78.04, "elapsed_time": "1:16:12", "remaining_time": "0:21:26", "throughput": 4248.73, "total_tokens": 19427352} {"current_steps": 29785, "total_steps": 38160, "loss": 0.3717, "lr": 0.0001397206384755833, "epoch": 15.610587002096436, "percentage": 78.05, "elapsed_time": "1:16:13", "remaining_time": "0:21:25", "throughput": 4248.75, "total_tokens": 19430328} {"current_steps": 29790, "total_steps": 38160, "loss": 0.3413, "lr": 0.00013956210689152526, "epoch": 15.61320754716981, "percentage": 78.07, "elapsed_time": "1:16:13", "remaining_time": "0:21:25", "throughput": 4248.81, "total_tokens": 19433848} {"current_steps": 29795, "total_steps": 38160, "loss": 0.4863, "lr": 0.0001394036507069622, "epoch": 15.615828092243186, "percentage": 78.08, "elapsed_time": "1:16:14", "remaining_time": "0:21:24", "throughput": 4248.83, "total_tokens": 19436888} {"current_steps": 29800, "total_steps": 38160, "loss": 0.5428, "lr": 0.00013924526995504172, "epoch": 15.618448637316561, "percentage": 78.09, "elapsed_time": "1:16:15", "remaining_time": "0:21:23", "throughput": 4248.97, "total_tokens": 19441176} {"current_steps": 29805, "total_steps": 38160, "loss": 0.4256, "lr": 0.00013908696466889486, "epoch": 15.621069182389936, "percentage": 78.11, "elapsed_time": "1:16:16", "remaining_time": "0:21:22", "throughput": 4249.04, "total_tokens": 19444664} {"current_steps": 29810, "total_steps": 38160, "loss": 0.4056, "lr": 0.0001389287348816375, "epoch": 15.623689727463312, "percentage": 78.12, "elapsed_time": "1:16:16", "remaining_time": "0:21:22", "throughput": 4249.06, "total_tokens": 19447736} {"current_steps": 29815, "total_steps": 38160, "loss": 0.4536, "lr": 0.00013877058062636944, "epoch": 15.626310272536688, "percentage": 78.13, "elapsed_time": "1:16:17", "remaining_time": "0:21:21", "throughput": 4249.13, "total_tokens": 19451384} {"current_steps": 29820, "total_steps": 38160, "loss": 0.4234, "lr": 0.00013861250193617498, "epoch": 15.628930817610064, "percentage": 78.14, "elapsed_time": "1:16:18", "remaining_time": "0:21:20", "throughput": 4249.16, "total_tokens": 19454552} {"current_steps": 29825, "total_steps": 38160, "loss": 0.3785, "lr": 0.00013845449884412203, "epoch": 15.631551362683439, "percentage": 78.16, "elapsed_time": "1:16:19", "remaining_time": "0:21:19", "throughput": 4249.15, "total_tokens": 19457336} {"current_steps": 29830, "total_steps": 38160, "loss": 0.4393, "lr": 0.00013829657138326334, "epoch": 15.634171907756814, "percentage": 78.17, "elapsed_time": "1:16:19", "remaining_time": "0:21:18", "throughput": 4249.16, "total_tokens": 19460344} {"current_steps": 29835, "total_steps": 38160, "loss": 0.4828, "lr": 0.00013813871958663526, "epoch": 15.63679245283019, "percentage": 78.18, "elapsed_time": "1:16:20", "remaining_time": "0:21:18", "throughput": 4249.1, "total_tokens": 19462744} {"current_steps": 29840, "total_steps": 38160, "loss": 0.4212, "lr": 0.0001379809434872587, "epoch": 15.639412997903564, "percentage": 78.2, "elapsed_time": "1:16:21", "remaining_time": "0:21:17", "throughput": 4249.14, "total_tokens": 19465880} {"current_steps": 29845, "total_steps": 38160, "loss": 0.4901, "lr": 0.0001378232431181386, "epoch": 15.64203354297694, "percentage": 78.21, "elapsed_time": "1:16:21", "remaining_time": "0:21:16", "throughput": 4249.12, "total_tokens": 19468632} {"current_steps": 29850, "total_steps": 38160, "loss": 0.4199, "lr": 0.00013766561851226428, "epoch": 15.644654088050315, "percentage": 78.22, "elapsed_time": "1:16:22", "remaining_time": "0:21:15", "throughput": 4249.13, "total_tokens": 19471736} {"current_steps": 29855, "total_steps": 38160, "loss": 0.3944, "lr": 0.00013750806970260886, "epoch": 15.64727463312369, "percentage": 78.24, "elapsed_time": "1:16:23", "remaining_time": "0:21:14", "throughput": 4249.12, "total_tokens": 19474424} {"current_steps": 29860, "total_steps": 38160, "loss": 0.3601, "lr": 0.00013735059672212959, "epoch": 15.649895178197065, "percentage": 78.25, "elapsed_time": "1:16:23", "remaining_time": "0:21:14", "throughput": 4249.12, "total_tokens": 19477400} {"current_steps": 29865, "total_steps": 38160, "loss": 0.4007, "lr": 0.00013719319960376808, "epoch": 15.65251572327044, "percentage": 78.26, "elapsed_time": "1:16:24", "remaining_time": "0:21:13", "throughput": 4249.1, "total_tokens": 19480024} {"current_steps": 29870, "total_steps": 38160, "loss": 0.449, "lr": 0.00013703587838045017, "epoch": 15.655136268343815, "percentage": 78.28, "elapsed_time": "1:16:25", "remaining_time": "0:21:12", "throughput": 4249.12, "total_tokens": 19483256} {"current_steps": 29875, "total_steps": 38160, "loss": 0.3758, "lr": 0.00013687863308508568, "epoch": 15.65775681341719, "percentage": 78.29, "elapsed_time": "1:16:25", "remaining_time": "0:21:11", "throughput": 4249.15, "total_tokens": 19486392} {"current_steps": 29880, "total_steps": 38160, "loss": 0.4031, "lr": 0.00013672146375056849, "epoch": 15.660377358490566, "percentage": 78.3, "elapsed_time": "1:16:26", "remaining_time": "0:21:10", "throughput": 4249.17, "total_tokens": 19489464} {"current_steps": 29885, "total_steps": 38160, "loss": 0.4179, "lr": 0.00013656437040977643, "epoch": 15.66299790356394, "percentage": 78.31, "elapsed_time": "1:16:27", "remaining_time": "0:21:10", "throughput": 4249.23, "total_tokens": 19492952} {"current_steps": 29890, "total_steps": 38160, "loss": 0.4969, "lr": 0.00013640735309557178, "epoch": 15.665618448637316, "percentage": 78.33, "elapsed_time": "1:16:28", "remaining_time": "0:21:09", "throughput": 4249.24, "total_tokens": 19495928} {"current_steps": 29895, "total_steps": 38160, "loss": 0.4177, "lr": 0.00013625041184080078, "epoch": 15.668238993710691, "percentage": 78.34, "elapsed_time": "1:16:28", "remaining_time": "0:21:08", "throughput": 4249.34, "total_tokens": 19499800} {"current_steps": 29900, "total_steps": 38160, "loss": 0.3613, "lr": 0.00013609354667829378, "epoch": 15.670859538784066, "percentage": 78.35, "elapsed_time": "1:16:29", "remaining_time": "0:21:07", "throughput": 4249.52, "total_tokens": 19504408} {"current_steps": 29905, "total_steps": 38160, "loss": 0.3516, "lr": 0.00013593675764086521, "epoch": 15.673480083857442, "percentage": 78.37, "elapsed_time": "1:16:30", "remaining_time": "0:21:07", "throughput": 4249.55, "total_tokens": 19507576} {"current_steps": 29910, "total_steps": 38160, "loss": 0.6138, "lr": 0.00013578004476131356, "epoch": 15.676100628930818, "percentage": 78.38, "elapsed_time": "1:16:31", "remaining_time": "0:21:06", "throughput": 4249.58, "total_tokens": 19510712} {"current_steps": 29915, "total_steps": 38160, "loss": 0.344, "lr": 0.00013562340807242112, "epoch": 15.678721174004194, "percentage": 78.39, "elapsed_time": "1:16:31", "remaining_time": "0:21:05", "throughput": 4249.64, "total_tokens": 19514168} {"current_steps": 29920, "total_steps": 38160, "loss": 0.3582, "lr": 0.00013546684760695472, "epoch": 15.681341719077569, "percentage": 78.41, "elapsed_time": "1:16:32", "remaining_time": "0:21:04", "throughput": 4249.66, "total_tokens": 19517304} {"current_steps": 29925, "total_steps": 38160, "loss": 0.4013, "lr": 0.00013531036339766494, "epoch": 15.683962264150944, "percentage": 78.42, "elapsed_time": "1:16:33", "remaining_time": "0:21:04", "throughput": 4249.69, "total_tokens": 19520504} {"current_steps": 29930, "total_steps": 38160, "loss": 0.3786, "lr": 0.00013515395547728675, "epoch": 15.68658280922432, "percentage": 78.43, "elapsed_time": "1:16:34", "remaining_time": "0:21:03", "throughput": 4250.02, "total_tokens": 19527000} {"current_steps": 29935, "total_steps": 38160, "loss": 0.4399, "lr": 0.00013499762387853866, "epoch": 15.689203354297694, "percentage": 78.45, "elapsed_time": "1:16:35", "remaining_time": "0:21:02", "throughput": 4250.03, "total_tokens": 19530008} {"current_steps": 29940, "total_steps": 38160, "loss": 0.3225, "lr": 0.00013484136863412333, "epoch": 15.69182389937107, "percentage": 78.46, "elapsed_time": "1:16:35", "remaining_time": "0:21:01", "throughput": 4250.06, "total_tokens": 19533208} {"current_steps": 29945, "total_steps": 38160, "loss": 0.6403, "lr": 0.00013468518977672773, "epoch": 15.694444444444445, "percentage": 78.47, "elapsed_time": "1:16:36", "remaining_time": "0:21:01", "throughput": 4250.09, "total_tokens": 19536248} {"current_steps": 29950, "total_steps": 38160, "loss": 0.3863, "lr": 0.0001345290873390227, "epoch": 15.69706498951782, "percentage": 78.49, "elapsed_time": "1:16:37", "remaining_time": "0:21:00", "throughput": 4250.12, "total_tokens": 19539480} {"current_steps": 29955, "total_steps": 38160, "loss": 0.4757, "lr": 0.00013437306135366322, "epoch": 15.699685534591195, "percentage": 78.5, "elapsed_time": "1:16:38", "remaining_time": "0:20:59", "throughput": 4250.15, "total_tokens": 19542584} {"current_steps": 29960, "total_steps": 38160, "loss": 0.5484, "lr": 0.00013421711185328806, "epoch": 15.70230607966457, "percentage": 78.51, "elapsed_time": "1:16:38", "remaining_time": "0:20:58", "throughput": 4250.23, "total_tokens": 19546296} {"current_steps": 29965, "total_steps": 38160, "loss": 0.4585, "lr": 0.00013406123887051984, "epoch": 15.704926624737945, "percentage": 78.52, "elapsed_time": "1:16:39", "remaining_time": "0:20:57", "throughput": 4250.25, "total_tokens": 19549400} {"current_steps": 29970, "total_steps": 38160, "loss": 0.4628, "lr": 0.0001339054424379656, "epoch": 15.70754716981132, "percentage": 78.54, "elapsed_time": "1:16:40", "remaining_time": "0:20:57", "throughput": 4250.32, "total_tokens": 19552984} {"current_steps": 29975, "total_steps": 38160, "loss": 0.5381, "lr": 0.00013374972258821621, "epoch": 15.710167714884696, "percentage": 78.55, "elapsed_time": "1:16:40", "remaining_time": "0:20:56", "throughput": 4250.29, "total_tokens": 19555448} {"current_steps": 29980, "total_steps": 38160, "loss": 0.3856, "lr": 0.00013359407935384642, "epoch": 15.71278825995807, "percentage": 78.56, "elapsed_time": "1:16:41", "remaining_time": "0:20:55", "throughput": 4250.27, "total_tokens": 19558136} {"current_steps": 29985, "total_steps": 38160, "loss": 0.3508, "lr": 0.0001334385127674152, "epoch": 15.715408805031446, "percentage": 78.58, "elapsed_time": "1:16:42", "remaining_time": "0:20:54", "throughput": 4250.25, "total_tokens": 19560824} {"current_steps": 29990, "total_steps": 38160, "loss": 0.3116, "lr": 0.00013328302286146515, "epoch": 15.718029350104821, "percentage": 78.59, "elapsed_time": "1:16:43", "remaining_time": "0:20:53", "throughput": 4250.33, "total_tokens": 19564472} {"current_steps": 29995, "total_steps": 38160, "loss": 0.5351, "lr": 0.00013312760966852283, "epoch": 15.720649895178196, "percentage": 78.6, "elapsed_time": "1:16:43", "remaining_time": "0:20:53", "throughput": 4250.39, "total_tokens": 19567960} {"current_steps": 30000, "total_steps": 38160, "loss": 0.4008, "lr": 0.00013297227322109912, "epoch": 15.723270440251572, "percentage": 78.62, "elapsed_time": "1:16:44", "remaining_time": "0:20:52", "throughput": 4250.36, "total_tokens": 19570616} {"current_steps": 30005, "total_steps": 38160, "loss": 0.5636, "lr": 0.00013281701355168852, "epoch": 15.725890985324948, "percentage": 78.63, "elapsed_time": "1:16:45", "remaining_time": "0:20:51", "throughput": 4250.39, "total_tokens": 19573816} {"current_steps": 30010, "total_steps": 38160, "loss": 0.4705, "lr": 0.00013266183069276982, "epoch": 15.728511530398324, "percentage": 78.64, "elapsed_time": "1:16:45", "remaining_time": "0:20:50", "throughput": 4250.45, "total_tokens": 19577272} {"current_steps": 30015, "total_steps": 38160, "loss": 0.3418, "lr": 0.00013250672467680514, "epoch": 15.731132075471699, "percentage": 78.66, "elapsed_time": "1:16:46", "remaining_time": "0:20:50", "throughput": 4250.47, "total_tokens": 19580408} {"current_steps": 30020, "total_steps": 38160, "loss": 0.4097, "lr": 0.00013235169553624127, "epoch": 15.733752620545074, "percentage": 78.67, "elapsed_time": "1:16:47", "remaining_time": "0:20:49", "throughput": 4250.51, "total_tokens": 19583640} {"current_steps": 30025, "total_steps": 38160, "loss": 0.3944, "lr": 0.00013219674330350816, "epoch": 15.73637316561845, "percentage": 78.68, "elapsed_time": "1:16:48", "remaining_time": "0:20:48", "throughput": 4250.58, "total_tokens": 19587128} {"current_steps": 30030, "total_steps": 38160, "loss": 0.4226, "lr": 0.00013204186801102024, "epoch": 15.738993710691824, "percentage": 78.69, "elapsed_time": "1:16:48", "remaining_time": "0:20:47", "throughput": 4250.64, "total_tokens": 19590584} {"current_steps": 30035, "total_steps": 38160, "loss": 0.4225, "lr": 0.0001318870696911758, "epoch": 15.7416142557652, "percentage": 78.71, "elapsed_time": "1:16:49", "remaining_time": "0:20:46", "throughput": 4250.73, "total_tokens": 19594264} {"current_steps": 30040, "total_steps": 38160, "loss": 0.4624, "lr": 0.00013173234837635656, "epoch": 15.744234800838575, "percentage": 78.72, "elapsed_time": "1:16:50", "remaining_time": "0:20:46", "throughput": 4250.73, "total_tokens": 19597176} {"current_steps": 30045, "total_steps": 38160, "loss": 0.5331, "lr": 0.00013157770409892878, "epoch": 15.74685534591195, "percentage": 78.73, "elapsed_time": "1:16:50", "remaining_time": "0:20:45", "throughput": 4250.72, "total_tokens": 19599896} {"current_steps": 30050, "total_steps": 38160, "loss": 0.4131, "lr": 0.00013142313689124197, "epoch": 15.749475890985325, "percentage": 78.75, "elapsed_time": "1:16:51", "remaining_time": "0:20:44", "throughput": 4250.72, "total_tokens": 19602904} {"current_steps": 30055, "total_steps": 38160, "loss": 0.4576, "lr": 0.00013126864678562994, "epoch": 15.7520964360587, "percentage": 78.76, "elapsed_time": "1:16:52", "remaining_time": "0:20:43", "throughput": 4250.79, "total_tokens": 19606456} {"current_steps": 30060, "total_steps": 38160, "loss": 0.3397, "lr": 0.00013111423381441034, "epoch": 15.754716981132075, "percentage": 78.77, "elapsed_time": "1:16:53", "remaining_time": "0:20:43", "throughput": 4250.78, "total_tokens": 19609304} {"current_steps": 30065, "total_steps": 38160, "loss": 0.4078, "lr": 0.00013095989800988468, "epoch": 15.75733752620545, "percentage": 78.79, "elapsed_time": "1:16:53", "remaining_time": "0:20:42", "throughput": 4250.89, "total_tokens": 19613304} {"current_steps": 30070, "total_steps": 38160, "loss": 0.4266, "lr": 0.000130805639404338, "epoch": 15.759958071278826, "percentage": 78.8, "elapsed_time": "1:16:54", "remaining_time": "0:20:41", "throughput": 4250.97, "total_tokens": 19616952} {"current_steps": 30075, "total_steps": 38160, "loss": 0.3883, "lr": 0.0001306514580300397, "epoch": 15.7625786163522, "percentage": 78.81, "elapsed_time": "1:16:55", "remaining_time": "0:20:40", "throughput": 4250.99, "total_tokens": 19620056} {"current_steps": 30080, "total_steps": 38160, "loss": 0.3649, "lr": 0.00013049735391924244, "epoch": 15.765199161425576, "percentage": 78.83, "elapsed_time": "1:16:56", "remaining_time": "0:20:39", "throughput": 4251.02, "total_tokens": 19623096} {"current_steps": 30085, "total_steps": 38160, "loss": 0.6299, "lr": 0.00013034332710418328, "epoch": 15.767819706498951, "percentage": 78.84, "elapsed_time": "1:16:56", "remaining_time": "0:20:39", "throughput": 4250.98, "total_tokens": 19625624} {"current_steps": 30090, "total_steps": 38160, "loss": 0.4441, "lr": 0.00013018937761708298, "epoch": 15.770440251572326, "percentage": 78.85, "elapsed_time": "1:16:57", "remaining_time": "0:20:38", "throughput": 4250.96, "total_tokens": 19628312} {"current_steps": 30095, "total_steps": 38160, "loss": 0.3688, "lr": 0.0001300355054901457, "epoch": 15.773060796645701, "percentage": 78.87, "elapsed_time": "1:16:58", "remaining_time": "0:20:37", "throughput": 4251.04, "total_tokens": 19632056} {"current_steps": 30100, "total_steps": 38160, "loss": 0.4152, "lr": 0.0001298817107555599, "epoch": 15.775681341719078, "percentage": 78.88, "elapsed_time": "1:16:59", "remaining_time": "0:20:36", "throughput": 4251.29, "total_tokens": 19637560} {"current_steps": 30105, "total_steps": 38160, "loss": 0.4423, "lr": 0.0001297279934454978, "epoch": 15.778301886792454, "percentage": 78.89, "elapsed_time": "1:16:59", "remaining_time": "0:20:36", "throughput": 4251.31, "total_tokens": 19640600} {"current_steps": 30110, "total_steps": 38160, "loss": 0.4034, "lr": 0.000129574353592115, "epoch": 15.780922431865829, "percentage": 78.9, "elapsed_time": "1:17:00", "remaining_time": "0:20:35", "throughput": 4251.32, "total_tokens": 19643608} {"current_steps": 30115, "total_steps": 38160, "loss": 0.5074, "lr": 0.00012942079122755162, "epoch": 15.783542976939204, "percentage": 78.92, "elapsed_time": "1:17:01", "remaining_time": "0:20:34", "throughput": 4251.28, "total_tokens": 19646040} {"current_steps": 30120, "total_steps": 38160, "loss": 0.4496, "lr": 0.00012926730638393075, "epoch": 15.786163522012579, "percentage": 78.93, "elapsed_time": "1:17:01", "remaining_time": "0:20:33", "throughput": 4251.25, "total_tokens": 19648600} {"current_steps": 30125, "total_steps": 38160, "loss": 0.3166, "lr": 0.0001291138990933598, "epoch": 15.788784067085954, "percentage": 78.94, "elapsed_time": "1:17:02", "remaining_time": "0:20:32", "throughput": 4251.33, "total_tokens": 19652280} {"current_steps": 30130, "total_steps": 38160, "loss": 0.4502, "lr": 0.00012896056938792994, "epoch": 15.79140461215933, "percentage": 78.96, "elapsed_time": "1:17:03", "remaining_time": "0:20:32", "throughput": 4251.38, "total_tokens": 19655736} {"current_steps": 30135, "total_steps": 38160, "loss": 0.4979, "lr": 0.000128807317299716, "epoch": 15.794025157232705, "percentage": 78.97, "elapsed_time": "1:17:04", "remaining_time": "0:20:31", "throughput": 4251.36, "total_tokens": 19658456} {"current_steps": 30140, "total_steps": 38160, "loss": 0.4034, "lr": 0.00012865414286077637, "epoch": 15.79664570230608, "percentage": 78.98, "elapsed_time": "1:17:04", "remaining_time": "0:20:30", "throughput": 4251.4, "total_tokens": 19661688} {"current_steps": 30145, "total_steps": 38160, "loss": 0.4492, "lr": 0.00012850104610315365, "epoch": 15.799266247379455, "percentage": 79.0, "elapsed_time": "1:17:05", "remaining_time": "0:20:29", "throughput": 4251.49, "total_tokens": 19665400} {"current_steps": 30150, "total_steps": 38160, "loss": 0.4033, "lr": 0.00012834802705887372, "epoch": 15.80188679245283, "percentage": 79.01, "elapsed_time": "1:17:06", "remaining_time": "0:20:29", "throughput": 4251.52, "total_tokens": 19668472} {"current_steps": 30155, "total_steps": 38160, "loss": 0.3303, "lr": 0.00012819508575994643, "epoch": 15.804507337526205, "percentage": 79.02, "elapsed_time": "1:17:06", "remaining_time": "0:20:28", "throughput": 4251.59, "total_tokens": 19672088} {"current_steps": 30160, "total_steps": 38160, "loss": 0.4049, "lr": 0.0001280422222383656, "epoch": 15.80712788259958, "percentage": 79.04, "elapsed_time": "1:17:07", "remaining_time": "0:20:27", "throughput": 4251.68, "total_tokens": 19675864} {"current_steps": 30165, "total_steps": 38160, "loss": 0.3846, "lr": 0.00012788943652610818, "epoch": 15.809748427672956, "percentage": 79.05, "elapsed_time": "1:17:08", "remaining_time": "0:20:26", "throughput": 4251.83, "total_tokens": 19680216} {"current_steps": 30170, "total_steps": 38160, "loss": 0.5586, "lr": 0.0001277367286551356, "epoch": 15.81236897274633, "percentage": 79.06, "elapsed_time": "1:17:09", "remaining_time": "0:20:26", "throughput": 4251.86, "total_tokens": 19683480} {"current_steps": 30175, "total_steps": 38160, "loss": 0.5224, "lr": 0.00012758409865739213, "epoch": 15.814989517819706, "percentage": 79.07, "elapsed_time": "1:17:10", "remaining_time": "0:20:25", "throughput": 4251.94, "total_tokens": 19687160} {"current_steps": 30180, "total_steps": 38160, "loss": 0.5075, "lr": 0.00012743154656480655, "epoch": 15.817610062893081, "percentage": 79.09, "elapsed_time": "1:17:10", "remaining_time": "0:20:24", "throughput": 4251.98, "total_tokens": 19690424} {"current_steps": 30185, "total_steps": 38160, "loss": 0.414, "lr": 0.00012727907240929094, "epoch": 15.820230607966456, "percentage": 79.1, "elapsed_time": "1:17:11", "remaining_time": "0:20:23", "throughput": 4252.01, "total_tokens": 19693656} {"current_steps": 30190, "total_steps": 38160, "loss": 0.5463, "lr": 0.00012712667622274127, "epoch": 15.822851153039831, "percentage": 79.11, "elapsed_time": "1:17:12", "remaining_time": "0:20:22", "throughput": 4252.04, "total_tokens": 19696920} {"current_steps": 30195, "total_steps": 38160, "loss": 0.3071, "lr": 0.000126974358037037, "epoch": 15.825471698113208, "percentage": 79.13, "elapsed_time": "1:17:13", "remaining_time": "0:20:22", "throughput": 4252.06, "total_tokens": 19700088} {"current_steps": 30200, "total_steps": 38160, "loss": 0.3957, "lr": 0.00012682211788404114, "epoch": 15.828092243186584, "percentage": 79.14, "elapsed_time": "1:17:13", "remaining_time": "0:20:21", "throughput": 4252.1, "total_tokens": 19703320} {"current_steps": 30205, "total_steps": 38160, "loss": 0.4318, "lr": 0.0001266699557956008, "epoch": 15.830712788259959, "percentage": 79.15, "elapsed_time": "1:17:14", "remaining_time": "0:20:20", "throughput": 4252.09, "total_tokens": 19706168} {"current_steps": 30210, "total_steps": 38160, "loss": 0.3359, "lr": 0.00012651787180354657, "epoch": 15.833333333333334, "percentage": 79.17, "elapsed_time": "1:17:15", "remaining_time": "0:20:19", "throughput": 4252.09, "total_tokens": 19708984} {"current_steps": 30215, "total_steps": 38160, "loss": 0.4321, "lr": 0.00012636586593969262, "epoch": 15.835953878406709, "percentage": 79.18, "elapsed_time": "1:17:15", "remaining_time": "0:20:18", "throughput": 4252.1, "total_tokens": 19711928} {"current_steps": 30220, "total_steps": 38160, "loss": 0.4331, "lr": 0.000126213938235837, "epoch": 15.838574423480084, "percentage": 79.19, "elapsed_time": "1:17:16", "remaining_time": "0:20:18", "throughput": 4252.18, "total_tokens": 19715640} {"current_steps": 30225, "total_steps": 38160, "loss": 0.3873, "lr": 0.0001260620887237611, "epoch": 15.84119496855346, "percentage": 79.21, "elapsed_time": "1:17:17", "remaining_time": "0:20:17", "throughput": 4252.2, "total_tokens": 19718616} {"current_steps": 30230, "total_steps": 38160, "loss": 0.3962, "lr": 0.00012591031743523006, "epoch": 15.843815513626835, "percentage": 79.22, "elapsed_time": "1:17:17", "remaining_time": "0:20:16", "throughput": 4252.22, "total_tokens": 19721688} {"current_steps": 30235, "total_steps": 38160, "loss": 0.4294, "lr": 0.00012575862440199277, "epoch": 15.84643605870021, "percentage": 79.23, "elapsed_time": "1:17:18", "remaining_time": "0:20:15", "throughput": 4252.29, "total_tokens": 19725272} {"current_steps": 30240, "total_steps": 38160, "loss": 0.3444, "lr": 0.00012560700965578165, "epoch": 15.849056603773585, "percentage": 79.25, "elapsed_time": "1:17:19", "remaining_time": "0:20:15", "throughput": 4252.27, "total_tokens": 19727960} {"current_steps": 30245, "total_steps": 38160, "loss": 0.4998, "lr": 0.0001254554732283129, "epoch": 15.85167714884696, "percentage": 79.26, "elapsed_time": "1:17:20", "remaining_time": "0:20:14", "throughput": 4252.28, "total_tokens": 19730904} {"current_steps": 30250, "total_steps": 38160, "loss": 0.5072, "lr": 0.0001253040151512862, "epoch": 15.854297693920335, "percentage": 79.27, "elapsed_time": "1:17:20", "remaining_time": "0:20:13", "throughput": 4252.35, "total_tokens": 19734552} {"current_steps": 30255, "total_steps": 38160, "loss": 0.3913, "lr": 0.0001251526354563846, "epoch": 15.85691823899371, "percentage": 79.28, "elapsed_time": "1:17:21", "remaining_time": "0:20:12", "throughput": 4252.34, "total_tokens": 19737400} {"current_steps": 30260, "total_steps": 38160, "loss": 0.39, "lr": 0.0001250013341752752, "epoch": 15.859538784067086, "percentage": 79.3, "elapsed_time": "1:17:22", "remaining_time": "0:20:11", "throughput": 4252.4, "total_tokens": 19740792} {"current_steps": 30265, "total_steps": 38160, "loss": 0.4468, "lr": 0.00012485011133960843, "epoch": 15.86215932914046, "percentage": 79.31, "elapsed_time": "1:17:23", "remaining_time": "0:20:11", "throughput": 4252.45, "total_tokens": 19744248} {"current_steps": 30270, "total_steps": 38160, "loss": 0.3047, "lr": 0.00012469896698101863, "epoch": 15.864779874213836, "percentage": 79.32, "elapsed_time": "1:17:23", "remaining_time": "0:20:10", "throughput": 4252.41, "total_tokens": 19746744} {"current_steps": 30275, "total_steps": 38160, "loss": 0.4376, "lr": 0.00012454790113112325, "epoch": 15.867400419287211, "percentage": 79.34, "elapsed_time": "1:17:24", "remaining_time": "0:20:09", "throughput": 4252.42, "total_tokens": 19749688} {"current_steps": 30280, "total_steps": 38160, "loss": 0.3633, "lr": 0.00012439691382152345, "epoch": 15.870020964360586, "percentage": 79.35, "elapsed_time": "1:17:25", "remaining_time": "0:20:08", "throughput": 4252.49, "total_tokens": 19753208} {"current_steps": 30285, "total_steps": 38160, "loss": 0.4952, "lr": 0.00012424600508380412, "epoch": 15.872641509433961, "percentage": 79.36, "elapsed_time": "1:17:25", "remaining_time": "0:20:08", "throughput": 4252.54, "total_tokens": 19756568} {"current_steps": 30290, "total_steps": 38160, "loss": 0.4182, "lr": 0.00012409517494953377, "epoch": 15.875262054507338, "percentage": 79.38, "elapsed_time": "1:17:26", "remaining_time": "0:20:07", "throughput": 4252.55, "total_tokens": 19759576} {"current_steps": 30295, "total_steps": 38160, "loss": 0.3334, "lr": 0.00012394442345026418, "epoch": 15.877882599580714, "percentage": 79.39, "elapsed_time": "1:17:27", "remaining_time": "0:20:06", "throughput": 4252.68, "total_tokens": 19763608} {"current_steps": 30300, "total_steps": 38160, "loss": 0.6235, "lr": 0.00012379375061753118, "epoch": 15.880503144654089, "percentage": 79.4, "elapsed_time": "1:17:28", "remaining_time": "0:20:05", "throughput": 4252.71, "total_tokens": 19766808} {"current_steps": 30305, "total_steps": 38160, "loss": 0.3229, "lr": 0.00012364315648285353, "epoch": 15.883123689727464, "percentage": 79.42, "elapsed_time": "1:17:28", "remaining_time": "0:20:04", "throughput": 4252.71, "total_tokens": 19769752} {"current_steps": 30310, "total_steps": 38160, "loss": 0.5912, "lr": 0.00012349264107773363, "epoch": 15.885744234800839, "percentage": 79.43, "elapsed_time": "1:17:29", "remaining_time": "0:20:04", "throughput": 4252.74, "total_tokens": 19772920} {"current_steps": 30315, "total_steps": 38160, "loss": 0.4032, "lr": 0.00012334220443365785, "epoch": 15.888364779874214, "percentage": 79.44, "elapsed_time": "1:17:30", "remaining_time": "0:20:03", "throughput": 4252.72, "total_tokens": 19775512} {"current_steps": 30320, "total_steps": 38160, "loss": 0.5166, "lr": 0.00012319184658209575, "epoch": 15.89098532494759, "percentage": 79.45, "elapsed_time": "1:17:30", "remaining_time": "0:20:02", "throughput": 4252.77, "total_tokens": 19778968} {"current_steps": 30325, "total_steps": 38160, "loss": 0.3613, "lr": 0.00012304156755450063, "epoch": 15.893605870020965, "percentage": 79.47, "elapsed_time": "1:17:31", "remaining_time": "0:20:01", "throughput": 4252.75, "total_tokens": 19781656} {"current_steps": 30330, "total_steps": 38160, "loss": 0.472, "lr": 0.00012289136738230906, "epoch": 15.89622641509434, "percentage": 79.48, "elapsed_time": "1:17:32", "remaining_time": "0:20:01", "throughput": 4252.8, "total_tokens": 19785112} {"current_steps": 30335, "total_steps": 38160, "loss": 0.4482, "lr": 0.00012274124609694092, "epoch": 15.898846960167715, "percentage": 79.49, "elapsed_time": "1:17:32", "remaining_time": "0:20:00", "throughput": 4252.81, "total_tokens": 19788088} {"current_steps": 30340, "total_steps": 38160, "loss": 0.3019, "lr": 0.00012259120372980014, "epoch": 15.90146750524109, "percentage": 79.51, "elapsed_time": "1:17:33", "remaining_time": "0:19:59", "throughput": 4252.85, "total_tokens": 19791352} {"current_steps": 30345, "total_steps": 38160, "loss": 0.4165, "lr": 0.0001224412403122739, "epoch": 15.904088050314465, "percentage": 79.52, "elapsed_time": "1:17:34", "remaining_time": "0:19:58", "throughput": 4252.95, "total_tokens": 19795288} {"current_steps": 30350, "total_steps": 38160, "loss": 0.4378, "lr": 0.0001222913558757328, "epoch": 15.90670859538784, "percentage": 79.53, "elapsed_time": "1:17:35", "remaining_time": "0:19:57", "throughput": 4252.96, "total_tokens": 19798328} {"current_steps": 30355, "total_steps": 38160, "loss": 0.3209, "lr": 0.00012214155045153085, "epoch": 15.909329140461216, "percentage": 79.55, "elapsed_time": "1:17:35", "remaining_time": "0:19:57", "throughput": 4252.98, "total_tokens": 19801432} {"current_steps": 30360, "total_steps": 38160, "loss": 0.5068, "lr": 0.00012199182407100584, "epoch": 15.91194968553459, "percentage": 79.56, "elapsed_time": "1:17:36", "remaining_time": "0:19:56", "throughput": 4252.98, "total_tokens": 19804280} {"current_steps": 30365, "total_steps": 38160, "loss": 0.3706, "lr": 0.00012184217676547855, "epoch": 15.914570230607966, "percentage": 79.57, "elapsed_time": "1:17:37", "remaining_time": "0:19:55", "throughput": 4253.04, "total_tokens": 19807768} {"current_steps": 30370, "total_steps": 38160, "loss": 0.41, "lr": 0.00012169260856625358, "epoch": 15.917190775681341, "percentage": 79.59, "elapsed_time": "1:17:38", "remaining_time": "0:19:54", "throughput": 4253.03, "total_tokens": 19810616} {"current_steps": 30375, "total_steps": 38160, "loss": 0.364, "lr": 0.000121543119504619, "epoch": 15.919811320754716, "percentage": 79.6, "elapsed_time": "1:17:39", "remaining_time": "0:19:54", "throughput": 4253.28, "total_tokens": 19816472} {"current_steps": 30380, "total_steps": 38160, "loss": 0.3635, "lr": 0.00012139370961184626, "epoch": 15.922431865828091, "percentage": 79.61, "elapsed_time": "1:17:39", "remaining_time": "0:19:53", "throughput": 4253.34, "total_tokens": 19819928} {"current_steps": 30385, "total_steps": 38160, "loss": 0.4202, "lr": 0.00012124437891918994, "epoch": 15.925052410901468, "percentage": 79.63, "elapsed_time": "1:17:40", "remaining_time": "0:19:52", "throughput": 4253.43, "total_tokens": 19823704} {"current_steps": 30390, "total_steps": 38160, "loss": 0.4521, "lr": 0.0001210951274578887, "epoch": 15.927672955974844, "percentage": 79.64, "elapsed_time": "1:17:41", "remaining_time": "0:19:51", "throughput": 4253.41, "total_tokens": 19826456} {"current_steps": 30395, "total_steps": 38160, "loss": 0.4113, "lr": 0.00012094595525916379, "epoch": 15.930293501048219, "percentage": 79.65, "elapsed_time": "1:17:42", "remaining_time": "0:19:51", "throughput": 4253.46, "total_tokens": 19829848} {"current_steps": 30400, "total_steps": 38160, "loss": 0.4449, "lr": 0.0001207968623542206, "epoch": 15.932914046121594, "percentage": 79.66, "elapsed_time": "1:17:42", "remaining_time": "0:19:50", "throughput": 4253.48, "total_tokens": 19832856} {"current_steps": 30405, "total_steps": 38160, "loss": 0.38, "lr": 0.00012064784877424778, "epoch": 15.935534591194969, "percentage": 79.68, "elapsed_time": "1:17:43", "remaining_time": "0:19:49", "throughput": 4253.47, "total_tokens": 19835704} {"current_steps": 30410, "total_steps": 38160, "loss": 0.3946, "lr": 0.00012049891455041695, "epoch": 15.938155136268344, "percentage": 79.69, "elapsed_time": "1:17:44", "remaining_time": "0:19:48", "throughput": 4253.56, "total_tokens": 19839352} {"current_steps": 30415, "total_steps": 38160, "loss": 0.4124, "lr": 0.00012035005971388379, "epoch": 15.94077568134172, "percentage": 79.7, "elapsed_time": "1:17:44", "remaining_time": "0:19:47", "throughput": 4253.61, "total_tokens": 19842840} {"current_steps": 30420, "total_steps": 38160, "loss": 0.3755, "lr": 0.0001202012842957867, "epoch": 15.943396226415095, "percentage": 79.72, "elapsed_time": "1:17:45", "remaining_time": "0:19:47", "throughput": 4253.72, "total_tokens": 19846808} {"current_steps": 30425, "total_steps": 38160, "loss": 0.4183, "lr": 0.00012005258832724797, "epoch": 15.94601677148847, "percentage": 79.73, "elapsed_time": "1:17:46", "remaining_time": "0:19:46", "throughput": 4253.73, "total_tokens": 19849816} {"current_steps": 30430, "total_steps": 38160, "loss": 0.3338, "lr": 0.00011990397183937324, "epoch": 15.948637316561845, "percentage": 79.74, "elapsed_time": "1:17:47", "remaining_time": "0:19:45", "throughput": 4253.72, "total_tokens": 19852568} {"current_steps": 30435, "total_steps": 38160, "loss": 0.2887, "lr": 0.00011975543486325108, "epoch": 15.95125786163522, "percentage": 79.76, "elapsed_time": "1:17:48", "remaining_time": "0:19:44", "throughput": 4253.95, "total_tokens": 19857976} {"current_steps": 30440, "total_steps": 38160, "loss": 0.4413, "lr": 0.00011960697742995392, "epoch": 15.953878406708595, "percentage": 79.77, "elapsed_time": "1:17:48", "remaining_time": "0:19:44", "throughput": 4254.01, "total_tokens": 19861432} {"current_steps": 30445, "total_steps": 38160, "loss": 0.4873, "lr": 0.00011945859957053746, "epoch": 15.95649895178197, "percentage": 79.78, "elapsed_time": "1:17:49", "remaining_time": "0:19:43", "throughput": 4254.08, "total_tokens": 19865144} {"current_steps": 30450, "total_steps": 38160, "loss": 0.3584, "lr": 0.00011931030131604036, "epoch": 15.959119496855346, "percentage": 79.8, "elapsed_time": "1:17:50", "remaining_time": "0:19:42", "throughput": 4254.07, "total_tokens": 19867928} {"current_steps": 30455, "total_steps": 38160, "loss": 0.3943, "lr": 0.00011916208269748507, "epoch": 15.96174004192872, "percentage": 79.81, "elapsed_time": "1:17:50", "remaining_time": "0:19:41", "throughput": 4254.03, "total_tokens": 19870456} {"current_steps": 30460, "total_steps": 38160, "loss": 0.3862, "lr": 0.00011901394374587743, "epoch": 15.964360587002096, "percentage": 79.82, "elapsed_time": "1:17:51", "remaining_time": "0:19:40", "throughput": 4253.98, "total_tokens": 19872824} {"current_steps": 30465, "total_steps": 38160, "loss": 0.3379, "lr": 0.00011886588449220609, "epoch": 15.966981132075471, "percentage": 79.83, "elapsed_time": "1:17:52", "remaining_time": "0:19:40", "throughput": 4253.94, "total_tokens": 19875256} {"current_steps": 30470, "total_steps": 38160, "loss": 0.4733, "lr": 0.00011871790496744351, "epoch": 15.969601677148846, "percentage": 79.85, "elapsed_time": "1:17:52", "remaining_time": "0:19:39", "throughput": 4253.96, "total_tokens": 19878328} {"current_steps": 30475, "total_steps": 38160, "loss": 0.4774, "lr": 0.00011857000520254546, "epoch": 15.972222222222221, "percentage": 79.86, "elapsed_time": "1:17:53", "remaining_time": "0:19:38", "throughput": 4254.02, "total_tokens": 19881784} {"current_steps": 30480, "total_steps": 38160, "loss": 0.4487, "lr": 0.0001184221852284506, "epoch": 15.974842767295598, "percentage": 79.87, "elapsed_time": "1:17:54", "remaining_time": "0:19:37", "throughput": 4254.06, "total_tokens": 19885144} {"current_steps": 30485, "total_steps": 38160, "loss": 0.5031, "lr": 0.00011827444507608143, "epoch": 15.977463312368974, "percentage": 79.89, "elapsed_time": "1:17:55", "remaining_time": "0:19:37", "throughput": 4254.08, "total_tokens": 19888120} {"current_steps": 30490, "total_steps": 38160, "loss": 0.4972, "lr": 0.00011812678477634325, "epoch": 15.980083857442349, "percentage": 79.9, "elapsed_time": "1:17:55", "remaining_time": "0:19:36", "throughput": 4254.11, "total_tokens": 19891352} {"current_steps": 30495, "total_steps": 38160, "loss": 0.4906, "lr": 0.0001179792043601251, "epoch": 15.982704402515724, "percentage": 79.91, "elapsed_time": "1:17:56", "remaining_time": "0:19:35", "throughput": 4254.17, "total_tokens": 19894872} {"current_steps": 30500, "total_steps": 38160, "loss": 0.3853, "lr": 0.00011783170385829905, "epoch": 15.985324947589099, "percentage": 79.93, "elapsed_time": "1:17:57", "remaining_time": "0:19:34", "throughput": 4254.28, "total_tokens": 19898904} {"current_steps": 30505, "total_steps": 38160, "loss": 0.4504, "lr": 0.00011768428330172071, "epoch": 15.987945492662474, "percentage": 79.94, "elapsed_time": "1:17:58", "remaining_time": "0:19:33", "throughput": 4254.37, "total_tokens": 19902840} {"current_steps": 30510, "total_steps": 38160, "loss": 0.3715, "lr": 0.00011753694272122856, "epoch": 15.99056603773585, "percentage": 79.95, "elapsed_time": "1:17:58", "remaining_time": "0:19:33", "throughput": 4254.42, "total_tokens": 19906168} {"current_steps": 30515, "total_steps": 38160, "loss": 0.6486, "lr": 0.00011738968214764456, "epoch": 15.993186582809225, "percentage": 79.97, "elapsed_time": "1:17:59", "remaining_time": "0:19:32", "throughput": 4254.41, "total_tokens": 19908920} {"current_steps": 30520, "total_steps": 38160, "loss": 0.5054, "lr": 0.00011724250161177391, "epoch": 15.9958071278826, "percentage": 79.98, "elapsed_time": "1:18:00", "remaining_time": "0:19:31", "throughput": 4254.45, "total_tokens": 19912216} {"current_steps": 30525, "total_steps": 38160, "loss": 0.458, "lr": 0.00011709540114440525, "epoch": 15.998427672955975, "percentage": 79.99, "elapsed_time": "1:18:00", "remaining_time": "0:19:30", "throughput": 4254.44, "total_tokens": 19914904} {"current_steps": 30528, "total_steps": 38160, "eval_loss": 0.46345266699790955, "epoch": 16.0, "percentage": 80.0, "elapsed_time": "1:18:14", "remaining_time": "0:19:33", "throughput": 4242.03, "total_tokens": 19916008} {"current_steps": 30530, "total_steps": 38160, "loss": 0.4557, "lr": 0.00011694838077631043, "epoch": 16.00104821802935, "percentage": 80.01, "elapsed_time": "1:18:16", "remaining_time": "0:19:33", "throughput": 4240.47, "total_tokens": 19917032} {"current_steps": 30535, "total_steps": 38160, "loss": 0.5499, "lr": 0.0001168014405382441, "epoch": 16.003668763102727, "percentage": 80.02, "elapsed_time": "1:18:17", "remaining_time": "0:19:33", "throughput": 4240.48, "total_tokens": 19919976} {"current_steps": 30540, "total_steps": 38160, "loss": 0.4634, "lr": 0.0001166545804609448, "epoch": 16.0062893081761, "percentage": 80.03, "elapsed_time": "1:18:18", "remaining_time": "0:19:32", "throughput": 4240.42, "total_tokens": 19922312} {"current_steps": 30545, "total_steps": 38160, "loss": 0.5355, "lr": 0.00011650780057513367, "epoch": 16.008909853249477, "percentage": 80.04, "elapsed_time": "1:18:18", "remaining_time": "0:19:31", "throughput": 4240.33, "total_tokens": 19924392} {"current_steps": 30550, "total_steps": 38160, "loss": 0.4273, "lr": 0.00011636110091151553, "epoch": 16.01153039832285, "percentage": 80.06, "elapsed_time": "1:18:19", "remaining_time": "0:19:30", "throughput": 4240.35, "total_tokens": 19927528} {"current_steps": 30555, "total_steps": 38160, "loss": 0.4002, "lr": 0.00011621448150077834, "epoch": 16.014150943396228, "percentage": 80.07, "elapsed_time": "1:18:20", "remaining_time": "0:19:29", "throughput": 4240.4, "total_tokens": 19930920} {"current_steps": 30560, "total_steps": 38160, "loss": 0.3461, "lr": 0.0001160679423735933, "epoch": 16.0167714884696, "percentage": 80.08, "elapsed_time": "1:18:20", "remaining_time": "0:19:29", "throughput": 4240.43, "total_tokens": 19934152} {"current_steps": 30565, "total_steps": 38160, "loss": 0.3317, "lr": 0.00011592148356061455, "epoch": 16.019392033542978, "percentage": 80.1, "elapsed_time": "1:18:21", "remaining_time": "0:19:28", "throughput": 4240.55, "total_tokens": 19938216} {"current_steps": 30570, "total_steps": 38160, "loss": 0.5036, "lr": 0.00011577510509247951, "epoch": 16.02201257861635, "percentage": 80.11, "elapsed_time": "1:18:22", "remaining_time": "0:19:27", "throughput": 4240.64, "total_tokens": 19942088} {"current_steps": 30575, "total_steps": 38160, "loss": 0.7358, "lr": 0.00011562880699980904, "epoch": 16.02463312368973, "percentage": 80.12, "elapsed_time": "1:18:23", "remaining_time": "0:19:26", "throughput": 4240.62, "total_tokens": 19944744} {"current_steps": 30580, "total_steps": 38160, "loss": 0.4188, "lr": 0.00011548258931320704, "epoch": 16.0272536687631, "percentage": 80.14, "elapsed_time": "1:18:24", "remaining_time": "0:19:26", "throughput": 4240.67, "total_tokens": 19948360} {"current_steps": 30585, "total_steps": 38160, "loss": 0.4158, "lr": 0.00011533645206326049, "epoch": 16.02987421383648, "percentage": 80.15, "elapsed_time": "1:18:24", "remaining_time": "0:19:25", "throughput": 4240.65, "total_tokens": 19951016} {"current_steps": 30590, "total_steps": 38160, "loss": 0.4045, "lr": 0.00011519039528053999, "epoch": 16.032494758909852, "percentage": 80.16, "elapsed_time": "1:18:25", "remaining_time": "0:19:24", "throughput": 4240.7, "total_tokens": 19954376} {"current_steps": 30595, "total_steps": 38160, "loss": 0.4313, "lr": 0.00011504441899559837, "epoch": 16.03511530398323, "percentage": 80.18, "elapsed_time": "1:18:26", "remaining_time": "0:19:23", "throughput": 4240.75, "total_tokens": 19957864} {"current_steps": 30600, "total_steps": 38160, "loss": 0.3966, "lr": 0.00011489852323897249, "epoch": 16.037735849056602, "percentage": 80.19, "elapsed_time": "1:18:26", "remaining_time": "0:19:22", "throughput": 4240.8, "total_tokens": 19961256} {"current_steps": 30605, "total_steps": 38160, "loss": 0.3763, "lr": 0.0001147527080411821, "epoch": 16.04035639412998, "percentage": 80.2, "elapsed_time": "1:18:27", "remaining_time": "0:19:22", "throughput": 4240.86, "total_tokens": 19964744} {"current_steps": 30610, "total_steps": 38160, "loss": 0.4569, "lr": 0.00011460697343273002, "epoch": 16.042976939203353, "percentage": 80.21, "elapsed_time": "1:18:28", "remaining_time": "0:19:21", "throughput": 4240.93, "total_tokens": 19968232} {"current_steps": 30615, "total_steps": 38160, "loss": 0.3914, "lr": 0.00011446131944410249, "epoch": 16.04559748427673, "percentage": 80.23, "elapsed_time": "1:18:29", "remaining_time": "0:19:20", "throughput": 4240.94, "total_tokens": 19971176} {"current_steps": 30620, "total_steps": 38160, "loss": 0.4242, "lr": 0.00011431574610576844, "epoch": 16.048218029350103, "percentage": 80.24, "elapsed_time": "1:18:29", "remaining_time": "0:19:19", "throughput": 4241.02, "total_tokens": 19974888} {"current_steps": 30625, "total_steps": 38160, "loss": 0.3762, "lr": 0.00011417025344818005, "epoch": 16.05083857442348, "percentage": 80.25, "elapsed_time": "1:18:30", "remaining_time": "0:19:19", "throughput": 4241.02, "total_tokens": 19977864} {"current_steps": 30630, "total_steps": 38160, "loss": 0.4874, "lr": 0.00011402484150177289, "epoch": 16.053459119496857, "percentage": 80.27, "elapsed_time": "1:18:31", "remaining_time": "0:19:18", "throughput": 4241.11, "total_tokens": 19981640} {"current_steps": 30635, "total_steps": 38160, "loss": 0.5064, "lr": 0.00011387951029696542, "epoch": 16.05607966457023, "percentage": 80.28, "elapsed_time": "1:18:32", "remaining_time": "0:19:17", "throughput": 4241.22, "total_tokens": 19985640} {"current_steps": 30640, "total_steps": 38160, "loss": 0.3329, "lr": 0.00011373425986415941, "epoch": 16.058700209643607, "percentage": 80.29, "elapsed_time": "1:18:32", "remaining_time": "0:19:16", "throughput": 4241.25, "total_tokens": 19988776} {"current_steps": 30645, "total_steps": 38160, "loss": 0.4331, "lr": 0.00011358909023373953, "epoch": 16.06132075471698, "percentage": 80.31, "elapsed_time": "1:18:33", "remaining_time": "0:19:15", "throughput": 4241.28, "total_tokens": 19991976} {"current_steps": 30650, "total_steps": 38160, "loss": 0.3977, "lr": 0.00011344400143607342, "epoch": 16.063941299790358, "percentage": 80.32, "elapsed_time": "1:18:34", "remaining_time": "0:19:15", "throughput": 4241.3, "total_tokens": 19995048} {"current_steps": 30655, "total_steps": 38160, "loss": 0.4625, "lr": 0.00011329899350151212, "epoch": 16.06656184486373, "percentage": 80.33, "elapsed_time": "1:18:35", "remaining_time": "0:19:14", "throughput": 4241.31, "total_tokens": 19997992} {"current_steps": 30660, "total_steps": 38160, "loss": 0.3509, "lr": 0.00011315406646038973, "epoch": 16.069182389937108, "percentage": 80.35, "elapsed_time": "1:18:35", "remaining_time": "0:19:13", "throughput": 4241.26, "total_tokens": 20000520} {"current_steps": 30665, "total_steps": 38160, "loss": 0.5848, "lr": 0.0001130092203430232, "epoch": 16.07180293501048, "percentage": 80.36, "elapsed_time": "1:18:36", "remaining_time": "0:19:12", "throughput": 4241.23, "total_tokens": 20003176} {"current_steps": 30670, "total_steps": 38160, "loss": 0.5221, "lr": 0.00011286445517971289, "epoch": 16.07442348008386, "percentage": 80.37, "elapsed_time": "1:18:37", "remaining_time": "0:19:11", "throughput": 4241.3, "total_tokens": 20006664} {"current_steps": 30675, "total_steps": 38160, "loss": 0.4228, "lr": 0.00011271977100074188, "epoch": 16.07704402515723, "percentage": 80.39, "elapsed_time": "1:18:37", "remaining_time": "0:19:11", "throughput": 4241.28, "total_tokens": 20009320} {"current_steps": 30680, "total_steps": 38160, "loss": 0.3244, "lr": 0.00011257516783637633, "epoch": 16.07966457023061, "percentage": 80.4, "elapsed_time": "1:18:38", "remaining_time": "0:19:10", "throughput": 4241.23, "total_tokens": 20011656} {"current_steps": 30685, "total_steps": 38160, "loss": 0.4309, "lr": 0.00011243064571686573, "epoch": 16.082285115303982, "percentage": 80.41, "elapsed_time": "1:18:39", "remaining_time": "0:19:09", "throughput": 4241.29, "total_tokens": 20015304} {"current_steps": 30690, "total_steps": 38160, "loss": 0.3775, "lr": 0.00011228620467244238, "epoch": 16.08490566037736, "percentage": 80.42, "elapsed_time": "1:18:39", "remaining_time": "0:19:08", "throughput": 4241.32, "total_tokens": 20018504} {"current_steps": 30695, "total_steps": 38160, "loss": 0.3622, "lr": 0.00011214184473332183, "epoch": 16.087526205450732, "percentage": 80.44, "elapsed_time": "1:18:40", "remaining_time": "0:19:08", "throughput": 4241.3, "total_tokens": 20021096} {"current_steps": 30700, "total_steps": 38160, "loss": 0.4632, "lr": 0.0001119975659297025, "epoch": 16.09014675052411, "percentage": 80.45, "elapsed_time": "1:18:41", "remaining_time": "0:19:07", "throughput": 4241.29, "total_tokens": 20023912} {"current_steps": 30705, "total_steps": 38160, "loss": 0.4637, "lr": 0.00011185336829176568, "epoch": 16.092767295597483, "percentage": 80.46, "elapsed_time": "1:18:41", "remaining_time": "0:19:06", "throughput": 4241.29, "total_tokens": 20026792} {"current_steps": 30710, "total_steps": 38160, "loss": 0.4326, "lr": 0.00011170925184967601, "epoch": 16.09538784067086, "percentage": 80.48, "elapsed_time": "1:18:42", "remaining_time": "0:19:05", "throughput": 4241.2, "total_tokens": 20028840} {"current_steps": 30715, "total_steps": 38160, "loss": 0.4113, "lr": 0.00011156521663358094, "epoch": 16.098008385744233, "percentage": 80.49, "elapsed_time": "1:18:43", "remaining_time": "0:19:04", "throughput": 4241.24, "total_tokens": 20032072} {"current_steps": 30720, "total_steps": 38160, "loss": 0.375, "lr": 0.00011142126267361124, "epoch": 16.10062893081761, "percentage": 80.5, "elapsed_time": "1:18:43", "remaining_time": "0:19:04", "throughput": 4241.24, "total_tokens": 20034824} {"current_steps": 30725, "total_steps": 38160, "loss": 0.3139, "lr": 0.00011127738999988007, "epoch": 16.103249475890987, "percentage": 80.52, "elapsed_time": "1:18:44", "remaining_time": "0:19:03", "throughput": 4241.35, "total_tokens": 20038792} {"current_steps": 30730, "total_steps": 38160, "loss": 0.3267, "lr": 0.00011113359864248429, "epoch": 16.10587002096436, "percentage": 80.53, "elapsed_time": "1:18:45", "remaining_time": "0:19:02", "throughput": 4241.38, "total_tokens": 20042024} {"current_steps": 30735, "total_steps": 38160, "loss": 0.5344, "lr": 0.00011098988863150317, "epoch": 16.108490566037737, "percentage": 80.54, "elapsed_time": "1:18:46", "remaining_time": "0:19:01", "throughput": 4241.44, "total_tokens": 20045576} {"current_steps": 30740, "total_steps": 38160, "loss": 0.3486, "lr": 0.0001108462599969992, "epoch": 16.11111111111111, "percentage": 80.56, "elapsed_time": "1:18:46", "remaining_time": "0:19:00", "throughput": 4241.48, "total_tokens": 20048872} {"current_steps": 30745, "total_steps": 38160, "loss": 0.477, "lr": 0.000110702712769018, "epoch": 16.113731656184488, "percentage": 80.57, "elapsed_time": "1:18:47", "remaining_time": "0:19:00", "throughput": 4241.6, "total_tokens": 20053096} {"current_steps": 30750, "total_steps": 38160, "loss": 0.4297, "lr": 0.00011055924697758801, "epoch": 16.11635220125786, "percentage": 80.58, "elapsed_time": "1:18:48", "remaining_time": "0:18:59", "throughput": 4241.62, "total_tokens": 20056296} {"current_steps": 30755, "total_steps": 38160, "loss": 0.4966, "lr": 0.00011041586265272052, "epoch": 16.118972746331238, "percentage": 80.59, "elapsed_time": "1:18:49", "remaining_time": "0:18:58", "throughput": 4241.65, "total_tokens": 20059368} {"current_steps": 30760, "total_steps": 38160, "loss": 0.3069, "lr": 0.00011027255982441003, "epoch": 16.12159329140461, "percentage": 80.61, "elapsed_time": "1:18:49", "remaining_time": "0:18:57", "throughput": 4241.66, "total_tokens": 20062472} {"current_steps": 30765, "total_steps": 38160, "loss": 0.3563, "lr": 0.00011012933852263369, "epoch": 16.12421383647799, "percentage": 80.62, "elapsed_time": "1:18:50", "remaining_time": "0:18:57", "throughput": 4241.72, "total_tokens": 20066024} {"current_steps": 30770, "total_steps": 38160, "loss": 0.369, "lr": 0.00010998619877735184, "epoch": 16.12683438155136, "percentage": 80.63, "elapsed_time": "1:18:51", "remaining_time": "0:18:56", "throughput": 4241.73, "total_tokens": 20068968} {"current_steps": 30775, "total_steps": 38160, "loss": 0.4256, "lr": 0.0001098431406185078, "epoch": 16.12945492662474, "percentage": 80.65, "elapsed_time": "1:18:51", "remaining_time": "0:18:55", "throughput": 4241.72, "total_tokens": 20071720} {"current_steps": 30780, "total_steps": 38160, "loss": 0.641, "lr": 0.00010970016407602751, "epoch": 16.132075471698112, "percentage": 80.66, "elapsed_time": "1:18:52", "remaining_time": "0:18:54", "throughput": 4241.75, "total_tokens": 20074984} {"current_steps": 30785, "total_steps": 38160, "loss": 0.5468, "lr": 0.00010955726917982023, "epoch": 16.13469601677149, "percentage": 80.67, "elapsed_time": "1:18:53", "remaining_time": "0:18:53", "throughput": 4241.84, "total_tokens": 20078760} {"current_steps": 30790, "total_steps": 38160, "loss": 0.3812, "lr": 0.00010941445595977767, "epoch": 16.137316561844862, "percentage": 80.69, "elapsed_time": "1:18:54", "remaining_time": "0:18:53", "throughput": 4241.82, "total_tokens": 20081480} {"current_steps": 30795, "total_steps": 38160, "loss": 0.4524, "lr": 0.00010927172444577494, "epoch": 16.13993710691824, "percentage": 80.7, "elapsed_time": "1:18:54", "remaining_time": "0:18:52", "throughput": 4241.79, "total_tokens": 20084072} {"current_steps": 30800, "total_steps": 38160, "loss": 0.5374, "lr": 0.00010912907466766985, "epoch": 16.142557651991613, "percentage": 80.71, "elapsed_time": "1:18:55", "remaining_time": "0:18:51", "throughput": 4241.93, "total_tokens": 20088488} {"current_steps": 30805, "total_steps": 38160, "loss": 0.4173, "lr": 0.00010898650665530302, "epoch": 16.14517819706499, "percentage": 80.73, "elapsed_time": "1:18:56", "remaining_time": "0:18:50", "throughput": 4241.99, "total_tokens": 20092008} {"current_steps": 30810, "total_steps": 38160, "loss": 0.4724, "lr": 0.000108844020438498, "epoch": 16.147798742138363, "percentage": 80.74, "elapsed_time": "1:18:57", "remaining_time": "0:18:50", "throughput": 4241.97, "total_tokens": 20094664} {"current_steps": 30815, "total_steps": 38160, "loss": 0.3784, "lr": 0.00010870161604706152, "epoch": 16.15041928721174, "percentage": 80.75, "elapsed_time": "1:18:58", "remaining_time": "0:18:49", "throughput": 4242.32, "total_tokens": 20101640} {"current_steps": 30820, "total_steps": 38160, "loss": 0.4792, "lr": 0.00010855929351078264, "epoch": 16.153039832285117, "percentage": 80.77, "elapsed_time": "1:18:59", "remaining_time": "0:18:48", "throughput": 4242.35, "total_tokens": 20104840} {"current_steps": 30825, "total_steps": 38160, "loss": 0.4991, "lr": 0.00010841705285943382, "epoch": 16.15566037735849, "percentage": 80.78, "elapsed_time": "1:18:59", "remaining_time": "0:18:47", "throughput": 4242.42, "total_tokens": 20108456} {"current_steps": 30830, "total_steps": 38160, "loss": 0.5275, "lr": 0.0001082748941227702, "epoch": 16.158280922431867, "percentage": 80.79, "elapsed_time": "1:19:00", "remaining_time": "0:18:47", "throughput": 4242.37, "total_tokens": 20110792} {"current_steps": 30835, "total_steps": 38160, "loss": 0.3189, "lr": 0.00010813281733052959, "epoch": 16.16090146750524, "percentage": 80.8, "elapsed_time": "1:19:01", "remaining_time": "0:18:46", "throughput": 4242.33, "total_tokens": 20113256} {"current_steps": 30840, "total_steps": 38160, "loss": 0.3421, "lr": 0.00010799082251243292, "epoch": 16.163522012578618, "percentage": 80.82, "elapsed_time": "1:19:01", "remaining_time": "0:18:45", "throughput": 4242.35, "total_tokens": 20116424} {"current_steps": 30845, "total_steps": 38160, "loss": 0.4724, "lr": 0.00010784890969818407, "epoch": 16.16614255765199, "percentage": 80.83, "elapsed_time": "1:19:02", "remaining_time": "0:18:44", "throughput": 4242.43, "total_tokens": 20120200} {"current_steps": 30850, "total_steps": 38160, "loss": 0.4551, "lr": 0.00010770707891746928, "epoch": 16.168763102725368, "percentage": 80.84, "elapsed_time": "1:19:03", "remaining_time": "0:18:43", "throughput": 4242.39, "total_tokens": 20122664} {"current_steps": 30855, "total_steps": 38160, "loss": 0.4967, "lr": 0.00010756533019995817, "epoch": 16.17138364779874, "percentage": 80.86, "elapsed_time": "1:19:03", "remaining_time": "0:18:43", "throughput": 4242.36, "total_tokens": 20125224} {"current_steps": 30860, "total_steps": 38160, "loss": 0.4081, "lr": 0.0001074236635753027, "epoch": 16.17400419287212, "percentage": 80.87, "elapsed_time": "1:19:04", "remaining_time": "0:18:42", "throughput": 4242.43, "total_tokens": 20128968} {"current_steps": 30865, "total_steps": 38160, "loss": 0.3962, "lr": 0.00010728207907313809, "epoch": 16.17662473794549, "percentage": 80.88, "elapsed_time": "1:19:05", "remaining_time": "0:18:41", "throughput": 4242.42, "total_tokens": 20131656} {"current_steps": 30870, "total_steps": 38160, "loss": 0.4583, "lr": 0.0001071405767230822, "epoch": 16.17924528301887, "percentage": 80.9, "elapsed_time": "1:19:06", "remaining_time": "0:18:40", "throughput": 4242.43, "total_tokens": 20134696} {"current_steps": 30875, "total_steps": 38160, "loss": 0.5193, "lr": 0.0001069991565547358, "epoch": 16.181865828092242, "percentage": 80.91, "elapsed_time": "1:19:06", "remaining_time": "0:18:39", "throughput": 4242.39, "total_tokens": 20137192} {"current_steps": 30880, "total_steps": 38160, "loss": 0.3216, "lr": 0.00010685781859768223, "epoch": 16.18448637316562, "percentage": 80.92, "elapsed_time": "1:19:07", "remaining_time": "0:18:39", "throughput": 4242.46, "total_tokens": 20140712} {"current_steps": 30885, "total_steps": 38160, "loss": 0.5536, "lr": 0.00010671656288148768, "epoch": 16.187106918238992, "percentage": 80.94, "elapsed_time": "1:19:08", "remaining_time": "0:18:38", "throughput": 4242.45, "total_tokens": 20143496} {"current_steps": 30890, "total_steps": 38160, "loss": 0.3488, "lr": 0.00010657538943570138, "epoch": 16.18972746331237, "percentage": 80.95, "elapsed_time": "1:19:08", "remaining_time": "0:18:37", "throughput": 4242.64, "total_tokens": 20148296} {"current_steps": 30895, "total_steps": 38160, "loss": 0.4, "lr": 0.00010643429828985518, "epoch": 16.192348008385743, "percentage": 80.96, "elapsed_time": "1:19:09", "remaining_time": "0:18:36", "throughput": 4242.74, "total_tokens": 20152168} {"current_steps": 30900, "total_steps": 38160, "loss": 0.4881, "lr": 0.0001062932894734639, "epoch": 16.19496855345912, "percentage": 80.97, "elapsed_time": "1:19:10", "remaining_time": "0:18:36", "throughput": 4242.8, "total_tokens": 20155784} {"current_steps": 30905, "total_steps": 38160, "loss": 0.5365, "lr": 0.00010615236301602476, "epoch": 16.197589098532493, "percentage": 80.99, "elapsed_time": "1:19:11", "remaining_time": "0:18:35", "throughput": 4242.84, "total_tokens": 20159112} {"current_steps": 30910, "total_steps": 38160, "loss": 0.3815, "lr": 0.00010601151894701794, "epoch": 16.20020964360587, "percentage": 81.0, "elapsed_time": "1:19:12", "remaining_time": "0:18:34", "throughput": 4242.84, "total_tokens": 20162152} {"current_steps": 30915, "total_steps": 38160, "loss": 0.4943, "lr": 0.0001058707572959065, "epoch": 16.202830188679247, "percentage": 81.01, "elapsed_time": "1:19:12", "remaining_time": "0:18:33", "throughput": 4242.84, "total_tokens": 20165032} {"current_steps": 30920, "total_steps": 38160, "loss": 0.409, "lr": 0.00010573007809213614, "epoch": 16.20545073375262, "percentage": 81.03, "elapsed_time": "1:19:13", "remaining_time": "0:18:33", "throughput": 4242.86, "total_tokens": 20168136} {"current_steps": 30925, "total_steps": 38160, "loss": 0.3598, "lr": 0.00010558948136513536, "epoch": 16.208071278825997, "percentage": 81.04, "elapsed_time": "1:19:14", "remaining_time": "0:18:32", "throughput": 4242.9, "total_tokens": 20171368} {"current_steps": 30930, "total_steps": 38160, "loss": 0.2471, "lr": 0.00010544896714431557, "epoch": 16.21069182389937, "percentage": 81.05, "elapsed_time": "1:19:14", "remaining_time": "0:18:31", "throughput": 4242.94, "total_tokens": 20174664} {"current_steps": 30935, "total_steps": 38160, "loss": 0.6162, "lr": 0.0001053085354590706, "epoch": 16.213312368972748, "percentage": 81.07, "elapsed_time": "1:19:15", "remaining_time": "0:18:30", "throughput": 4242.91, "total_tokens": 20177224} {"current_steps": 30940, "total_steps": 38160, "loss": 0.3922, "lr": 0.00010516818633877695, "epoch": 16.21593291404612, "percentage": 81.08, "elapsed_time": "1:19:16", "remaining_time": "0:18:29", "throughput": 4242.92, "total_tokens": 20180200} {"current_steps": 30945, "total_steps": 38160, "loss": 0.3642, "lr": 0.00010502791981279425, "epoch": 16.218553459119498, "percentage": 81.09, "elapsed_time": "1:19:16", "remaining_time": "0:18:29", "throughput": 4242.97, "total_tokens": 20183592} {"current_steps": 30950, "total_steps": 38160, "loss": 0.4273, "lr": 0.00010488773591046469, "epoch": 16.22117400419287, "percentage": 81.11, "elapsed_time": "1:19:17", "remaining_time": "0:18:28", "throughput": 4243.0, "total_tokens": 20186760} {"current_steps": 30955, "total_steps": 38160, "loss": 0.4017, "lr": 0.0001047476346611132, "epoch": 16.22379454926625, "percentage": 81.12, "elapsed_time": "1:19:18", "remaining_time": "0:18:27", "throughput": 4243.01, "total_tokens": 20189864} {"current_steps": 30960, "total_steps": 38160, "loss": 0.4602, "lr": 0.00010460761609404724, "epoch": 16.22641509433962, "percentage": 81.13, "elapsed_time": "1:19:19", "remaining_time": "0:18:26", "throughput": 4243.04, "total_tokens": 20193096} {"current_steps": 30965, "total_steps": 38160, "loss": 0.396, "lr": 0.00010446768023855701, "epoch": 16.229035639413, "percentage": 81.15, "elapsed_time": "1:19:19", "remaining_time": "0:18:25", "throughput": 4243.05, "total_tokens": 20196136} {"current_steps": 30970, "total_steps": 38160, "loss": 0.4545, "lr": 0.00010432782712391559, "epoch": 16.231656184486372, "percentage": 81.16, "elapsed_time": "1:19:20", "remaining_time": "0:18:25", "throughput": 4243.14, "total_tokens": 20199880} {"current_steps": 30975, "total_steps": 38160, "loss": 0.4351, "lr": 0.00010418805677937871, "epoch": 16.23427672955975, "percentage": 81.17, "elapsed_time": "1:19:21", "remaining_time": "0:18:24", "throughput": 4243.24, "total_tokens": 20203752} {"current_steps": 30980, "total_steps": 38160, "loss": 0.3442, "lr": 0.00010404836923418465, "epoch": 16.236897274633122, "percentage": 81.18, "elapsed_time": "1:19:22", "remaining_time": "0:18:23", "throughput": 4243.26, "total_tokens": 20206760} {"current_steps": 30985, "total_steps": 38160, "loss": 0.4399, "lr": 0.00010390876451755477, "epoch": 16.2395178197065, "percentage": 81.2, "elapsed_time": "1:19:22", "remaining_time": "0:18:22", "throughput": 4243.21, "total_tokens": 20209096} {"current_steps": 30990, "total_steps": 38160, "loss": 0.3111, "lr": 0.0001037692426586922, "epoch": 16.242138364779873, "percentage": 81.21, "elapsed_time": "1:19:23", "remaining_time": "0:18:22", "throughput": 4243.26, "total_tokens": 20212520} {"current_steps": 30995, "total_steps": 38160, "loss": 0.3587, "lr": 0.0001036298036867837, "epoch": 16.24475890985325, "percentage": 81.22, "elapsed_time": "1:19:24", "remaining_time": "0:18:21", "throughput": 4243.28, "total_tokens": 20215720} {"current_steps": 31000, "total_steps": 38160, "loss": 0.317, "lr": 0.00010349044763099819, "epoch": 16.247379454926623, "percentage": 81.24, "elapsed_time": "1:19:24", "remaining_time": "0:18:20", "throughput": 4243.32, "total_tokens": 20219048} {"current_steps": 31005, "total_steps": 38160, "loss": 0.5751, "lr": 0.00010335117452048742, "epoch": 16.25, "percentage": 81.25, "elapsed_time": "1:19:25", "remaining_time": "0:18:19", "throughput": 4243.36, "total_tokens": 20222440} {"current_steps": 31010, "total_steps": 38160, "loss": 0.4434, "lr": 0.00010321198438438589, "epoch": 16.252620545073377, "percentage": 81.26, "elapsed_time": "1:19:26", "remaining_time": "0:18:18", "throughput": 4243.34, "total_tokens": 20225224} {"current_steps": 31015, "total_steps": 38160, "loss": 0.4626, "lr": 0.00010307287725181036, "epoch": 16.25524109014675, "percentage": 81.28, "elapsed_time": "1:19:27", "remaining_time": "0:18:18", "throughput": 4243.4, "total_tokens": 20228680} {"current_steps": 31020, "total_steps": 38160, "loss": 0.5654, "lr": 0.00010293385315186049, "epoch": 16.257861635220127, "percentage": 81.29, "elapsed_time": "1:19:27", "remaining_time": "0:18:17", "throughput": 4243.35, "total_tokens": 20231176} {"current_steps": 31025, "total_steps": 38160, "loss": 0.4239, "lr": 0.00010279491211361853, "epoch": 16.2604821802935, "percentage": 81.3, "elapsed_time": "1:19:28", "remaining_time": "0:18:16", "throughput": 4243.32, "total_tokens": 20233672} {"current_steps": 31030, "total_steps": 38160, "loss": 0.3132, "lr": 0.00010265605416614938, "epoch": 16.263102725366878, "percentage": 81.32, "elapsed_time": "1:19:29", "remaining_time": "0:18:15", "throughput": 4243.29, "total_tokens": 20236424} {"current_steps": 31035, "total_steps": 38160, "loss": 0.4503, "lr": 0.00010251727933850069, "epoch": 16.26572327044025, "percentage": 81.33, "elapsed_time": "1:19:29", "remaining_time": "0:18:15", "throughput": 4243.29, "total_tokens": 20239336} {"current_steps": 31040, "total_steps": 38160, "loss": 0.4309, "lr": 0.00010237858765970231, "epoch": 16.268343815513628, "percentage": 81.34, "elapsed_time": "1:19:30", "remaining_time": "0:18:14", "throughput": 4243.27, "total_tokens": 20242056} {"current_steps": 31045, "total_steps": 38160, "loss": 0.3691, "lr": 0.00010223997915876726, "epoch": 16.270964360587, "percentage": 81.35, "elapsed_time": "1:19:31", "remaining_time": "0:18:13", "throughput": 4243.31, "total_tokens": 20245384} {"current_steps": 31050, "total_steps": 38160, "loss": 0.4096, "lr": 0.00010210145386469049, "epoch": 16.27358490566038, "percentage": 81.37, "elapsed_time": "1:19:31", "remaining_time": "0:18:12", "throughput": 4243.38, "total_tokens": 20248936} {"current_steps": 31055, "total_steps": 38160, "loss": 0.3856, "lr": 0.00010196301180645012, "epoch": 16.27620545073375, "percentage": 81.38, "elapsed_time": "1:19:32", "remaining_time": "0:18:11", "throughput": 4243.54, "total_tokens": 20253416} {"current_steps": 31060, "total_steps": 38160, "loss": 0.4377, "lr": 0.0001018246530130067, "epoch": 16.27882599580713, "percentage": 81.39, "elapsed_time": "1:19:33", "remaining_time": "0:18:11", "throughput": 4243.61, "total_tokens": 20256968} {"current_steps": 31065, "total_steps": 38160, "loss": 0.5599, "lr": 0.00010168637751330328, "epoch": 16.281446540880502, "percentage": 81.41, "elapsed_time": "1:19:34", "remaining_time": "0:18:10", "throughput": 4243.6, "total_tokens": 20259752} {"current_steps": 31070, "total_steps": 38160, "loss": 0.4506, "lr": 0.00010154818533626552, "epoch": 16.28406708595388, "percentage": 81.42, "elapsed_time": "1:19:34", "remaining_time": "0:18:09", "throughput": 4243.6, "total_tokens": 20262600} {"current_steps": 31075, "total_steps": 38160, "loss": 0.3701, "lr": 0.00010141007651080153, "epoch": 16.286687631027252, "percentage": 81.43, "elapsed_time": "1:19:35", "remaining_time": "0:18:08", "throughput": 4243.64, "total_tokens": 20265896} {"current_steps": 31080, "total_steps": 38160, "loss": 0.4934, "lr": 0.00010127205106580212, "epoch": 16.28930817610063, "percentage": 81.45, "elapsed_time": "1:19:36", "remaining_time": "0:18:08", "throughput": 4243.67, "total_tokens": 20269224} {"current_steps": 31085, "total_steps": 38160, "loss": 0.3253, "lr": 0.0001011341090301407, "epoch": 16.291928721174003, "percentage": 81.46, "elapsed_time": "1:19:37", "remaining_time": "0:18:07", "throughput": 4243.66, "total_tokens": 20272072} {"current_steps": 31090, "total_steps": 38160, "loss": 0.4369, "lr": 0.00010099625043267336, "epoch": 16.29454926624738, "percentage": 81.47, "elapsed_time": "1:19:37", "remaining_time": "0:18:06", "throughput": 4243.71, "total_tokens": 20275400} {"current_steps": 31095, "total_steps": 38160, "loss": 0.4208, "lr": 0.00010085847530223812, "epoch": 16.297169811320753, "percentage": 81.49, "elapsed_time": "1:19:38", "remaining_time": "0:18:05", "throughput": 4243.83, "total_tokens": 20279560} {"current_steps": 31100, "total_steps": 38160, "loss": 0.4424, "lr": 0.00010072078366765641, "epoch": 16.29979035639413, "percentage": 81.5, "elapsed_time": "1:19:39", "remaining_time": "0:18:04", "throughput": 4243.86, "total_tokens": 20282728} {"current_steps": 31105, "total_steps": 38160, "loss": 0.5126, "lr": 0.00010058317555773139, "epoch": 16.302410901467507, "percentage": 81.51, "elapsed_time": "1:19:39", "remaining_time": "0:18:04", "throughput": 4243.82, "total_tokens": 20285224} {"current_steps": 31110, "total_steps": 38160, "loss": 0.3601, "lr": 0.00010044565100124925, "epoch": 16.30503144654088, "percentage": 81.53, "elapsed_time": "1:19:40", "remaining_time": "0:18:03", "throughput": 4243.86, "total_tokens": 20288552} {"current_steps": 31115, "total_steps": 38160, "loss": 0.4361, "lr": 0.00010030821002697871, "epoch": 16.307651991614257, "percentage": 81.54, "elapsed_time": "1:19:41", "remaining_time": "0:18:02", "throughput": 4244.0, "total_tokens": 20292776} {"current_steps": 31120, "total_steps": 38160, "loss": 0.5731, "lr": 0.00010017085266367054, "epoch": 16.31027253668763, "percentage": 81.55, "elapsed_time": "1:19:42", "remaining_time": "0:18:01", "throughput": 4243.95, "total_tokens": 20295208} {"current_steps": 31125, "total_steps": 38160, "loss": 0.4165, "lr": 0.00010003357894005854, "epoch": 16.312893081761008, "percentage": 81.56, "elapsed_time": "1:19:42", "remaining_time": "0:18:01", "throughput": 4243.94, "total_tokens": 20297960} {"current_steps": 31130, "total_steps": 38160, "loss": 0.5239, "lr": 9.989638888485885e-05, "epoch": 16.31551362683438, "percentage": 81.58, "elapsed_time": "1:19:43", "remaining_time": "0:18:00", "throughput": 4243.95, "total_tokens": 20300968} {"current_steps": 31135, "total_steps": 38160, "loss": 0.4736, "lr": 9.975928252676991e-05, "epoch": 16.318134171907758, "percentage": 81.59, "elapsed_time": "1:19:44", "remaining_time": "0:17:59", "throughput": 4244.03, "total_tokens": 20304648} {"current_steps": 31140, "total_steps": 38160, "loss": 0.4894, "lr": 9.962225989447288e-05, "epoch": 16.32075471698113, "percentage": 81.6, "elapsed_time": "1:19:45", "remaining_time": "0:17:58", "throughput": 4244.12, "total_tokens": 20308488} {"current_steps": 31145, "total_steps": 38160, "loss": 0.4695, "lr": 9.948532101663144e-05, "epoch": 16.32337526205451, "percentage": 81.62, "elapsed_time": "1:19:45", "remaining_time": "0:17:57", "throughput": 4244.13, "total_tokens": 20311560} {"current_steps": 31150, "total_steps": 38160, "loss": 0.4023, "lr": 9.934846592189134e-05, "epoch": 16.32599580712788, "percentage": 81.63, "elapsed_time": "1:19:46", "remaining_time": "0:17:57", "throughput": 4244.23, "total_tokens": 20315592} {"current_steps": 31155, "total_steps": 38160, "loss": 0.4931, "lr": 9.921169463888153e-05, "epoch": 16.32861635220126, "percentage": 81.64, "elapsed_time": "1:19:47", "remaining_time": "0:17:56", "throughput": 4244.32, "total_tokens": 20319304} {"current_steps": 31160, "total_steps": 38160, "loss": 0.3734, "lr": 9.907500719621253e-05, "epoch": 16.331236897274632, "percentage": 81.66, "elapsed_time": "1:19:48", "remaining_time": "0:17:55", "throughput": 4244.51, "total_tokens": 20324264} {"current_steps": 31165, "total_steps": 38160, "loss": 0.3387, "lr": 9.893840362247809e-05, "epoch": 16.33385744234801, "percentage": 81.67, "elapsed_time": "1:19:48", "remaining_time": "0:17:54", "throughput": 4244.47, "total_tokens": 20326696} {"current_steps": 31170, "total_steps": 38160, "loss": 0.5011, "lr": 9.880188394625417e-05, "epoch": 16.336477987421382, "percentage": 81.68, "elapsed_time": "1:19:49", "remaining_time": "0:17:54", "throughput": 4244.53, "total_tokens": 20330248} {"current_steps": 31175, "total_steps": 38160, "loss": 0.3321, "lr": 9.86654481960989e-05, "epoch": 16.33909853249476, "percentage": 81.7, "elapsed_time": "1:19:50", "remaining_time": "0:17:53", "throughput": 4244.47, "total_tokens": 20332552} {"current_steps": 31180, "total_steps": 38160, "loss": 0.479, "lr": 9.852909640055325e-05, "epoch": 16.341719077568133, "percentage": 81.71, "elapsed_time": "1:19:51", "remaining_time": "0:17:52", "throughput": 4244.46, "total_tokens": 20335304} {"current_steps": 31185, "total_steps": 38160, "loss": 0.5273, "lr": 9.839282858814047e-05, "epoch": 16.34433962264151, "percentage": 81.72, "elapsed_time": "1:19:51", "remaining_time": "0:17:51", "throughput": 4244.44, "total_tokens": 20337992} {"current_steps": 31190, "total_steps": 38160, "loss": 0.4119, "lr": 9.825664478736607e-05, "epoch": 16.346960167714883, "percentage": 81.73, "elapsed_time": "1:19:52", "remaining_time": "0:17:50", "throughput": 4244.42, "total_tokens": 20340680} {"current_steps": 31195, "total_steps": 38160, "loss": 0.3976, "lr": 9.812054502671835e-05, "epoch": 16.34958071278826, "percentage": 81.75, "elapsed_time": "1:19:53", "remaining_time": "0:17:50", "throughput": 4244.45, "total_tokens": 20343848} {"current_steps": 31200, "total_steps": 38160, "loss": 0.3512, "lr": 9.798452933466761e-05, "epoch": 16.352201257861637, "percentage": 81.76, "elapsed_time": "1:19:53", "remaining_time": "0:17:49", "throughput": 4244.47, "total_tokens": 20346792} {"current_steps": 31205, "total_steps": 38160, "loss": 0.4072, "lr": 9.784859773966693e-05, "epoch": 16.35482180293501, "percentage": 81.77, "elapsed_time": "1:19:54", "remaining_time": "0:17:48", "throughput": 4244.46, "total_tokens": 20349544} {"current_steps": 31210, "total_steps": 38160, "loss": 0.4851, "lr": 9.771275027015159e-05, "epoch": 16.357442348008387, "percentage": 81.79, "elapsed_time": "1:19:55", "remaining_time": "0:17:47", "throughput": 4244.5, "total_tokens": 20352904} {"current_steps": 31215, "total_steps": 38160, "loss": 0.3348, "lr": 9.757698695453954e-05, "epoch": 16.36006289308176, "percentage": 81.8, "elapsed_time": "1:19:55", "remaining_time": "0:17:47", "throughput": 4244.57, "total_tokens": 20356424} {"current_steps": 31220, "total_steps": 38160, "loss": 0.4245, "lr": 9.74413078212305e-05, "epoch": 16.362683438155138, "percentage": 81.81, "elapsed_time": "1:19:56", "remaining_time": "0:17:46", "throughput": 4244.68, "total_tokens": 20360264} {"current_steps": 31225, "total_steps": 38160, "loss": 0.4175, "lr": 9.730571289860746e-05, "epoch": 16.36530398322851, "percentage": 81.83, "elapsed_time": "1:19:57", "remaining_time": "0:17:45", "throughput": 4244.75, "total_tokens": 20363848} {"current_steps": 31230, "total_steps": 38160, "loss": 0.408, "lr": 9.717020221503493e-05, "epoch": 16.367924528301888, "percentage": 81.84, "elapsed_time": "1:19:58", "remaining_time": "0:17:44", "throughput": 4244.71, "total_tokens": 20366280} {"current_steps": 31235, "total_steps": 38160, "loss": 0.2796, "lr": 9.703477579886038e-05, "epoch": 16.37054507337526, "percentage": 81.85, "elapsed_time": "1:19:58", "remaining_time": "0:17:43", "throughput": 4244.84, "total_tokens": 20370568} {"current_steps": 31240, "total_steps": 38160, "loss": 0.4014, "lr": 9.689943367841347e-05, "epoch": 16.37316561844864, "percentage": 81.87, "elapsed_time": "1:19:59", "remaining_time": "0:17:43", "throughput": 4244.89, "total_tokens": 20373928} {"current_steps": 31245, "total_steps": 38160, "loss": 0.4361, "lr": 9.676417588200632e-05, "epoch": 16.37578616352201, "percentage": 81.88, "elapsed_time": "1:20:00", "remaining_time": "0:17:42", "throughput": 4244.86, "total_tokens": 20376488} {"current_steps": 31250, "total_steps": 38160, "loss": 0.3711, "lr": 9.662900243793321e-05, "epoch": 16.37840670859539, "percentage": 81.89, "elapsed_time": "1:20:00", "remaining_time": "0:17:41", "throughput": 4244.84, "total_tokens": 20379176} {"current_steps": 31255, "total_steps": 38160, "loss": 0.4894, "lr": 9.649391337447084e-05, "epoch": 16.381027253668762, "percentage": 81.91, "elapsed_time": "1:20:01", "remaining_time": "0:17:40", "throughput": 4244.8, "total_tokens": 20381736} {"current_steps": 31260, "total_steps": 38160, "loss": 0.3595, "lr": 9.635890871987829e-05, "epoch": 16.38364779874214, "percentage": 81.92, "elapsed_time": "1:20:02", "remaining_time": "0:17:40", "throughput": 4244.84, "total_tokens": 20385064} {"current_steps": 31265, "total_steps": 38160, "loss": 0.45, "lr": 9.622398850239705e-05, "epoch": 16.386268343815512, "percentage": 81.93, "elapsed_time": "1:20:03", "remaining_time": "0:17:39", "throughput": 4244.86, "total_tokens": 20388072} {"current_steps": 31270, "total_steps": 38160, "loss": 0.5099, "lr": 9.608915275025104e-05, "epoch": 16.38888888888889, "percentage": 81.94, "elapsed_time": "1:20:03", "remaining_time": "0:17:38", "throughput": 4244.88, "total_tokens": 20391080} {"current_steps": 31275, "total_steps": 38160, "loss": 0.4457, "lr": 9.595440149164619e-05, "epoch": 16.391509433962263, "percentage": 81.96, "elapsed_time": "1:20:04", "remaining_time": "0:17:37", "throughput": 4244.89, "total_tokens": 20394024} {"current_steps": 31280, "total_steps": 38160, "loss": 0.3565, "lr": 9.581973475477085e-05, "epoch": 16.39412997903564, "percentage": 81.97, "elapsed_time": "1:20:05", "remaining_time": "0:17:36", "throughput": 4244.96, "total_tokens": 20397672} {"current_steps": 31285, "total_steps": 38160, "loss": 0.5242, "lr": 9.568515256779587e-05, "epoch": 16.396750524109013, "percentage": 81.98, "elapsed_time": "1:20:05", "remaining_time": "0:17:36", "throughput": 4245.03, "total_tokens": 20401352} {"current_steps": 31290, "total_steps": 38160, "loss": 0.4035, "lr": 9.555065495887433e-05, "epoch": 16.39937106918239, "percentage": 82.0, "elapsed_time": "1:20:06", "remaining_time": "0:17:35", "throughput": 4245.01, "total_tokens": 20404008} {"current_steps": 31295, "total_steps": 38160, "loss": 0.5858, "lr": 9.541624195614152e-05, "epoch": 16.401991614255767, "percentage": 82.01, "elapsed_time": "1:20:07", "remaining_time": "0:17:34", "throughput": 4245.06, "total_tokens": 20407496} {"current_steps": 31300, "total_steps": 38160, "loss": 0.4291, "lr": 9.528191358771532e-05, "epoch": 16.40461215932914, "percentage": 82.02, "elapsed_time": "1:20:08", "remaining_time": "0:17:33", "throughput": 4245.09, "total_tokens": 20410696} {"current_steps": 31305, "total_steps": 38160, "loss": 0.4721, "lr": 9.514766988169549e-05, "epoch": 16.407232704402517, "percentage": 82.04, "elapsed_time": "1:20:08", "remaining_time": "0:17:33", "throughput": 4245.09, "total_tokens": 20413736} {"current_steps": 31310, "total_steps": 38160, "loss": 0.3869, "lr": 9.501351086616422e-05, "epoch": 16.40985324947589, "percentage": 82.05, "elapsed_time": "1:20:09", "remaining_time": "0:17:32", "throughput": 4245.14, "total_tokens": 20417160} {"current_steps": 31315, "total_steps": 38160, "loss": 0.4378, "lr": 9.487943656918613e-05, "epoch": 16.412473794549268, "percentage": 82.06, "elapsed_time": "1:20:10", "remaining_time": "0:17:31", "throughput": 4245.19, "total_tokens": 20420520} {"current_steps": 31320, "total_steps": 38160, "loss": 0.4157, "lr": 9.474544701880805e-05, "epoch": 16.41509433962264, "percentage": 82.08, "elapsed_time": "1:20:10", "remaining_time": "0:17:30", "throughput": 4245.17, "total_tokens": 20423272} {"current_steps": 31325, "total_steps": 38160, "loss": 0.409, "lr": 9.461154224305923e-05, "epoch": 16.417714884696018, "percentage": 82.09, "elapsed_time": "1:20:11", "remaining_time": "0:17:29", "throughput": 4245.18, "total_tokens": 20426216} {"current_steps": 31330, "total_steps": 38160, "loss": 0.4478, "lr": 9.447772226995082e-05, "epoch": 16.42033542976939, "percentage": 82.1, "elapsed_time": "1:20:12", "remaining_time": "0:17:29", "throughput": 4245.21, "total_tokens": 20429512} {"current_steps": 31335, "total_steps": 38160, "loss": 0.4889, "lr": 9.434398712747639e-05, "epoch": 16.42295597484277, "percentage": 82.11, "elapsed_time": "1:20:13", "remaining_time": "0:17:28", "throughput": 4245.27, "total_tokens": 20433064} {"current_steps": 31340, "total_steps": 38160, "loss": 0.466, "lr": 9.421033684361185e-05, "epoch": 16.42557651991614, "percentage": 82.13, "elapsed_time": "1:20:13", "remaining_time": "0:17:27", "throughput": 4245.29, "total_tokens": 20436232} {"current_steps": 31345, "total_steps": 38160, "loss": 0.4761, "lr": 9.407677144631533e-05, "epoch": 16.42819706498952, "percentage": 82.14, "elapsed_time": "1:20:14", "remaining_time": "0:17:26", "throughput": 4245.35, "total_tokens": 20439688} {"current_steps": 31350, "total_steps": 38160, "loss": 0.6238, "lr": 9.394329096352732e-05, "epoch": 16.430817610062892, "percentage": 82.15, "elapsed_time": "1:20:15", "remaining_time": "0:17:26", "throughput": 4245.38, "total_tokens": 20442888} {"current_steps": 31355, "total_steps": 38160, "loss": 0.4736, "lr": 9.380989542317037e-05, "epoch": 16.43343815513627, "percentage": 82.17, "elapsed_time": "1:20:16", "remaining_time": "0:17:25", "throughput": 4245.4, "total_tokens": 20445928} {"current_steps": 31360, "total_steps": 38160, "loss": 0.352, "lr": 9.367658485314907e-05, "epoch": 16.436058700209642, "percentage": 82.18, "elapsed_time": "1:20:16", "remaining_time": "0:17:24", "throughput": 4245.37, "total_tokens": 20448552} {"current_steps": 31365, "total_steps": 38160, "loss": 0.4178, "lr": 9.354335928135066e-05, "epoch": 16.43867924528302, "percentage": 82.19, "elapsed_time": "1:20:17", "remaining_time": "0:17:23", "throughput": 4245.35, "total_tokens": 20451304} {"current_steps": 31370, "total_steps": 38160, "loss": 0.4535, "lr": 9.341021873564432e-05, "epoch": 16.441299790356393, "percentage": 82.21, "elapsed_time": "1:20:18", "remaining_time": "0:17:22", "throughput": 4245.38, "total_tokens": 20454408} {"current_steps": 31375, "total_steps": 38160, "loss": 0.381, "lr": 9.327716324388164e-05, "epoch": 16.44392033542977, "percentage": 82.22, "elapsed_time": "1:20:18", "remaining_time": "0:17:22", "throughput": 4245.39, "total_tokens": 20457384} {"current_steps": 31380, "total_steps": 38160, "loss": 0.3917, "lr": 9.314419283389641e-05, "epoch": 16.446540880503143, "percentage": 82.23, "elapsed_time": "1:20:19", "remaining_time": "0:17:21", "throughput": 4245.4, "total_tokens": 20460456} {"current_steps": 31385, "total_steps": 38160, "loss": 0.3997, "lr": 9.30113075335044e-05, "epoch": 16.44916142557652, "percentage": 82.25, "elapsed_time": "1:20:20", "remaining_time": "0:17:20", "throughput": 4245.4, "total_tokens": 20463336} {"current_steps": 31390, "total_steps": 38160, "loss": 0.4723, "lr": 9.287850737050352e-05, "epoch": 16.451781970649897, "percentage": 82.26, "elapsed_time": "1:20:20", "remaining_time": "0:17:19", "throughput": 4245.37, "total_tokens": 20465928} {"current_steps": 31395, "total_steps": 38160, "loss": 0.4146, "lr": 9.274579237267422e-05, "epoch": 16.45440251572327, "percentage": 82.27, "elapsed_time": "1:20:21", "remaining_time": "0:17:18", "throughput": 4245.34, "total_tokens": 20468584} {"current_steps": 31400, "total_steps": 38160, "loss": 0.4563, "lr": 9.261316256777897e-05, "epoch": 16.457023060796647, "percentage": 82.29, "elapsed_time": "1:20:22", "remaining_time": "0:17:18", "throughput": 4245.33, "total_tokens": 20471336} {"current_steps": 31405, "total_steps": 38160, "loss": 0.3636, "lr": 9.24806179835625e-05, "epoch": 16.45964360587002, "percentage": 82.3, "elapsed_time": "1:20:22", "remaining_time": "0:17:17", "throughput": 4245.38, "total_tokens": 20474696} {"current_steps": 31410, "total_steps": 38160, "loss": 0.4297, "lr": 9.234815864775137e-05, "epoch": 16.462264150943398, "percentage": 82.31, "elapsed_time": "1:20:23", "remaining_time": "0:17:16", "throughput": 4245.4, "total_tokens": 20477832} {"current_steps": 31415, "total_steps": 38160, "loss": 0.5195, "lr": 9.221578458805485e-05, "epoch": 16.46488469601677, "percentage": 82.32, "elapsed_time": "1:20:24", "remaining_time": "0:17:15", "throughput": 4245.44, "total_tokens": 20481160} {"current_steps": 31420, "total_steps": 38160, "loss": 0.4483, "lr": 9.208349583216385e-05, "epoch": 16.467505241090148, "percentage": 82.34, "elapsed_time": "1:20:25", "remaining_time": "0:17:15", "throughput": 4245.5, "total_tokens": 20484648} {"current_steps": 31425, "total_steps": 38160, "loss": 0.2617, "lr": 9.195129240775174e-05, "epoch": 16.47012578616352, "percentage": 82.35, "elapsed_time": "1:20:25", "remaining_time": "0:17:14", "throughput": 4245.42, "total_tokens": 20486696} {"current_steps": 31430, "total_steps": 38160, "loss": 0.4182, "lr": 9.181917434247417e-05, "epoch": 16.4727463312369, "percentage": 82.36, "elapsed_time": "1:20:26", "remaining_time": "0:17:13", "throughput": 4245.43, "total_tokens": 20489640} {"current_steps": 31435, "total_steps": 38160, "loss": 0.5267, "lr": 9.168714166396835e-05, "epoch": 16.47536687631027, "percentage": 82.38, "elapsed_time": "1:20:26", "remaining_time": "0:17:12", "throughput": 4245.42, "total_tokens": 20492392} {"current_steps": 31440, "total_steps": 38160, "loss": 0.3923, "lr": 9.155519439985438e-05, "epoch": 16.47798742138365, "percentage": 82.39, "elapsed_time": "1:20:27", "remaining_time": "0:17:11", "throughput": 4245.39, "total_tokens": 20494984} {"current_steps": 31445, "total_steps": 38160, "loss": 0.409, "lr": 9.142333257773383e-05, "epoch": 16.480607966457022, "percentage": 82.4, "elapsed_time": "1:20:28", "remaining_time": "0:17:11", "throughput": 4245.39, "total_tokens": 20497832} {"current_steps": 31450, "total_steps": 38160, "loss": 0.3543, "lr": 9.12915562251908e-05, "epoch": 16.4832285115304, "percentage": 82.42, "elapsed_time": "1:20:28", "remaining_time": "0:17:10", "throughput": 4245.36, "total_tokens": 20500488} {"current_steps": 31455, "total_steps": 38160, "loss": 0.4616, "lr": 9.115986536979149e-05, "epoch": 16.485849056603772, "percentage": 82.43, "elapsed_time": "1:20:29", "remaining_time": "0:17:09", "throughput": 4245.38, "total_tokens": 20503688} {"current_steps": 31460, "total_steps": 38160, "loss": 0.3292, "lr": 9.10282600390841e-05, "epoch": 16.48846960167715, "percentage": 82.44, "elapsed_time": "1:20:30", "remaining_time": "0:17:08", "throughput": 4245.5, "total_tokens": 20507816} {"current_steps": 31465, "total_steps": 38160, "loss": 0.5437, "lr": 9.08967402605988e-05, "epoch": 16.491090146750523, "percentage": 82.46, "elapsed_time": "1:20:31", "remaining_time": "0:17:07", "throughput": 4245.53, "total_tokens": 20510920} {"current_steps": 31470, "total_steps": 38160, "loss": 0.4037, "lr": 9.07653060618483e-05, "epoch": 16.4937106918239, "percentage": 82.47, "elapsed_time": "1:20:31", "remaining_time": "0:17:07", "throughput": 4245.58, "total_tokens": 20514408} {"current_steps": 31475, "total_steps": 38160, "loss": 0.3909, "lr": 9.063395747032676e-05, "epoch": 16.496331236897273, "percentage": 82.48, "elapsed_time": "1:20:32", "remaining_time": "0:17:06", "throughput": 4245.69, "total_tokens": 20518472} {"current_steps": 31480, "total_steps": 38160, "loss": 0.5352, "lr": 9.050269451351112e-05, "epoch": 16.49895178197065, "percentage": 82.49, "elapsed_time": "1:20:33", "remaining_time": "0:17:05", "throughput": 4245.67, "total_tokens": 20521064} {"current_steps": 31485, "total_steps": 38160, "loss": 0.4856, "lr": 9.037151721886006e-05, "epoch": 16.501572327044027, "percentage": 82.51, "elapsed_time": "1:20:34", "remaining_time": "0:17:04", "throughput": 4245.65, "total_tokens": 20523784} {"current_steps": 31490, "total_steps": 38160, "loss": 0.4598, "lr": 9.024042561381424e-05, "epoch": 16.5041928721174, "percentage": 82.52, "elapsed_time": "1:20:34", "remaining_time": "0:17:04", "throughput": 4245.77, "total_tokens": 20527976} {"current_steps": 31495, "total_steps": 38160, "loss": 0.5437, "lr": 9.010941972579656e-05, "epoch": 16.506813417190777, "percentage": 82.53, "elapsed_time": "1:20:35", "remaining_time": "0:17:03", "throughput": 4245.85, "total_tokens": 20531784} {"current_steps": 31500, "total_steps": 38160, "loss": 0.4616, "lr": 8.99784995822121e-05, "epoch": 16.50943396226415, "percentage": 82.55, "elapsed_time": "1:20:36", "remaining_time": "0:17:02", "throughput": 4245.89, "total_tokens": 20535048} {"current_steps": 31505, "total_steps": 38160, "loss": 0.5221, "lr": 8.984766521044769e-05, "epoch": 16.512054507337528, "percentage": 82.56, "elapsed_time": "1:20:37", "remaining_time": "0:17:01", "throughput": 4245.86, "total_tokens": 20537672} {"current_steps": 31510, "total_steps": 38160, "loss": 0.3371, "lr": 8.971691663787252e-05, "epoch": 16.5146750524109, "percentage": 82.57, "elapsed_time": "1:20:37", "remaining_time": "0:17:00", "throughput": 4245.84, "total_tokens": 20540264} {"current_steps": 31515, "total_steps": 38160, "loss": 0.3705, "lr": 8.958625389183756e-05, "epoch": 16.517295597484278, "percentage": 82.59, "elapsed_time": "1:20:38", "remaining_time": "0:17:00", "throughput": 4245.84, "total_tokens": 20543208} {"current_steps": 31520, "total_steps": 38160, "loss": 0.401, "lr": 8.9455676999676e-05, "epoch": 16.51991614255765, "percentage": 82.6, "elapsed_time": "1:20:39", "remaining_time": "0:16:59", "throughput": 4245.9, "total_tokens": 20546632} {"current_steps": 31525, "total_steps": 38160, "loss": 0.5345, "lr": 8.932518598870309e-05, "epoch": 16.52253668763103, "percentage": 82.61, "elapsed_time": "1:20:39", "remaining_time": "0:16:58", "throughput": 4245.88, "total_tokens": 20549256} {"current_steps": 31530, "total_steps": 38160, "loss": 0.5228, "lr": 8.919478088621614e-05, "epoch": 16.5251572327044, "percentage": 82.63, "elapsed_time": "1:20:40", "remaining_time": "0:16:57", "throughput": 4245.85, "total_tokens": 20551880} {"current_steps": 31535, "total_steps": 38160, "loss": 0.4004, "lr": 8.906446171949422e-05, "epoch": 16.52777777777778, "percentage": 82.64, "elapsed_time": "1:20:41", "remaining_time": "0:16:57", "throughput": 4245.91, "total_tokens": 20555368} {"current_steps": 31540, "total_steps": 38160, "loss": 0.3146, "lr": 8.893422851579885e-05, "epoch": 16.530398322851152, "percentage": 82.65, "elapsed_time": "1:20:41", "remaining_time": "0:16:56", "throughput": 4245.86, "total_tokens": 20557864} {"current_steps": 31545, "total_steps": 38160, "loss": 0.3762, "lr": 8.8804081302373e-05, "epoch": 16.53301886792453, "percentage": 82.67, "elapsed_time": "1:20:42", "remaining_time": "0:16:55", "throughput": 4245.97, "total_tokens": 20561800} {"current_steps": 31550, "total_steps": 38160, "loss": 0.3875, "lr": 8.867402010644221e-05, "epoch": 16.535639412997902, "percentage": 82.68, "elapsed_time": "1:20:43", "remaining_time": "0:16:54", "throughput": 4246.01, "total_tokens": 20565128} {"current_steps": 31555, "total_steps": 38160, "loss": 0.3315, "lr": 8.854404495521389e-05, "epoch": 16.53825995807128, "percentage": 82.69, "elapsed_time": "1:20:44", "remaining_time": "0:16:53", "throughput": 4246.07, "total_tokens": 20568648} {"current_steps": 31560, "total_steps": 38160, "loss": 0.3787, "lr": 8.841415587587709e-05, "epoch": 16.540880503144653, "percentage": 82.7, "elapsed_time": "1:20:44", "remaining_time": "0:16:53", "throughput": 4246.09, "total_tokens": 20571816} {"current_steps": 31565, "total_steps": 38160, "loss": 0.5082, "lr": 8.828435289560344e-05, "epoch": 16.54350104821803, "percentage": 82.72, "elapsed_time": "1:20:45", "remaining_time": "0:16:52", "throughput": 4246.24, "total_tokens": 20576136} {"current_steps": 31570, "total_steps": 38160, "loss": 0.4798, "lr": 8.815463604154588e-05, "epoch": 16.546121593291403, "percentage": 82.73, "elapsed_time": "1:20:46", "remaining_time": "0:16:51", "throughput": 4246.18, "total_tokens": 20578472} {"current_steps": 31575, "total_steps": 38160, "loss": 0.5097, "lr": 8.80250053408399e-05, "epoch": 16.54874213836478, "percentage": 82.74, "elapsed_time": "1:20:47", "remaining_time": "0:16:50", "throughput": 4246.22, "total_tokens": 20581800} {"current_steps": 31580, "total_steps": 38160, "loss": 0.6167, "lr": 8.789546082060273e-05, "epoch": 16.551362683438157, "percentage": 82.76, "elapsed_time": "1:20:47", "remaining_time": "0:16:50", "throughput": 4246.18, "total_tokens": 20584296} {"current_steps": 31585, "total_steps": 38160, "loss": 0.4248, "lr": 8.776600250793371e-05, "epoch": 16.55398322851153, "percentage": 82.77, "elapsed_time": "1:20:48", "remaining_time": "0:16:49", "throughput": 4246.2, "total_tokens": 20587368} {"current_steps": 31590, "total_steps": 38160, "loss": 0.4979, "lr": 8.763663042991399e-05, "epoch": 16.556603773584907, "percentage": 82.78, "elapsed_time": "1:20:49", "remaining_time": "0:16:48", "throughput": 4246.22, "total_tokens": 20590504} {"current_steps": 31595, "total_steps": 38160, "loss": 0.45, "lr": 8.75073446136066e-05, "epoch": 16.55922431865828, "percentage": 82.8, "elapsed_time": "1:20:49", "remaining_time": "0:16:47", "throughput": 4246.22, "total_tokens": 20593448} {"current_steps": 31600, "total_steps": 38160, "loss": 0.4419, "lr": 8.737814508605674e-05, "epoch": 16.561844863731658, "percentage": 82.81, "elapsed_time": "1:20:50", "remaining_time": "0:16:46", "throughput": 4246.27, "total_tokens": 20596904} {"current_steps": 31605, "total_steps": 38160, "loss": 0.421, "lr": 8.724903187429145e-05, "epoch": 16.56446540880503, "percentage": 82.82, "elapsed_time": "1:20:51", "remaining_time": "0:16:46", "throughput": 4246.3, "total_tokens": 20600040} {"current_steps": 31610, "total_steps": 38160, "loss": 0.4465, "lr": 8.71200050053198e-05, "epoch": 16.567085953878408, "percentage": 82.84, "elapsed_time": "1:20:52", "remaining_time": "0:16:45", "throughput": 4246.31, "total_tokens": 20603112} {"current_steps": 31615, "total_steps": 38160, "loss": 0.4255, "lr": 8.699106450613287e-05, "epoch": 16.56970649895178, "percentage": 82.85, "elapsed_time": "1:20:52", "remaining_time": "0:16:44", "throughput": 4246.38, "total_tokens": 20606760} {"current_steps": 31620, "total_steps": 38160, "loss": 0.4056, "lr": 8.686221040370334e-05, "epoch": 16.572327044025158, "percentage": 82.86, "elapsed_time": "1:20:53", "remaining_time": "0:16:43", "throughput": 4246.41, "total_tokens": 20609896} {"current_steps": 31625, "total_steps": 38160, "loss": 0.4617, "lr": 8.673344272498596e-05, "epoch": 16.57494758909853, "percentage": 82.87, "elapsed_time": "1:20:54", "remaining_time": "0:16:43", "throughput": 4246.4, "total_tokens": 20612712} {"current_steps": 31630, "total_steps": 38160, "loss": 0.6805, "lr": 8.660476149691759e-05, "epoch": 16.57756813417191, "percentage": 82.89, "elapsed_time": "1:20:54", "remaining_time": "0:16:42", "throughput": 4246.48, "total_tokens": 20616488} {"current_steps": 31635, "total_steps": 38160, "loss": 0.5352, "lr": 8.647616674641684e-05, "epoch": 16.580188679245282, "percentage": 82.9, "elapsed_time": "1:20:55", "remaining_time": "0:16:41", "throughput": 4246.52, "total_tokens": 20619944} {"current_steps": 31640, "total_steps": 38160, "loss": 0.4306, "lr": 8.63476585003844e-05, "epoch": 16.58280922431866, "percentage": 82.91, "elapsed_time": "1:20:56", "remaining_time": "0:16:40", "throughput": 4246.53, "total_tokens": 20622952} {"current_steps": 31645, "total_steps": 38160, "loss": 0.335, "lr": 8.621923678570259e-05, "epoch": 16.585429769392032, "percentage": 82.93, "elapsed_time": "1:20:57", "remaining_time": "0:16:39", "throughput": 4246.57, "total_tokens": 20626248} {"current_steps": 31650, "total_steps": 38160, "loss": 0.3216, "lr": 8.609090162923567e-05, "epoch": 16.58805031446541, "percentage": 82.94, "elapsed_time": "1:20:57", "remaining_time": "0:16:39", "throughput": 4246.66, "total_tokens": 20630088} {"current_steps": 31655, "total_steps": 38160, "loss": 0.4351, "lr": 8.596265305783002e-05, "epoch": 16.590670859538783, "percentage": 82.95, "elapsed_time": "1:20:58", "remaining_time": "0:16:38", "throughput": 4246.65, "total_tokens": 20632840} {"current_steps": 31660, "total_steps": 38160, "loss": 0.4244, "lr": 8.583449109831375e-05, "epoch": 16.59329140461216, "percentage": 82.97, "elapsed_time": "1:20:59", "remaining_time": "0:16:37", "throughput": 4246.64, "total_tokens": 20635720} {"current_steps": 31665, "total_steps": 38160, "loss": 0.3579, "lr": 8.570641577749705e-05, "epoch": 16.595911949685533, "percentage": 82.98, "elapsed_time": "1:21:00", "remaining_time": "0:16:36", "throughput": 4246.72, "total_tokens": 20639400} {"current_steps": 31670, "total_steps": 38160, "loss": 0.4073, "lr": 8.557842712217162e-05, "epoch": 16.59853249475891, "percentage": 82.99, "elapsed_time": "1:21:00", "remaining_time": "0:16:36", "throughput": 4246.84, "total_tokens": 20643656} {"current_steps": 31675, "total_steps": 38160, "loss": 0.3979, "lr": 8.545052515911112e-05, "epoch": 16.601153039832283, "percentage": 83.01, "elapsed_time": "1:21:01", "remaining_time": "0:16:35", "throughput": 4246.82, "total_tokens": 20646504} {"current_steps": 31680, "total_steps": 38160, "loss": 0.5047, "lr": 8.532270991507136e-05, "epoch": 16.60377358490566, "percentage": 83.02, "elapsed_time": "1:21:02", "remaining_time": "0:16:34", "throughput": 4246.9, "total_tokens": 20650120} {"current_steps": 31685, "total_steps": 38160, "loss": 0.3785, "lr": 8.519498141678983e-05, "epoch": 16.606394129979037, "percentage": 83.03, "elapsed_time": "1:21:03", "remaining_time": "0:16:33", "throughput": 4246.91, "total_tokens": 20653064} {"current_steps": 31690, "total_steps": 38160, "loss": 0.4029, "lr": 8.506733969098579e-05, "epoch": 16.60901467505241, "percentage": 83.05, "elapsed_time": "1:21:03", "remaining_time": "0:16:33", "throughput": 4247.02, "total_tokens": 20657160} {"current_steps": 31695, "total_steps": 38160, "loss": 0.3342, "lr": 8.49397847643606e-05, "epoch": 16.611635220125788, "percentage": 83.06, "elapsed_time": "1:21:04", "remaining_time": "0:16:32", "throughput": 4247.01, "total_tokens": 20659912} {"current_steps": 31700, "total_steps": 38160, "loss": 0.3204, "lr": 8.481231666359723e-05, "epoch": 16.61425576519916, "percentage": 83.07, "elapsed_time": "1:21:05", "remaining_time": "0:16:31", "throughput": 4246.97, "total_tokens": 20662312} {"current_steps": 31705, "total_steps": 38160, "loss": 0.4215, "lr": 8.468493541536031e-05, "epoch": 16.616876310272538, "percentage": 83.08, "elapsed_time": "1:21:06", "remaining_time": "0:16:30", "throughput": 4247.07, "total_tokens": 20666248} {"current_steps": 31710, "total_steps": 38160, "loss": 0.4125, "lr": 8.455764104629681e-05, "epoch": 16.61949685534591, "percentage": 83.1, "elapsed_time": "1:21:06", "remaining_time": "0:16:29", "throughput": 4247.23, "total_tokens": 20670888} {"current_steps": 31715, "total_steps": 38160, "loss": 0.4029, "lr": 8.443043358303515e-05, "epoch": 16.622117400419288, "percentage": 83.11, "elapsed_time": "1:21:07", "remaining_time": "0:16:29", "throughput": 4247.19, "total_tokens": 20673320} {"current_steps": 31720, "total_steps": 38160, "loss": 0.3218, "lr": 8.430331305218585e-05, "epoch": 16.62473794549266, "percentage": 83.12, "elapsed_time": "1:21:08", "remaining_time": "0:16:28", "throughput": 4247.22, "total_tokens": 20676552} {"current_steps": 31725, "total_steps": 38160, "loss": 0.4071, "lr": 8.417627948034096e-05, "epoch": 16.62735849056604, "percentage": 83.14, "elapsed_time": "1:21:08", "remaining_time": "0:16:27", "throughput": 4247.16, "total_tokens": 20678792} {"current_steps": 31730, "total_steps": 38160, "loss": 0.3573, "lr": 8.404933289407424e-05, "epoch": 16.629979035639412, "percentage": 83.15, "elapsed_time": "1:21:09", "remaining_time": "0:16:26", "throughput": 4247.3, "total_tokens": 20683240} {"current_steps": 31735, "total_steps": 38160, "loss": 0.514, "lr": 8.392247331994174e-05, "epoch": 16.63259958071279, "percentage": 83.16, "elapsed_time": "1:21:10", "remaining_time": "0:16:26", "throughput": 4247.34, "total_tokens": 20686536} {"current_steps": 31740, "total_steps": 38160, "loss": 0.4604, "lr": 8.37957007844809e-05, "epoch": 16.635220125786162, "percentage": 83.18, "elapsed_time": "1:21:11", "remaining_time": "0:16:25", "throughput": 4247.37, "total_tokens": 20689832} {"current_steps": 31745, "total_steps": 38160, "loss": 0.492, "lr": 8.366901531421134e-05, "epoch": 16.63784067085954, "percentage": 83.19, "elapsed_time": "1:21:11", "remaining_time": "0:16:24", "throughput": 4247.36, "total_tokens": 20692648} {"current_steps": 31750, "total_steps": 38160, "loss": 0.4656, "lr": 8.354241693563385e-05, "epoch": 16.640461215932913, "percentage": 83.2, "elapsed_time": "1:21:12", "remaining_time": "0:16:23", "throughput": 4247.31, "total_tokens": 20695048} {"current_steps": 31755, "total_steps": 38160, "loss": 0.3932, "lr": 8.341590567523166e-05, "epoch": 16.64308176100629, "percentage": 83.22, "elapsed_time": "1:21:13", "remaining_time": "0:16:22", "throughput": 4247.35, "total_tokens": 20698216} {"current_steps": 31760, "total_steps": 38160, "loss": 0.4787, "lr": 8.328948155946924e-05, "epoch": 16.645702306079663, "percentage": 83.23, "elapsed_time": "1:21:14", "remaining_time": "0:16:22", "throughput": 4247.43, "total_tokens": 20702024} {"current_steps": 31765, "total_steps": 38160, "loss": 0.3199, "lr": 8.316314461479318e-05, "epoch": 16.64832285115304, "percentage": 83.24, "elapsed_time": "1:21:14", "remaining_time": "0:16:21", "throughput": 4247.44, "total_tokens": 20705032} {"current_steps": 31770, "total_steps": 38160, "loss": 0.3523, "lr": 8.303689486763177e-05, "epoch": 16.650943396226417, "percentage": 83.25, "elapsed_time": "1:21:15", "remaining_time": "0:16:20", "throughput": 4247.45, "total_tokens": 20708072} {"current_steps": 31775, "total_steps": 38160, "loss": 0.4122, "lr": 8.291073234439512e-05, "epoch": 16.65356394129979, "percentage": 83.27, "elapsed_time": "1:21:16", "remaining_time": "0:16:19", "throughput": 4247.49, "total_tokens": 20711432} {"current_steps": 31780, "total_steps": 38160, "loss": 0.5054, "lr": 8.27846570714747e-05, "epoch": 16.656184486373167, "percentage": 83.28, "elapsed_time": "1:21:16", "remaining_time": "0:16:19", "throughput": 4247.57, "total_tokens": 20715112} {"current_steps": 31785, "total_steps": 38160, "loss": 0.4, "lr": 8.265866907524427e-05, "epoch": 16.65880503144654, "percentage": 83.29, "elapsed_time": "1:21:17", "remaining_time": "0:16:18", "throughput": 4247.57, "total_tokens": 20718024} {"current_steps": 31790, "total_steps": 38160, "loss": 0.3858, "lr": 8.253276838205892e-05, "epoch": 16.661425576519918, "percentage": 83.31, "elapsed_time": "1:21:18", "remaining_time": "0:16:17", "throughput": 4247.6, "total_tokens": 20721192} {"current_steps": 31795, "total_steps": 38160, "loss": 0.3292, "lr": 8.240695501825568e-05, "epoch": 16.66404612159329, "percentage": 83.32, "elapsed_time": "1:21:18", "remaining_time": "0:16:16", "throughput": 4247.55, "total_tokens": 20723656} {"current_steps": 31800, "total_steps": 38160, "loss": 0.3287, "lr": 8.228122901015345e-05, "epoch": 16.666666666666668, "percentage": 83.33, "elapsed_time": "1:21:19", "remaining_time": "0:16:15", "throughput": 4247.51, "total_tokens": 20726088} {"current_steps": 31805, "total_steps": 38160, "loss": 0.3251, "lr": 8.21555903840524e-05, "epoch": 16.66928721174004, "percentage": 83.35, "elapsed_time": "1:21:20", "remaining_time": "0:16:15", "throughput": 4247.5, "total_tokens": 20728840} {"current_steps": 31810, "total_steps": 38160, "loss": 0.2877, "lr": 8.203003916623491e-05, "epoch": 16.671907756813418, "percentage": 83.36, "elapsed_time": "1:21:21", "remaining_time": "0:16:14", "throughput": 4247.58, "total_tokens": 20732424} {"current_steps": 31815, "total_steps": 38160, "loss": 0.32, "lr": 8.190457538296464e-05, "epoch": 16.67452830188679, "percentage": 83.37, "elapsed_time": "1:21:22", "remaining_time": "0:16:13", "throughput": 4247.85, "total_tokens": 20738184} {"current_steps": 31820, "total_steps": 38160, "loss": 0.3413, "lr": 8.177919906048736e-05, "epoch": 16.67714884696017, "percentage": 83.39, "elapsed_time": "1:21:23", "remaining_time": "0:16:12", "throughput": 4248.06, "total_tokens": 20743464} {"current_steps": 31825, "total_steps": 38160, "loss": 0.3967, "lr": 8.165391022503044e-05, "epoch": 16.679769392033542, "percentage": 83.4, "elapsed_time": "1:21:23", "remaining_time": "0:16:12", "throughput": 4248.08, "total_tokens": 20746536} {"current_steps": 31830, "total_steps": 38160, "loss": 0.4931, "lr": 8.152870890280261e-05, "epoch": 16.68238993710692, "percentage": 83.41, "elapsed_time": "1:21:24", "remaining_time": "0:16:11", "throughput": 4248.12, "total_tokens": 20749896} {"current_steps": 31835, "total_steps": 38160, "loss": 0.3837, "lr": 8.140359511999473e-05, "epoch": 16.685010482180292, "percentage": 83.43, "elapsed_time": "1:21:25", "remaining_time": "0:16:10", "throughput": 4248.19, "total_tokens": 20753448} {"current_steps": 31840, "total_steps": 38160, "loss": 0.4779, "lr": 8.127856890277923e-05, "epoch": 16.68763102725367, "percentage": 83.44, "elapsed_time": "1:21:26", "remaining_time": "0:16:09", "throughput": 4248.25, "total_tokens": 20757032} {"current_steps": 31845, "total_steps": 38160, "loss": 0.3452, "lr": 8.115363027730998e-05, "epoch": 16.690251572327043, "percentage": 83.45, "elapsed_time": "1:21:26", "remaining_time": "0:16:09", "throughput": 4248.28, "total_tokens": 20760136} {"current_steps": 31850, "total_steps": 38160, "loss": 0.4662, "lr": 8.102877926972286e-05, "epoch": 16.69287211740042, "percentage": 83.46, "elapsed_time": "1:21:27", "remaining_time": "0:16:08", "throughput": 4248.29, "total_tokens": 20763144} {"current_steps": 31855, "total_steps": 38160, "loss": 0.4614, "lr": 8.090401590613533e-05, "epoch": 16.695492662473793, "percentage": 83.48, "elapsed_time": "1:21:28", "remaining_time": "0:16:07", "throughput": 4248.32, "total_tokens": 20766248} {"current_steps": 31860, "total_steps": 38160, "loss": 0.4834, "lr": 8.077934021264627e-05, "epoch": 16.69811320754717, "percentage": 83.49, "elapsed_time": "1:21:28", "remaining_time": "0:16:06", "throughput": 4248.32, "total_tokens": 20769160} {"current_steps": 31865, "total_steps": 38160, "loss": 0.3697, "lr": 8.065475221533652e-05, "epoch": 16.700733752620543, "percentage": 83.5, "elapsed_time": "1:21:29", "remaining_time": "0:16:05", "throughput": 4248.45, "total_tokens": 20773384} {"current_steps": 31870, "total_steps": 38160, "loss": 0.5252, "lr": 8.053025194026858e-05, "epoch": 16.70335429769392, "percentage": 83.52, "elapsed_time": "1:21:30", "remaining_time": "0:16:05", "throughput": 4248.56, "total_tokens": 20777416} {"current_steps": 31875, "total_steps": 38160, "loss": 0.4834, "lr": 8.040583941348623e-05, "epoch": 16.705974842767297, "percentage": 83.53, "elapsed_time": "1:21:31", "remaining_time": "0:16:04", "throughput": 4248.61, "total_tokens": 20780808} {"current_steps": 31880, "total_steps": 38160, "loss": 0.2852, "lr": 8.028151466101541e-05, "epoch": 16.70859538784067, "percentage": 83.54, "elapsed_time": "1:21:31", "remaining_time": "0:16:03", "throughput": 4248.63, "total_tokens": 20784040} {"current_steps": 31885, "total_steps": 38160, "loss": 0.4147, "lr": 8.015727770886321e-05, "epoch": 16.711215932914047, "percentage": 83.56, "elapsed_time": "1:21:32", "remaining_time": "0:16:02", "throughput": 4248.64, "total_tokens": 20787144} {"current_steps": 31890, "total_steps": 38160, "loss": 0.4174, "lr": 8.00331285830187e-05, "epoch": 16.71383647798742, "percentage": 83.57, "elapsed_time": "1:21:33", "remaining_time": "0:16:02", "throughput": 4248.68, "total_tokens": 20790408} {"current_steps": 31895, "total_steps": 38160, "loss": 0.4499, "lr": 7.990906730945247e-05, "epoch": 16.716457023060798, "percentage": 83.58, "elapsed_time": "1:21:34", "remaining_time": "0:16:01", "throughput": 4248.73, "total_tokens": 20793768} {"current_steps": 31900, "total_steps": 38160, "loss": 0.3787, "lr": 7.978509391411681e-05, "epoch": 16.71907756813417, "percentage": 83.6, "elapsed_time": "1:21:35", "remaining_time": "0:16:00", "throughput": 4248.97, "total_tokens": 20799624} {"current_steps": 31905, "total_steps": 38160, "loss": 0.4669, "lr": 7.966120842294544e-05, "epoch": 16.721698113207548, "percentage": 83.61, "elapsed_time": "1:21:35", "remaining_time": "0:15:59", "throughput": 4248.94, "total_tokens": 20802152} {"current_steps": 31910, "total_steps": 38160, "loss": 0.4239, "lr": 7.953741086185368e-05, "epoch": 16.72431865828092, "percentage": 83.62, "elapsed_time": "1:21:36", "remaining_time": "0:15:59", "throughput": 4248.92, "total_tokens": 20804776} {"current_steps": 31915, "total_steps": 38160, "loss": 0.4564, "lr": 7.941370125673864e-05, "epoch": 16.7269392033543, "percentage": 83.63, "elapsed_time": "1:21:37", "remaining_time": "0:15:58", "throughput": 4248.94, "total_tokens": 20807880} {"current_steps": 31920, "total_steps": 38160, "loss": 0.4212, "lr": 7.9290079633479e-05, "epoch": 16.729559748427672, "percentage": 83.65, "elapsed_time": "1:21:37", "remaining_time": "0:15:57", "throughput": 4248.92, "total_tokens": 20810568} {"current_steps": 31925, "total_steps": 38160, "loss": 0.4194, "lr": 7.916654601793516e-05, "epoch": 16.73218029350105, "percentage": 83.66, "elapsed_time": "1:21:38", "remaining_time": "0:15:56", "throughput": 4249.09, "total_tokens": 20815368} {"current_steps": 31930, "total_steps": 38160, "loss": 0.5207, "lr": 7.904310043594859e-05, "epoch": 16.734800838574422, "percentage": 83.67, "elapsed_time": "1:21:39", "remaining_time": "0:15:55", "throughput": 4249.1, "total_tokens": 20818472} {"current_steps": 31935, "total_steps": 38160, "loss": 0.4371, "lr": 7.891974291334303e-05, "epoch": 16.7374213836478, "percentage": 83.69, "elapsed_time": "1:21:40", "remaining_time": "0:15:55", "throughput": 4249.18, "total_tokens": 20822120} {"current_steps": 31940, "total_steps": 38160, "loss": 0.4202, "lr": 7.879647347592322e-05, "epoch": 16.740041928721173, "percentage": 83.7, "elapsed_time": "1:21:40", "remaining_time": "0:15:54", "throughput": 4249.19, "total_tokens": 20825160} {"current_steps": 31945, "total_steps": 38160, "loss": 0.6133, "lr": 7.867329214947578e-05, "epoch": 16.74266247379455, "percentage": 83.71, "elapsed_time": "1:21:41", "remaining_time": "0:15:53", "throughput": 4249.37, "total_tokens": 20830056} {"current_steps": 31950, "total_steps": 38160, "loss": 0.4937, "lr": 7.855019895976889e-05, "epoch": 16.745283018867923, "percentage": 83.73, "elapsed_time": "1:21:42", "remaining_time": "0:15:52", "throughput": 4249.38, "total_tokens": 20833032} {"current_steps": 31955, "total_steps": 38160, "loss": 0.4166, "lr": 7.842719393255232e-05, "epoch": 16.7479035639413, "percentage": 83.74, "elapsed_time": "1:21:43", "remaining_time": "0:15:52", "throughput": 4249.39, "total_tokens": 20836200} {"current_steps": 31960, "total_steps": 38160, "loss": 0.4358, "lr": 7.830427709355725e-05, "epoch": 16.750524109014677, "percentage": 83.75, "elapsed_time": "1:21:44", "remaining_time": "0:15:51", "throughput": 4249.46, "total_tokens": 20839784} {"current_steps": 31965, "total_steps": 38160, "loss": 0.3612, "lr": 7.818144846849634e-05, "epoch": 16.75314465408805, "percentage": 83.77, "elapsed_time": "1:21:44", "remaining_time": "0:15:50", "throughput": 4249.49, "total_tokens": 20842952} {"current_steps": 31970, "total_steps": 38160, "loss": 0.4599, "lr": 7.805870808306403e-05, "epoch": 16.755765199161427, "percentage": 83.78, "elapsed_time": "1:21:45", "remaining_time": "0:15:49", "throughput": 4249.53, "total_tokens": 20846344} {"current_steps": 31975, "total_steps": 38160, "loss": 0.3897, "lr": 7.793605596293618e-05, "epoch": 16.7583857442348, "percentage": 83.79, "elapsed_time": "1:21:46", "remaining_time": "0:15:49", "throughput": 4249.56, "total_tokens": 20849512} {"current_steps": 31980, "total_steps": 38160, "loss": 0.5701, "lr": 7.781349213377048e-05, "epoch": 16.761006289308177, "percentage": 83.81, "elapsed_time": "1:21:47", "remaining_time": "0:15:48", "throughput": 4249.59, "total_tokens": 20852744} {"current_steps": 31985, "total_steps": 38160, "loss": 0.4866, "lr": 7.769101662120559e-05, "epoch": 16.76362683438155, "percentage": 83.82, "elapsed_time": "1:21:47", "remaining_time": "0:15:47", "throughput": 4249.67, "total_tokens": 20856392} {"current_steps": 31990, "total_steps": 38160, "loss": 0.4396, "lr": 7.756862945086196e-05, "epoch": 16.766247379454928, "percentage": 83.83, "elapsed_time": "1:21:48", "remaining_time": "0:15:46", "throughput": 4249.65, "total_tokens": 20859048} {"current_steps": 31995, "total_steps": 38160, "loss": 0.4158, "lr": 7.744633064834172e-05, "epoch": 16.7688679245283, "percentage": 83.84, "elapsed_time": "1:21:49", "remaining_time": "0:15:45", "throughput": 4249.65, "total_tokens": 20861992} {"current_steps": 32000, "total_steps": 38160, "loss": 0.4378, "lr": 7.732412023922836e-05, "epoch": 16.771488469601678, "percentage": 83.86, "elapsed_time": "1:21:49", "remaining_time": "0:15:45", "throughput": 4249.66, "total_tokens": 20864904} {"current_steps": 32005, "total_steps": 38160, "loss": 0.4499, "lr": 7.720199824908692e-05, "epoch": 16.77410901467505, "percentage": 83.87, "elapsed_time": "1:21:50", "remaining_time": "0:15:44", "throughput": 4249.67, "total_tokens": 20867976} {"current_steps": 32010, "total_steps": 38160, "loss": 0.4257, "lr": 7.707996470346402e-05, "epoch": 16.77672955974843, "percentage": 83.88, "elapsed_time": "1:21:51", "remaining_time": "0:15:43", "throughput": 4249.72, "total_tokens": 20871464} {"current_steps": 32015, "total_steps": 38160, "loss": 0.4788, "lr": 7.695801962788756e-05, "epoch": 16.779350104821802, "percentage": 83.9, "elapsed_time": "1:21:52", "remaining_time": "0:15:42", "throughput": 4249.78, "total_tokens": 20874984} {"current_steps": 32020, "total_steps": 38160, "loss": 0.3319, "lr": 7.683616304786695e-05, "epoch": 16.78197064989518, "percentage": 83.91, "elapsed_time": "1:21:52", "remaining_time": "0:15:42", "throughput": 4249.77, "total_tokens": 20877832} {"current_steps": 32025, "total_steps": 38160, "loss": 0.5321, "lr": 7.671439498889332e-05, "epoch": 16.784591194968552, "percentage": 83.92, "elapsed_time": "1:21:53", "remaining_time": "0:15:41", "throughput": 4249.81, "total_tokens": 20881096} {"current_steps": 32030, "total_steps": 38160, "loss": 0.4571, "lr": 7.65927154764392e-05, "epoch": 16.78721174004193, "percentage": 83.94, "elapsed_time": "1:21:54", "remaining_time": "0:15:40", "throughput": 4249.88, "total_tokens": 20884680} {"current_steps": 32035, "total_steps": 38160, "loss": 0.5452, "lr": 7.647112453595862e-05, "epoch": 16.789832285115303, "percentage": 83.95, "elapsed_time": "1:21:54", "remaining_time": "0:15:39", "throughput": 4249.92, "total_tokens": 20888008} {"current_steps": 32040, "total_steps": 38160, "loss": 0.3803, "lr": 7.634962219288688e-05, "epoch": 16.79245283018868, "percentage": 83.96, "elapsed_time": "1:21:55", "remaining_time": "0:15:38", "throughput": 4249.95, "total_tokens": 20891240} {"current_steps": 32045, "total_steps": 38160, "loss": 0.333, "lr": 7.622820847264083e-05, "epoch": 16.795073375262053, "percentage": 83.98, "elapsed_time": "1:21:56", "remaining_time": "0:15:38", "throughput": 4250.0, "total_tokens": 20894664} {"current_steps": 32050, "total_steps": 38160, "loss": 0.4919, "lr": 7.610688340061894e-05, "epoch": 16.79769392033543, "percentage": 83.99, "elapsed_time": "1:21:57", "remaining_time": "0:15:37", "throughput": 4250.01, "total_tokens": 20897608} {"current_steps": 32055, "total_steps": 38160, "loss": 0.4242, "lr": 7.598564700220101e-05, "epoch": 16.800314465408803, "percentage": 84.0, "elapsed_time": "1:21:57", "remaining_time": "0:15:36", "throughput": 4250.06, "total_tokens": 20901096} {"current_steps": 32060, "total_steps": 38160, "loss": 0.3958, "lr": 7.586449930274842e-05, "epoch": 16.80293501048218, "percentage": 84.01, "elapsed_time": "1:21:58", "remaining_time": "0:15:35", "throughput": 4250.12, "total_tokens": 20904520} {"current_steps": 32065, "total_steps": 38160, "loss": 0.3797, "lr": 7.574344032760367e-05, "epoch": 16.805555555555557, "percentage": 84.03, "elapsed_time": "1:21:59", "remaining_time": "0:15:35", "throughput": 4250.14, "total_tokens": 20907592} {"current_steps": 32070, "total_steps": 38160, "loss": 0.3992, "lr": 7.562247010209111e-05, "epoch": 16.80817610062893, "percentage": 84.04, "elapsed_time": "1:22:00", "remaining_time": "0:15:34", "throughput": 4250.26, "total_tokens": 20911752} {"current_steps": 32075, "total_steps": 38160, "loss": 0.4492, "lr": 7.550158865151618e-05, "epoch": 16.810796645702307, "percentage": 84.05, "elapsed_time": "1:22:00", "remaining_time": "0:15:33", "throughput": 4250.26, "total_tokens": 20914728} {"current_steps": 32080, "total_steps": 38160, "loss": 0.4088, "lr": 7.538079600116593e-05, "epoch": 16.81341719077568, "percentage": 84.07, "elapsed_time": "1:22:01", "remaining_time": "0:15:32", "throughput": 4250.28, "total_tokens": 20917704} {"current_steps": 32085, "total_steps": 38160, "loss": 0.4396, "lr": 7.526009217630886e-05, "epoch": 16.816037735849058, "percentage": 84.08, "elapsed_time": "1:22:02", "remaining_time": "0:15:31", "throughput": 4250.29, "total_tokens": 20920808} {"current_steps": 32090, "total_steps": 38160, "loss": 0.4045, "lr": 7.513947720219494e-05, "epoch": 16.81865828092243, "percentage": 84.09, "elapsed_time": "1:22:02", "remaining_time": "0:15:31", "throughput": 4250.28, "total_tokens": 20923528} {"current_steps": 32095, "total_steps": 38160, "loss": 0.3851, "lr": 7.501895110405533e-05, "epoch": 16.821278825995808, "percentage": 84.11, "elapsed_time": "1:22:03", "remaining_time": "0:15:30", "throughput": 4250.28, "total_tokens": 20926376} {"current_steps": 32100, "total_steps": 38160, "loss": 0.3906, "lr": 7.489851390710262e-05, "epoch": 16.82389937106918, "percentage": 84.12, "elapsed_time": "1:22:04", "remaining_time": "0:15:29", "throughput": 4250.31, "total_tokens": 20929672} {"current_steps": 32105, "total_steps": 38160, "loss": 0.4695, "lr": 7.477816563653095e-05, "epoch": 16.82651991614256, "percentage": 84.13, "elapsed_time": "1:22:04", "remaining_time": "0:15:28", "throughput": 4250.32, "total_tokens": 20932616} {"current_steps": 32110, "total_steps": 38160, "loss": 0.3254, "lr": 7.465790631751584e-05, "epoch": 16.829140461215932, "percentage": 84.15, "elapsed_time": "1:22:05", "remaining_time": "0:15:28", "throughput": 4250.31, "total_tokens": 20935400} {"current_steps": 32115, "total_steps": 38160, "loss": 0.358, "lr": 7.453773597521429e-05, "epoch": 16.83176100628931, "percentage": 84.16, "elapsed_time": "1:22:06", "remaining_time": "0:15:27", "throughput": 4250.35, "total_tokens": 20938824} {"current_steps": 32120, "total_steps": 38160, "loss": 0.5666, "lr": 7.44176546347643e-05, "epoch": 16.834381551362682, "percentage": 84.17, "elapsed_time": "1:22:07", "remaining_time": "0:15:26", "throughput": 4250.38, "total_tokens": 20941960} {"current_steps": 32125, "total_steps": 38160, "loss": 0.3979, "lr": 7.429766232128583e-05, "epoch": 16.83700209643606, "percentage": 84.19, "elapsed_time": "1:22:08", "remaining_time": "0:15:25", "throughput": 4250.69, "total_tokens": 20948712} {"current_steps": 32130, "total_steps": 38160, "loss": 0.4714, "lr": 7.417775905987956e-05, "epoch": 16.839622641509433, "percentage": 84.2, "elapsed_time": "1:22:08", "remaining_time": "0:15:25", "throughput": 4250.69, "total_tokens": 20951592} {"current_steps": 32135, "total_steps": 38160, "loss": 0.5156, "lr": 7.405794487562811e-05, "epoch": 16.84224318658281, "percentage": 84.21, "elapsed_time": "1:22:09", "remaining_time": "0:15:24", "throughput": 4250.82, "total_tokens": 20955880} {"current_steps": 32140, "total_steps": 38160, "loss": 0.401, "lr": 7.393821979359528e-05, "epoch": 16.844863731656183, "percentage": 84.22, "elapsed_time": "1:22:10", "remaining_time": "0:15:23", "throughput": 4250.85, "total_tokens": 20959112} {"current_steps": 32145, "total_steps": 38160, "loss": 0.2918, "lr": 7.3818583838826e-05, "epoch": 16.84748427672956, "percentage": 84.24, "elapsed_time": "1:22:11", "remaining_time": "0:15:22", "throughput": 4250.85, "total_tokens": 20961992} {"current_steps": 32150, "total_steps": 38160, "loss": 0.3319, "lr": 7.369903703634684e-05, "epoch": 16.850104821802937, "percentage": 84.25, "elapsed_time": "1:22:11", "remaining_time": "0:15:21", "throughput": 4250.83, "total_tokens": 20964776} {"current_steps": 32155, "total_steps": 38160, "loss": 0.4395, "lr": 7.357957941116572e-05, "epoch": 16.85272536687631, "percentage": 84.26, "elapsed_time": "1:22:12", "remaining_time": "0:15:21", "throughput": 4250.85, "total_tokens": 20967944} {"current_steps": 32160, "total_steps": 38160, "loss": 0.4465, "lr": 7.346021098827166e-05, "epoch": 16.855345911949687, "percentage": 84.28, "elapsed_time": "1:22:13", "remaining_time": "0:15:20", "throughput": 4250.95, "total_tokens": 20971976} {"current_steps": 32165, "total_steps": 38160, "loss": 0.391, "lr": 7.334093179263518e-05, "epoch": 16.85796645702306, "percentage": 84.29, "elapsed_time": "1:22:14", "remaining_time": "0:15:19", "throughput": 4250.98, "total_tokens": 20975208} {"current_steps": 32170, "total_steps": 38160, "loss": 0.4364, "lr": 7.322174184920837e-05, "epoch": 16.860587002096437, "percentage": 84.3, "elapsed_time": "1:22:14", "remaining_time": "0:15:18", "throughput": 4250.94, "total_tokens": 20977736} {"current_steps": 32175, "total_steps": 38160, "loss": 0.4207, "lr": 7.310264118292404e-05, "epoch": 16.86320754716981, "percentage": 84.32, "elapsed_time": "1:22:15", "remaining_time": "0:15:18", "throughput": 4251.05, "total_tokens": 20981704} {"current_steps": 32180, "total_steps": 38160, "loss": 0.5, "lr": 7.298362981869705e-05, "epoch": 16.865828092243188, "percentage": 84.33, "elapsed_time": "1:22:16", "remaining_time": "0:15:17", "throughput": 4251.17, "total_tokens": 20985992} {"current_steps": 32185, "total_steps": 38160, "loss": 0.5073, "lr": 7.286470778142284e-05, "epoch": 16.86844863731656, "percentage": 84.34, "elapsed_time": "1:22:17", "remaining_time": "0:15:16", "throughput": 4251.23, "total_tokens": 20989544} {"current_steps": 32190, "total_steps": 38160, "loss": 0.4781, "lr": 7.274587509597886e-05, "epoch": 16.871069182389938, "percentage": 84.36, "elapsed_time": "1:22:18", "remaining_time": "0:15:15", "throughput": 4251.56, "total_tokens": 20996392} {"current_steps": 32195, "total_steps": 38160, "loss": 0.4355, "lr": 7.262713178722346e-05, "epoch": 16.87368972746331, "percentage": 84.37, "elapsed_time": "1:22:19", "remaining_time": "0:15:15", "throughput": 4251.57, "total_tokens": 20999400} {"current_steps": 32200, "total_steps": 38160, "loss": 0.3671, "lr": 7.250847787999625e-05, "epoch": 16.87631027253669, "percentage": 84.38, "elapsed_time": "1:22:19", "remaining_time": "0:15:14", "throughput": 4251.52, "total_tokens": 21001704} {"current_steps": 32205, "total_steps": 38160, "loss": 0.4802, "lr": 7.238991339911844e-05, "epoch": 16.878930817610062, "percentage": 84.39, "elapsed_time": "1:22:20", "remaining_time": "0:15:13", "throughput": 4251.54, "total_tokens": 21004872} {"current_steps": 32210, "total_steps": 38160, "loss": 0.4991, "lr": 7.227143836939237e-05, "epoch": 16.88155136268344, "percentage": 84.41, "elapsed_time": "1:22:21", "remaining_time": "0:15:12", "throughput": 4251.85, "total_tokens": 21011656} {"current_steps": 32215, "total_steps": 38160, "loss": 0.4114, "lr": 7.215305281560153e-05, "epoch": 16.884171907756812, "percentage": 84.42, "elapsed_time": "1:22:22", "remaining_time": "0:15:12", "throughput": 4251.85, "total_tokens": 21014472} {"current_steps": 32220, "total_steps": 38160, "loss": 0.4183, "lr": 7.203475676251104e-05, "epoch": 16.88679245283019, "percentage": 84.43, "elapsed_time": "1:22:23", "remaining_time": "0:15:11", "throughput": 4251.91, "total_tokens": 21017960} {"current_steps": 32225, "total_steps": 38160, "loss": 0.4141, "lr": 7.191655023486682e-05, "epoch": 16.889412997903563, "percentage": 84.45, "elapsed_time": "1:22:23", "remaining_time": "0:15:10", "throughput": 4251.95, "total_tokens": 21021288} {"current_steps": 32230, "total_steps": 38160, "loss": 0.4435, "lr": 7.179843325739644e-05, "epoch": 16.89203354297694, "percentage": 84.46, "elapsed_time": "1:22:24", "remaining_time": "0:15:09", "throughput": 4252.01, "total_tokens": 21024872} {"current_steps": 32235, "total_steps": 38160, "loss": 0.3936, "lr": 7.168040585480861e-05, "epoch": 16.894654088050313, "percentage": 84.47, "elapsed_time": "1:22:25", "remaining_time": "0:15:08", "throughput": 4252.03, "total_tokens": 21028008} {"current_steps": 32240, "total_steps": 38160, "loss": 0.3015, "lr": 7.156246805179351e-05, "epoch": 16.89727463312369, "percentage": 84.49, "elapsed_time": "1:22:26", "remaining_time": "0:15:08", "throughput": 4252.03, "total_tokens": 21030920} {"current_steps": 32245, "total_steps": 38160, "loss": 0.4926, "lr": 7.144461987302208e-05, "epoch": 16.899895178197063, "percentage": 84.5, "elapsed_time": "1:22:26", "remaining_time": "0:15:07", "throughput": 4252.08, "total_tokens": 21034248} {"current_steps": 32250, "total_steps": 38160, "loss": 0.453, "lr": 7.132686134314714e-05, "epoch": 16.90251572327044, "percentage": 84.51, "elapsed_time": "1:22:27", "remaining_time": "0:15:06", "throughput": 4252.13, "total_tokens": 21037672} {"current_steps": 32255, "total_steps": 38160, "loss": 0.4737, "lr": 7.120919248680208e-05, "epoch": 16.905136268343817, "percentage": 84.53, "elapsed_time": "1:22:28", "remaining_time": "0:15:05", "throughput": 4252.2, "total_tokens": 21041192} {"current_steps": 32260, "total_steps": 38160, "loss": 0.3878, "lr": 7.109161332860203e-05, "epoch": 16.90775681341719, "percentage": 84.54, "elapsed_time": "1:22:29", "remaining_time": "0:15:05", "throughput": 4252.24, "total_tokens": 21044488} {"current_steps": 32265, "total_steps": 38160, "loss": 0.4858, "lr": 7.097412389314322e-05, "epoch": 16.910377358490567, "percentage": 84.55, "elapsed_time": "1:22:29", "remaining_time": "0:15:04", "throughput": 4252.27, "total_tokens": 21047752} {"current_steps": 32270, "total_steps": 38160, "loss": 0.3893, "lr": 7.085672420500322e-05, "epoch": 16.91299790356394, "percentage": 84.56, "elapsed_time": "1:22:30", "remaining_time": "0:15:03", "throughput": 4252.24, "total_tokens": 21050344} {"current_steps": 32275, "total_steps": 38160, "loss": 0.4681, "lr": 7.073941428874064e-05, "epoch": 16.915618448637318, "percentage": 84.58, "elapsed_time": "1:22:31", "remaining_time": "0:15:02", "throughput": 4252.24, "total_tokens": 21053288} {"current_steps": 32280, "total_steps": 38160, "loss": 0.4256, "lr": 7.062219416889514e-05, "epoch": 16.91823899371069, "percentage": 84.59, "elapsed_time": "1:22:31", "remaining_time": "0:15:02", "throughput": 4252.31, "total_tokens": 21056904} {"current_steps": 32285, "total_steps": 38160, "loss": 0.3571, "lr": 7.050506386998806e-05, "epoch": 16.920859538784068, "percentage": 84.6, "elapsed_time": "1:22:32", "remaining_time": "0:15:01", "throughput": 4252.32, "total_tokens": 21059848} {"current_steps": 32290, "total_steps": 38160, "loss": 0.3908, "lr": 7.038802341652172e-05, "epoch": 16.92348008385744, "percentage": 84.62, "elapsed_time": "1:22:33", "remaining_time": "0:15:00", "throughput": 4252.29, "total_tokens": 21062472} {"current_steps": 32295, "total_steps": 38160, "loss": 0.4149, "lr": 7.027107283297967e-05, "epoch": 16.92610062893082, "percentage": 84.63, "elapsed_time": "1:22:34", "remaining_time": "0:14:59", "throughput": 4252.49, "total_tokens": 21067752} {"current_steps": 32300, "total_steps": 38160, "loss": 0.47, "lr": 7.015421214382661e-05, "epoch": 16.928721174004192, "percentage": 84.64, "elapsed_time": "1:22:34", "remaining_time": "0:14:58", "throughput": 4252.5, "total_tokens": 21070632} {"current_steps": 32305, "total_steps": 38160, "loss": 0.4817, "lr": 7.003744137350827e-05, "epoch": 16.93134171907757, "percentage": 84.66, "elapsed_time": "1:22:35", "remaining_time": "0:14:58", "throughput": 4252.59, "total_tokens": 21074568} {"current_steps": 32310, "total_steps": 38160, "loss": 0.3873, "lr": 6.992076054645197e-05, "epoch": 16.933962264150942, "percentage": 84.67, "elapsed_time": "1:22:36", "remaining_time": "0:14:57", "throughput": 4252.57, "total_tokens": 21077288} {"current_steps": 32315, "total_steps": 38160, "loss": 0.3678, "lr": 6.980416968706594e-05, "epoch": 16.93658280922432, "percentage": 84.68, "elapsed_time": "1:22:36", "remaining_time": "0:14:56", "throughput": 4252.56, "total_tokens": 21079912} {"current_steps": 32320, "total_steps": 38160, "loss": 0.5207, "lr": 6.968766881973965e-05, "epoch": 16.939203354297693, "percentage": 84.7, "elapsed_time": "1:22:37", "remaining_time": "0:14:55", "throughput": 4252.66, "total_tokens": 21084040} {"current_steps": 32325, "total_steps": 38160, "loss": 0.4535, "lr": 6.957125796884395e-05, "epoch": 16.94182389937107, "percentage": 84.71, "elapsed_time": "1:22:38", "remaining_time": "0:14:55", "throughput": 4252.71, "total_tokens": 21087528} {"current_steps": 32330, "total_steps": 38160, "loss": 0.3694, "lr": 6.945493715873046e-05, "epoch": 16.944444444444443, "percentage": 84.72, "elapsed_time": "1:22:39", "remaining_time": "0:14:54", "throughput": 4252.76, "total_tokens": 21090888} {"current_steps": 32335, "total_steps": 38160, "loss": 0.4694, "lr": 6.933870641373208e-05, "epoch": 16.94706498951782, "percentage": 84.74, "elapsed_time": "1:22:40", "remaining_time": "0:14:53", "throughput": 4252.86, "total_tokens": 21094792} {"current_steps": 32340, "total_steps": 38160, "loss": 0.3855, "lr": 6.92225657581631e-05, "epoch": 16.949685534591197, "percentage": 84.75, "elapsed_time": "1:22:40", "remaining_time": "0:14:52", "throughput": 4252.86, "total_tokens": 21097736} {"current_steps": 32345, "total_steps": 38160, "loss": 0.3058, "lr": 6.910651521631877e-05, "epoch": 16.95230607966457, "percentage": 84.76, "elapsed_time": "1:22:41", "remaining_time": "0:14:51", "throughput": 4252.87, "total_tokens": 21100776} {"current_steps": 32350, "total_steps": 38160, "loss": 0.426, "lr": 6.899055481247568e-05, "epoch": 16.954926624737947, "percentage": 84.77, "elapsed_time": "1:22:42", "remaining_time": "0:14:51", "throughput": 4252.9, "total_tokens": 21104040} {"current_steps": 32355, "total_steps": 38160, "loss": 0.3484, "lr": 6.88746845708913e-05, "epoch": 16.95754716981132, "percentage": 84.79, "elapsed_time": "1:22:42", "remaining_time": "0:14:50", "throughput": 4252.9, "total_tokens": 21106856} {"current_steps": 32360, "total_steps": 38160, "loss": 0.4181, "lr": 6.87589045158043e-05, "epoch": 16.960167714884697, "percentage": 84.8, "elapsed_time": "1:22:43", "remaining_time": "0:14:49", "throughput": 4252.9, "total_tokens": 21109768} {"current_steps": 32365, "total_steps": 38160, "loss": 0.4037, "lr": 6.864321467143459e-05, "epoch": 16.96278825995807, "percentage": 84.81, "elapsed_time": "1:22:44", "remaining_time": "0:14:48", "throughput": 4252.98, "total_tokens": 21113512} {"current_steps": 32370, "total_steps": 38160, "loss": 0.4385, "lr": 6.852761506198319e-05, "epoch": 16.965408805031448, "percentage": 84.83, "elapsed_time": "1:22:45", "remaining_time": "0:14:48", "throughput": 4253.09, "total_tokens": 21117544} {"current_steps": 32375, "total_steps": 38160, "loss": 0.3988, "lr": 6.841210571163231e-05, "epoch": 16.96802935010482, "percentage": 84.84, "elapsed_time": "1:22:46", "remaining_time": "0:14:47", "throughput": 4253.23, "total_tokens": 21121864} {"current_steps": 32380, "total_steps": 38160, "loss": 0.4462, "lr": 6.829668664454513e-05, "epoch": 16.970649895178198, "percentage": 84.85, "elapsed_time": "1:22:46", "remaining_time": "0:14:46", "throughput": 4253.18, "total_tokens": 21124328} {"current_steps": 32385, "total_steps": 38160, "loss": 0.3302, "lr": 6.818135788486584e-05, "epoch": 16.97327044025157, "percentage": 84.87, "elapsed_time": "1:22:47", "remaining_time": "0:14:45", "throughput": 4253.19, "total_tokens": 21127336} {"current_steps": 32390, "total_steps": 38160, "loss": 0.3343, "lr": 6.806611945672004e-05, "epoch": 16.97589098532495, "percentage": 84.88, "elapsed_time": "1:22:48", "remaining_time": "0:14:45", "throughput": 4253.17, "total_tokens": 21129896} {"current_steps": 32395, "total_steps": 38160, "loss": 0.4391, "lr": 6.79509713842143e-05, "epoch": 16.978511530398322, "percentage": 84.89, "elapsed_time": "1:22:48", "remaining_time": "0:14:44", "throughput": 4253.22, "total_tokens": 21133512} {"current_steps": 32400, "total_steps": 38160, "loss": 0.4058, "lr": 6.783591369143626e-05, "epoch": 16.9811320754717, "percentage": 84.91, "elapsed_time": "1:22:49", "remaining_time": "0:14:43", "throughput": 4253.17, "total_tokens": 21135816} {"current_steps": 32405, "total_steps": 38160, "loss": 0.2922, "lr": 6.77209464024548e-05, "epoch": 16.983752620545072, "percentage": 84.92, "elapsed_time": "1:22:50", "remaining_time": "0:14:42", "throughput": 4253.15, "total_tokens": 21138536} {"current_steps": 32410, "total_steps": 38160, "loss": 0.4355, "lr": 6.760606954131965e-05, "epoch": 16.98637316561845, "percentage": 84.93, "elapsed_time": "1:22:50", "remaining_time": "0:14:41", "throughput": 4253.13, "total_tokens": 21141160} {"current_steps": 32415, "total_steps": 38160, "loss": 0.3992, "lr": 6.749128313206165e-05, "epoch": 16.988993710691823, "percentage": 84.94, "elapsed_time": "1:22:51", "remaining_time": "0:14:41", "throughput": 4253.08, "total_tokens": 21143624} {"current_steps": 32420, "total_steps": 38160, "loss": 0.4917, "lr": 6.737658719869288e-05, "epoch": 16.9916142557652, "percentage": 84.96, "elapsed_time": "1:22:52", "remaining_time": "0:14:40", "throughput": 4253.18, "total_tokens": 21147528} {"current_steps": 32425, "total_steps": 38160, "loss": 0.4281, "lr": 6.726198176520642e-05, "epoch": 16.994234800838573, "percentage": 84.97, "elapsed_time": "1:22:52", "remaining_time": "0:14:39", "throughput": 4253.18, "total_tokens": 21150376} {"current_steps": 32430, "total_steps": 38160, "loss": 0.464, "lr": 6.71474668555766e-05, "epoch": 16.99685534591195, "percentage": 84.98, "elapsed_time": "1:22:53", "remaining_time": "0:14:38", "throughput": 4253.34, "total_tokens": 21155016} {"current_steps": 32435, "total_steps": 38160, "loss": 0.2553, "lr": 6.703304249375836e-05, "epoch": 16.999475890985323, "percentage": 85.0, "elapsed_time": "1:22:54", "remaining_time": "0:14:38", "throughput": 4253.35, "total_tokens": 21157992} {"current_steps": 32436, "total_steps": 38160, "eval_loss": 0.46461933851242065, "epoch": 17.0, "percentage": 85.0, "elapsed_time": "1:23:08", "remaining_time": "0:14:40", "throughput": 4241.65, "total_tokens": 21158120} {"current_steps": 32440, "total_steps": 38160, "loss": 0.3022, "lr": 6.691870870368815e-05, "epoch": 17.0020964360587, "percentage": 85.01, "elapsed_time": "1:23:10", "remaining_time": "0:14:39", "throughput": 4240.31, "total_tokens": 21160712} {"current_steps": 32445, "total_steps": 38160, "loss": 0.386, "lr": 6.680446550928316e-05, "epoch": 17.004716981132077, "percentage": 85.02, "elapsed_time": "1:23:11", "remaining_time": "0:14:39", "throughput": 4240.3, "total_tokens": 21163528} {"current_steps": 32450, "total_steps": 38160, "loss": 0.5215, "lr": 6.669031293444177e-05, "epoch": 17.00733752620545, "percentage": 85.04, "elapsed_time": "1:23:11", "remaining_time": "0:14:38", "throughput": 4240.38, "total_tokens": 21167304} {"current_steps": 32455, "total_steps": 38160, "loss": 0.4331, "lr": 6.65762510030436e-05, "epoch": 17.009958071278827, "percentage": 85.05, "elapsed_time": "1:23:12", "remaining_time": "0:14:37", "throughput": 4240.44, "total_tokens": 21170792} {"current_steps": 32460, "total_steps": 38160, "loss": 0.3956, "lr": 6.646227973894886e-05, "epoch": 17.0125786163522, "percentage": 85.06, "elapsed_time": "1:23:13", "remaining_time": "0:14:36", "throughput": 4240.51, "total_tokens": 21174408} {"current_steps": 32465, "total_steps": 38160, "loss": 0.4642, "lr": 6.634839916599921e-05, "epoch": 17.015199161425578, "percentage": 85.08, "elapsed_time": "1:23:14", "remaining_time": "0:14:36", "throughput": 4240.6, "total_tokens": 21178248} {"current_steps": 32470, "total_steps": 38160, "loss": 0.3157, "lr": 6.623460930801701e-05, "epoch": 17.01781970649895, "percentage": 85.09, "elapsed_time": "1:23:14", "remaining_time": "0:14:35", "throughput": 4240.61, "total_tokens": 21181064} {"current_steps": 32475, "total_steps": 38160, "loss": 0.4595, "lr": 6.61209101888059e-05, "epoch": 17.020440251572328, "percentage": 85.1, "elapsed_time": "1:23:15", "remaining_time": "0:14:34", "throughput": 4240.65, "total_tokens": 21184296} {"current_steps": 32480, "total_steps": 38160, "loss": 0.4821, "lr": 6.600730183215043e-05, "epoch": 17.0230607966457, "percentage": 85.12, "elapsed_time": "1:23:16", "remaining_time": "0:14:33", "throughput": 4240.65, "total_tokens": 21187176} {"current_steps": 32485, "total_steps": 38160, "loss": 0.3277, "lr": 6.589378426181624e-05, "epoch": 17.02568134171908, "percentage": 85.13, "elapsed_time": "1:23:16", "remaining_time": "0:14:32", "throughput": 4240.62, "total_tokens": 21189800} {"current_steps": 32490, "total_steps": 38160, "loss": 0.4992, "lr": 6.578035750154976e-05, "epoch": 17.028301886792452, "percentage": 85.14, "elapsed_time": "1:23:18", "remaining_time": "0:14:32", "throughput": 4240.92, "total_tokens": 21196328} {"current_steps": 32495, "total_steps": 38160, "loss": 0.44, "lr": 6.566702157507875e-05, "epoch": 17.03092243186583, "percentage": 85.15, "elapsed_time": "1:23:18", "remaining_time": "0:14:31", "throughput": 4240.93, "total_tokens": 21199400} {"current_steps": 32500, "total_steps": 38160, "loss": 0.3607, "lr": 6.555377650611155e-05, "epoch": 17.033542976939202, "percentage": 85.17, "elapsed_time": "1:23:19", "remaining_time": "0:14:30", "throughput": 4240.91, "total_tokens": 21202248} {"current_steps": 32505, "total_steps": 38160, "loss": 0.5154, "lr": 6.544062231833792e-05, "epoch": 17.03616352201258, "percentage": 85.18, "elapsed_time": "1:23:20", "remaining_time": "0:14:29", "throughput": 4240.93, "total_tokens": 21205448} {"current_steps": 32510, "total_steps": 38160, "loss": 0.3544, "lr": 6.532755903542847e-05, "epoch": 17.038784067085953, "percentage": 85.19, "elapsed_time": "1:23:21", "remaining_time": "0:14:29", "throughput": 4241.03, "total_tokens": 21209576} {"current_steps": 32515, "total_steps": 38160, "loss": 0.4569, "lr": 6.521458668103458e-05, "epoch": 17.04140461215933, "percentage": 85.21, "elapsed_time": "1:23:21", "remaining_time": "0:14:28", "throughput": 4241.07, "total_tokens": 21212904} {"current_steps": 32520, "total_steps": 38160, "loss": 0.4073, "lr": 6.510170527878889e-05, "epoch": 17.044025157232703, "percentage": 85.22, "elapsed_time": "1:23:22", "remaining_time": "0:14:27", "throughput": 4241.11, "total_tokens": 21216104} {"current_steps": 32525, "total_steps": 38160, "loss": 0.4958, "lr": 6.498891485230491e-05, "epoch": 17.04664570230608, "percentage": 85.23, "elapsed_time": "1:23:23", "remaining_time": "0:14:26", "throughput": 4241.2, "total_tokens": 21220104} {"current_steps": 32530, "total_steps": 38160, "loss": 0.4923, "lr": 6.487621542517703e-05, "epoch": 17.049266247379453, "percentage": 85.25, "elapsed_time": "1:23:23", "remaining_time": "0:14:26", "throughput": 4241.2, "total_tokens": 21222920} {"current_steps": 32535, "total_steps": 38160, "loss": 0.387, "lr": 6.476360702098078e-05, "epoch": 17.05188679245283, "percentage": 85.26, "elapsed_time": "1:23:24", "remaining_time": "0:14:25", "throughput": 4241.25, "total_tokens": 21226408} {"current_steps": 32540, "total_steps": 38160, "loss": 0.5131, "lr": 6.465108966327243e-05, "epoch": 17.054507337526207, "percentage": 85.27, "elapsed_time": "1:23:25", "remaining_time": "0:14:24", "throughput": 4241.34, "total_tokens": 21230184} {"current_steps": 32545, "total_steps": 38160, "loss": 0.3885, "lr": 6.453866337558939e-05, "epoch": 17.05712788259958, "percentage": 85.29, "elapsed_time": "1:23:26", "remaining_time": "0:14:23", "throughput": 4241.36, "total_tokens": 21233288} {"current_steps": 32550, "total_steps": 38160, "loss": 0.4083, "lr": 6.442632818145011e-05, "epoch": 17.059748427672957, "percentage": 85.3, "elapsed_time": "1:23:26", "remaining_time": "0:14:22", "throughput": 4241.32, "total_tokens": 21235720} {"current_steps": 32555, "total_steps": 38160, "loss": 0.4184, "lr": 6.431408410435352e-05, "epoch": 17.06236897274633, "percentage": 85.31, "elapsed_time": "1:23:27", "remaining_time": "0:14:22", "throughput": 4241.29, "total_tokens": 21238408} {"current_steps": 32560, "total_steps": 38160, "loss": 0.3644, "lr": 6.420193116778e-05, "epoch": 17.064989517819708, "percentage": 85.32, "elapsed_time": "1:23:28", "remaining_time": "0:14:21", "throughput": 4241.43, "total_tokens": 21242632} {"current_steps": 32565, "total_steps": 38160, "loss": 0.3888, "lr": 6.408986939519074e-05, "epoch": 17.06761006289308, "percentage": 85.34, "elapsed_time": "1:23:29", "remaining_time": "0:14:20", "throughput": 4241.47, "total_tokens": 21246056} {"current_steps": 32570, "total_steps": 38160, "loss": 0.5273, "lr": 6.397789881002752e-05, "epoch": 17.070230607966458, "percentage": 85.35, "elapsed_time": "1:23:29", "remaining_time": "0:14:19", "throughput": 4241.47, "total_tokens": 21249032} {"current_steps": 32575, "total_steps": 38160, "loss": 0.4089, "lr": 6.386601943571352e-05, "epoch": 17.07285115303983, "percentage": 85.36, "elapsed_time": "1:23:30", "remaining_time": "0:14:19", "throughput": 4241.46, "total_tokens": 21251816} {"current_steps": 32580, "total_steps": 38160, "loss": 0.3586, "lr": 6.375423129565266e-05, "epoch": 17.07547169811321, "percentage": 85.38, "elapsed_time": "1:23:31", "remaining_time": "0:14:18", "throughput": 4241.61, "total_tokens": 21256200} {"current_steps": 32585, "total_steps": 38160, "loss": 0.4003, "lr": 6.36425344132296e-05, "epoch": 17.078092243186582, "percentage": 85.39, "elapsed_time": "1:23:32", "remaining_time": "0:14:17", "throughput": 4241.73, "total_tokens": 21260392} {"current_steps": 32590, "total_steps": 38160, "loss": 0.4628, "lr": 6.353092881181016e-05, "epoch": 17.08071278825996, "percentage": 85.4, "elapsed_time": "1:23:33", "remaining_time": "0:14:16", "throughput": 4241.83, "total_tokens": 21264296} {"current_steps": 32595, "total_steps": 38160, "loss": 0.4692, "lr": 6.341941451474082e-05, "epoch": 17.083333333333332, "percentage": 85.42, "elapsed_time": "1:23:33", "remaining_time": "0:14:16", "throughput": 4241.89, "total_tokens": 21267848} {"current_steps": 32600, "total_steps": 38160, "loss": 0.3766, "lr": 6.330799154534921e-05, "epoch": 17.08595387840671, "percentage": 85.43, "elapsed_time": "1:23:34", "remaining_time": "0:14:15", "throughput": 4241.95, "total_tokens": 21271560} {"current_steps": 32605, "total_steps": 38160, "loss": 0.451, "lr": 6.319665992694368e-05, "epoch": 17.088574423480082, "percentage": 85.44, "elapsed_time": "1:23:35", "remaining_time": "0:14:14", "throughput": 4241.97, "total_tokens": 21274760} {"current_steps": 32610, "total_steps": 38160, "loss": 0.3702, "lr": 6.308541968281373e-05, "epoch": 17.09119496855346, "percentage": 85.46, "elapsed_time": "1:23:35", "remaining_time": "0:14:13", "throughput": 4241.94, "total_tokens": 21277352} {"current_steps": 32615, "total_steps": 38160, "loss": 0.5639, "lr": 6.297427083622936e-05, "epoch": 17.093815513626833, "percentage": 85.47, "elapsed_time": "1:23:36", "remaining_time": "0:14:12", "throughput": 4241.94, "total_tokens": 21280168} {"current_steps": 32620, "total_steps": 38160, "loss": 0.4357, "lr": 6.28632134104416e-05, "epoch": 17.09643605870021, "percentage": 85.48, "elapsed_time": "1:23:37", "remaining_time": "0:14:12", "throughput": 4241.99, "total_tokens": 21283688} {"current_steps": 32625, "total_steps": 38160, "loss": 0.442, "lr": 6.275224742868247e-05, "epoch": 17.099056603773583, "percentage": 85.5, "elapsed_time": "1:23:38", "remaining_time": "0:14:11", "throughput": 4242.03, "total_tokens": 21286920} {"current_steps": 32630, "total_steps": 38160, "loss": 0.4369, "lr": 6.264137291416477e-05, "epoch": 17.10167714884696, "percentage": 85.51, "elapsed_time": "1:23:38", "remaining_time": "0:14:10", "throughput": 4242.11, "total_tokens": 21290600} {"current_steps": 32635, "total_steps": 38160, "loss": 0.4711, "lr": 6.253058989008226e-05, "epoch": 17.104297693920337, "percentage": 85.52, "elapsed_time": "1:23:39", "remaining_time": "0:14:09", "throughput": 4242.06, "total_tokens": 21293032} {"current_steps": 32640, "total_steps": 38160, "loss": 0.4518, "lr": 6.241989837960949e-05, "epoch": 17.10691823899371, "percentage": 85.53, "elapsed_time": "1:23:40", "remaining_time": "0:14:09", "throughput": 4242.07, "total_tokens": 21295976} {"current_steps": 32645, "total_steps": 38160, "loss": 0.4509, "lr": 6.230929840590177e-05, "epoch": 17.109538784067087, "percentage": 85.55, "elapsed_time": "1:23:40", "remaining_time": "0:14:08", "throughput": 4242.16, "total_tokens": 21299816} {"current_steps": 32650, "total_steps": 38160, "loss": 0.4198, "lr": 6.219878999209533e-05, "epoch": 17.11215932914046, "percentage": 85.56, "elapsed_time": "1:23:41", "remaining_time": "0:14:07", "throughput": 4242.16, "total_tokens": 21302696} {"current_steps": 32655, "total_steps": 38160, "loss": 0.4378, "lr": 6.208837316130733e-05, "epoch": 17.114779874213838, "percentage": 85.57, "elapsed_time": "1:23:42", "remaining_time": "0:14:06", "throughput": 4242.13, "total_tokens": 21305288} {"current_steps": 32660, "total_steps": 38160, "loss": 0.3509, "lr": 6.197804793663564e-05, "epoch": 17.11740041928721, "percentage": 85.59, "elapsed_time": "1:23:43", "remaining_time": "0:14:05", "throughput": 4242.2, "total_tokens": 21308808} {"current_steps": 32665, "total_steps": 38160, "loss": 0.394, "lr": 6.18678143411593e-05, "epoch": 17.120020964360588, "percentage": 85.6, "elapsed_time": "1:23:43", "remaining_time": "0:14:05", "throughput": 4242.23, "total_tokens": 21312008} {"current_steps": 32670, "total_steps": 38160, "loss": 0.4111, "lr": 6.175767239793767e-05, "epoch": 17.12264150943396, "percentage": 85.61, "elapsed_time": "1:23:44", "remaining_time": "0:14:04", "throughput": 4242.17, "total_tokens": 21314280} {"current_steps": 32675, "total_steps": 38160, "loss": 0.3724, "lr": 6.164762213001112e-05, "epoch": 17.12526205450734, "percentage": 85.63, "elapsed_time": "1:23:45", "remaining_time": "0:14:03", "throughput": 4242.14, "total_tokens": 21316808} {"current_steps": 32680, "total_steps": 38160, "loss": 0.418, "lr": 6.153766356040107e-05, "epoch": 17.127882599580712, "percentage": 85.64, "elapsed_time": "1:23:45", "remaining_time": "0:14:02", "throughput": 4242.23, "total_tokens": 21320712} {"current_steps": 32685, "total_steps": 38160, "loss": 0.4167, "lr": 6.142779671210951e-05, "epoch": 17.13050314465409, "percentage": 85.65, "elapsed_time": "1:23:46", "remaining_time": "0:14:02", "throughput": 4242.36, "total_tokens": 21324968} {"current_steps": 32690, "total_steps": 38160, "loss": 0.4208, "lr": 6.131802160811956e-05, "epoch": 17.133123689727462, "percentage": 85.67, "elapsed_time": "1:23:47", "remaining_time": "0:14:01", "throughput": 4242.42, "total_tokens": 21328360} {"current_steps": 32695, "total_steps": 38160, "loss": 0.4293, "lr": 6.120833827139466e-05, "epoch": 17.13574423480084, "percentage": 85.68, "elapsed_time": "1:23:48", "remaining_time": "0:14:00", "throughput": 4242.42, "total_tokens": 21331336} {"current_steps": 32700, "total_steps": 38160, "loss": 0.5429, "lr": 6.109874672487936e-05, "epoch": 17.138364779874212, "percentage": 85.69, "elapsed_time": "1:23:48", "remaining_time": "0:13:59", "throughput": 4242.43, "total_tokens": 21334344} {"current_steps": 32705, "total_steps": 38160, "loss": 0.4685, "lr": 6.098924699149894e-05, "epoch": 17.14098532494759, "percentage": 85.7, "elapsed_time": "1:23:49", "remaining_time": "0:13:58", "throughput": 4242.7, "total_tokens": 21340360} {"current_steps": 32710, "total_steps": 38160, "loss": 0.4121, "lr": 6.087983909415962e-05, "epoch": 17.143605870020963, "percentage": 85.72, "elapsed_time": "1:23:50", "remaining_time": "0:13:58", "throughput": 4242.7, "total_tokens": 21343176} {"current_steps": 32715, "total_steps": 38160, "loss": 0.4272, "lr": 6.077052305574815e-05, "epoch": 17.14622641509434, "percentage": 85.73, "elapsed_time": "1:23:51", "remaining_time": "0:13:57", "throughput": 4242.7, "total_tokens": 21346024} {"current_steps": 32720, "total_steps": 38160, "loss": 0.4041, "lr": 6.066129889913241e-05, "epoch": 17.148846960167713, "percentage": 85.74, "elapsed_time": "1:23:52", "remaining_time": "0:13:56", "throughput": 4242.81, "total_tokens": 21350120} {"current_steps": 32725, "total_steps": 38160, "loss": 0.5483, "lr": 6.0552166647160676e-05, "epoch": 17.15146750524109, "percentage": 85.76, "elapsed_time": "1:23:52", "remaining_time": "0:13:55", "throughput": 4242.87, "total_tokens": 21353608} {"current_steps": 32730, "total_steps": 38160, "loss": 0.4283, "lr": 6.044312632266208e-05, "epoch": 17.154088050314467, "percentage": 85.77, "elapsed_time": "1:23:53", "remaining_time": "0:13:55", "throughput": 4243.05, "total_tokens": 21358376} {"current_steps": 32735, "total_steps": 38160, "loss": 0.3568, "lr": 6.03341779484467e-05, "epoch": 17.15670859538784, "percentage": 85.78, "elapsed_time": "1:23:54", "remaining_time": "0:13:54", "throughput": 4243.04, "total_tokens": 21361128} {"current_steps": 32740, "total_steps": 38160, "loss": 0.4453, "lr": 6.022532154730537e-05, "epoch": 17.159329140461217, "percentage": 85.8, "elapsed_time": "1:23:55", "remaining_time": "0:13:53", "throughput": 4243.1, "total_tokens": 21364584} {"current_steps": 32745, "total_steps": 38160, "loss": 0.3939, "lr": 6.011655714200964e-05, "epoch": 17.16194968553459, "percentage": 85.81, "elapsed_time": "1:23:55", "remaining_time": "0:13:52", "throughput": 4243.18, "total_tokens": 21368168} {"current_steps": 32750, "total_steps": 38160, "loss": 0.3776, "lr": 6.0007884755311715e-05, "epoch": 17.164570230607968, "percentage": 85.82, "elapsed_time": "1:23:56", "remaining_time": "0:13:52", "throughput": 4243.24, "total_tokens": 21371752} {"current_steps": 32755, "total_steps": 38160, "loss": 0.5052, "lr": 5.989930440994451e-05, "epoch": 17.16719077568134, "percentage": 85.84, "elapsed_time": "1:23:57", "remaining_time": "0:13:51", "throughput": 4243.24, "total_tokens": 21374632} {"current_steps": 32760, "total_steps": 38160, "loss": 0.4309, "lr": 5.979081612862186e-05, "epoch": 17.169811320754718, "percentage": 85.85, "elapsed_time": "1:23:58", "remaining_time": "0:13:50", "throughput": 4243.25, "total_tokens": 21377608} {"current_steps": 32765, "total_steps": 38160, "loss": 0.4814, "lr": 5.968241993403834e-05, "epoch": 17.17243186582809, "percentage": 85.86, "elapsed_time": "1:23:58", "remaining_time": "0:13:49", "throughput": 4243.32, "total_tokens": 21381192} {"current_steps": 32770, "total_steps": 38160, "loss": 0.59, "lr": 5.957411584886924e-05, "epoch": 17.17505241090147, "percentage": 85.88, "elapsed_time": "1:23:59", "remaining_time": "0:13:48", "throughput": 4243.34, "total_tokens": 21384168} {"current_steps": 32775, "total_steps": 38160, "loss": 0.4088, "lr": 5.946590389577033e-05, "epoch": 17.177672955974842, "percentage": 85.89, "elapsed_time": "1:24:00", "remaining_time": "0:13:48", "throughput": 4243.36, "total_tokens": 21387240} {"current_steps": 32780, "total_steps": 38160, "loss": 0.3617, "lr": 5.935778409737857e-05, "epoch": 17.18029350104822, "percentage": 85.9, "elapsed_time": "1:24:00", "remaining_time": "0:13:47", "throughput": 4243.37, "total_tokens": 21390216} {"current_steps": 32785, "total_steps": 38160, "loss": 0.4383, "lr": 5.92497564763112e-05, "epoch": 17.182914046121592, "percentage": 85.91, "elapsed_time": "1:24:01", "remaining_time": "0:13:46", "throughput": 4243.41, "total_tokens": 21393544} {"current_steps": 32790, "total_steps": 38160, "loss": 0.4618, "lr": 5.914182105516641e-05, "epoch": 17.18553459119497, "percentage": 85.93, "elapsed_time": "1:24:02", "remaining_time": "0:13:45", "throughput": 4243.5, "total_tokens": 21397288} {"current_steps": 32795, "total_steps": 38160, "loss": 0.3427, "lr": 5.903397785652304e-05, "epoch": 17.188155136268342, "percentage": 85.94, "elapsed_time": "1:24:03", "remaining_time": "0:13:44", "throughput": 4243.47, "total_tokens": 21399912} {"current_steps": 32800, "total_steps": 38160, "loss": 0.4168, "lr": 5.8926226902940804e-05, "epoch": 17.19077568134172, "percentage": 85.95, "elapsed_time": "1:24:03", "remaining_time": "0:13:44", "throughput": 4243.45, "total_tokens": 21402472} {"current_steps": 32805, "total_steps": 38160, "loss": 0.3751, "lr": 5.88185682169598e-05, "epoch": 17.193396226415093, "percentage": 85.97, "elapsed_time": "1:24:04", "remaining_time": "0:13:43", "throughput": 4243.44, "total_tokens": 21405352} {"current_steps": 32810, "total_steps": 38160, "loss": 0.3594, "lr": 5.871100182110117e-05, "epoch": 17.19601677148847, "percentage": 85.98, "elapsed_time": "1:24:04", "remaining_time": "0:13:42", "throughput": 4243.42, "total_tokens": 21408008} {"current_steps": 32815, "total_steps": 38160, "loss": 0.5386, "lr": 5.8603527737866314e-05, "epoch": 17.198637316561843, "percentage": 85.99, "elapsed_time": "1:24:05", "remaining_time": "0:13:41", "throughput": 4243.52, "total_tokens": 21411880} {"current_steps": 32820, "total_steps": 38160, "loss": 0.4141, "lr": 5.849614598973779e-05, "epoch": 17.20125786163522, "percentage": 86.01, "elapsed_time": "1:24:06", "remaining_time": "0:13:41", "throughput": 4243.5, "total_tokens": 21414504} {"current_steps": 32825, "total_steps": 38160, "loss": 0.394, "lr": 5.8388856599178644e-05, "epoch": 17.203878406708597, "percentage": 86.02, "elapsed_time": "1:24:07", "remaining_time": "0:13:40", "throughput": 4243.52, "total_tokens": 21417608} {"current_steps": 32830, "total_steps": 38160, "loss": 0.4806, "lr": 5.8281659588632464e-05, "epoch": 17.20649895178197, "percentage": 86.03, "elapsed_time": "1:24:07", "remaining_time": "0:13:39", "throughput": 4243.54, "total_tokens": 21420712} {"current_steps": 32835, "total_steps": 38160, "loss": 0.6107, "lr": 5.817455498052382e-05, "epoch": 17.209119496855347, "percentage": 86.05, "elapsed_time": "1:24:08", "remaining_time": "0:13:38", "throughput": 4243.52, "total_tokens": 21423400} {"current_steps": 32840, "total_steps": 38160, "loss": 0.493, "lr": 5.806754279725751e-05, "epoch": 17.21174004192872, "percentage": 86.06, "elapsed_time": "1:24:09", "remaining_time": "0:13:37", "throughput": 4243.58, "total_tokens": 21426888} {"current_steps": 32845, "total_steps": 38160, "loss": 0.4502, "lr": 5.796062306121947e-05, "epoch": 17.214360587002098, "percentage": 86.07, "elapsed_time": "1:24:09", "remaining_time": "0:13:37", "throughput": 4243.59, "total_tokens": 21429736} {"current_steps": 32850, "total_steps": 38160, "loss": 0.4218, "lr": 5.785379579477607e-05, "epoch": 17.21698113207547, "percentage": 86.08, "elapsed_time": "1:24:10", "remaining_time": "0:13:36", "throughput": 4243.65, "total_tokens": 21433320} {"current_steps": 32855, "total_steps": 38160, "loss": 0.3902, "lr": 5.774706102027427e-05, "epoch": 17.219601677148848, "percentage": 86.1, "elapsed_time": "1:24:11", "remaining_time": "0:13:35", "throughput": 4243.68, "total_tokens": 21436584} {"current_steps": 32860, "total_steps": 38160, "loss": 0.5389, "lr": 5.7640418760041776e-05, "epoch": 17.22222222222222, "percentage": 86.11, "elapsed_time": "1:24:12", "remaining_time": "0:13:34", "throughput": 4243.69, "total_tokens": 21439528} {"current_steps": 32865, "total_steps": 38160, "loss": 0.3843, "lr": 5.753386903638713e-05, "epoch": 17.2248427672956, "percentage": 86.12, "elapsed_time": "1:24:12", "remaining_time": "0:13:34", "throughput": 4243.73, "total_tokens": 21442824} {"current_steps": 32870, "total_steps": 38160, "loss": 0.463, "lr": 5.7427411871599e-05, "epoch": 17.22746331236897, "percentage": 86.14, "elapsed_time": "1:24:13", "remaining_time": "0:13:33", "throughput": 4243.77, "total_tokens": 21446024} {"current_steps": 32875, "total_steps": 38160, "loss": 0.3175, "lr": 5.7321047287947235e-05, "epoch": 17.23008385744235, "percentage": 86.15, "elapsed_time": "1:24:14", "remaining_time": "0:13:32", "throughput": 4243.75, "total_tokens": 21448744} {"current_steps": 32880, "total_steps": 38160, "loss": 0.4293, "lr": 5.72147753076821e-05, "epoch": 17.232704402515722, "percentage": 86.16, "elapsed_time": "1:24:14", "remaining_time": "0:13:31", "throughput": 4243.76, "total_tokens": 21451688} {"current_steps": 32885, "total_steps": 38160, "loss": 0.392, "lr": 5.7108595953034306e-05, "epoch": 17.2353249475891, "percentage": 86.18, "elapsed_time": "1:24:15", "remaining_time": "0:13:30", "throughput": 4243.7, "total_tokens": 21453864} {"current_steps": 32890, "total_steps": 38160, "loss": 0.4352, "lr": 5.7002509246215415e-05, "epoch": 17.237945492662472, "percentage": 86.19, "elapsed_time": "1:24:16", "remaining_time": "0:13:30", "throughput": 4243.71, "total_tokens": 21456936} {"current_steps": 32895, "total_steps": 38160, "loss": 0.3835, "lr": 5.68965152094178e-05, "epoch": 17.24056603773585, "percentage": 86.2, "elapsed_time": "1:24:16", "remaining_time": "0:13:29", "throughput": 4243.77, "total_tokens": 21460424} {"current_steps": 32900, "total_steps": 38160, "loss": 0.41, "lr": 5.679061386481388e-05, "epoch": 17.243186582809223, "percentage": 86.22, "elapsed_time": "1:24:17", "remaining_time": "0:13:28", "throughput": 4243.75, "total_tokens": 21463016} {"current_steps": 32905, "total_steps": 38160, "loss": 0.3866, "lr": 5.6684805234557216e-05, "epoch": 17.2458071278826, "percentage": 86.23, "elapsed_time": "1:24:18", "remaining_time": "0:13:27", "throughput": 4243.81, "total_tokens": 21466632} {"current_steps": 32910, "total_steps": 38160, "loss": 0.4129, "lr": 5.65790893407816e-05, "epoch": 17.248427672955973, "percentage": 86.24, "elapsed_time": "1:24:19", "remaining_time": "0:13:27", "throughput": 4243.82, "total_tokens": 21469544} {"current_steps": 32915, "total_steps": 38160, "loss": 0.351, "lr": 5.647346620560168e-05, "epoch": 17.25104821802935, "percentage": 86.26, "elapsed_time": "1:24:19", "remaining_time": "0:13:26", "throughput": 4243.79, "total_tokens": 21472040} {"current_steps": 32920, "total_steps": 38160, "loss": 0.3674, "lr": 5.6367935851112605e-05, "epoch": 17.253668763102727, "percentage": 86.27, "elapsed_time": "1:24:20", "remaining_time": "0:13:25", "throughput": 4243.87, "total_tokens": 21475784} {"current_steps": 32925, "total_steps": 38160, "loss": 0.3636, "lr": 5.626249829939023e-05, "epoch": 17.2562893081761, "percentage": 86.28, "elapsed_time": "1:24:21", "remaining_time": "0:13:24", "throughput": 4243.97, "total_tokens": 21479656} {"current_steps": 32930, "total_steps": 38160, "loss": 0.3983, "lr": 5.6157153572490795e-05, "epoch": 17.258909853249477, "percentage": 86.29, "elapsed_time": "1:24:21", "remaining_time": "0:13:23", "throughput": 4243.99, "total_tokens": 21482824} {"current_steps": 32935, "total_steps": 38160, "loss": 0.4061, "lr": 5.6051901692451115e-05, "epoch": 17.26153039832285, "percentage": 86.31, "elapsed_time": "1:24:22", "remaining_time": "0:13:23", "throughput": 4243.99, "total_tokens": 21485672} {"current_steps": 32940, "total_steps": 38160, "loss": 0.3703, "lr": 5.5946742681288744e-05, "epoch": 17.264150943396228, "percentage": 86.32, "elapsed_time": "1:24:23", "remaining_time": "0:13:22", "throughput": 4244.0, "total_tokens": 21488616} {"current_steps": 32945, "total_steps": 38160, "loss": 0.3906, "lr": 5.5841676561001805e-05, "epoch": 17.2667714884696, "percentage": 86.33, "elapsed_time": "1:24:23", "remaining_time": "0:13:21", "throughput": 4243.94, "total_tokens": 21490952} {"current_steps": 32950, "total_steps": 38160, "loss": 0.4118, "lr": 5.573670335356901e-05, "epoch": 17.269392033542978, "percentage": 86.35, "elapsed_time": "1:24:24", "remaining_time": "0:13:20", "throughput": 4243.93, "total_tokens": 21493832} {"current_steps": 32955, "total_steps": 38160, "loss": 0.3978, "lr": 5.563182308094933e-05, "epoch": 17.27201257861635, "percentage": 86.36, "elapsed_time": "1:24:25", "remaining_time": "0:13:20", "throughput": 4243.88, "total_tokens": 21496136} {"current_steps": 32960, "total_steps": 38160, "loss": 0.4674, "lr": 5.552703576508272e-05, "epoch": 17.27463312368973, "percentage": 86.37, "elapsed_time": "1:24:25", "remaining_time": "0:13:19", "throughput": 4243.92, "total_tokens": 21499432} {"current_steps": 32965, "total_steps": 38160, "loss": 0.5719, "lr": 5.5422341427889324e-05, "epoch": 17.2772536687631, "percentage": 86.39, "elapsed_time": "1:24:26", "remaining_time": "0:13:18", "throughput": 4243.94, "total_tokens": 21502472} {"current_steps": 32970, "total_steps": 38160, "loss": 0.3526, "lr": 5.531774009127011e-05, "epoch": 17.27987421383648, "percentage": 86.4, "elapsed_time": "1:24:27", "remaining_time": "0:13:17", "throughput": 4244.01, "total_tokens": 21506088} {"current_steps": 32975, "total_steps": 38160, "loss": 0.3815, "lr": 5.521323177710647e-05, "epoch": 17.282494758909852, "percentage": 86.41, "elapsed_time": "1:24:28", "remaining_time": "0:13:16", "throughput": 4244.0, "total_tokens": 21508904} {"current_steps": 32980, "total_steps": 38160, "loss": 0.3538, "lr": 5.510881650726046e-05, "epoch": 17.28511530398323, "percentage": 86.43, "elapsed_time": "1:24:28", "remaining_time": "0:13:16", "throughput": 4243.99, "total_tokens": 21511624} {"current_steps": 32985, "total_steps": 38160, "loss": 0.3559, "lr": 5.50044943035744e-05, "epoch": 17.287735849056602, "percentage": 86.44, "elapsed_time": "1:24:29", "remaining_time": "0:13:15", "throughput": 4243.99, "total_tokens": 21514504} {"current_steps": 32990, "total_steps": 38160, "loss": 0.5067, "lr": 5.490026518787128e-05, "epoch": 17.29035639412998, "percentage": 86.45, "elapsed_time": "1:24:30", "remaining_time": "0:13:14", "throughput": 4243.98, "total_tokens": 21517256} {"current_steps": 32995, "total_steps": 38160, "loss": 0.3926, "lr": 5.47961291819547e-05, "epoch": 17.292976939203353, "percentage": 86.46, "elapsed_time": "1:24:30", "remaining_time": "0:13:13", "throughput": 4244.02, "total_tokens": 21520648} {"current_steps": 33000, "total_steps": 38160, "loss": 0.3751, "lr": 5.46920863076088e-05, "epoch": 17.29559748427673, "percentage": 86.48, "elapsed_time": "1:24:31", "remaining_time": "0:13:13", "throughput": 4244.03, "total_tokens": 21523688} {"current_steps": 33005, "total_steps": 38160, "loss": 0.4624, "lr": 5.4588136586598056e-05, "epoch": 17.298218029350103, "percentage": 86.49, "elapsed_time": "1:24:32", "remaining_time": "0:13:12", "throughput": 4244.07, "total_tokens": 21527016} {"current_steps": 33010, "total_steps": 38160, "loss": 0.3704, "lr": 5.44842800406678e-05, "epoch": 17.30083857442348, "percentage": 86.5, "elapsed_time": "1:24:32", "remaining_time": "0:13:11", "throughput": 4244.12, "total_tokens": 21530408} {"current_steps": 33015, "total_steps": 38160, "loss": 0.4828, "lr": 5.438051669154326e-05, "epoch": 17.303459119496857, "percentage": 86.52, "elapsed_time": "1:24:33", "remaining_time": "0:13:10", "throughput": 4244.12, "total_tokens": 21533288} {"current_steps": 33020, "total_steps": 38160, "loss": 0.4014, "lr": 5.427684656093074e-05, "epoch": 17.30607966457023, "percentage": 86.53, "elapsed_time": "1:24:34", "remaining_time": "0:13:09", "throughput": 4244.15, "total_tokens": 21536520} {"current_steps": 33025, "total_steps": 38160, "loss": 0.4764, "lr": 5.417326967051683e-05, "epoch": 17.308700209643607, "percentage": 86.54, "elapsed_time": "1:24:35", "remaining_time": "0:13:09", "throughput": 4244.14, "total_tokens": 21539304} {"current_steps": 33030, "total_steps": 38160, "loss": 0.3808, "lr": 5.4069786041968663e-05, "epoch": 17.31132075471698, "percentage": 86.56, "elapsed_time": "1:24:35", "remaining_time": "0:13:08", "throughput": 4244.16, "total_tokens": 21542472} {"current_steps": 33035, "total_steps": 38160, "loss": 0.4685, "lr": 5.39663956969339e-05, "epoch": 17.313941299790358, "percentage": 86.57, "elapsed_time": "1:24:36", "remaining_time": "0:13:07", "throughput": 4244.2, "total_tokens": 21545736} {"current_steps": 33040, "total_steps": 38160, "loss": 0.5184, "lr": 5.3863098657040534e-05, "epoch": 17.31656184486373, "percentage": 86.58, "elapsed_time": "1:24:37", "remaining_time": "0:13:06", "throughput": 4244.21, "total_tokens": 21548744} {"current_steps": 33045, "total_steps": 38160, "loss": 0.527, "lr": 5.375989494389705e-05, "epoch": 17.319182389937108, "percentage": 86.6, "elapsed_time": "1:24:37", "remaining_time": "0:13:05", "throughput": 4244.21, "total_tokens": 21551592} {"current_steps": 33050, "total_steps": 38160, "loss": 0.4336, "lr": 5.365678457909257e-05, "epoch": 17.32180293501048, "percentage": 86.61, "elapsed_time": "1:24:38", "remaining_time": "0:13:05", "throughput": 4244.19, "total_tokens": 21554216} {"current_steps": 33055, "total_steps": 38160, "loss": 0.3176, "lr": 5.3553767584196555e-05, "epoch": 17.32442348008386, "percentage": 86.62, "elapsed_time": "1:24:39", "remaining_time": "0:13:04", "throughput": 4244.17, "total_tokens": 21556776} {"current_steps": 33060, "total_steps": 38160, "loss": 0.4414, "lr": 5.3450843980759166e-05, "epoch": 17.32704402515723, "percentage": 86.64, "elapsed_time": "1:24:39", "remaining_time": "0:13:03", "throughput": 4244.19, "total_tokens": 21559976} {"current_steps": 33065, "total_steps": 38160, "loss": 0.4347, "lr": 5.3348013790310736e-05, "epoch": 17.32966457023061, "percentage": 86.65, "elapsed_time": "1:24:40", "remaining_time": "0:13:02", "throughput": 4244.19, "total_tokens": 21562792} {"current_steps": 33070, "total_steps": 38160, "loss": 0.5078, "lr": 5.324527703436199e-05, "epoch": 17.332285115303982, "percentage": 86.66, "elapsed_time": "1:24:41", "remaining_time": "0:13:02", "throughput": 4244.2, "total_tokens": 21565736} {"current_steps": 33075, "total_steps": 38160, "loss": 0.3595, "lr": 5.314263373440448e-05, "epoch": 17.33490566037736, "percentage": 86.67, "elapsed_time": "1:24:42", "remaining_time": "0:13:01", "throughput": 4244.31, "total_tokens": 21569864} {"current_steps": 33080, "total_steps": 38160, "loss": 0.2607, "lr": 5.304008391190995e-05, "epoch": 17.337526205450732, "percentage": 86.69, "elapsed_time": "1:24:42", "remaining_time": "0:13:00", "throughput": 4244.32, "total_tokens": 21572776} {"current_steps": 33085, "total_steps": 38160, "loss": 0.5977, "lr": 5.293762758833071e-05, "epoch": 17.34014675052411, "percentage": 86.7, "elapsed_time": "1:24:43", "remaining_time": "0:12:59", "throughput": 4244.41, "total_tokens": 21576584} {"current_steps": 33090, "total_steps": 38160, "loss": 0.4244, "lr": 5.283526478509953e-05, "epoch": 17.342767295597483, "percentage": 86.71, "elapsed_time": "1:24:44", "remaining_time": "0:12:58", "throughput": 4244.41, "total_tokens": 21579496} {"current_steps": 33095, "total_steps": 38160, "loss": 0.4943, "lr": 5.273299552362942e-05, "epoch": 17.34538784067086, "percentage": 86.73, "elapsed_time": "1:24:44", "remaining_time": "0:12:58", "throughput": 4244.39, "total_tokens": 21582120} {"current_steps": 33100, "total_steps": 38160, "loss": 0.479, "lr": 5.263081982531381e-05, "epoch": 17.348008385744233, "percentage": 86.74, "elapsed_time": "1:24:45", "remaining_time": "0:12:57", "throughput": 4244.42, "total_tokens": 21585224} {"current_steps": 33105, "total_steps": 38160, "loss": 0.3173, "lr": 5.2528737711526885e-05, "epoch": 17.35062893081761, "percentage": 86.75, "elapsed_time": "1:24:46", "remaining_time": "0:12:56", "throughput": 4244.44, "total_tokens": 21588264} {"current_steps": 33110, "total_steps": 38160, "loss": 0.4901, "lr": 5.2426749203623005e-05, "epoch": 17.353249475890987, "percentage": 86.77, "elapsed_time": "1:24:46", "remaining_time": "0:12:55", "throughput": 4244.47, "total_tokens": 21591464} {"current_steps": 33115, "total_steps": 38160, "loss": 0.4028, "lr": 5.23248543229371e-05, "epoch": 17.35587002096436, "percentage": 86.78, "elapsed_time": "1:24:47", "remaining_time": "0:12:55", "throughput": 4244.44, "total_tokens": 21594024} {"current_steps": 33120, "total_steps": 38160, "loss": 0.4915, "lr": 5.222305309078429e-05, "epoch": 17.358490566037737, "percentage": 86.79, "elapsed_time": "1:24:48", "remaining_time": "0:12:54", "throughput": 4244.43, "total_tokens": 21596776} {"current_steps": 33125, "total_steps": 38160, "loss": 0.2863, "lr": 5.2121345528460205e-05, "epoch": 17.36111111111111, "percentage": 86.81, "elapsed_time": "1:24:49", "remaining_time": "0:12:53", "throughput": 4244.5, "total_tokens": 21600392} {"current_steps": 33130, "total_steps": 38160, "loss": 0.5997, "lr": 5.201973165724094e-05, "epoch": 17.363731656184488, "percentage": 86.82, "elapsed_time": "1:24:49", "remaining_time": "0:12:52", "throughput": 4244.55, "total_tokens": 21603880} {"current_steps": 33135, "total_steps": 38160, "loss": 0.4048, "lr": 5.1918211498382996e-05, "epoch": 17.36635220125786, "percentage": 86.83, "elapsed_time": "1:24:50", "remaining_time": "0:12:51", "throughput": 4244.54, "total_tokens": 21606600} {"current_steps": 33140, "total_steps": 38160, "loss": 0.5321, "lr": 5.181678507312332e-05, "epoch": 17.368972746331238, "percentage": 86.84, "elapsed_time": "1:24:51", "remaining_time": "0:12:51", "throughput": 4244.67, "total_tokens": 21610856} {"current_steps": 33145, "total_steps": 38160, "loss": 0.3787, "lr": 5.171545240267894e-05, "epoch": 17.37159329140461, "percentage": 86.86, "elapsed_time": "1:24:52", "remaining_time": "0:12:50", "throughput": 4244.79, "total_tokens": 21615016} {"current_steps": 33150, "total_steps": 38160, "loss": 0.4646, "lr": 5.161421350824774e-05, "epoch": 17.37421383647799, "percentage": 86.87, "elapsed_time": "1:24:52", "remaining_time": "0:12:49", "throughput": 4244.89, "total_tokens": 21618920} {"current_steps": 33155, "total_steps": 38160, "loss": 0.3266, "lr": 5.151306841100756e-05, "epoch": 17.37683438155136, "percentage": 86.88, "elapsed_time": "1:24:53", "remaining_time": "0:12:48", "throughput": 4244.92, "total_tokens": 21621960} {"current_steps": 33160, "total_steps": 38160, "loss": 0.4023, "lr": 5.141201713211679e-05, "epoch": 17.37945492662474, "percentage": 86.9, "elapsed_time": "1:24:54", "remaining_time": "0:12:48", "throughput": 4244.89, "total_tokens": 21624584} {"current_steps": 33165, "total_steps": 38160, "loss": 0.3914, "lr": 5.1311059692714324e-05, "epoch": 17.382075471698112, "percentage": 86.91, "elapsed_time": "1:24:55", "remaining_time": "0:12:47", "throughput": 4244.96, "total_tokens": 21628200} {"current_steps": 33170, "total_steps": 38160, "loss": 0.3089, "lr": 5.1210196113919306e-05, "epoch": 17.38469601677149, "percentage": 86.92, "elapsed_time": "1:24:55", "remaining_time": "0:12:46", "throughput": 4244.94, "total_tokens": 21630792} {"current_steps": 33175, "total_steps": 38160, "loss": 0.5198, "lr": 5.110942641683114e-05, "epoch": 17.387316561844862, "percentage": 86.94, "elapsed_time": "1:24:56", "remaining_time": "0:12:45", "throughput": 4244.93, "total_tokens": 21633480} {"current_steps": 33180, "total_steps": 38160, "loss": 0.4214, "lr": 5.10087506225298e-05, "epoch": 17.38993710691824, "percentage": 86.95, "elapsed_time": "1:24:57", "remaining_time": "0:12:45", "throughput": 4244.95, "total_tokens": 21636584} {"current_steps": 33185, "total_steps": 38160, "loss": 0.4284, "lr": 5.090816875207543e-05, "epoch": 17.392557651991613, "percentage": 86.96, "elapsed_time": "1:24:57", "remaining_time": "0:12:44", "throughput": 4244.97, "total_tokens": 21639624} {"current_steps": 33190, "total_steps": 38160, "loss": 0.5439, "lr": 5.0807680826508604e-05, "epoch": 17.39517819706499, "percentage": 86.98, "elapsed_time": "1:24:58", "remaining_time": "0:12:43", "throughput": 4244.96, "total_tokens": 21642248} {"current_steps": 33195, "total_steps": 38160, "loss": 0.5228, "lr": 5.070728686685039e-05, "epoch": 17.397798742138363, "percentage": 86.99, "elapsed_time": "1:24:59", "remaining_time": "0:12:42", "throughput": 4244.99, "total_tokens": 21645576} {"current_steps": 33200, "total_steps": 38160, "loss": 0.5018, "lr": 5.0606986894101925e-05, "epoch": 17.40041928721174, "percentage": 87.0, "elapsed_time": "1:24:59", "remaining_time": "0:12:41", "throughput": 4245.01, "total_tokens": 21648712} {"current_steps": 33205, "total_steps": 38160, "loss": 0.4804, "lr": 5.0506780929244875e-05, "epoch": 17.403039832285117, "percentage": 87.02, "elapsed_time": "1:25:00", "remaining_time": "0:12:41", "throughput": 4245.02, "total_tokens": 21651624} {"current_steps": 33210, "total_steps": 38160, "loss": 0.5293, "lr": 5.040666899324109e-05, "epoch": 17.40566037735849, "percentage": 87.03, "elapsed_time": "1:25:01", "remaining_time": "0:12:40", "throughput": 4245.11, "total_tokens": 21655624} {"current_steps": 33215, "total_steps": 38160, "loss": 0.4831, "lr": 5.0306651107032916e-05, "epoch": 17.408280922431867, "percentage": 87.04, "elapsed_time": "1:25:01", "remaining_time": "0:12:39", "throughput": 4245.13, "total_tokens": 21658632} {"current_steps": 33220, "total_steps": 38160, "loss": 0.3506, "lr": 5.020672729154308e-05, "epoch": 17.41090146750524, "percentage": 87.05, "elapsed_time": "1:25:02", "remaining_time": "0:12:38", "throughput": 4245.15, "total_tokens": 21661736} {"current_steps": 33225, "total_steps": 38160, "loss": 0.4854, "lr": 5.010689756767428e-05, "epoch": 17.413522012578618, "percentage": 87.07, "elapsed_time": "1:25:03", "remaining_time": "0:12:38", "throughput": 4245.17, "total_tokens": 21664776} {"current_steps": 33230, "total_steps": 38160, "loss": 0.4165, "lr": 5.000716195630983e-05, "epoch": 17.41614255765199, "percentage": 87.08, "elapsed_time": "1:25:04", "remaining_time": "0:12:37", "throughput": 4245.18, "total_tokens": 21667752} {"current_steps": 33235, "total_steps": 38160, "loss": 0.5431, "lr": 4.990752047831343e-05, "epoch": 17.418763102725368, "percentage": 87.09, "elapsed_time": "1:25:04", "remaining_time": "0:12:36", "throughput": 4245.31, "total_tokens": 21672168} {"current_steps": 33240, "total_steps": 38160, "loss": 0.4762, "lr": 4.980797315452873e-05, "epoch": 17.42138364779874, "percentage": 87.11, "elapsed_time": "1:25:05", "remaining_time": "0:12:35", "throughput": 4245.26, "total_tokens": 21674472} {"current_steps": 33245, "total_steps": 38160, "loss": 0.6127, "lr": 4.9708520005779965e-05, "epoch": 17.42400419287212, "percentage": 87.12, "elapsed_time": "1:25:06", "remaining_time": "0:12:34", "throughput": 4245.28, "total_tokens": 21677608} {"current_steps": 33250, "total_steps": 38160, "loss": 0.4198, "lr": 4.960916105287172e-05, "epoch": 17.42662473794549, "percentage": 87.13, "elapsed_time": "1:25:06", "remaining_time": "0:12:34", "throughput": 4245.29, "total_tokens": 21680552} {"current_steps": 33255, "total_steps": 38160, "loss": 0.4861, "lr": 4.950989631658859e-05, "epoch": 17.42924528301887, "percentage": 87.15, "elapsed_time": "1:25:07", "remaining_time": "0:12:33", "throughput": 4245.22, "total_tokens": 21682696} {"current_steps": 33260, "total_steps": 38160, "loss": 0.4762, "lr": 4.941072581769562e-05, "epoch": 17.431865828092242, "percentage": 87.16, "elapsed_time": "1:25:08", "remaining_time": "0:12:32", "throughput": 4245.35, "total_tokens": 21686920} {"current_steps": 33265, "total_steps": 38160, "loss": 0.3148, "lr": 4.931164957693834e-05, "epoch": 17.43448637316562, "percentage": 87.17, "elapsed_time": "1:25:09", "remaining_time": "0:12:31", "throughput": 4245.32, "total_tokens": 21689416} {"current_steps": 33270, "total_steps": 38160, "loss": 0.2847, "lr": 4.921266761504217e-05, "epoch": 17.437106918238992, "percentage": 87.19, "elapsed_time": "1:25:09", "remaining_time": "0:12:31", "throughput": 4245.42, "total_tokens": 21693480} {"current_steps": 33275, "total_steps": 38160, "loss": 0.4305, "lr": 4.9113779952713155e-05, "epoch": 17.43972746331237, "percentage": 87.2, "elapsed_time": "1:25:10", "remaining_time": "0:12:30", "throughput": 4245.41, "total_tokens": 21696296} {"current_steps": 33280, "total_steps": 38160, "loss": 0.3671, "lr": 4.90149866106373e-05, "epoch": 17.442348008385743, "percentage": 87.21, "elapsed_time": "1:25:11", "remaining_time": "0:12:29", "throughput": 4245.63, "total_tokens": 21702088} {"current_steps": 33285, "total_steps": 38160, "loss": 0.4839, "lr": 4.8916287609481137e-05, "epoch": 17.44496855345912, "percentage": 87.22, "elapsed_time": "1:25:12", "remaining_time": "0:12:28", "throughput": 4245.65, "total_tokens": 21705160} {"current_steps": 33290, "total_steps": 38160, "loss": 0.4909, "lr": 4.8817682969891366e-05, "epoch": 17.447589098532493, "percentage": 87.24, "elapsed_time": "1:25:13", "remaining_time": "0:12:27", "throughput": 4245.68, "total_tokens": 21708328} {"current_steps": 33295, "total_steps": 38160, "loss": 0.5671, "lr": 4.8719172712495095e-05, "epoch": 17.45020964360587, "percentage": 87.25, "elapsed_time": "1:25:14", "remaining_time": "0:12:27", "throughput": 4245.91, "total_tokens": 21713768} {"current_steps": 33300, "total_steps": 38160, "loss": 0.3934, "lr": 4.862075685789935e-05, "epoch": 17.452830188679247, "percentage": 87.26, "elapsed_time": "1:25:14", "remaining_time": "0:12:26", "throughput": 4245.95, "total_tokens": 21717192} {"current_steps": 33305, "total_steps": 38160, "loss": 0.471, "lr": 4.8522435426691604e-05, "epoch": 17.45545073375262, "percentage": 87.28, "elapsed_time": "1:25:15", "remaining_time": "0:12:25", "throughput": 4246.05, "total_tokens": 21721384} {"current_steps": 33310, "total_steps": 38160, "loss": 0.4155, "lr": 4.842420843943962e-05, "epoch": 17.458071278825997, "percentage": 87.29, "elapsed_time": "1:25:16", "remaining_time": "0:12:24", "throughput": 4246.06, "total_tokens": 21724392} {"current_steps": 33315, "total_steps": 38160, "loss": 0.5012, "lr": 4.8326075916691415e-05, "epoch": 17.46069182389937, "percentage": 87.3, "elapsed_time": "1:25:17", "remaining_time": "0:12:24", "throughput": 4246.06, "total_tokens": 21727208} {"current_steps": 33320, "total_steps": 38160, "loss": 0.3648, "lr": 4.822803787897523e-05, "epoch": 17.463312368972748, "percentage": 87.32, "elapsed_time": "1:25:17", "remaining_time": "0:12:23", "throughput": 4246.05, "total_tokens": 21729960} {"current_steps": 33325, "total_steps": 38160, "loss": 0.4283, "lr": 4.813009434679932e-05, "epoch": 17.46593291404612, "percentage": 87.33, "elapsed_time": "1:25:18", "remaining_time": "0:12:22", "throughput": 4246.17, "total_tokens": 21734216} {"current_steps": 33330, "total_steps": 38160, "loss": 0.5188, "lr": 4.803224534065259e-05, "epoch": 17.468553459119498, "percentage": 87.34, "elapsed_time": "1:25:19", "remaining_time": "0:12:21", "throughput": 4246.28, "total_tokens": 21738152} {"current_steps": 33335, "total_steps": 38160, "loss": 0.483, "lr": 4.793449088100371e-05, "epoch": 17.47117400419287, "percentage": 87.36, "elapsed_time": "1:25:20", "remaining_time": "0:12:21", "throughput": 4246.33, "total_tokens": 21741576} {"current_steps": 33340, "total_steps": 38160, "loss": 0.328, "lr": 4.783683098830188e-05, "epoch": 17.47379454926625, "percentage": 87.37, "elapsed_time": "1:25:20", "remaining_time": "0:12:20", "throughput": 4246.4, "total_tokens": 21745224} {"current_steps": 33345, "total_steps": 38160, "loss": 0.5175, "lr": 4.7739265682976485e-05, "epoch": 17.47641509433962, "percentage": 87.38, "elapsed_time": "1:25:21", "remaining_time": "0:12:19", "throughput": 4246.44, "total_tokens": 21748424} {"current_steps": 33350, "total_steps": 38160, "loss": 0.4269, "lr": 4.764179498543714e-05, "epoch": 17.479035639413, "percentage": 87.4, "elapsed_time": "1:25:22", "remaining_time": "0:12:18", "throughput": 4246.44, "total_tokens": 21751336} {"current_steps": 33355, "total_steps": 38160, "loss": 0.3598, "lr": 4.754441891607347e-05, "epoch": 17.481656184486372, "percentage": 87.41, "elapsed_time": "1:25:22", "remaining_time": "0:12:17", "throughput": 4246.48, "total_tokens": 21754568} {"current_steps": 33360, "total_steps": 38160, "loss": 0.3643, "lr": 4.7447137495255424e-05, "epoch": 17.48427672955975, "percentage": 87.42, "elapsed_time": "1:25:23", "remaining_time": "0:12:17", "throughput": 4246.52, "total_tokens": 21757832} {"current_steps": 33365, "total_steps": 38160, "loss": 0.3252, "lr": 4.7349950743333206e-05, "epoch": 17.486897274633122, "percentage": 87.43, "elapsed_time": "1:25:24", "remaining_time": "0:12:16", "throughput": 4246.54, "total_tokens": 21760968} {"current_steps": 33370, "total_steps": 38160, "loss": 0.3677, "lr": 4.725285868063722e-05, "epoch": 17.4895178197065, "percentage": 87.45, "elapsed_time": "1:25:25", "remaining_time": "0:12:15", "throughput": 4246.65, "total_tokens": 21765160} {"current_steps": 33375, "total_steps": 38160, "loss": 0.5912, "lr": 4.715586132747801e-05, "epoch": 17.492138364779873, "percentage": 87.46, "elapsed_time": "1:25:26", "remaining_time": "0:12:14", "throughput": 4246.69, "total_tokens": 21768584} {"current_steps": 33380, "total_steps": 38160, "loss": 0.4237, "lr": 4.705895870414634e-05, "epoch": 17.49475890985325, "percentage": 87.47, "elapsed_time": "1:25:26", "remaining_time": "0:12:14", "throughput": 4246.68, "total_tokens": 21771304} {"current_steps": 33385, "total_steps": 38160, "loss": 0.508, "lr": 4.696215083091299e-05, "epoch": 17.497379454926623, "percentage": 87.49, "elapsed_time": "1:25:27", "remaining_time": "0:12:13", "throughput": 4246.72, "total_tokens": 21774568} {"current_steps": 33390, "total_steps": 38160, "loss": 0.5091, "lr": 4.686543772802915e-05, "epoch": 17.5, "percentage": 87.5, "elapsed_time": "1:25:28", "remaining_time": "0:12:12", "throughput": 4246.73, "total_tokens": 21777608} {"current_steps": 33395, "total_steps": 38160, "loss": 0.3965, "lr": 4.6768819415726085e-05, "epoch": 17.502620545073377, "percentage": 87.51, "elapsed_time": "1:25:28", "remaining_time": "0:12:11", "throughput": 4246.82, "total_tokens": 21781288} {"current_steps": 33400, "total_steps": 38160, "loss": 0.4878, "lr": 4.667229591421529e-05, "epoch": 17.50524109014675, "percentage": 87.53, "elapsed_time": "1:25:29", "remaining_time": "0:12:11", "throughput": 4246.81, "total_tokens": 21784168} {"current_steps": 33405, "total_steps": 38160, "loss": 0.4145, "lr": 4.657586724368845e-05, "epoch": 17.507861635220127, "percentage": 87.54, "elapsed_time": "1:25:30", "remaining_time": "0:12:10", "throughput": 4246.79, "total_tokens": 21786760} {"current_steps": 33410, "total_steps": 38160, "loss": 0.4018, "lr": 4.647953342431726e-05, "epoch": 17.5104821802935, "percentage": 87.55, "elapsed_time": "1:25:30", "remaining_time": "0:12:09", "throughput": 4246.77, "total_tokens": 21789352} {"current_steps": 33415, "total_steps": 38160, "loss": 0.4819, "lr": 4.63832944762535e-05, "epoch": 17.513102725366878, "percentage": 87.57, "elapsed_time": "1:25:31", "remaining_time": "0:12:08", "throughput": 4246.78, "total_tokens": 21792296} {"current_steps": 33420, "total_steps": 38160, "loss": 0.3734, "lr": 4.628715041962944e-05, "epoch": 17.51572327044025, "percentage": 87.58, "elapsed_time": "1:25:32", "remaining_time": "0:12:07", "throughput": 4246.75, "total_tokens": 21794824} {"current_steps": 33425, "total_steps": 38160, "loss": 0.4251, "lr": 4.619110127455728e-05, "epoch": 17.518343815513628, "percentage": 87.59, "elapsed_time": "1:25:32", "remaining_time": "0:12:07", "throughput": 4246.77, "total_tokens": 21797928} {"current_steps": 33430, "total_steps": 38160, "loss": 0.6305, "lr": 4.6095147061129494e-05, "epoch": 17.520964360587, "percentage": 87.6, "elapsed_time": "1:25:33", "remaining_time": "0:12:06", "throughput": 4246.82, "total_tokens": 21801352} {"current_steps": 33435, "total_steps": 38160, "loss": 0.4136, "lr": 4.599928779941853e-05, "epoch": 17.52358490566038, "percentage": 87.62, "elapsed_time": "1:25:34", "remaining_time": "0:12:05", "throughput": 4246.96, "total_tokens": 21805768} {"current_steps": 33440, "total_steps": 38160, "loss": 0.3404, "lr": 4.590352350947691e-05, "epoch": 17.52620545073375, "percentage": 87.63, "elapsed_time": "1:25:35", "remaining_time": "0:12:04", "throughput": 4246.96, "total_tokens": 21808648} {"current_steps": 33445, "total_steps": 38160, "loss": 0.4684, "lr": 4.580785421133759e-05, "epoch": 17.52882599580713, "percentage": 87.64, "elapsed_time": "1:25:35", "remaining_time": "0:12:04", "throughput": 4246.92, "total_tokens": 21811080} {"current_steps": 33450, "total_steps": 38160, "loss": 0.336, "lr": 4.571227992501348e-05, "epoch": 17.531446540880502, "percentage": 87.66, "elapsed_time": "1:25:36", "remaining_time": "0:12:03", "throughput": 4246.98, "total_tokens": 21814568} {"current_steps": 33455, "total_steps": 38160, "loss": 0.4212, "lr": 4.561680067049773e-05, "epoch": 17.53406708595388, "percentage": 87.67, "elapsed_time": "1:25:37", "remaining_time": "0:12:02", "throughput": 4246.97, "total_tokens": 21817416} {"current_steps": 33460, "total_steps": 38160, "loss": 0.4055, "lr": 4.552141646776331e-05, "epoch": 17.536687631027252, "percentage": 87.68, "elapsed_time": "1:25:37", "remaining_time": "0:12:01", "throughput": 4247.0, "total_tokens": 21820648} {"current_steps": 33465, "total_steps": 38160, "loss": 0.4766, "lr": 4.542612733676365e-05, "epoch": 17.53930817610063, "percentage": 87.7, "elapsed_time": "1:25:38", "remaining_time": "0:12:00", "throughput": 4247.0, "total_tokens": 21823560} {"current_steps": 33470, "total_steps": 38160, "loss": 0.5102, "lr": 4.533093329743204e-05, "epoch": 17.541928721174003, "percentage": 87.71, "elapsed_time": "1:25:39", "remaining_time": "0:12:00", "throughput": 4247.07, "total_tokens": 21827208} {"current_steps": 33475, "total_steps": 38160, "loss": 0.5166, "lr": 4.523583436968204e-05, "epoch": 17.54454926624738, "percentage": 87.72, "elapsed_time": "1:25:40", "remaining_time": "0:11:59", "throughput": 4247.07, "total_tokens": 21830120} {"current_steps": 33480, "total_steps": 38160, "loss": 0.43, "lr": 4.514083057340723e-05, "epoch": 17.547169811320753, "percentage": 87.74, "elapsed_time": "1:25:40", "remaining_time": "0:11:58", "throughput": 4247.07, "total_tokens": 21833064} {"current_steps": 33485, "total_steps": 38160, "loss": 0.4397, "lr": 4.504592192848151e-05, "epoch": 17.54979035639413, "percentage": 87.75, "elapsed_time": "1:25:41", "remaining_time": "0:11:57", "throughput": 4247.05, "total_tokens": 21835752} {"current_steps": 33490, "total_steps": 38160, "loss": 0.5432, "lr": 4.495110845475847e-05, "epoch": 17.552410901467507, "percentage": 87.76, "elapsed_time": "1:25:42", "remaining_time": "0:11:57", "throughput": 4247.06, "total_tokens": 21838664} {"current_steps": 33495, "total_steps": 38160, "loss": 0.4565, "lr": 4.4856390172072045e-05, "epoch": 17.55503144654088, "percentage": 87.78, "elapsed_time": "1:25:42", "remaining_time": "0:11:56", "throughput": 4247.11, "total_tokens": 21842184} {"current_steps": 33500, "total_steps": 38160, "loss": 0.4242, "lr": 4.476176710023622e-05, "epoch": 17.557651991614257, "percentage": 87.79, "elapsed_time": "1:25:43", "remaining_time": "0:11:55", "throughput": 4247.12, "total_tokens": 21845224} {"current_steps": 33505, "total_steps": 38160, "loss": 0.6302, "lr": 4.4667239259045035e-05, "epoch": 17.56027253668763, "percentage": 87.8, "elapsed_time": "1:25:44", "remaining_time": "0:11:54", "throughput": 4247.17, "total_tokens": 21848552} {"current_steps": 33510, "total_steps": 38160, "loss": 0.4343, "lr": 4.457280666827285e-05, "epoch": 17.562893081761008, "percentage": 87.81, "elapsed_time": "1:25:44", "remaining_time": "0:11:53", "throughput": 4247.12, "total_tokens": 21850856} {"current_steps": 33515, "total_steps": 38160, "loss": 0.3459, "lr": 4.447846934767358e-05, "epoch": 17.56551362683438, "percentage": 87.83, "elapsed_time": "1:25:45", "remaining_time": "0:11:53", "throughput": 4247.3, "total_tokens": 21856104} {"current_steps": 33520, "total_steps": 38160, "loss": 0.3168, "lr": 4.4384227316981774e-05, "epoch": 17.568134171907758, "percentage": 87.84, "elapsed_time": "1:25:46", "remaining_time": "0:11:52", "throughput": 4247.25, "total_tokens": 21858440} {"current_steps": 33525, "total_steps": 38160, "loss": 0.7186, "lr": 4.4290080595911555e-05, "epoch": 17.57075471698113, "percentage": 87.85, "elapsed_time": "1:25:47", "remaining_time": "0:11:51", "throughput": 4247.23, "total_tokens": 21861064} {"current_steps": 33530, "total_steps": 38160, "loss": 0.2812, "lr": 4.419602920415749e-05, "epoch": 17.57337526205451, "percentage": 87.87, "elapsed_time": "1:25:47", "remaining_time": "0:11:50", "throughput": 4247.22, "total_tokens": 21863848} {"current_steps": 33535, "total_steps": 38160, "loss": 0.4325, "lr": 4.410207316139408e-05, "epoch": 17.57599580712788, "percentage": 87.88, "elapsed_time": "1:25:48", "remaining_time": "0:11:50", "throughput": 4247.26, "total_tokens": 21867208} {"current_steps": 33540, "total_steps": 38160, "loss": 0.3927, "lr": 4.400821248727577e-05, "epoch": 17.57861635220126, "percentage": 87.89, "elapsed_time": "1:25:49", "remaining_time": "0:11:49", "throughput": 4247.43, "total_tokens": 21871944} {"current_steps": 33545, "total_steps": 38160, "loss": 0.2418, "lr": 4.391444720143717e-05, "epoch": 17.581236897274632, "percentage": 87.91, "elapsed_time": "1:25:50", "remaining_time": "0:11:48", "throughput": 4247.42, "total_tokens": 21874728} {"current_steps": 33550, "total_steps": 38160, "loss": 0.3814, "lr": 4.382077732349299e-05, "epoch": 17.58385744234801, "percentage": 87.92, "elapsed_time": "1:25:50", "remaining_time": "0:11:47", "throughput": 4247.39, "total_tokens": 21877320} {"current_steps": 33555, "total_steps": 38160, "loss": 0.3933, "lr": 4.372720287303772e-05, "epoch": 17.586477987421382, "percentage": 87.93, "elapsed_time": "1:25:51", "remaining_time": "0:11:46", "throughput": 4247.41, "total_tokens": 21880488} {"current_steps": 33560, "total_steps": 38160, "loss": 0.4753, "lr": 4.3633723869646204e-05, "epoch": 17.58909853249476, "percentage": 87.95, "elapsed_time": "1:25:52", "remaining_time": "0:11:46", "throughput": 4247.38, "total_tokens": 21883080} {"current_steps": 33565, "total_steps": 38160, "loss": 0.5058, "lr": 4.3540340332873184e-05, "epoch": 17.591719077568133, "percentage": 87.96, "elapsed_time": "1:25:52", "remaining_time": "0:11:45", "throughput": 4247.43, "total_tokens": 21886536} {"current_steps": 33570, "total_steps": 38160, "loss": 0.4338, "lr": 4.3447052282253375e-05, "epoch": 17.59433962264151, "percentage": 87.97, "elapsed_time": "1:25:53", "remaining_time": "0:11:44", "throughput": 4247.48, "total_tokens": 21889896} {"current_steps": 33575, "total_steps": 38160, "loss": 0.414, "lr": 4.335385973730166e-05, "epoch": 17.596960167714883, "percentage": 87.98, "elapsed_time": "1:25:54", "remaining_time": "0:11:43", "throughput": 4247.52, "total_tokens": 21893256} {"current_steps": 33580, "total_steps": 38160, "loss": 0.432, "lr": 4.3260762717512726e-05, "epoch": 17.59958071278826, "percentage": 88.0, "elapsed_time": "1:25:55", "remaining_time": "0:11:43", "throughput": 4247.53, "total_tokens": 21896328} {"current_steps": 33585, "total_steps": 38160, "loss": 0.5007, "lr": 4.316776124236144e-05, "epoch": 17.602201257861637, "percentage": 88.01, "elapsed_time": "1:25:55", "remaining_time": "0:11:42", "throughput": 4247.51, "total_tokens": 21898856} {"current_steps": 33590, "total_steps": 38160, "loss": 0.4096, "lr": 4.307485533130279e-05, "epoch": 17.60482180293501, "percentage": 88.02, "elapsed_time": "1:25:56", "remaining_time": "0:11:41", "throughput": 4247.53, "total_tokens": 21901992} {"current_steps": 33595, "total_steps": 38160, "loss": 0.3407, "lr": 4.298204500377145e-05, "epoch": 17.607442348008387, "percentage": 88.04, "elapsed_time": "1:25:57", "remaining_time": "0:11:40", "throughput": 4247.54, "total_tokens": 21904904} {"current_steps": 33600, "total_steps": 38160, "loss": 0.3532, "lr": 4.288933027918235e-05, "epoch": 17.61006289308176, "percentage": 88.05, "elapsed_time": "1:25:57", "remaining_time": "0:11:39", "throughput": 4247.63, "total_tokens": 21908808} {"current_steps": 33605, "total_steps": 38160, "loss": 0.4137, "lr": 4.279671117693046e-05, "epoch": 17.612683438155138, "percentage": 88.06, "elapsed_time": "1:25:58", "remaining_time": "0:11:39", "throughput": 4247.63, "total_tokens": 21911720} {"current_steps": 33610, "total_steps": 38160, "loss": 0.3514, "lr": 4.270418771639045e-05, "epoch": 17.61530398322851, "percentage": 88.08, "elapsed_time": "1:25:59", "remaining_time": "0:11:38", "throughput": 4247.57, "total_tokens": 21914024} {"current_steps": 33615, "total_steps": 38160, "loss": 0.3577, "lr": 4.2611759916917345e-05, "epoch": 17.617924528301888, "percentage": 88.09, "elapsed_time": "1:25:59", "remaining_time": "0:11:37", "throughput": 4247.54, "total_tokens": 21916648} {"current_steps": 33620, "total_steps": 38160, "loss": 0.4317, "lr": 4.251942779784579e-05, "epoch": 17.62054507337526, "percentage": 88.1, "elapsed_time": "1:26:00", "remaining_time": "0:11:36", "throughput": 4247.6, "total_tokens": 21920136} {"current_steps": 33625, "total_steps": 38160, "loss": 0.3757, "lr": 4.242719137849077e-05, "epoch": 17.62316561844864, "percentage": 88.12, "elapsed_time": "1:26:01", "remaining_time": "0:11:36", "throughput": 4247.72, "total_tokens": 21924168} {"current_steps": 33630, "total_steps": 38160, "loss": 0.435, "lr": 4.233505067814702e-05, "epoch": 17.62578616352201, "percentage": 88.13, "elapsed_time": "1:26:02", "remaining_time": "0:11:35", "throughput": 4248.07, "total_tokens": 21931656} {"current_steps": 33635, "total_steps": 38160, "loss": 0.3862, "lr": 4.224300571608947e-05, "epoch": 17.62840670859539, "percentage": 88.14, "elapsed_time": "1:26:03", "remaining_time": "0:11:34", "throughput": 4248.03, "total_tokens": 21934184} {"current_steps": 33640, "total_steps": 38160, "loss": 0.4582, "lr": 4.215105651157264e-05, "epoch": 17.631027253668762, "percentage": 88.16, "elapsed_time": "1:26:04", "remaining_time": "0:11:33", "throughput": 4248.19, "total_tokens": 21938856} {"current_steps": 33645, "total_steps": 38160, "loss": 0.3665, "lr": 4.2059203083831434e-05, "epoch": 17.63364779874214, "percentage": 88.17, "elapsed_time": "1:26:04", "remaining_time": "0:11:33", "throughput": 4248.19, "total_tokens": 21941736} {"current_steps": 33650, "total_steps": 38160, "loss": 0.4745, "lr": 4.196744545208042e-05, "epoch": 17.636268343815512, "percentage": 88.18, "elapsed_time": "1:26:05", "remaining_time": "0:11:32", "throughput": 4248.25, "total_tokens": 21945256} {"current_steps": 33655, "total_steps": 38160, "loss": 0.4169, "lr": 4.187578363551431e-05, "epoch": 17.63888888888889, "percentage": 88.19, "elapsed_time": "1:26:06", "remaining_time": "0:11:31", "throughput": 4248.18, "total_tokens": 21947432} {"current_steps": 33660, "total_steps": 38160, "loss": 0.5223, "lr": 4.17842176533077e-05, "epoch": 17.641509433962263, "percentage": 88.21, "elapsed_time": "1:26:07", "remaining_time": "0:11:30", "throughput": 4248.2, "total_tokens": 21950664} {"current_steps": 33665, "total_steps": 38160, "loss": 0.4849, "lr": 4.1692747524615274e-05, "epoch": 17.64412997903564, "percentage": 88.22, "elapsed_time": "1:26:07", "remaining_time": "0:11:30", "throughput": 4248.22, "total_tokens": 21953704} {"current_steps": 33670, "total_steps": 38160, "loss": 0.3503, "lr": 4.160137326857138e-05, "epoch": 17.646750524109013, "percentage": 88.23, "elapsed_time": "1:26:08", "remaining_time": "0:11:29", "throughput": 4248.25, "total_tokens": 21956936} {"current_steps": 33675, "total_steps": 38160, "loss": 0.4268, "lr": 4.151009490429042e-05, "epoch": 17.64937106918239, "percentage": 88.25, "elapsed_time": "1:26:09", "remaining_time": "0:11:28", "throughput": 4248.28, "total_tokens": 21960200} {"current_steps": 33680, "total_steps": 38160, "loss": 0.3981, "lr": 4.141891245086687e-05, "epoch": 17.651991614255767, "percentage": 88.26, "elapsed_time": "1:26:09", "remaining_time": "0:11:27", "throughput": 4248.26, "total_tokens": 21962824} {"current_steps": 33685, "total_steps": 38160, "loss": 0.4149, "lr": 4.132782592737511e-05, "epoch": 17.65461215932914, "percentage": 88.27, "elapsed_time": "1:26:10", "remaining_time": "0:11:26", "throughput": 4248.32, "total_tokens": 21966504} {"current_steps": 33690, "total_steps": 38160, "loss": 0.3953, "lr": 4.123683535286943e-05, "epoch": 17.657232704402517, "percentage": 88.29, "elapsed_time": "1:26:11", "remaining_time": "0:11:26", "throughput": 4248.45, "total_tokens": 21970664} {"current_steps": 33695, "total_steps": 38160, "loss": 0.3442, "lr": 4.114594074638395e-05, "epoch": 17.65985324947589, "percentage": 88.3, "elapsed_time": "1:26:12", "remaining_time": "0:11:25", "throughput": 4248.52, "total_tokens": 21974312} {"current_steps": 33700, "total_steps": 38160, "loss": 0.5069, "lr": 4.105514212693268e-05, "epoch": 17.662473794549268, "percentage": 88.31, "elapsed_time": "1:26:12", "remaining_time": "0:11:24", "throughput": 4248.53, "total_tokens": 21977288} {"current_steps": 33705, "total_steps": 38160, "loss": 0.4446, "lr": 4.096443951350976e-05, "epoch": 17.66509433962264, "percentage": 88.33, "elapsed_time": "1:26:13", "remaining_time": "0:11:23", "throughput": 4248.49, "total_tokens": 21979720} {"current_steps": 33710, "total_steps": 38160, "loss": 0.4035, "lr": 4.0873832925089116e-05, "epoch": 17.667714884696018, "percentage": 88.34, "elapsed_time": "1:26:14", "remaining_time": "0:11:23", "throughput": 4248.49, "total_tokens": 21982600} {"current_steps": 33715, "total_steps": 38160, "loss": 0.4224, "lr": 4.0783322380624656e-05, "epoch": 17.67033542976939, "percentage": 88.35, "elapsed_time": "1:26:14", "remaining_time": "0:11:22", "throughput": 4248.55, "total_tokens": 21986184} {"current_steps": 33720, "total_steps": 38160, "loss": 0.4869, "lr": 4.069290789905023e-05, "epoch": 17.67295597484277, "percentage": 88.36, "elapsed_time": "1:26:15", "remaining_time": "0:11:21", "throughput": 4248.57, "total_tokens": 21989352} {"current_steps": 33725, "total_steps": 38160, "loss": 0.4093, "lr": 4.060258949927942e-05, "epoch": 17.67557651991614, "percentage": 88.38, "elapsed_time": "1:26:16", "remaining_time": "0:11:20", "throughput": 4248.56, "total_tokens": 21992072} {"current_steps": 33730, "total_steps": 38160, "loss": 0.4825, "lr": 4.051236720020568e-05, "epoch": 17.67819706498952, "percentage": 88.39, "elapsed_time": "1:26:17", "remaining_time": "0:11:19", "throughput": 4248.67, "total_tokens": 21996200} {"current_steps": 33735, "total_steps": 38160, "loss": 0.4365, "lr": 4.042224102070263e-05, "epoch": 17.680817610062892, "percentage": 88.4, "elapsed_time": "1:26:17", "remaining_time": "0:11:19", "throughput": 4248.63, "total_tokens": 21998728} {"current_steps": 33740, "total_steps": 38160, "loss": 0.446, "lr": 4.033221097962364e-05, "epoch": 17.68343815513627, "percentage": 88.42, "elapsed_time": "1:26:18", "remaining_time": "0:11:18", "throughput": 4248.63, "total_tokens": 22001480} {"current_steps": 33745, "total_steps": 38160, "loss": 0.5611, "lr": 4.0242277095802025e-05, "epoch": 17.686058700209642, "percentage": 88.43, "elapsed_time": "1:26:19", "remaining_time": "0:11:17", "throughput": 4248.76, "total_tokens": 22005800} {"current_steps": 33750, "total_steps": 38160, "loss": 0.3337, "lr": 4.015243938805086e-05, "epoch": 17.68867924528302, "percentage": 88.44, "elapsed_time": "1:26:20", "remaining_time": "0:11:16", "throughput": 4248.81, "total_tokens": 22009096} {"current_steps": 33755, "total_steps": 38160, "loss": 0.3987, "lr": 4.006269787516304e-05, "epoch": 17.691299790356393, "percentage": 88.46, "elapsed_time": "1:26:20", "remaining_time": "0:11:16", "throughput": 4248.81, "total_tokens": 22012072} {"current_steps": 33760, "total_steps": 38160, "loss": 0.5173, "lr": 3.9973052575911606e-05, "epoch": 17.69392033542977, "percentage": 88.47, "elapsed_time": "1:26:21", "remaining_time": "0:11:15", "throughput": 4248.85, "total_tokens": 22015304} {"current_steps": 33765, "total_steps": 38160, "loss": 0.3618, "lr": 3.988350350904929e-05, "epoch": 17.696540880503143, "percentage": 88.48, "elapsed_time": "1:26:22", "remaining_time": "0:11:14", "throughput": 4248.92, "total_tokens": 22019016} {"current_steps": 33770, "total_steps": 38160, "loss": 0.4613, "lr": 3.979405069330882e-05, "epoch": 17.69916142557652, "percentage": 88.5, "elapsed_time": "1:26:22", "remaining_time": "0:11:13", "throughput": 4248.93, "total_tokens": 22021992} {"current_steps": 33775, "total_steps": 38160, "loss": 0.3605, "lr": 3.970469414740269e-05, "epoch": 17.701781970649897, "percentage": 88.51, "elapsed_time": "1:26:23", "remaining_time": "0:11:12", "throughput": 4248.92, "total_tokens": 22024808} {"current_steps": 33780, "total_steps": 38160, "loss": 0.447, "lr": 3.961543389002309e-05, "epoch": 17.70440251572327, "percentage": 88.52, "elapsed_time": "1:26:24", "remaining_time": "0:11:12", "throughput": 4248.89, "total_tokens": 22027336} {"current_steps": 33785, "total_steps": 38160, "loss": 0.3993, "lr": 3.952626993984243e-05, "epoch": 17.707023060796647, "percentage": 88.54, "elapsed_time": "1:26:24", "remaining_time": "0:11:11", "throughput": 4248.91, "total_tokens": 22030440} {"current_steps": 33790, "total_steps": 38160, "loss": 0.5759, "lr": 3.943720231551268e-05, "epoch": 17.70964360587002, "percentage": 88.55, "elapsed_time": "1:26:25", "remaining_time": "0:11:10", "throughput": 4248.9, "total_tokens": 22033160} {"current_steps": 33795, "total_steps": 38160, "loss": 0.264, "lr": 3.934823103566587e-05, "epoch": 17.712264150943398, "percentage": 88.56, "elapsed_time": "1:26:26", "remaining_time": "0:11:09", "throughput": 4248.87, "total_tokens": 22035720} {"current_steps": 33800, "total_steps": 38160, "loss": 0.5306, "lr": 3.925935611891379e-05, "epoch": 17.71488469601677, "percentage": 88.57, "elapsed_time": "1:26:26", "remaining_time": "0:11:09", "throughput": 4248.87, "total_tokens": 22038664} {"current_steps": 33805, "total_steps": 38160, "loss": 0.3585, "lr": 3.917057758384801e-05, "epoch": 17.717505241090148, "percentage": 88.59, "elapsed_time": "1:26:27", "remaining_time": "0:11:08", "throughput": 4248.88, "total_tokens": 22041512} {"current_steps": 33810, "total_steps": 38160, "loss": 0.4144, "lr": 3.9081895449039896e-05, "epoch": 17.72012578616352, "percentage": 88.6, "elapsed_time": "1:26:28", "remaining_time": "0:11:07", "throughput": 4248.96, "total_tokens": 22045320} {"current_steps": 33815, "total_steps": 38160, "loss": 0.318, "lr": 3.899330973304083e-05, "epoch": 17.7227463312369, "percentage": 88.61, "elapsed_time": "1:26:29", "remaining_time": "0:11:06", "throughput": 4248.97, "total_tokens": 22048232} {"current_steps": 33820, "total_steps": 38160, "loss": 0.3757, "lr": 3.8904820454381875e-05, "epoch": 17.72536687631027, "percentage": 88.63, "elapsed_time": "1:26:29", "remaining_time": "0:11:05", "throughput": 4249.01, "total_tokens": 22051528} {"current_steps": 33825, "total_steps": 38160, "loss": 0.4555, "lr": 3.881642763157417e-05, "epoch": 17.72798742138365, "percentage": 88.64, "elapsed_time": "1:26:30", "remaining_time": "0:11:05", "throughput": 4248.99, "total_tokens": 22054248} {"current_steps": 33830, "total_steps": 38160, "loss": 0.3298, "lr": 3.872813128310826e-05, "epoch": 17.730607966457022, "percentage": 88.65, "elapsed_time": "1:26:31", "remaining_time": "0:11:04", "throughput": 4249.12, "total_tokens": 22058600} {"current_steps": 33835, "total_steps": 38160, "loss": 0.3919, "lr": 3.8639931427454866e-05, "epoch": 17.7332285115304, "percentage": 88.67, "elapsed_time": "1:26:32", "remaining_time": "0:11:03", "throughput": 4249.16, "total_tokens": 22061896} {"current_steps": 33840, "total_steps": 38160, "loss": 0.5423, "lr": 3.855182808306429e-05, "epoch": 17.735849056603772, "percentage": 88.68, "elapsed_time": "1:26:32", "remaining_time": "0:11:02", "throughput": 4249.21, "total_tokens": 22065192} {"current_steps": 33845, "total_steps": 38160, "loss": 0.4837, "lr": 3.8463821268366784e-05, "epoch": 17.73846960167715, "percentage": 88.69, "elapsed_time": "1:26:33", "remaining_time": "0:11:02", "throughput": 4249.23, "total_tokens": 22068296} {"current_steps": 33850, "total_steps": 38160, "loss": 0.4747, "lr": 3.837591100177246e-05, "epoch": 17.741090146750523, "percentage": 88.71, "elapsed_time": "1:26:34", "remaining_time": "0:11:01", "throughput": 4249.3, "total_tokens": 22071976} {"current_steps": 33855, "total_steps": 38160, "loss": 0.5166, "lr": 3.828809730167099e-05, "epoch": 17.7437106918239, "percentage": 88.72, "elapsed_time": "1:26:35", "remaining_time": "0:11:00", "throughput": 4249.37, "total_tokens": 22075656} {"current_steps": 33860, "total_steps": 38160, "loss": 0.374, "lr": 3.820038018643218e-05, "epoch": 17.746331236897273, "percentage": 88.73, "elapsed_time": "1:26:35", "remaining_time": "0:10:59", "throughput": 4249.48, "total_tokens": 22079816} {"current_steps": 33865, "total_steps": 38160, "loss": 0.4275, "lr": 3.8112759674405254e-05, "epoch": 17.74895178197065, "percentage": 88.74, "elapsed_time": "1:26:36", "remaining_time": "0:10:59", "throughput": 4249.47, "total_tokens": 22082472} {"current_steps": 33870, "total_steps": 38160, "loss": 0.432, "lr": 3.802523578391953e-05, "epoch": 17.751572327044027, "percentage": 88.76, "elapsed_time": "1:26:37", "remaining_time": "0:10:58", "throughput": 4249.52, "total_tokens": 22086024} {"current_steps": 33875, "total_steps": 38160, "loss": 0.4463, "lr": 3.793780853328399e-05, "epoch": 17.7541928721174, "percentage": 88.77, "elapsed_time": "1:26:38", "remaining_time": "0:10:57", "throughput": 4249.61, "total_tokens": 22090024} {"current_steps": 33880, "total_steps": 38160, "loss": 0.3431, "lr": 3.785047794078744e-05, "epoch": 17.756813417190777, "percentage": 88.78, "elapsed_time": "1:26:38", "remaining_time": "0:10:56", "throughput": 4249.59, "total_tokens": 22092680} {"current_steps": 33885, "total_steps": 38160, "loss": 0.4919, "lr": 3.776324402469844e-05, "epoch": 17.75943396226415, "percentage": 88.8, "elapsed_time": "1:26:39", "remaining_time": "0:10:55", "throughput": 4249.55, "total_tokens": 22095112} {"current_steps": 33890, "total_steps": 38160, "loss": 0.4714, "lr": 3.767610680326533e-05, "epoch": 17.762054507337528, "percentage": 88.81, "elapsed_time": "1:26:40", "remaining_time": "0:10:55", "throughput": 4249.61, "total_tokens": 22098696} {"current_steps": 33895, "total_steps": 38160, "loss": 0.4554, "lr": 3.7589066294716145e-05, "epoch": 17.7646750524109, "percentage": 88.82, "elapsed_time": "1:26:40", "remaining_time": "0:10:54", "throughput": 4249.65, "total_tokens": 22102024} {"current_steps": 33900, "total_steps": 38160, "loss": 0.4158, "lr": 3.750212251725882e-05, "epoch": 17.767295597484278, "percentage": 88.84, "elapsed_time": "1:26:41", "remaining_time": "0:10:53", "throughput": 4249.67, "total_tokens": 22105064} {"current_steps": 33905, "total_steps": 38160, "loss": 0.549, "lr": 3.741527548908113e-05, "epoch": 17.76991614255765, "percentage": 88.85, "elapsed_time": "1:26:42", "remaining_time": "0:10:52", "throughput": 4249.75, "total_tokens": 22108968} {"current_steps": 33910, "total_steps": 38160, "loss": 0.3701, "lr": 3.732852522835023e-05, "epoch": 17.77253668763103, "percentage": 88.86, "elapsed_time": "1:26:43", "remaining_time": "0:10:52", "throughput": 4249.88, "total_tokens": 22113288} {"current_steps": 33915, "total_steps": 38160, "loss": 0.4783, "lr": 3.724187175321342e-05, "epoch": 17.7751572327044, "percentage": 88.88, "elapsed_time": "1:26:44", "remaining_time": "0:10:51", "throughput": 4250.03, "total_tokens": 22117768} {"current_steps": 33920, "total_steps": 38160, "loss": 0.3971, "lr": 3.71553150817977e-05, "epoch": 17.77777777777778, "percentage": 88.89, "elapsed_time": "1:26:44", "remaining_time": "0:10:50", "throughput": 4250.05, "total_tokens": 22120936} {"current_steps": 33925, "total_steps": 38160, "loss": 0.3334, "lr": 3.70688552322096e-05, "epoch": 17.780398322851152, "percentage": 88.9, "elapsed_time": "1:26:45", "remaining_time": "0:10:49", "throughput": 4250.13, "total_tokens": 22124616} {"current_steps": 33930, "total_steps": 38160, "loss": 0.3985, "lr": 3.698249222253569e-05, "epoch": 17.78301886792453, "percentage": 88.92, "elapsed_time": "1:26:46", "remaining_time": "0:10:49", "throughput": 4250.18, "total_tokens": 22128072} {"current_steps": 33935, "total_steps": 38160, "loss": 0.3996, "lr": 3.6896226070841863e-05, "epoch": 17.785639412997902, "percentage": 88.93, "elapsed_time": "1:26:47", "remaining_time": "0:10:48", "throughput": 4250.22, "total_tokens": 22131272} {"current_steps": 33940, "total_steps": 38160, "loss": 0.3389, "lr": 3.681005679517424e-05, "epoch": 17.78825995807128, "percentage": 88.94, "elapsed_time": "1:26:47", "remaining_time": "0:10:47", "throughput": 4250.28, "total_tokens": 22134888} {"current_steps": 33945, "total_steps": 38160, "loss": 0.3487, "lr": 3.6723984413558455e-05, "epoch": 17.790880503144653, "percentage": 88.95, "elapsed_time": "1:26:48", "remaining_time": "0:10:46", "throughput": 4250.25, "total_tokens": 22137480} {"current_steps": 33950, "total_steps": 38160, "loss": 0.4273, "lr": 3.663800894399971e-05, "epoch": 17.79350104821803, "percentage": 88.97, "elapsed_time": "1:26:49", "remaining_time": "0:10:45", "throughput": 4250.31, "total_tokens": 22141000} {"current_steps": 33955, "total_steps": 38160, "loss": 0.3113, "lr": 3.655213040448318e-05, "epoch": 17.796121593291403, "percentage": 88.98, "elapsed_time": "1:26:49", "remaining_time": "0:10:45", "throughput": 4250.3, "total_tokens": 22143752} {"current_steps": 33960, "total_steps": 38160, "loss": 0.4087, "lr": 3.6466348812973723e-05, "epoch": 17.79874213836478, "percentage": 88.99, "elapsed_time": "1:26:50", "remaining_time": "0:10:44", "throughput": 4250.36, "total_tokens": 22147272} {"current_steps": 33965, "total_steps": 38160, "loss": 0.3059, "lr": 3.6380664187415815e-05, "epoch": 17.801362683438157, "percentage": 89.01, "elapsed_time": "1:26:51", "remaining_time": "0:10:43", "throughput": 4250.43, "total_tokens": 22151080} {"current_steps": 33970, "total_steps": 38160, "loss": 0.3676, "lr": 3.6295076545733663e-05, "epoch": 17.80398322851153, "percentage": 89.02, "elapsed_time": "1:26:52", "remaining_time": "0:10:42", "throughput": 4250.49, "total_tokens": 22154664} {"current_steps": 33975, "total_steps": 38160, "loss": 0.383, "lr": 3.6209585905831344e-05, "epoch": 17.806603773584907, "percentage": 89.03, "elapsed_time": "1:26:52", "remaining_time": "0:10:42", "throughput": 4250.5, "total_tokens": 22157608} {"current_steps": 33980, "total_steps": 38160, "loss": 0.4763, "lr": 3.6124192285592385e-05, "epoch": 17.80922431865828, "percentage": 89.05, "elapsed_time": "1:26:53", "remaining_time": "0:10:41", "throughput": 4250.46, "total_tokens": 22160136} {"current_steps": 33985, "total_steps": 38160, "loss": 0.3736, "lr": 3.6038895702880324e-05, "epoch": 17.811844863731658, "percentage": 89.06, "elapsed_time": "1:26:54", "remaining_time": "0:10:40", "throughput": 4250.41, "total_tokens": 22162376} {"current_steps": 33990, "total_steps": 38160, "loss": 0.6033, "lr": 3.595369617553806e-05, "epoch": 17.81446540880503, "percentage": 89.07, "elapsed_time": "1:26:55", "remaining_time": "0:10:39", "throughput": 4250.5, "total_tokens": 22166376} {"current_steps": 33995, "total_steps": 38160, "loss": 0.367, "lr": 3.58685937213884e-05, "epoch": 17.817085953878408, "percentage": 89.09, "elapsed_time": "1:26:55", "remaining_time": "0:10:39", "throughput": 4250.49, "total_tokens": 22169128} {"current_steps": 34000, "total_steps": 38160, "loss": 0.476, "lr": 3.5783588358233863e-05, "epoch": 17.81970649895178, "percentage": 89.1, "elapsed_time": "1:26:56", "remaining_time": "0:10:38", "throughput": 4250.64, "total_tokens": 22173544} {"current_steps": 34005, "total_steps": 38160, "loss": 0.4014, "lr": 3.569868010385663e-05, "epoch": 17.822327044025158, "percentage": 89.11, "elapsed_time": "1:26:57", "remaining_time": "0:10:37", "throughput": 4250.66, "total_tokens": 22176712} {"current_steps": 34010, "total_steps": 38160, "loss": 0.3747, "lr": 3.5613868976018535e-05, "epoch": 17.82494758909853, "percentage": 89.12, "elapsed_time": "1:26:57", "remaining_time": "0:10:36", "throughput": 4250.67, "total_tokens": 22179816} {"current_steps": 34015, "total_steps": 38160, "loss": 0.3955, "lr": 3.5529154992460955e-05, "epoch": 17.82756813417191, "percentage": 89.14, "elapsed_time": "1:26:58", "remaining_time": "0:10:35", "throughput": 4250.7, "total_tokens": 22182888} {"current_steps": 34020, "total_steps": 38160, "loss": 0.4791, "lr": 3.544453817090521e-05, "epoch": 17.830188679245282, "percentage": 89.15, "elapsed_time": "1:26:59", "remaining_time": "0:10:35", "throughput": 4250.77, "total_tokens": 22186472} {"current_steps": 34025, "total_steps": 38160, "loss": 0.3967, "lr": 3.536001852905207e-05, "epoch": 17.83280922431866, "percentage": 89.16, "elapsed_time": "1:27:00", "remaining_time": "0:10:34", "throughput": 4250.76, "total_tokens": 22189320} {"current_steps": 34030, "total_steps": 38160, "loss": 0.4389, "lr": 3.527559608458225e-05, "epoch": 17.835429769392032, "percentage": 89.18, "elapsed_time": "1:27:00", "remaining_time": "0:10:33", "throughput": 4250.75, "total_tokens": 22192200} {"current_steps": 34035, "total_steps": 38160, "loss": 0.3336, "lr": 3.5191270855155886e-05, "epoch": 17.83805031446541, "percentage": 89.19, "elapsed_time": "1:27:01", "remaining_time": "0:10:32", "throughput": 4250.72, "total_tokens": 22194696} {"current_steps": 34040, "total_steps": 38160, "loss": 0.3677, "lr": 3.510704285841293e-05, "epoch": 17.840670859538783, "percentage": 89.2, "elapsed_time": "1:27:02", "remaining_time": "0:10:32", "throughput": 4250.68, "total_tokens": 22197192} {"current_steps": 34045, "total_steps": 38160, "loss": 0.3994, "lr": 3.502291211197267e-05, "epoch": 17.84329140461216, "percentage": 89.22, "elapsed_time": "1:27:02", "remaining_time": "0:10:31", "throughput": 4250.67, "total_tokens": 22199976} {"current_steps": 34050, "total_steps": 38160, "loss": 0.4316, "lr": 3.493887863343448e-05, "epoch": 17.845911949685533, "percentage": 89.23, "elapsed_time": "1:27:03", "remaining_time": "0:10:30", "throughput": 4250.7, "total_tokens": 22203176} {"current_steps": 34055, "total_steps": 38160, "loss": 0.3028, "lr": 3.485494244037718e-05, "epoch": 17.84853249475891, "percentage": 89.24, "elapsed_time": "1:27:04", "remaining_time": "0:10:29", "throughput": 4250.82, "total_tokens": 22207368} {"current_steps": 34060, "total_steps": 38160, "loss": 0.4525, "lr": 3.477110355035934e-05, "epoch": 17.851153039832283, "percentage": 89.26, "elapsed_time": "1:27:04", "remaining_time": "0:10:28", "throughput": 4250.84, "total_tokens": 22210376} {"current_steps": 34065, "total_steps": 38160, "loss": 0.3839, "lr": 3.468736198091904e-05, "epoch": 17.85377358490566, "percentage": 89.27, "elapsed_time": "1:27:05", "remaining_time": "0:10:28", "throughput": 4250.97, "total_tokens": 22214856} {"current_steps": 34070, "total_steps": 38160, "loss": 0.367, "lr": 3.4603717749573935e-05, "epoch": 17.856394129979037, "percentage": 89.28, "elapsed_time": "1:27:06", "remaining_time": "0:10:27", "throughput": 4251.05, "total_tokens": 22218504} {"current_steps": 34075, "total_steps": 38160, "loss": 0.399, "lr": 3.452017087382159e-05, "epoch": 17.85901467505241, "percentage": 89.3, "elapsed_time": "1:27:07", "remaining_time": "0:10:26", "throughput": 4251.04, "total_tokens": 22221384} {"current_steps": 34080, "total_steps": 38160, "loss": 0.4946, "lr": 3.443672137113901e-05, "epoch": 17.861635220125788, "percentage": 89.31, "elapsed_time": "1:27:08", "remaining_time": "0:10:25", "throughput": 4251.14, "total_tokens": 22225480} {"current_steps": 34085, "total_steps": 38160, "loss": 0.4887, "lr": 3.4353369258983025e-05, "epoch": 17.86425576519916, "percentage": 89.32, "elapsed_time": "1:27:08", "remaining_time": "0:10:25", "throughput": 4251.15, "total_tokens": 22228488} {"current_steps": 34090, "total_steps": 38160, "loss": 0.4372, "lr": 3.4270114554789735e-05, "epoch": 17.866876310272538, "percentage": 89.33, "elapsed_time": "1:27:09", "remaining_time": "0:10:24", "throughput": 4251.2, "total_tokens": 22231912} {"current_steps": 34095, "total_steps": 38160, "loss": 0.4489, "lr": 3.41869572759751e-05, "epoch": 17.86949685534591, "percentage": 89.35, "elapsed_time": "1:27:10", "remaining_time": "0:10:23", "throughput": 4251.23, "total_tokens": 22235144} {"current_steps": 34100, "total_steps": 38160, "loss": 0.5227, "lr": 3.410389743993475e-05, "epoch": 17.872117400419288, "percentage": 89.36, "elapsed_time": "1:27:10", "remaining_time": "0:10:22", "throughput": 4251.24, "total_tokens": 22238088} {"current_steps": 34105, "total_steps": 38160, "loss": 0.5143, "lr": 3.40209350640438e-05, "epoch": 17.87473794549266, "percentage": 89.37, "elapsed_time": "1:27:11", "remaining_time": "0:10:22", "throughput": 4251.32, "total_tokens": 22241800} {"current_steps": 34110, "total_steps": 38160, "loss": 0.4693, "lr": 3.3938070165657084e-05, "epoch": 17.87735849056604, "percentage": 89.39, "elapsed_time": "1:27:12", "remaining_time": "0:10:21", "throughput": 4251.39, "total_tokens": 22245512} {"current_steps": 34115, "total_steps": 38160, "loss": 0.478, "lr": 3.385530276210902e-05, "epoch": 17.879979035639412, "percentage": 89.4, "elapsed_time": "1:27:13", "remaining_time": "0:10:20", "throughput": 4251.39, "total_tokens": 22248328} {"current_steps": 34120, "total_steps": 38160, "loss": 0.5029, "lr": 3.377263287071358e-05, "epoch": 17.88259958071279, "percentage": 89.41, "elapsed_time": "1:27:14", "remaining_time": "0:10:19", "throughput": 4251.53, "total_tokens": 22252744} {"current_steps": 34125, "total_steps": 38160, "loss": 0.3428, "lr": 3.369006050876428e-05, "epoch": 17.885220125786162, "percentage": 89.43, "elapsed_time": "1:27:14", "remaining_time": "0:10:18", "throughput": 4251.7, "total_tokens": 22257544} {"current_steps": 34130, "total_steps": 38160, "loss": 0.4121, "lr": 3.3607585693534394e-05, "epoch": 17.88784067085954, "percentage": 89.44, "elapsed_time": "1:27:15", "remaining_time": "0:10:18", "throughput": 4251.69, "total_tokens": 22260456} {"current_steps": 34135, "total_steps": 38160, "loss": 0.4543, "lr": 3.352520844227663e-05, "epoch": 17.890461215932913, "percentage": 89.45, "elapsed_time": "1:27:16", "remaining_time": "0:10:17", "throughput": 4251.78, "total_tokens": 22264328} {"current_steps": 34140, "total_steps": 38160, "loss": 0.3397, "lr": 3.344292877222355e-05, "epoch": 17.89308176100629, "percentage": 89.47, "elapsed_time": "1:27:17", "remaining_time": "0:10:16", "throughput": 4251.77, "total_tokens": 22267080} {"current_steps": 34145, "total_steps": 38160, "loss": 0.3141, "lr": 3.336074670058703e-05, "epoch": 17.895702306079663, "percentage": 89.48, "elapsed_time": "1:27:17", "remaining_time": "0:10:15", "throughput": 4251.8, "total_tokens": 22270248} {"current_steps": 34150, "total_steps": 38160, "loss": 0.4327, "lr": 3.327866224455844e-05, "epoch": 17.89832285115304, "percentage": 89.49, "elapsed_time": "1:27:18", "remaining_time": "0:10:15", "throughput": 4251.87, "total_tokens": 22273960} {"current_steps": 34155, "total_steps": 38160, "loss": 0.4219, "lr": 3.3196675421309165e-05, "epoch": 17.900943396226417, "percentage": 89.5, "elapsed_time": "1:27:19", "remaining_time": "0:10:14", "throughput": 4251.9, "total_tokens": 22277256} {"current_steps": 34160, "total_steps": 38160, "loss": 0.4711, "lr": 3.3114786247989744e-05, "epoch": 17.90356394129979, "percentage": 89.52, "elapsed_time": "1:27:20", "remaining_time": "0:10:13", "throughput": 4251.92, "total_tokens": 22280424} {"current_steps": 34165, "total_steps": 38160, "loss": 0.3693, "lr": 3.303299474173066e-05, "epoch": 17.906184486373167, "percentage": 89.53, "elapsed_time": "1:27:20", "remaining_time": "0:10:12", "throughput": 4252.04, "total_tokens": 22284808} {"current_steps": 34170, "total_steps": 38160, "loss": 0.3745, "lr": 3.2951300919641544e-05, "epoch": 17.90880503144654, "percentage": 89.54, "elapsed_time": "1:27:21", "remaining_time": "0:10:12", "throughput": 4252.06, "total_tokens": 22287912} {"current_steps": 34175, "total_steps": 38160, "loss": 0.4772, "lr": 3.2869704798811964e-05, "epoch": 17.911425576519918, "percentage": 89.56, "elapsed_time": "1:27:22", "remaining_time": "0:10:11", "throughput": 4252.1, "total_tokens": 22291112} {"current_steps": 34180, "total_steps": 38160, "loss": 0.4556, "lr": 3.2788206396310746e-05, "epoch": 17.91404612159329, "percentage": 89.57, "elapsed_time": "1:27:23", "remaining_time": "0:10:10", "throughput": 4252.12, "total_tokens": 22294280} {"current_steps": 34185, "total_steps": 38160, "loss": 0.3222, "lr": 3.270680572918655e-05, "epoch": 17.916666666666668, "percentage": 89.58, "elapsed_time": "1:27:23", "remaining_time": "0:10:09", "throughput": 4252.15, "total_tokens": 22297640} {"current_steps": 34190, "total_steps": 38160, "loss": 0.3496, "lr": 3.262550281446741e-05, "epoch": 17.91928721174004, "percentage": 89.6, "elapsed_time": "1:27:24", "remaining_time": "0:10:08", "throughput": 4252.17, "total_tokens": 22300712} {"current_steps": 34195, "total_steps": 38160, "loss": 0.3601, "lr": 3.2544297669161115e-05, "epoch": 17.921907756813418, "percentage": 89.61, "elapsed_time": "1:27:25", "remaining_time": "0:10:08", "throughput": 4252.21, "total_tokens": 22304072} {"current_steps": 34200, "total_steps": 38160, "loss": 0.5652, "lr": 3.2463190310254633e-05, "epoch": 17.92452830188679, "percentage": 89.62, "elapsed_time": "1:27:26", "remaining_time": "0:10:07", "throughput": 4252.24, "total_tokens": 22307336} {"current_steps": 34205, "total_steps": 38160, "loss": 0.3937, "lr": 3.238218075471483e-05, "epoch": 17.92714884696017, "percentage": 89.64, "elapsed_time": "1:27:26", "remaining_time": "0:10:06", "throughput": 4252.24, "total_tokens": 22310216} {"current_steps": 34210, "total_steps": 38160, "loss": 0.3836, "lr": 3.230126901948788e-05, "epoch": 17.929769392033542, "percentage": 89.65, "elapsed_time": "1:27:27", "remaining_time": "0:10:05", "throughput": 4252.34, "total_tokens": 22314216} {"current_steps": 34215, "total_steps": 38160, "loss": 0.3365, "lr": 3.222045512149968e-05, "epoch": 17.93238993710692, "percentage": 89.66, "elapsed_time": "1:27:28", "remaining_time": "0:10:05", "throughput": 4252.37, "total_tokens": 22317416} {"current_steps": 34220, "total_steps": 38160, "loss": 0.3958, "lr": 3.213973907765566e-05, "epoch": 17.935010482180292, "percentage": 89.68, "elapsed_time": "1:27:28", "remaining_time": "0:10:04", "throughput": 4252.38, "total_tokens": 22320456} {"current_steps": 34225, "total_steps": 38160, "loss": 0.3224, "lr": 3.205912090484048e-05, "epoch": 17.93763102725367, "percentage": 89.69, "elapsed_time": "1:27:29", "remaining_time": "0:10:03", "throughput": 4252.36, "total_tokens": 22323048} {"current_steps": 34230, "total_steps": 38160, "loss": 0.3407, "lr": 3.1978600619918754e-05, "epoch": 17.940251572327043, "percentage": 89.7, "elapsed_time": "1:27:30", "remaining_time": "0:10:02", "throughput": 4252.42, "total_tokens": 22326568} {"current_steps": 34235, "total_steps": 38160, "loss": 0.444, "lr": 3.189817823973423e-05, "epoch": 17.94287211740042, "percentage": 89.71, "elapsed_time": "1:27:31", "remaining_time": "0:10:02", "throughput": 4252.45, "total_tokens": 22329864} {"current_steps": 34240, "total_steps": 38160, "loss": 0.6116, "lr": 3.18178537811104e-05, "epoch": 17.945492662473793, "percentage": 89.73, "elapsed_time": "1:27:31", "remaining_time": "0:10:01", "throughput": 4252.48, "total_tokens": 22333000} {"current_steps": 34245, "total_steps": 38160, "loss": 0.3624, "lr": 3.1737627260850335e-05, "epoch": 17.94811320754717, "percentage": 89.74, "elapsed_time": "1:27:32", "remaining_time": "0:10:00", "throughput": 4252.52, "total_tokens": 22336328} {"current_steps": 34250, "total_steps": 38160, "loss": 0.3301, "lr": 3.1657498695736364e-05, "epoch": 17.950733752620543, "percentage": 89.75, "elapsed_time": "1:27:33", "remaining_time": "0:09:59", "throughput": 4252.49, "total_tokens": 22338920} {"current_steps": 34255, "total_steps": 38160, "loss": 0.6485, "lr": 3.157746810253054e-05, "epoch": 17.95335429769392, "percentage": 89.77, "elapsed_time": "1:27:33", "remaining_time": "0:09:58", "throughput": 4252.55, "total_tokens": 22342568} {"current_steps": 34260, "total_steps": 38160, "loss": 0.4342, "lr": 3.149753549797446e-05, "epoch": 17.955974842767297, "percentage": 89.78, "elapsed_time": "1:27:34", "remaining_time": "0:09:58", "throughput": 4252.56, "total_tokens": 22345512} {"current_steps": 34265, "total_steps": 38160, "loss": 0.4907, "lr": 3.141770089878887e-05, "epoch": 17.95859538784067, "percentage": 89.79, "elapsed_time": "1:27:35", "remaining_time": "0:09:57", "throughput": 4252.57, "total_tokens": 22348488} {"current_steps": 34270, "total_steps": 38160, "loss": 0.3645, "lr": 3.1337964321674354e-05, "epoch": 17.961215932914047, "percentage": 89.81, "elapsed_time": "1:27:36", "remaining_time": "0:09:56", "throughput": 4252.62, "total_tokens": 22351848} {"current_steps": 34275, "total_steps": 38160, "loss": 0.3634, "lr": 3.125832578331106e-05, "epoch": 17.96383647798742, "percentage": 89.82, "elapsed_time": "1:27:36", "remaining_time": "0:09:55", "throughput": 4252.62, "total_tokens": 22354856} {"current_steps": 34280, "total_steps": 38160, "loss": 0.2964, "lr": 3.117878530035823e-05, "epoch": 17.966457023060798, "percentage": 89.83, "elapsed_time": "1:27:37", "remaining_time": "0:09:55", "throughput": 4252.66, "total_tokens": 22358152} {"current_steps": 34285, "total_steps": 38160, "loss": 0.4622, "lr": 3.1099342889454875e-05, "epoch": 17.96907756813417, "percentage": 89.85, "elapsed_time": "1:27:38", "remaining_time": "0:09:54", "throughput": 4252.71, "total_tokens": 22361704} {"current_steps": 34290, "total_steps": 38160, "loss": 0.5186, "lr": 3.1019998567219597e-05, "epoch": 17.971698113207548, "percentage": 89.86, "elapsed_time": "1:27:38", "remaining_time": "0:09:53", "throughput": 4252.72, "total_tokens": 22364680} {"current_steps": 34295, "total_steps": 38160, "loss": 0.3527, "lr": 3.0940752350250125e-05, "epoch": 17.97431865828092, "percentage": 89.87, "elapsed_time": "1:27:39", "remaining_time": "0:09:52", "throughput": 4252.74, "total_tokens": 22367752} {"current_steps": 34300, "total_steps": 38160, "loss": 0.406, "lr": 3.0861604255124074e-05, "epoch": 17.9769392033543, "percentage": 89.88, "elapsed_time": "1:27:40", "remaining_time": "0:09:51", "throughput": 4252.74, "total_tokens": 22370632} {"current_steps": 34305, "total_steps": 38160, "loss": 0.3948, "lr": 3.0782554298398045e-05, "epoch": 17.979559748427672, "percentage": 89.9, "elapsed_time": "1:27:40", "remaining_time": "0:09:51", "throughput": 4252.72, "total_tokens": 22373224} {"current_steps": 34310, "total_steps": 38160, "loss": 0.4143, "lr": 3.070360249660859e-05, "epoch": 17.98218029350105, "percentage": 89.91, "elapsed_time": "1:27:42", "remaining_time": "0:09:50", "throughput": 4252.99, "total_tokens": 22379816} {"current_steps": 34315, "total_steps": 38160, "loss": 0.3397, "lr": 3.0624748866271535e-05, "epoch": 17.984800838574422, "percentage": 89.92, "elapsed_time": "1:27:42", "remaining_time": "0:09:49", "throughput": 4253.03, "total_tokens": 22383112} {"current_steps": 34320, "total_steps": 38160, "loss": 0.5399, "lr": 3.0545993423882036e-05, "epoch": 17.9874213836478, "percentage": 89.94, "elapsed_time": "1:27:43", "remaining_time": "0:09:48", "throughput": 4253.08, "total_tokens": 22386472} {"current_steps": 34325, "total_steps": 38160, "loss": 0.4827, "lr": 3.046733618591496e-05, "epoch": 17.990041928721173, "percentage": 89.95, "elapsed_time": "1:27:44", "remaining_time": "0:09:48", "throughput": 4253.04, "total_tokens": 22388968} {"current_steps": 34330, "total_steps": 38160, "loss": 0.3535, "lr": 3.0388777168824434e-05, "epoch": 17.99266247379455, "percentage": 89.96, "elapsed_time": "1:27:44", "remaining_time": "0:09:47", "throughput": 4253.05, "total_tokens": 22392008} {"current_steps": 34335, "total_steps": 38160, "loss": 0.3516, "lr": 3.0310316389044022e-05, "epoch": 17.995283018867923, "percentage": 89.98, "elapsed_time": "1:27:45", "remaining_time": "0:09:46", "throughput": 4253.06, "total_tokens": 22394984} {"current_steps": 34340, "total_steps": 38160, "loss": 0.4614, "lr": 3.0231953862986995e-05, "epoch": 17.9979035639413, "percentage": 89.99, "elapsed_time": "1:27:46", "remaining_time": "0:09:45", "throughput": 4253.11, "total_tokens": 22398376} {"current_steps": 34344, "total_steps": 38160, "eval_loss": 0.46658554673194885, "epoch": 18.0, "percentage": 90.0, "elapsed_time": "1:28:00", "remaining_time": "0:09:46", "throughput": 4242.01, "total_tokens": 22400368} {"current_steps": 34345, "total_steps": 38160, "loss": 0.6094, "lr": 3.0153689607045842e-05, "epoch": 18.000524109014677, "percentage": 90.0, "elapsed_time": "1:28:02", "remaining_time": "0:09:46", "throughput": 4240.66, "total_tokens": 22400816} {"current_steps": 34350, "total_steps": 38160, "loss": 0.4229, "lr": 3.0075523637592474e-05, "epoch": 18.00314465408805, "percentage": 90.02, "elapsed_time": "1:28:03", "remaining_time": "0:09:45", "throughput": 4240.67, "total_tokens": 22403888} {"current_steps": 34355, "total_steps": 38160, "loss": 0.4744, "lr": 2.999745597097847e-05, "epoch": 18.005765199161427, "percentage": 90.03, "elapsed_time": "1:28:03", "remaining_time": "0:09:45", "throughput": 4240.8, "total_tokens": 22408208} {"current_steps": 34360, "total_steps": 38160, "loss": 0.4145, "lr": 2.9919486623534497e-05, "epoch": 18.0083857442348, "percentage": 90.04, "elapsed_time": "1:28:04", "remaining_time": "0:09:44", "throughput": 4240.86, "total_tokens": 22411856} {"current_steps": 34365, "total_steps": 38160, "loss": 0.3884, "lr": 2.9841615611571005e-05, "epoch": 18.011006289308177, "percentage": 90.06, "elapsed_time": "1:28:05", "remaining_time": "0:09:43", "throughput": 4240.88, "total_tokens": 22415248} {"current_steps": 34370, "total_steps": 38160, "loss": 0.4467, "lr": 2.9763842951377628e-05, "epoch": 18.01362683438155, "percentage": 90.07, "elapsed_time": "1:28:06", "remaining_time": "0:09:42", "throughput": 4240.89, "total_tokens": 22418416} {"current_steps": 34375, "total_steps": 38160, "loss": 0.403, "lr": 2.968616865922369e-05, "epoch": 18.016247379454928, "percentage": 90.08, "elapsed_time": "1:28:06", "remaining_time": "0:09:42", "throughput": 4240.91, "total_tokens": 22421456} {"current_steps": 34380, "total_steps": 38160, "loss": 0.2892, "lr": 2.960859275135758e-05, "epoch": 18.0188679245283, "percentage": 90.09, "elapsed_time": "1:28:07", "remaining_time": "0:09:41", "throughput": 4240.92, "total_tokens": 22424464} {"current_steps": 34385, "total_steps": 38160, "loss": 0.3506, "lr": 2.9531115244007367e-05, "epoch": 18.021488469601678, "percentage": 90.11, "elapsed_time": "1:28:08", "remaining_time": "0:09:40", "throughput": 4240.91, "total_tokens": 22427152} {"current_steps": 34390, "total_steps": 38160, "loss": 0.3666, "lr": 2.945373615338037e-05, "epoch": 18.02410901467505, "percentage": 90.12, "elapsed_time": "1:28:09", "remaining_time": "0:09:39", "throughput": 4241.05, "total_tokens": 22431696} {"current_steps": 34395, "total_steps": 38160, "loss": 0.5684, "lr": 2.9376455495663534e-05, "epoch": 18.02672955974843, "percentage": 90.13, "elapsed_time": "1:28:09", "remaining_time": "0:09:39", "throughput": 4241.06, "total_tokens": 22434704} {"current_steps": 34400, "total_steps": 38160, "loss": 0.4663, "lr": 2.9299273287023144e-05, "epoch": 18.029350104821802, "percentage": 90.15, "elapsed_time": "1:28:10", "remaining_time": "0:09:38", "throughput": 4241.08, "total_tokens": 22437776} {"current_steps": 34405, "total_steps": 38160, "loss": 0.3512, "lr": 2.922218954360473e-05, "epoch": 18.03197064989518, "percentage": 90.16, "elapsed_time": "1:28:11", "remaining_time": "0:09:37", "throughput": 4241.1, "total_tokens": 22440912} {"current_steps": 34410, "total_steps": 38160, "loss": 0.4478, "lr": 2.9145204281533278e-05, "epoch": 18.034591194968552, "percentage": 90.17, "elapsed_time": "1:28:12", "remaining_time": "0:09:36", "throughput": 4241.12, "total_tokens": 22444112} {"current_steps": 34415, "total_steps": 38160, "loss": 0.4255, "lr": 2.9068317516913244e-05, "epoch": 18.03721174004193, "percentage": 90.19, "elapsed_time": "1:28:12", "remaining_time": "0:09:35", "throughput": 4241.22, "total_tokens": 22448080} {"current_steps": 34420, "total_steps": 38160, "loss": 0.412, "lr": 2.8991529265828542e-05, "epoch": 18.039832285115303, "percentage": 90.2, "elapsed_time": "1:28:13", "remaining_time": "0:09:35", "throughput": 4241.19, "total_tokens": 22450800} {"current_steps": 34425, "total_steps": 38160, "loss": 0.484, "lr": 2.891483954434243e-05, "epoch": 18.04245283018868, "percentage": 90.21, "elapsed_time": "1:28:14", "remaining_time": "0:09:34", "throughput": 4241.2, "total_tokens": 22453648} {"current_steps": 34430, "total_steps": 38160, "loss": 0.3794, "lr": 2.8838248368497465e-05, "epoch": 18.045073375262053, "percentage": 90.23, "elapsed_time": "1:28:15", "remaining_time": "0:09:33", "throughput": 4241.35, "total_tokens": 22458480} {"current_steps": 34435, "total_steps": 38160, "loss": 0.4342, "lr": 2.8761755754315667e-05, "epoch": 18.04769392033543, "percentage": 90.24, "elapsed_time": "1:28:15", "remaining_time": "0:09:32", "throughput": 4241.39, "total_tokens": 22461840} {"current_steps": 34440, "total_steps": 38160, "loss": 0.2968, "lr": 2.8685361717798286e-05, "epoch": 18.050314465408807, "percentage": 90.25, "elapsed_time": "1:28:16", "remaining_time": "0:09:32", "throughput": 4241.43, "total_tokens": 22465104} {"current_steps": 34445, "total_steps": 38160, "loss": 0.4147, "lr": 2.8609066274926265e-05, "epoch": 18.05293501048218, "percentage": 90.26, "elapsed_time": "1:28:17", "remaining_time": "0:09:31", "throughput": 4241.52, "total_tokens": 22468976} {"current_steps": 34450, "total_steps": 38160, "loss": 0.3654, "lr": 2.8532869441659615e-05, "epoch": 18.055555555555557, "percentage": 90.28, "elapsed_time": "1:28:18", "remaining_time": "0:09:30", "throughput": 4241.51, "total_tokens": 22471888} {"current_steps": 34455, "total_steps": 38160, "loss": 0.4113, "lr": 2.8456771233937973e-05, "epoch": 18.05817610062893, "percentage": 90.29, "elapsed_time": "1:28:18", "remaining_time": "0:09:29", "throughput": 4241.51, "total_tokens": 22474640} {"current_steps": 34460, "total_steps": 38160, "loss": 0.5413, "lr": 2.838077166768016e-05, "epoch": 18.060796645702307, "percentage": 90.3, "elapsed_time": "1:28:19", "remaining_time": "0:09:28", "throughput": 4241.47, "total_tokens": 22477168} {"current_steps": 34465, "total_steps": 38160, "loss": 0.5416, "lr": 2.8304870758784296e-05, "epoch": 18.06341719077568, "percentage": 90.32, "elapsed_time": "1:28:20", "remaining_time": "0:09:28", "throughput": 4241.48, "total_tokens": 22480240} {"current_steps": 34470, "total_steps": 38160, "loss": 0.4499, "lr": 2.822906852312812e-05, "epoch": 18.066037735849058, "percentage": 90.33, "elapsed_time": "1:28:20", "remaining_time": "0:09:27", "throughput": 4241.5, "total_tokens": 22483344} {"current_steps": 34475, "total_steps": 38160, "loss": 0.3865, "lr": 2.8153364976568563e-05, "epoch": 18.06865828092243, "percentage": 90.34, "elapsed_time": "1:28:21", "remaining_time": "0:09:26", "throughput": 4241.47, "total_tokens": 22485840} {"current_steps": 34480, "total_steps": 38160, "loss": 0.4024, "lr": 2.8077760134941955e-05, "epoch": 18.071278825995808, "percentage": 90.36, "elapsed_time": "1:28:22", "remaining_time": "0:09:25", "throughput": 4241.53, "total_tokens": 22489392} {"current_steps": 34485, "total_steps": 38160, "loss": 0.3471, "lr": 2.800225401406392e-05, "epoch": 18.07389937106918, "percentage": 90.37, "elapsed_time": "1:28:22", "remaining_time": "0:09:25", "throughput": 4241.47, "total_tokens": 22491696} {"current_steps": 34490, "total_steps": 38160, "loss": 0.4333, "lr": 2.7926846629729607e-05, "epoch": 18.07651991614256, "percentage": 90.38, "elapsed_time": "1:28:23", "remaining_time": "0:09:24", "throughput": 4241.46, "total_tokens": 22494448} {"current_steps": 34495, "total_steps": 38160, "loss": 0.4007, "lr": 2.7851537997713174e-05, "epoch": 18.079140461215932, "percentage": 90.4, "elapsed_time": "1:28:24", "remaining_time": "0:09:23", "throughput": 4241.46, "total_tokens": 22497264} {"current_steps": 34500, "total_steps": 38160, "loss": 0.3384, "lr": 2.7776328133768458e-05, "epoch": 18.08176100628931, "percentage": 90.41, "elapsed_time": "1:28:24", "remaining_time": "0:09:22", "throughput": 4241.46, "total_tokens": 22500080} {"current_steps": 34505, "total_steps": 38160, "loss": 0.4492, "lr": 2.770121705362849e-05, "epoch": 18.084381551362682, "percentage": 90.42, "elapsed_time": "1:28:25", "remaining_time": "0:09:21", "throughput": 4241.48, "total_tokens": 22503152} {"current_steps": 34510, "total_steps": 38160, "loss": 0.4776, "lr": 2.7626204773005704e-05, "epoch": 18.08700209643606, "percentage": 90.44, "elapsed_time": "1:28:26", "remaining_time": "0:09:21", "throughput": 4241.51, "total_tokens": 22506288} {"current_steps": 34515, "total_steps": 38160, "loss": 0.4782, "lr": 2.7551291307591765e-05, "epoch": 18.089622641509433, "percentage": 90.45, "elapsed_time": "1:28:26", "remaining_time": "0:09:20", "throughput": 4241.45, "total_tokens": 22508496} {"current_steps": 34520, "total_steps": 38160, "loss": 0.4567, "lr": 2.7476476673057636e-05, "epoch": 18.09224318658281, "percentage": 90.46, "elapsed_time": "1:28:27", "remaining_time": "0:09:19", "throughput": 4241.55, "total_tokens": 22512496} {"current_steps": 34525, "total_steps": 38160, "loss": 0.4225, "lr": 2.740176088505375e-05, "epoch": 18.094863731656183, "percentage": 90.47, "elapsed_time": "1:28:28", "remaining_time": "0:09:18", "throughput": 4241.6, "total_tokens": 22515888} {"current_steps": 34530, "total_steps": 38160, "loss": 0.3824, "lr": 2.7327143959209765e-05, "epoch": 18.09748427672956, "percentage": 90.49, "elapsed_time": "1:28:29", "remaining_time": "0:09:18", "throughput": 4241.62, "total_tokens": 22518928} {"current_steps": 34535, "total_steps": 38160, "loss": 0.3789, "lr": 2.725262591113481e-05, "epoch": 18.100104821802937, "percentage": 90.5, "elapsed_time": "1:28:29", "remaining_time": "0:09:17", "throughput": 4241.73, "total_tokens": 22523120} {"current_steps": 34540, "total_steps": 38160, "loss": 0.3732, "lr": 2.7178206756417078e-05, "epoch": 18.10272536687631, "percentage": 90.51, "elapsed_time": "1:28:30", "remaining_time": "0:09:16", "throughput": 4241.68, "total_tokens": 22525392} {"current_steps": 34545, "total_steps": 38160, "loss": 0.3853, "lr": 2.7103886510624344e-05, "epoch": 18.105345911949687, "percentage": 90.53, "elapsed_time": "1:28:31", "remaining_time": "0:09:15", "throughput": 4241.65, "total_tokens": 22527920} {"current_steps": 34550, "total_steps": 38160, "loss": 0.4668, "lr": 2.7029665189303387e-05, "epoch": 18.10796645702306, "percentage": 90.54, "elapsed_time": "1:28:31", "remaining_time": "0:09:15", "throughput": 4241.7, "total_tokens": 22531472} {"current_steps": 34555, "total_steps": 38160, "loss": 0.4821, "lr": 2.6955542807980515e-05, "epoch": 18.110587002096437, "percentage": 90.55, "elapsed_time": "1:28:32", "remaining_time": "0:09:14", "throughput": 4241.72, "total_tokens": 22534672} {"current_steps": 34560, "total_steps": 38160, "loss": 0.4549, "lr": 2.688151938216138e-05, "epoch": 18.11320754716981, "percentage": 90.57, "elapsed_time": "1:28:33", "remaining_time": "0:09:13", "throughput": 4241.71, "total_tokens": 22537424} {"current_steps": 34565, "total_steps": 38160, "loss": 0.5083, "lr": 2.6807594927330703e-05, "epoch": 18.115828092243188, "percentage": 90.58, "elapsed_time": "1:28:34", "remaining_time": "0:09:12", "throughput": 4241.77, "total_tokens": 22540944} {"current_steps": 34570, "total_steps": 38160, "loss": 0.3702, "lr": 2.6733769458952727e-05, "epoch": 18.11844863731656, "percentage": 90.59, "elapsed_time": "1:28:34", "remaining_time": "0:09:11", "throughput": 4241.82, "total_tokens": 22544368} {"current_steps": 34575, "total_steps": 38160, "loss": 0.4153, "lr": 2.6660042992470934e-05, "epoch": 18.121069182389938, "percentage": 90.61, "elapsed_time": "1:28:35", "remaining_time": "0:09:11", "throughput": 4241.85, "total_tokens": 22547568} {"current_steps": 34580, "total_steps": 38160, "loss": 0.4046, "lr": 2.658641554330793e-05, "epoch": 18.12368972746331, "percentage": 90.62, "elapsed_time": "1:28:36", "remaining_time": "0:09:10", "throughput": 4241.95, "total_tokens": 22551504} {"current_steps": 34585, "total_steps": 38160, "loss": 0.409, "lr": 2.6512887126865782e-05, "epoch": 18.12631027253669, "percentage": 90.63, "elapsed_time": "1:28:36", "remaining_time": "0:09:09", "throughput": 4241.95, "total_tokens": 22554416} {"current_steps": 34590, "total_steps": 38160, "loss": 0.2697, "lr": 2.6439457758525908e-05, "epoch": 18.128930817610062, "percentage": 90.64, "elapsed_time": "1:28:37", "remaining_time": "0:09:08", "throughput": 4241.95, "total_tokens": 22557232} {"current_steps": 34595, "total_steps": 38160, "loss": 0.3729, "lr": 2.6366127453648748e-05, "epoch": 18.13155136268344, "percentage": 90.66, "elapsed_time": "1:28:38", "remaining_time": "0:09:08", "throughput": 4242.03, "total_tokens": 22560976} {"current_steps": 34600, "total_steps": 38160, "loss": 0.5576, "lr": 2.6292896227574303e-05, "epoch": 18.134171907756812, "percentage": 90.67, "elapsed_time": "1:28:39", "remaining_time": "0:09:07", "throughput": 4242.07, "total_tokens": 22564272} {"current_steps": 34605, "total_steps": 38160, "loss": 0.6959, "lr": 2.6219764095621547e-05, "epoch": 18.13679245283019, "percentage": 90.68, "elapsed_time": "1:28:39", "remaining_time": "0:09:06", "throughput": 4242.08, "total_tokens": 22567280} {"current_steps": 34610, "total_steps": 38160, "loss": 0.4199, "lr": 2.6146731073088958e-05, "epoch": 18.139412997903563, "percentage": 90.7, "elapsed_time": "1:28:40", "remaining_time": "0:09:05", "throughput": 4242.16, "total_tokens": 22571120} {"current_steps": 34615, "total_steps": 38160, "loss": 0.38, "lr": 2.607379717525432e-05, "epoch": 18.14203354297694, "percentage": 90.71, "elapsed_time": "1:28:41", "remaining_time": "0:09:04", "throughput": 4242.21, "total_tokens": 22574672} {"current_steps": 34620, "total_steps": 38160, "loss": 0.4761, "lr": 2.6000962417374373e-05, "epoch": 18.144654088050313, "percentage": 90.72, "elapsed_time": "1:28:42", "remaining_time": "0:09:04", "throughput": 4242.21, "total_tokens": 22577616} {"current_steps": 34625, "total_steps": 38160, "loss": 0.4897, "lr": 2.5928226814685485e-05, "epoch": 18.14727463312369, "percentage": 90.74, "elapsed_time": "1:28:42", "remaining_time": "0:09:03", "throughput": 4242.16, "total_tokens": 22579888} {"current_steps": 34630, "total_steps": 38160, "loss": 0.4687, "lr": 2.585559038240304e-05, "epoch": 18.149895178197063, "percentage": 90.75, "elapsed_time": "1:28:43", "remaining_time": "0:09:02", "throughput": 4242.17, "total_tokens": 22582896} {"current_steps": 34635, "total_steps": 38160, "loss": 0.3422, "lr": 2.5783053135721714e-05, "epoch": 18.15251572327044, "percentage": 90.76, "elapsed_time": "1:28:44", "remaining_time": "0:09:01", "throughput": 4242.15, "total_tokens": 22585616} {"current_steps": 34640, "total_steps": 38160, "loss": 0.5253, "lr": 2.571061508981565e-05, "epoch": 18.155136268343817, "percentage": 90.78, "elapsed_time": "1:28:44", "remaining_time": "0:09:01", "throughput": 4242.14, "total_tokens": 22588496} {"current_steps": 34645, "total_steps": 38160, "loss": 0.4101, "lr": 2.5638276259837778e-05, "epoch": 18.15775681341719, "percentage": 90.79, "elapsed_time": "1:28:45", "remaining_time": "0:09:00", "throughput": 4242.11, "total_tokens": 22590896} {"current_steps": 34650, "total_steps": 38160, "loss": 0.7325, "lr": 2.5566036660920778e-05, "epoch": 18.160377358490567, "percentage": 90.8, "elapsed_time": "1:28:45", "remaining_time": "0:08:59", "throughput": 4242.04, "total_tokens": 22593104} {"current_steps": 34655, "total_steps": 38160, "loss": 0.4124, "lr": 2.5493896308176223e-05, "epoch": 18.16299790356394, "percentage": 90.81, "elapsed_time": "1:28:46", "remaining_time": "0:08:58", "throughput": 4242.1, "total_tokens": 22596656} {"current_steps": 34660, "total_steps": 38160, "loss": 0.4359, "lr": 2.542185521669521e-05, "epoch": 18.165618448637318, "percentage": 90.83, "elapsed_time": "1:28:47", "remaining_time": "0:08:57", "throughput": 4242.08, "total_tokens": 22599312} {"current_steps": 34665, "total_steps": 38160, "loss": 0.3336, "lr": 2.534991340154774e-05, "epoch": 18.16823899371069, "percentage": 90.84, "elapsed_time": "1:28:48", "remaining_time": "0:08:57", "throughput": 4242.18, "total_tokens": 22603440} {"current_steps": 34670, "total_steps": 38160, "loss": 0.4386, "lr": 2.5278070877783332e-05, "epoch": 18.170859538784068, "percentage": 90.85, "elapsed_time": "1:28:48", "remaining_time": "0:08:56", "throughput": 4242.2, "total_tokens": 22606512} {"current_steps": 34675, "total_steps": 38160, "loss": 0.5036, "lr": 2.520632766043052e-05, "epoch": 18.17348008385744, "percentage": 90.87, "elapsed_time": "1:28:49", "remaining_time": "0:08:55", "throughput": 4242.22, "total_tokens": 22609584} {"current_steps": 34680, "total_steps": 38160, "loss": 0.4587, "lr": 2.513468376449729e-05, "epoch": 18.17610062893082, "percentage": 90.88, "elapsed_time": "1:28:50", "remaining_time": "0:08:54", "throughput": 4242.31, "total_tokens": 22613712} {"current_steps": 34685, "total_steps": 38160, "loss": 0.3843, "lr": 2.506313920497061e-05, "epoch": 18.178721174004192, "percentage": 90.89, "elapsed_time": "1:28:51", "remaining_time": "0:08:54", "throughput": 4242.35, "total_tokens": 22617008} {"current_steps": 34690, "total_steps": 38160, "loss": 0.282, "lr": 2.4991693996816888e-05, "epoch": 18.18134171907757, "percentage": 90.91, "elapsed_time": "1:28:51", "remaining_time": "0:08:53", "throughput": 4242.36, "total_tokens": 22620112} {"current_steps": 34695, "total_steps": 38160, "loss": 0.3383, "lr": 2.4920348154981677e-05, "epoch": 18.183962264150942, "percentage": 90.92, "elapsed_time": "1:28:52", "remaining_time": "0:08:52", "throughput": 4242.33, "total_tokens": 22622608} {"current_steps": 34700, "total_steps": 38160, "loss": 0.5241, "lr": 2.4849101694389477e-05, "epoch": 18.18658280922432, "percentage": 90.93, "elapsed_time": "1:28:53", "remaining_time": "0:08:51", "throughput": 4242.4, "total_tokens": 22626416} {"current_steps": 34705, "total_steps": 38160, "loss": 0.326, "lr": 2.4777954629944478e-05, "epoch": 18.189203354297693, "percentage": 90.95, "elapsed_time": "1:28:54", "remaining_time": "0:08:51", "throughput": 4242.42, "total_tokens": 22629328} {"current_steps": 34710, "total_steps": 38160, "loss": 0.5246, "lr": 2.4706906976529718e-05, "epoch": 18.19182389937107, "percentage": 90.96, "elapsed_time": "1:28:54", "remaining_time": "0:08:50", "throughput": 4242.41, "total_tokens": 22632144} {"current_steps": 34715, "total_steps": 38160, "loss": 0.4111, "lr": 2.4635958749007648e-05, "epoch": 18.194444444444443, "percentage": 90.97, "elapsed_time": "1:28:55", "remaining_time": "0:08:49", "throughput": 4242.4, "total_tokens": 22634992} {"current_steps": 34720, "total_steps": 38160, "loss": 0.3829, "lr": 2.456510996221978e-05, "epoch": 18.19706498951782, "percentage": 90.99, "elapsed_time": "1:28:56", "remaining_time": "0:08:48", "throughput": 4242.43, "total_tokens": 22638256} {"current_steps": 34725, "total_steps": 38160, "loss": 0.4402, "lr": 2.4494360630986756e-05, "epoch": 18.199685534591197, "percentage": 91.0, "elapsed_time": "1:28:56", "remaining_time": "0:08:47", "throughput": 4242.47, "total_tokens": 22641712} {"current_steps": 34730, "total_steps": 38160, "loss": 0.4189, "lr": 2.4423710770108687e-05, "epoch": 18.20230607966457, "percentage": 91.01, "elapsed_time": "1:28:57", "remaining_time": "0:08:47", "throughput": 4242.6, "total_tokens": 22645904} {"current_steps": 34735, "total_steps": 38160, "loss": 0.4479, "lr": 2.435316039436464e-05, "epoch": 18.204926624737947, "percentage": 91.02, "elapsed_time": "1:28:58", "remaining_time": "0:08:46", "throughput": 4242.6, "total_tokens": 22648944} {"current_steps": 34740, "total_steps": 38160, "loss": 0.4419, "lr": 2.428270951851297e-05, "epoch": 18.20754716981132, "percentage": 91.04, "elapsed_time": "1:28:59", "remaining_time": "0:08:45", "throughput": 4242.61, "total_tokens": 22651888} {"current_steps": 34745, "total_steps": 38160, "loss": 0.4568, "lr": 2.421235815729128e-05, "epoch": 18.210167714884697, "percentage": 91.05, "elapsed_time": "1:28:59", "remaining_time": "0:08:44", "throughput": 4242.63, "total_tokens": 22655120} {"current_steps": 34750, "total_steps": 38160, "loss": 0.7387, "lr": 2.414210632541619e-05, "epoch": 18.21278825995807, "percentage": 91.06, "elapsed_time": "1:29:00", "remaining_time": "0:08:44", "throughput": 4242.71, "total_tokens": 22658928} {"current_steps": 34755, "total_steps": 38160, "loss": 0.4457, "lr": 2.40719540375835e-05, "epoch": 18.215408805031448, "percentage": 91.08, "elapsed_time": "1:29:01", "remaining_time": "0:08:43", "throughput": 4242.75, "total_tokens": 22662288} {"current_steps": 34760, "total_steps": 38160, "loss": 0.3886, "lr": 2.4001901308468353e-05, "epoch": 18.21802935010482, "percentage": 91.09, "elapsed_time": "1:29:02", "remaining_time": "0:08:42", "throughput": 4242.72, "total_tokens": 22664848} {"current_steps": 34765, "total_steps": 38160, "loss": 0.3537, "lr": 2.3931948152724982e-05, "epoch": 18.220649895178198, "percentage": 91.1, "elapsed_time": "1:29:02", "remaining_time": "0:08:41", "throughput": 4242.68, "total_tokens": 22667376} {"current_steps": 34770, "total_steps": 38160, "loss": 0.4802, "lr": 2.386209458498684e-05, "epoch": 18.22327044025157, "percentage": 91.12, "elapsed_time": "1:29:03", "remaining_time": "0:08:40", "throughput": 4242.78, "total_tokens": 22671440} {"current_steps": 34775, "total_steps": 38160, "loss": 0.4087, "lr": 2.3792340619866458e-05, "epoch": 18.22589098532495, "percentage": 91.13, "elapsed_time": "1:29:04", "remaining_time": "0:08:40", "throughput": 4242.87, "total_tokens": 22675408} {"current_steps": 34780, "total_steps": 38160, "loss": 0.3748, "lr": 2.3722686271955507e-05, "epoch": 18.228511530398322, "percentage": 91.14, "elapsed_time": "1:29:05", "remaining_time": "0:08:39", "throughput": 4242.86, "total_tokens": 22678224} {"current_steps": 34785, "total_steps": 38160, "loss": 0.3309, "lr": 2.365313155582488e-05, "epoch": 18.2311320754717, "percentage": 91.16, "elapsed_time": "1:29:05", "remaining_time": "0:08:38", "throughput": 4242.92, "total_tokens": 22681712} {"current_steps": 34790, "total_steps": 38160, "loss": 0.2974, "lr": 2.358367648602472e-05, "epoch": 18.233752620545072, "percentage": 91.17, "elapsed_time": "1:29:06", "remaining_time": "0:08:37", "throughput": 4242.95, "total_tokens": 22685008} {"current_steps": 34795, "total_steps": 38160, "loss": 0.4638, "lr": 2.3514321077084234e-05, "epoch": 18.23637316561845, "percentage": 91.18, "elapsed_time": "1:29:07", "remaining_time": "0:08:37", "throughput": 4242.99, "total_tokens": 22688368} {"current_steps": 34800, "total_steps": 38160, "loss": 0.4309, "lr": 2.3445065343511763e-05, "epoch": 18.238993710691823, "percentage": 91.19, "elapsed_time": "1:29:07", "remaining_time": "0:08:36", "throughput": 4242.98, "total_tokens": 22691184} {"current_steps": 34805, "total_steps": 38160, "loss": 0.4477, "lr": 2.3375909299794717e-05, "epoch": 18.2416142557652, "percentage": 91.21, "elapsed_time": "1:29:08", "remaining_time": "0:08:35", "throughput": 4243.06, "total_tokens": 22695024} {"current_steps": 34810, "total_steps": 38160, "loss": 0.4103, "lr": 2.330685296039986e-05, "epoch": 18.244234800838573, "percentage": 91.22, "elapsed_time": "1:29:09", "remaining_time": "0:08:34", "throughput": 4243.16, "total_tokens": 22699088} {"current_steps": 34815, "total_steps": 38160, "loss": 0.3671, "lr": 2.3237896339772914e-05, "epoch": 18.24685534591195, "percentage": 91.23, "elapsed_time": "1:29:10", "remaining_time": "0:08:34", "throughput": 4243.21, "total_tokens": 22702480} {"current_steps": 34820, "total_steps": 38160, "loss": 0.2956, "lr": 2.3169039452338892e-05, "epoch": 18.249475890985323, "percentage": 91.25, "elapsed_time": "1:29:11", "remaining_time": "0:08:33", "throughput": 4243.24, "total_tokens": 22705840} {"current_steps": 34825, "total_steps": 38160, "loss": 0.4418, "lr": 2.3100282312501886e-05, "epoch": 18.2520964360587, "percentage": 91.26, "elapsed_time": "1:29:11", "remaining_time": "0:08:32", "throughput": 4243.24, "total_tokens": 22708752} {"current_steps": 34830, "total_steps": 38160, "loss": 0.4557, "lr": 2.3031624934645113e-05, "epoch": 18.254716981132077, "percentage": 91.27, "elapsed_time": "1:29:12", "remaining_time": "0:08:31", "throughput": 4243.21, "total_tokens": 22711504} {"current_steps": 34835, "total_steps": 38160, "loss": 0.6007, "lr": 2.296306733313075e-05, "epoch": 18.25733752620545, "percentage": 91.29, "elapsed_time": "1:29:13", "remaining_time": "0:08:30", "throughput": 4243.22, "total_tokens": 22714384} {"current_steps": 34840, "total_steps": 38160, "loss": 0.447, "lr": 2.289460952230038e-05, "epoch": 18.259958071278827, "percentage": 91.3, "elapsed_time": "1:29:13", "remaining_time": "0:08:30", "throughput": 4243.3, "total_tokens": 22718192} {"current_steps": 34845, "total_steps": 38160, "loss": 0.4613, "lr": 2.2826251516474604e-05, "epoch": 18.2625786163522, "percentage": 91.31, "elapsed_time": "1:29:14", "remaining_time": "0:08:29", "throughput": 4243.34, "total_tokens": 22721616} {"current_steps": 34850, "total_steps": 38160, "loss": 0.5123, "lr": 2.2757993329953152e-05, "epoch": 18.265199161425578, "percentage": 91.33, "elapsed_time": "1:29:15", "remaining_time": "0:08:28", "throughput": 4243.35, "total_tokens": 22724624} {"current_steps": 34855, "total_steps": 38160, "loss": 0.4834, "lr": 2.2689834977014822e-05, "epoch": 18.26781970649895, "percentage": 91.34, "elapsed_time": "1:29:16", "remaining_time": "0:08:27", "throughput": 4243.35, "total_tokens": 22727600} {"current_steps": 34860, "total_steps": 38160, "loss": 0.2946, "lr": 2.2621776471917598e-05, "epoch": 18.270440251572328, "percentage": 91.35, "elapsed_time": "1:29:16", "remaining_time": "0:08:27", "throughput": 4243.37, "total_tokens": 22730608} {"current_steps": 34865, "total_steps": 38160, "loss": 0.4198, "lr": 2.255381782889848e-05, "epoch": 18.2730607966457, "percentage": 91.37, "elapsed_time": "1:29:17", "remaining_time": "0:08:26", "throughput": 4243.37, "total_tokens": 22733424} {"current_steps": 34870, "total_steps": 38160, "loss": 0.397, "lr": 2.2485959062173654e-05, "epoch": 18.27568134171908, "percentage": 91.38, "elapsed_time": "1:29:18", "remaining_time": "0:08:25", "throughput": 4243.43, "total_tokens": 22737008} {"current_steps": 34875, "total_steps": 38160, "loss": 0.4014, "lr": 2.2418200185938485e-05, "epoch": 18.278301886792452, "percentage": 91.39, "elapsed_time": "1:29:18", "remaining_time": "0:08:24", "throughput": 4243.46, "total_tokens": 22740272} {"current_steps": 34880, "total_steps": 38160, "loss": 0.3965, "lr": 2.235054121436725e-05, "epoch": 18.28092243186583, "percentage": 91.4, "elapsed_time": "1:29:19", "remaining_time": "0:08:24", "throughput": 4243.57, "total_tokens": 22744464} {"current_steps": 34885, "total_steps": 38160, "loss": 0.4315, "lr": 2.2282982161613562e-05, "epoch": 18.283542976939202, "percentage": 91.42, "elapsed_time": "1:29:20", "remaining_time": "0:08:23", "throughput": 4243.55, "total_tokens": 22747152} {"current_steps": 34890, "total_steps": 38160, "loss": 0.4046, "lr": 2.221552304180985e-05, "epoch": 18.28616352201258, "percentage": 91.43, "elapsed_time": "1:29:21", "remaining_time": "0:08:22", "throughput": 4243.67, "total_tokens": 22751408} {"current_steps": 34895, "total_steps": 38160, "loss": 0.4814, "lr": 2.2148163869067816e-05, "epoch": 18.288784067085953, "percentage": 91.44, "elapsed_time": "1:29:22", "remaining_time": "0:08:21", "throughput": 4243.79, "total_tokens": 22755568} {"current_steps": 34900, "total_steps": 38160, "loss": 0.3868, "lr": 2.2080904657478305e-05, "epoch": 18.29140461215933, "percentage": 91.46, "elapsed_time": "1:29:22", "remaining_time": "0:08:20", "throughput": 4243.8, "total_tokens": 22758576} {"current_steps": 34905, "total_steps": 38160, "loss": 0.4292, "lr": 2.201374542111123e-05, "epoch": 18.294025157232703, "percentage": 91.47, "elapsed_time": "1:29:23", "remaining_time": "0:08:20", "throughput": 4243.87, "total_tokens": 22762128} {"current_steps": 34910, "total_steps": 38160, "loss": 0.4068, "lr": 2.1946686174015407e-05, "epoch": 18.29664570230608, "percentage": 91.48, "elapsed_time": "1:29:24", "remaining_time": "0:08:19", "throughput": 4243.85, "total_tokens": 22764784} {"current_steps": 34915, "total_steps": 38160, "loss": 0.426, "lr": 2.1879726930218946e-05, "epoch": 18.299266247379457, "percentage": 91.5, "elapsed_time": "1:29:24", "remaining_time": "0:08:18", "throughput": 4243.91, "total_tokens": 22768304} {"current_steps": 34920, "total_steps": 38160, "loss": 0.3971, "lr": 2.1812867703728866e-05, "epoch": 18.30188679245283, "percentage": 91.51, "elapsed_time": "1:29:25", "remaining_time": "0:08:17", "throughput": 4243.95, "total_tokens": 22771632} {"current_steps": 34925, "total_steps": 38160, "loss": 0.3411, "lr": 2.1746108508531426e-05, "epoch": 18.304507337526207, "percentage": 91.52, "elapsed_time": "1:29:26", "remaining_time": "0:08:17", "throughput": 4244.0, "total_tokens": 22774928} {"current_steps": 34930, "total_steps": 38160, "loss": 0.3557, "lr": 2.1679449358591952e-05, "epoch": 18.30712788259958, "percentage": 91.54, "elapsed_time": "1:29:27", "remaining_time": "0:08:16", "throughput": 4244.07, "total_tokens": 22778640} {"current_steps": 34935, "total_steps": 38160, "loss": 0.3278, "lr": 2.1612890267854624e-05, "epoch": 18.309748427672957, "percentage": 91.55, "elapsed_time": "1:29:27", "remaining_time": "0:08:15", "throughput": 4244.1, "total_tokens": 22781936} {"current_steps": 34940, "total_steps": 38160, "loss": 0.3724, "lr": 2.1546431250242914e-05, "epoch": 18.31236897274633, "percentage": 91.56, "elapsed_time": "1:29:28", "remaining_time": "0:08:14", "throughput": 4244.07, "total_tokens": 22784528} {"current_steps": 34945, "total_steps": 38160, "loss": 0.3077, "lr": 2.1480072319659427e-05, "epoch": 18.314989517819708, "percentage": 91.57, "elapsed_time": "1:29:29", "remaining_time": "0:08:14", "throughput": 4244.32, "total_tokens": 22790704} {"current_steps": 34950, "total_steps": 38160, "loss": 0.4542, "lr": 2.1413813489985447e-05, "epoch": 18.31761006289308, "percentage": 91.59, "elapsed_time": "1:29:30", "remaining_time": "0:08:13", "throughput": 4244.38, "total_tokens": 22794320} {"current_steps": 34955, "total_steps": 38160, "loss": 0.4753, "lr": 2.1347654775081716e-05, "epoch": 18.320230607966458, "percentage": 91.6, "elapsed_time": "1:29:31", "remaining_time": "0:08:12", "throughput": 4244.49, "total_tokens": 22798544} {"current_steps": 34960, "total_steps": 38160, "loss": 0.3972, "lr": 2.1281596188787834e-05, "epoch": 18.32285115303983, "percentage": 91.61, "elapsed_time": "1:29:31", "remaining_time": "0:08:11", "throughput": 4244.49, "total_tokens": 22801392} {"current_steps": 34965, "total_steps": 38160, "loss": 0.4025, "lr": 2.121563774492252e-05, "epoch": 18.32547169811321, "percentage": 91.63, "elapsed_time": "1:29:32", "remaining_time": "0:08:10", "throughput": 4244.54, "total_tokens": 22804880} {"current_steps": 34970, "total_steps": 38160, "loss": 0.608, "lr": 2.114977945728358e-05, "epoch": 18.328092243186582, "percentage": 91.64, "elapsed_time": "1:29:33", "remaining_time": "0:08:10", "throughput": 4244.57, "total_tokens": 22808112} {"current_steps": 34975, "total_steps": 38160, "loss": 0.4494, "lr": 2.1084021339647707e-05, "epoch": 18.33071278825996, "percentage": 91.65, "elapsed_time": "1:29:34", "remaining_time": "0:08:09", "throughput": 4244.85, "total_tokens": 22814544} {"current_steps": 34980, "total_steps": 38160, "loss": 0.3492, "lr": 2.1018363405770792e-05, "epoch": 18.333333333333332, "percentage": 91.67, "elapsed_time": "1:29:35", "remaining_time": "0:08:08", "throughput": 4244.84, "total_tokens": 22817200} {"current_steps": 34985, "total_steps": 38160, "loss": 0.3357, "lr": 2.095280566938784e-05, "epoch": 18.33595387840671, "percentage": 91.68, "elapsed_time": "1:29:35", "remaining_time": "0:08:07", "throughput": 4244.84, "total_tokens": 22820048} {"current_steps": 34990, "total_steps": 38160, "loss": 0.3754, "lr": 2.0887348144212615e-05, "epoch": 18.338574423480082, "percentage": 91.69, "elapsed_time": "1:29:36", "remaining_time": "0:08:07", "throughput": 4244.87, "total_tokens": 22823280} {"current_steps": 34995, "total_steps": 38160, "loss": 0.4762, "lr": 2.08219908439381e-05, "epoch": 18.34119496855346, "percentage": 91.71, "elapsed_time": "1:29:37", "remaining_time": "0:08:06", "throughput": 4244.88, "total_tokens": 22826224} {"current_steps": 35000, "total_steps": 38160, "loss": 0.3158, "lr": 2.075673378223647e-05, "epoch": 18.343815513626833, "percentage": 91.72, "elapsed_time": "1:29:38", "remaining_time": "0:08:05", "throughput": 4244.9, "total_tokens": 22829360} {"current_steps": 35005, "total_steps": 38160, "loss": 0.3997, "lr": 2.069157697275853e-05, "epoch": 18.34643605870021, "percentage": 91.73, "elapsed_time": "1:29:38", "remaining_time": "0:08:04", "throughput": 4244.93, "total_tokens": 22832688} {"current_steps": 35010, "total_steps": 38160, "loss": 0.3555, "lr": 2.0626520429134543e-05, "epoch": 18.349056603773583, "percentage": 91.75, "elapsed_time": "1:29:39", "remaining_time": "0:08:04", "throughput": 4244.98, "total_tokens": 22836176} {"current_steps": 35015, "total_steps": 38160, "loss": 0.3097, "lr": 2.0561564164973458e-05, "epoch": 18.35167714884696, "percentage": 91.76, "elapsed_time": "1:29:40", "remaining_time": "0:08:03", "throughput": 4244.99, "total_tokens": 22839088} {"current_steps": 35020, "total_steps": 38160, "loss": 0.4021, "lr": 2.04967081938634e-05, "epoch": 18.354297693920337, "percentage": 91.77, "elapsed_time": "1:29:40", "remaining_time": "0:08:02", "throughput": 4245.03, "total_tokens": 22842384} {"current_steps": 35025, "total_steps": 38160, "loss": 0.4408, "lr": 2.043195252937152e-05, "epoch": 18.35691823899371, "percentage": 91.78, "elapsed_time": "1:29:41", "remaining_time": "0:08:01", "throughput": 4245.02, "total_tokens": 22845232} {"current_steps": 35030, "total_steps": 38160, "loss": 0.4412, "lr": 2.0367297185044043e-05, "epoch": 18.359538784067087, "percentage": 91.8, "elapsed_time": "1:29:42", "remaining_time": "0:08:00", "throughput": 4245.01, "total_tokens": 22848016} {"current_steps": 35035, "total_steps": 38160, "loss": 0.5107, "lr": 2.030274217440603e-05, "epoch": 18.36215932914046, "percentage": 91.81, "elapsed_time": "1:29:42", "remaining_time": "0:08:00", "throughput": 4244.99, "total_tokens": 22850672} {"current_steps": 35040, "total_steps": 38160, "loss": 0.2978, "lr": 2.0238287510961628e-05, "epoch": 18.364779874213838, "percentage": 91.82, "elapsed_time": "1:29:43", "remaining_time": "0:07:59", "throughput": 4244.99, "total_tokens": 22853584} {"current_steps": 35045, "total_steps": 38160, "loss": 0.3747, "lr": 2.017393320819405e-05, "epoch": 18.36740041928721, "percentage": 91.84, "elapsed_time": "1:29:44", "remaining_time": "0:07:58", "throughput": 4245.06, "total_tokens": 22857424} {"current_steps": 35050, "total_steps": 38160, "loss": 0.3845, "lr": 2.010967927956553e-05, "epoch": 18.370020964360588, "percentage": 91.85, "elapsed_time": "1:29:45", "remaining_time": "0:07:57", "throughput": 4245.17, "total_tokens": 22861456} {"current_steps": 35055, "total_steps": 38160, "loss": 0.3705, "lr": 2.00455257385172e-05, "epoch": 18.37264150943396, "percentage": 91.86, "elapsed_time": "1:29:46", "remaining_time": "0:07:57", "throughput": 4245.21, "total_tokens": 22864752} {"current_steps": 35060, "total_steps": 38160, "loss": 0.3471, "lr": 1.9981472598469386e-05, "epoch": 18.37526205450734, "percentage": 91.88, "elapsed_time": "1:29:46", "remaining_time": "0:07:56", "throughput": 4245.3, "total_tokens": 22868624} {"current_steps": 35065, "total_steps": 38160, "loss": 0.4729, "lr": 1.9917519872821142e-05, "epoch": 18.377882599580712, "percentage": 91.89, "elapsed_time": "1:29:47", "remaining_time": "0:07:55", "throughput": 4245.33, "total_tokens": 22871760} {"current_steps": 35070, "total_steps": 38160, "loss": 0.3713, "lr": 1.9853667574950605e-05, "epoch": 18.38050314465409, "percentage": 91.9, "elapsed_time": "1:29:48", "remaining_time": "0:07:54", "throughput": 4245.38, "total_tokens": 22875248} {"current_steps": 35075, "total_steps": 38160, "loss": 0.4612, "lr": 1.978991571821498e-05, "epoch": 18.383123689727462, "percentage": 91.92, "elapsed_time": "1:29:49", "remaining_time": "0:07:53", "throughput": 4245.42, "total_tokens": 22878640} {"current_steps": 35080, "total_steps": 38160, "loss": 0.377, "lr": 1.972626431595048e-05, "epoch": 18.38574423480084, "percentage": 91.93, "elapsed_time": "1:29:49", "remaining_time": "0:07:53", "throughput": 4245.43, "total_tokens": 22881584} {"current_steps": 35085, "total_steps": 38160, "loss": 0.3947, "lr": 1.9662713381472295e-05, "epoch": 18.388364779874212, "percentage": 91.94, "elapsed_time": "1:29:50", "remaining_time": "0:07:52", "throughput": 4245.42, "total_tokens": 22884368} {"current_steps": 35090, "total_steps": 38160, "loss": 0.509, "lr": 1.959926292807451e-05, "epoch": 18.39098532494759, "percentage": 91.95, "elapsed_time": "1:29:50", "remaining_time": "0:07:51", "throughput": 4245.4, "total_tokens": 22886896} {"current_steps": 35095, "total_steps": 38160, "loss": 0.4735, "lr": 1.9535912969030178e-05, "epoch": 18.393605870020963, "percentage": 91.97, "elapsed_time": "1:29:51", "remaining_time": "0:07:50", "throughput": 4245.46, "total_tokens": 22890448} {"current_steps": 35100, "total_steps": 38160, "loss": 0.4035, "lr": 1.947266351759136e-05, "epoch": 18.39622641509434, "percentage": 91.98, "elapsed_time": "1:29:52", "remaining_time": "0:07:50", "throughput": 4245.53, "total_tokens": 22894224} {"current_steps": 35105, "total_steps": 38160, "loss": 0.5141, "lr": 1.940951458698925e-05, "epoch": 18.398846960167713, "percentage": 91.99, "elapsed_time": "1:29:53", "remaining_time": "0:07:49", "throughput": 4245.57, "total_tokens": 22897680} {"current_steps": 35110, "total_steps": 38160, "loss": 0.4072, "lr": 1.9346466190433842e-05, "epoch": 18.40146750524109, "percentage": 92.01, "elapsed_time": "1:29:54", "remaining_time": "0:07:48", "throughput": 4245.6, "total_tokens": 22900880} {"current_steps": 35115, "total_steps": 38160, "loss": 0.4257, "lr": 1.9283518341114136e-05, "epoch": 18.404088050314467, "percentage": 92.02, "elapsed_time": "1:29:54", "remaining_time": "0:07:47", "throughput": 4245.62, "total_tokens": 22903984} {"current_steps": 35120, "total_steps": 38160, "loss": 0.5028, "lr": 1.9220671052198047e-05, "epoch": 18.40670859538784, "percentage": 92.03, "elapsed_time": "1:29:55", "remaining_time": "0:07:47", "throughput": 4245.66, "total_tokens": 22907216} {"current_steps": 35125, "total_steps": 38160, "loss": 0.5816, "lr": 1.9157924336832556e-05, "epoch": 18.409329140461217, "percentage": 92.05, "elapsed_time": "1:29:56", "remaining_time": "0:07:46", "throughput": 4245.68, "total_tokens": 22910352} {"current_steps": 35130, "total_steps": 38160, "loss": 0.6077, "lr": 1.909527820814355e-05, "epoch": 18.41194968553459, "percentage": 92.06, "elapsed_time": "1:29:56", "remaining_time": "0:07:45", "throughput": 4245.73, "total_tokens": 22913776} {"current_steps": 35135, "total_steps": 38160, "loss": 0.5534, "lr": 1.9032732679235886e-05, "epoch": 18.414570230607968, "percentage": 92.07, "elapsed_time": "1:29:57", "remaining_time": "0:07:44", "throughput": 4245.82, "total_tokens": 22917584} {"current_steps": 35140, "total_steps": 38160, "loss": 0.4127, "lr": 1.8970287763193428e-05, "epoch": 18.41719077568134, "percentage": 92.09, "elapsed_time": "1:29:58", "remaining_time": "0:07:43", "throughput": 4245.84, "total_tokens": 22920592} {"current_steps": 35145, "total_steps": 38160, "loss": 0.4117, "lr": 1.8907943473078892e-05, "epoch": 18.419811320754718, "percentage": 92.1, "elapsed_time": "1:29:59", "remaining_time": "0:07:43", "throughput": 4245.82, "total_tokens": 22923248} {"current_steps": 35150, "total_steps": 38160, "loss": 0.3661, "lr": 1.884569982193396e-05, "epoch": 18.42243186582809, "percentage": 92.11, "elapsed_time": "1:29:59", "remaining_time": "0:07:42", "throughput": 4245.89, "total_tokens": 22926832} {"current_steps": 35155, "total_steps": 38160, "loss": 0.4296, "lr": 1.8783556822779267e-05, "epoch": 18.42505241090147, "percentage": 92.13, "elapsed_time": "1:30:00", "remaining_time": "0:07:41", "throughput": 4245.94, "total_tokens": 22930256} {"current_steps": 35160, "total_steps": 38160, "loss": 0.5727, "lr": 1.8721514488614532e-05, "epoch": 18.427672955974842, "percentage": 92.14, "elapsed_time": "1:30:01", "remaining_time": "0:07:40", "throughput": 4245.98, "total_tokens": 22933552} {"current_steps": 35165, "total_steps": 38160, "loss": 0.3944, "lr": 1.8659572832418315e-05, "epoch": 18.43029350104822, "percentage": 92.15, "elapsed_time": "1:30:01", "remaining_time": "0:07:40", "throughput": 4245.95, "total_tokens": 22936112} {"current_steps": 35170, "total_steps": 38160, "loss": 0.5773, "lr": 1.8597731867148026e-05, "epoch": 18.432914046121592, "percentage": 92.16, "elapsed_time": "1:30:02", "remaining_time": "0:07:39", "throughput": 4245.97, "total_tokens": 22939376} {"current_steps": 35175, "total_steps": 38160, "loss": 0.3923, "lr": 1.8535991605740043e-05, "epoch": 18.43553459119497, "percentage": 92.18, "elapsed_time": "1:30:03", "remaining_time": "0:07:38", "throughput": 4245.98, "total_tokens": 22942416} {"current_steps": 35180, "total_steps": 38160, "loss": 0.4708, "lr": 1.8474352061109757e-05, "epoch": 18.438155136268342, "percentage": 92.19, "elapsed_time": "1:30:04", "remaining_time": "0:07:37", "throughput": 4246.0, "total_tokens": 22945520} {"current_steps": 35185, "total_steps": 38160, "loss": 0.4677, "lr": 1.8412813246151515e-05, "epoch": 18.44077568134172, "percentage": 92.2, "elapsed_time": "1:30:04", "remaining_time": "0:07:36", "throughput": 4245.99, "total_tokens": 22948240} {"current_steps": 35190, "total_steps": 38160, "loss": 0.4811, "lr": 1.8351375173738584e-05, "epoch": 18.443396226415093, "percentage": 92.22, "elapsed_time": "1:30:05", "remaining_time": "0:07:36", "throughput": 4246.02, "total_tokens": 22951536} {"current_steps": 35195, "total_steps": 38160, "loss": 0.4009, "lr": 1.829003785672295e-05, "epoch": 18.44601677148847, "percentage": 92.23, "elapsed_time": "1:30:06", "remaining_time": "0:07:35", "throughput": 4246.1, "total_tokens": 22955280} {"current_steps": 35200, "total_steps": 38160, "loss": 0.4267, "lr": 1.8228801307935806e-05, "epoch": 18.448637316561843, "percentage": 92.24, "elapsed_time": "1:30:06", "remaining_time": "0:07:34", "throughput": 4246.13, "total_tokens": 22958576} {"current_steps": 35205, "total_steps": 38160, "loss": 0.4438, "lr": 1.8167665540187063e-05, "epoch": 18.45125786163522, "percentage": 92.26, "elapsed_time": "1:30:07", "remaining_time": "0:07:33", "throughput": 4246.12, "total_tokens": 22961328} {"current_steps": 35210, "total_steps": 38160, "loss": 0.3014, "lr": 1.8106630566265604e-05, "epoch": 18.453878406708597, "percentage": 92.27, "elapsed_time": "1:30:08", "remaining_time": "0:07:33", "throughput": 4246.18, "total_tokens": 22964880} {"current_steps": 35215, "total_steps": 38160, "loss": 0.405, "lr": 1.8045696398939326e-05, "epoch": 18.45649895178197, "percentage": 92.28, "elapsed_time": "1:30:09", "remaining_time": "0:07:32", "throughput": 4246.27, "total_tokens": 22968848} {"current_steps": 35220, "total_steps": 38160, "loss": 0.5101, "lr": 1.7984863050955036e-05, "epoch": 18.459119496855347, "percentage": 92.3, "elapsed_time": "1:30:10", "remaining_time": "0:07:31", "throughput": 4246.38, "total_tokens": 22972944} {"current_steps": 35225, "total_steps": 38160, "loss": 0.4701, "lr": 1.7924130535038162e-05, "epoch": 18.46174004192872, "percentage": 92.31, "elapsed_time": "1:30:10", "remaining_time": "0:07:30", "throughput": 4246.42, "total_tokens": 22976208} {"current_steps": 35230, "total_steps": 38160, "loss": 0.4033, "lr": 1.7863498863893433e-05, "epoch": 18.464360587002098, "percentage": 92.32, "elapsed_time": "1:30:11", "remaining_time": "0:07:30", "throughput": 4246.41, "total_tokens": 22978832} {"current_steps": 35235, "total_steps": 38160, "loss": 0.5057, "lr": 1.7802968050204203e-05, "epoch": 18.46698113207547, "percentage": 92.33, "elapsed_time": "1:30:12", "remaining_time": "0:07:29", "throughput": 4246.43, "total_tokens": 22982096} {"current_steps": 35240, "total_steps": 38160, "loss": 0.5859, "lr": 1.7742538106632844e-05, "epoch": 18.469601677148848, "percentage": 92.35, "elapsed_time": "1:30:12", "remaining_time": "0:07:28", "throughput": 4246.52, "total_tokens": 22986032} {"current_steps": 35245, "total_steps": 38160, "loss": 0.3565, "lr": 1.7682209045820684e-05, "epoch": 18.47222222222222, "percentage": 92.36, "elapsed_time": "1:30:13", "remaining_time": "0:07:27", "throughput": 4246.53, "total_tokens": 22989168} {"current_steps": 35250, "total_steps": 38160, "loss": 0.4738, "lr": 1.76219808803878e-05, "epoch": 18.4748427672956, "percentage": 92.37, "elapsed_time": "1:30:14", "remaining_time": "0:07:26", "throughput": 4246.6, "total_tokens": 22992784} {"current_steps": 35255, "total_steps": 38160, "loss": 0.3464, "lr": 1.7561853622933278e-05, "epoch": 18.47746331236897, "percentage": 92.39, "elapsed_time": "1:30:15", "remaining_time": "0:07:26", "throughput": 4246.62, "total_tokens": 22995824} {"current_steps": 35260, "total_steps": 38160, "loss": 0.4793, "lr": 1.7501827286035e-05, "epoch": 18.48008385744235, "percentage": 92.4, "elapsed_time": "1:30:15", "remaining_time": "0:07:25", "throughput": 4246.64, "total_tokens": 22998928} {"current_steps": 35265, "total_steps": 38160, "loss": 0.3338, "lr": 1.7441901882249754e-05, "epoch": 18.482704402515722, "percentage": 92.41, "elapsed_time": "1:30:16", "remaining_time": "0:07:24", "throughput": 4246.61, "total_tokens": 23001424} {"current_steps": 35270, "total_steps": 38160, "loss": 0.3866, "lr": 1.7382077424113464e-05, "epoch": 18.4853249475891, "percentage": 92.43, "elapsed_time": "1:30:17", "remaining_time": "0:07:23", "throughput": 4246.65, "total_tokens": 23004784} {"current_steps": 35275, "total_steps": 38160, "loss": 0.3582, "lr": 1.7322353924140498e-05, "epoch": 18.487945492662472, "percentage": 92.44, "elapsed_time": "1:30:17", "remaining_time": "0:07:23", "throughput": 4246.68, "total_tokens": 23008048} {"current_steps": 35280, "total_steps": 38160, "loss": 0.2952, "lr": 1.7262731394824372e-05, "epoch": 18.49056603773585, "percentage": 92.45, "elapsed_time": "1:30:18", "remaining_time": "0:07:22", "throughput": 4246.63, "total_tokens": 23010416} {"current_steps": 35285, "total_steps": 38160, "loss": 0.4329, "lr": 1.7203209848637603e-05, "epoch": 18.493186582809223, "percentage": 92.47, "elapsed_time": "1:30:19", "remaining_time": "0:07:21", "throughput": 4246.66, "total_tokens": 23013616} {"current_steps": 35290, "total_steps": 38160, "loss": 0.4018, "lr": 1.7143789298031175e-05, "epoch": 18.4958071278826, "percentage": 92.48, "elapsed_time": "1:30:20", "remaining_time": "0:07:20", "throughput": 4246.77, "total_tokens": 23017808} {"current_steps": 35295, "total_steps": 38160, "loss": 0.3369, "lr": 1.708446975543537e-05, "epoch": 18.498427672955973, "percentage": 92.49, "elapsed_time": "1:30:20", "remaining_time": "0:07:20", "throughput": 4246.78, "total_tokens": 23020720} {"current_steps": 35300, "total_steps": 38160, "loss": 0.3027, "lr": 1.7025251233259098e-05, "epoch": 18.50104821802935, "percentage": 92.51, "elapsed_time": "1:30:21", "remaining_time": "0:07:19", "throughput": 4246.86, "total_tokens": 23024560} {"current_steps": 35305, "total_steps": 38160, "loss": 0.4093, "lr": 1.6966133743890166e-05, "epoch": 18.503668763102727, "percentage": 92.52, "elapsed_time": "1:30:22", "remaining_time": "0:07:18", "throughput": 4246.9, "total_tokens": 23027856} {"current_steps": 35310, "total_steps": 38160, "loss": 0.3726, "lr": 1.690711729969535e-05, "epoch": 18.5062893081761, "percentage": 92.53, "elapsed_time": "1:30:22", "remaining_time": "0:07:17", "throughput": 4246.92, "total_tokens": 23031024} {"current_steps": 35315, "total_steps": 38160, "loss": 0.3525, "lr": 1.684820191302022e-05, "epoch": 18.508909853249477, "percentage": 92.54, "elapsed_time": "1:30:23", "remaining_time": "0:07:16", "throughput": 4246.94, "total_tokens": 23034192} {"current_steps": 35320, "total_steps": 38160, "loss": 0.4685, "lr": 1.6789387596189087e-05, "epoch": 18.51153039832285, "percentage": 92.56, "elapsed_time": "1:30:24", "remaining_time": "0:07:16", "throughput": 4246.99, "total_tokens": 23037680} {"current_steps": 35325, "total_steps": 38160, "loss": 0.4078, "lr": 1.6730674361505382e-05, "epoch": 18.514150943396228, "percentage": 92.57, "elapsed_time": "1:30:25", "remaining_time": "0:07:15", "throughput": 4247.01, "total_tokens": 23040784} {"current_steps": 35330, "total_steps": 38160, "loss": 0.3935, "lr": 1.6672062221251117e-05, "epoch": 18.5167714884696, "percentage": 92.58, "elapsed_time": "1:30:25", "remaining_time": "0:07:14", "throughput": 4247.03, "total_tokens": 23043888} {"current_steps": 35335, "total_steps": 38160, "loss": 0.4532, "lr": 1.6613551187687314e-05, "epoch": 18.519392033542978, "percentage": 92.6, "elapsed_time": "1:30:26", "remaining_time": "0:07:13", "throughput": 4247.04, "total_tokens": 23046928} {"current_steps": 35340, "total_steps": 38160, "loss": 0.34, "lr": 1.6555141273053907e-05, "epoch": 18.52201257861635, "percentage": 92.61, "elapsed_time": "1:30:27", "remaining_time": "0:07:13", "throughput": 4247.23, "total_tokens": 23052016} {"current_steps": 35345, "total_steps": 38160, "loss": 0.4066, "lr": 1.6496832489569457e-05, "epoch": 18.52463312368973, "percentage": 92.62, "elapsed_time": "1:30:28", "remaining_time": "0:07:12", "throughput": 4247.29, "total_tokens": 23055632} {"current_steps": 35350, "total_steps": 38160, "loss": 0.4199, "lr": 1.643862484943165e-05, "epoch": 18.5272536687631, "percentage": 92.64, "elapsed_time": "1:30:29", "remaining_time": "0:07:11", "throughput": 4247.3, "total_tokens": 23058640} {"current_steps": 35355, "total_steps": 38160, "loss": 0.4618, "lr": 1.6380518364816687e-05, "epoch": 18.52987421383648, "percentage": 92.65, "elapsed_time": "1:30:29", "remaining_time": "0:07:10", "throughput": 4247.3, "total_tokens": 23061488} {"current_steps": 35360, "total_steps": 38160, "loss": 0.3365, "lr": 1.632251304787985e-05, "epoch": 18.532494758909852, "percentage": 92.66, "elapsed_time": "1:30:30", "remaining_time": "0:07:10", "throughput": 4247.27, "total_tokens": 23064016} {"current_steps": 35365, "total_steps": 38160, "loss": 0.3891, "lr": 1.6264608910755153e-05, "epoch": 18.53511530398323, "percentage": 92.68, "elapsed_time": "1:30:30", "remaining_time": "0:07:09", "throughput": 4247.24, "total_tokens": 23066576} {"current_steps": 35370, "total_steps": 38160, "loss": 0.4386, "lr": 1.6206805965555627e-05, "epoch": 18.537735849056602, "percentage": 92.69, "elapsed_time": "1:30:31", "remaining_time": "0:07:08", "throughput": 4247.29, "total_tokens": 23069936} {"current_steps": 35375, "total_steps": 38160, "loss": 0.7166, "lr": 1.614910422437288e-05, "epoch": 18.54035639412998, "percentage": 92.7, "elapsed_time": "1:30:32", "remaining_time": "0:07:07", "throughput": 4247.32, "total_tokens": 23073392} {"current_steps": 35380, "total_steps": 38160, "loss": 0.4112, "lr": 1.6091503699277477e-05, "epoch": 18.542976939203353, "percentage": 92.71, "elapsed_time": "1:30:33", "remaining_time": "0:07:06", "throughput": 4247.56, "total_tokens": 23079568} {"current_steps": 35385, "total_steps": 38160, "loss": 0.329, "lr": 1.6034004402318726e-05, "epoch": 18.54559748427673, "percentage": 92.73, "elapsed_time": "1:30:34", "remaining_time": "0:07:06", "throughput": 4247.56, "total_tokens": 23082480} {"current_steps": 35390, "total_steps": 38160, "loss": 0.3841, "lr": 1.5976606345524836e-05, "epoch": 18.548218029350103, "percentage": 92.74, "elapsed_time": "1:30:34", "remaining_time": "0:07:05", "throughput": 4247.55, "total_tokens": 23085328} {"current_steps": 35395, "total_steps": 38160, "loss": 0.447, "lr": 1.5919309540902927e-05, "epoch": 18.55083857442348, "percentage": 92.75, "elapsed_time": "1:30:35", "remaining_time": "0:07:04", "throughput": 4247.54, "total_tokens": 23088208} {"current_steps": 35400, "total_steps": 38160, "loss": 0.3579, "lr": 1.5862114000438797e-05, "epoch": 18.553459119496857, "percentage": 92.77, "elapsed_time": "1:30:36", "remaining_time": "0:07:03", "throughput": 4247.57, "total_tokens": 23091376} {"current_steps": 35405, "total_steps": 38160, "loss": 0.4901, "lr": 1.5805019736097104e-05, "epoch": 18.55607966457023, "percentage": 92.78, "elapsed_time": "1:30:37", "remaining_time": "0:07:03", "throughput": 4247.62, "total_tokens": 23094832} {"current_steps": 35410, "total_steps": 38160, "loss": 0.347, "lr": 1.5748026759821232e-05, "epoch": 18.558700209643607, "percentage": 92.79, "elapsed_time": "1:30:37", "remaining_time": "0:07:02", "throughput": 4247.62, "total_tokens": 23097808} {"current_steps": 35415, "total_steps": 38160, "loss": 0.5002, "lr": 1.5691135083533537e-05, "epoch": 18.56132075471698, "percentage": 92.81, "elapsed_time": "1:30:38", "remaining_time": "0:07:01", "throughput": 4247.59, "total_tokens": 23100464} {"current_steps": 35420, "total_steps": 38160, "loss": 0.3637, "lr": 1.5634344719135052e-05, "epoch": 18.563941299790358, "percentage": 92.82, "elapsed_time": "1:30:39", "remaining_time": "0:07:00", "throughput": 4247.63, "total_tokens": 23103760} {"current_steps": 35425, "total_steps": 38160, "loss": 0.4174, "lr": 1.5577655678505776e-05, "epoch": 18.56656184486373, "percentage": 92.83, "elapsed_time": "1:30:39", "remaining_time": "0:06:59", "throughput": 4247.65, "total_tokens": 23106832} {"current_steps": 35430, "total_steps": 38160, "loss": 0.4753, "lr": 1.5521067973504442e-05, "epoch": 18.569182389937108, "percentage": 92.85, "elapsed_time": "1:30:40", "remaining_time": "0:06:59", "throughput": 4247.74, "total_tokens": 23110832} {"current_steps": 35435, "total_steps": 38160, "loss": 0.3034, "lr": 1.546458161596831e-05, "epoch": 18.57180293501048, "percentage": 92.86, "elapsed_time": "1:30:41", "remaining_time": "0:06:58", "throughput": 4247.77, "total_tokens": 23113968} {"current_steps": 35440, "total_steps": 38160, "loss": 0.4055, "lr": 1.5408196617713866e-05, "epoch": 18.57442348008386, "percentage": 92.87, "elapsed_time": "1:30:42", "remaining_time": "0:06:57", "throughput": 4247.77, "total_tokens": 23116944} {"current_steps": 35445, "total_steps": 38160, "loss": 0.4864, "lr": 1.5351912990536175e-05, "epoch": 18.57704402515723, "percentage": 92.89, "elapsed_time": "1:30:42", "remaining_time": "0:06:56", "throughput": 4247.81, "total_tokens": 23120112} {"current_steps": 35450, "total_steps": 38160, "loss": 0.4781, "lr": 1.5295730746209103e-05, "epoch": 18.57966457023061, "percentage": 92.9, "elapsed_time": "1:30:43", "remaining_time": "0:06:56", "throughput": 4247.9, "total_tokens": 23124176} {"current_steps": 35455, "total_steps": 38160, "loss": 0.378, "lr": 1.5239649896485463e-05, "epoch": 18.582285115303982, "percentage": 92.91, "elapsed_time": "1:30:44", "remaining_time": "0:06:55", "throughput": 4247.88, "total_tokens": 23126832} {"current_steps": 35460, "total_steps": 38160, "loss": 0.4183, "lr": 1.5183670453096598e-05, "epoch": 18.58490566037736, "percentage": 92.92, "elapsed_time": "1:30:45", "remaining_time": "0:06:54", "throughput": 4247.9, "total_tokens": 23129904} {"current_steps": 35465, "total_steps": 38160, "loss": 0.4015, "lr": 1.5127792427752696e-05, "epoch": 18.587526205450732, "percentage": 92.94, "elapsed_time": "1:30:45", "remaining_time": "0:06:53", "throughput": 4247.93, "total_tokens": 23133200} {"current_steps": 35470, "total_steps": 38160, "loss": 0.3552, "lr": 1.507201583214296e-05, "epoch": 18.59014675052411, "percentage": 92.95, "elapsed_time": "1:30:46", "remaining_time": "0:06:53", "throughput": 4247.96, "total_tokens": 23136496} {"current_steps": 35475, "total_steps": 38160, "loss": 0.349, "lr": 1.5016340677935169e-05, "epoch": 18.592767295597483, "percentage": 92.96, "elapsed_time": "1:30:47", "remaining_time": "0:06:52", "throughput": 4247.98, "total_tokens": 23139472} {"current_steps": 35480, "total_steps": 38160, "loss": 0.3955, "lr": 1.4960766976775953e-05, "epoch": 18.59538784067086, "percentage": 92.98, "elapsed_time": "1:30:47", "remaining_time": "0:06:51", "throughput": 4247.97, "total_tokens": 23142384} {"current_steps": 35485, "total_steps": 38160, "loss": 0.4373, "lr": 1.4905294740290677e-05, "epoch": 18.598008385744233, "percentage": 92.99, "elapsed_time": "1:30:48", "remaining_time": "0:06:50", "throughput": 4247.98, "total_tokens": 23145328} {"current_steps": 35490, "total_steps": 38160, "loss": 0.4296, "lr": 1.4849923980083391e-05, "epoch": 18.60062893081761, "percentage": 93.0, "elapsed_time": "1:30:49", "remaining_time": "0:06:49", "throughput": 4248.03, "total_tokens": 23148912} {"current_steps": 35495, "total_steps": 38160, "loss": 0.4428, "lr": 1.4794654707737164e-05, "epoch": 18.603249475890987, "percentage": 93.02, "elapsed_time": "1:30:49", "remaining_time": "0:06:49", "throughput": 4248.02, "total_tokens": 23151632} {"current_steps": 35500, "total_steps": 38160, "loss": 0.3877, "lr": 1.4739486934813696e-05, "epoch": 18.60587002096436, "percentage": 93.03, "elapsed_time": "1:30:50", "remaining_time": "0:06:48", "throughput": 4247.98, "total_tokens": 23154032} {"current_steps": 35505, "total_steps": 38160, "loss": 0.4348, "lr": 1.468442067285336e-05, "epoch": 18.608490566037737, "percentage": 93.04, "elapsed_time": "1:30:51", "remaining_time": "0:06:47", "throughput": 4247.98, "total_tokens": 23156976} {"current_steps": 35510, "total_steps": 38160, "loss": 0.4224, "lr": 1.4629455933375501e-05, "epoch": 18.61111111111111, "percentage": 93.06, "elapsed_time": "1:30:51", "remaining_time": "0:06:46", "throughput": 4247.95, "total_tokens": 23159472} {"current_steps": 35515, "total_steps": 38160, "loss": 0.5039, "lr": 1.4574592727878089e-05, "epoch": 18.613731656184488, "percentage": 93.07, "elapsed_time": "1:30:52", "remaining_time": "0:06:46", "throughput": 4247.96, "total_tokens": 23162672} {"current_steps": 35520, "total_steps": 38160, "loss": 0.4714, "lr": 1.4519831067837774e-05, "epoch": 18.61635220125786, "percentage": 93.08, "elapsed_time": "1:30:53", "remaining_time": "0:06:45", "throughput": 4247.96, "total_tokens": 23165456} {"current_steps": 35525, "total_steps": 38160, "loss": 0.4144, "lr": 1.4465170964710172e-05, "epoch": 18.618972746331238, "percentage": 93.09, "elapsed_time": "1:30:54", "remaining_time": "0:06:44", "throughput": 4247.98, "total_tokens": 23168656} {"current_steps": 35530, "total_steps": 38160, "loss": 0.4298, "lr": 1.441061242992947e-05, "epoch": 18.62159329140461, "percentage": 93.11, "elapsed_time": "1:30:54", "remaining_time": "0:06:43", "throughput": 4248.0, "total_tokens": 23171856} {"current_steps": 35535, "total_steps": 38160, "loss": 0.3604, "lr": 1.4356155474908871e-05, "epoch": 18.62421383647799, "percentage": 93.12, "elapsed_time": "1:30:55", "remaining_time": "0:06:43", "throughput": 4248.1, "total_tokens": 23175856} {"current_steps": 35540, "total_steps": 38160, "loss": 0.4788, "lr": 1.4301800111039986e-05, "epoch": 18.62683438155136, "percentage": 93.13, "elapsed_time": "1:30:56", "remaining_time": "0:06:42", "throughput": 4248.11, "total_tokens": 23178928} {"current_steps": 35545, "total_steps": 38160, "loss": 0.472, "lr": 1.4247546349693386e-05, "epoch": 18.62945492662474, "percentage": 93.15, "elapsed_time": "1:30:57", "remaining_time": "0:06:41", "throughput": 4248.16, "total_tokens": 23182384} {"current_steps": 35550, "total_steps": 38160, "loss": 0.2986, "lr": 1.4193394202218268e-05, "epoch": 18.632075471698112, "percentage": 93.16, "elapsed_time": "1:30:57", "remaining_time": "0:06:40", "throughput": 4248.24, "total_tokens": 23186192} {"current_steps": 35555, "total_steps": 38160, "loss": 0.4596, "lr": 1.413934367994274e-05, "epoch": 18.63469601677149, "percentage": 93.17, "elapsed_time": "1:30:58", "remaining_time": "0:06:39", "throughput": 4248.41, "total_tokens": 23191056} {"current_steps": 35560, "total_steps": 38160, "loss": 0.4185, "lr": 1.408539479417359e-05, "epoch": 18.637316561844862, "percentage": 93.19, "elapsed_time": "1:30:59", "remaining_time": "0:06:39", "throughput": 4248.43, "total_tokens": 23194160} {"current_steps": 35565, "total_steps": 38160, "loss": 0.3927, "lr": 1.4031547556196178e-05, "epoch": 18.63993710691824, "percentage": 93.2, "elapsed_time": "1:31:00", "remaining_time": "0:06:38", "throughput": 4248.47, "total_tokens": 23197392} {"current_steps": 35570, "total_steps": 38160, "loss": 0.3783, "lr": 1.3977801977274828e-05, "epoch": 18.642557651991613, "percentage": 93.21, "elapsed_time": "1:31:00", "remaining_time": "0:06:37", "throughput": 4248.53, "total_tokens": 23201008} {"current_steps": 35575, "total_steps": 38160, "loss": 0.3483, "lr": 1.3924158068652437e-05, "epoch": 18.64517819706499, "percentage": 93.23, "elapsed_time": "1:31:02", "remaining_time": "0:06:36", "throughput": 4248.84, "total_tokens": 23208176} {"current_steps": 35580, "total_steps": 38160, "loss": 0.4237, "lr": 1.3870615841550693e-05, "epoch": 18.647798742138363, "percentage": 93.24, "elapsed_time": "1:31:02", "remaining_time": "0:06:36", "throughput": 4248.81, "total_tokens": 23210768} {"current_steps": 35585, "total_steps": 38160, "loss": 0.655, "lr": 1.3817175307170138e-05, "epoch": 18.65041928721174, "percentage": 93.25, "elapsed_time": "1:31:03", "remaining_time": "0:06:35", "throughput": 4248.88, "total_tokens": 23214480} {"current_steps": 35590, "total_steps": 38160, "loss": 0.38, "lr": 1.3763836476689828e-05, "epoch": 18.653039832285117, "percentage": 93.27, "elapsed_time": "1:31:04", "remaining_time": "0:06:34", "throughput": 4248.88, "total_tokens": 23217296} {"current_steps": 35595, "total_steps": 38160, "loss": 0.3501, "lr": 1.3710599361267617e-05, "epoch": 18.65566037735849, "percentage": 93.28, "elapsed_time": "1:31:05", "remaining_time": "0:06:33", "throughput": 4248.89, "total_tokens": 23220272} {"current_steps": 35600, "total_steps": 38160, "loss": 0.3514, "lr": 1.3657463972040207e-05, "epoch": 18.658280922431867, "percentage": 93.29, "elapsed_time": "1:31:05", "remaining_time": "0:06:33", "throughput": 4249.05, "total_tokens": 23224912} {"current_steps": 35605, "total_steps": 38160, "loss": 0.3482, "lr": 1.3604430320122762e-05, "epoch": 18.66090146750524, "percentage": 93.3, "elapsed_time": "1:31:06", "remaining_time": "0:06:32", "throughput": 4249.03, "total_tokens": 23227600} {"current_steps": 35610, "total_steps": 38160, "loss": 0.5449, "lr": 1.355149841660941e-05, "epoch": 18.663522012578618, "percentage": 93.32, "elapsed_time": "1:31:07", "remaining_time": "0:06:31", "throughput": 4249.04, "total_tokens": 23230576} {"current_steps": 35615, "total_steps": 38160, "loss": 0.5222, "lr": 1.3498668272572955e-05, "epoch": 18.66614255765199, "percentage": 93.33, "elapsed_time": "1:31:07", "remaining_time": "0:06:30", "throughput": 4249.03, "total_tokens": 23233360} {"current_steps": 35620, "total_steps": 38160, "loss": 0.6085, "lr": 1.3445939899064729e-05, "epoch": 18.668763102725368, "percentage": 93.34, "elapsed_time": "1:31:08", "remaining_time": "0:06:29", "throughput": 4249.13, "total_tokens": 23237328} {"current_steps": 35625, "total_steps": 38160, "loss": 0.3555, "lr": 1.3393313307115019e-05, "epoch": 18.67138364779874, "percentage": 93.36, "elapsed_time": "1:31:09", "remaining_time": "0:06:29", "throughput": 4249.16, "total_tokens": 23240592} {"current_steps": 35630, "total_steps": 38160, "loss": 0.4175, "lr": 1.3340788507732626e-05, "epoch": 18.67400419287212, "percentage": 93.37, "elapsed_time": "1:31:10", "remaining_time": "0:06:28", "throughput": 4249.14, "total_tokens": 23243472} {"current_steps": 35635, "total_steps": 38160, "loss": 0.3939, "lr": 1.328836551190521e-05, "epoch": 18.67662473794549, "percentage": 93.38, "elapsed_time": "1:31:10", "remaining_time": "0:06:27", "throughput": 4249.11, "total_tokens": 23246032} {"current_steps": 35640, "total_steps": 38160, "loss": 0.3871, "lr": 1.323604433059905e-05, "epoch": 18.67924528301887, "percentage": 93.4, "elapsed_time": "1:31:11", "remaining_time": "0:06:26", "throughput": 4249.05, "total_tokens": 23248304} {"current_steps": 35645, "total_steps": 38160, "loss": 0.4204, "lr": 1.3183824974759063e-05, "epoch": 18.681865828092242, "percentage": 93.41, "elapsed_time": "1:31:12", "remaining_time": "0:06:26", "throughput": 4249.08, "total_tokens": 23251632} {"current_steps": 35650, "total_steps": 38160, "loss": 0.3709, "lr": 1.3131707455309006e-05, "epoch": 18.68448637316562, "percentage": 93.42, "elapsed_time": "1:31:12", "remaining_time": "0:06:25", "throughput": 4249.15, "total_tokens": 23255216} {"current_steps": 35655, "total_steps": 38160, "loss": 0.5033, "lr": 1.307969178315127e-05, "epoch": 18.687106918238992, "percentage": 93.44, "elapsed_time": "1:31:13", "remaining_time": "0:06:24", "throughput": 4249.21, "total_tokens": 23258736} {"current_steps": 35660, "total_steps": 38160, "loss": 0.3184, "lr": 1.3027777969166932e-05, "epoch": 18.68972746331237, "percentage": 93.45, "elapsed_time": "1:31:14", "remaining_time": "0:06:23", "throughput": 4249.24, "total_tokens": 23261872} {"current_steps": 35665, "total_steps": 38160, "loss": 0.5256, "lr": 1.2975966024215746e-05, "epoch": 18.692348008385743, "percentage": 93.46, "elapsed_time": "1:31:15", "remaining_time": "0:06:23", "throughput": 4249.27, "total_tokens": 23265008} {"current_steps": 35670, "total_steps": 38160, "loss": 0.3927, "lr": 1.2924255959136267e-05, "epoch": 18.69496855345912, "percentage": 93.47, "elapsed_time": "1:31:15", "remaining_time": "0:06:22", "throughput": 4249.35, "total_tokens": 23268912} {"current_steps": 35675, "total_steps": 38160, "loss": 0.2467, "lr": 1.2872647784745561e-05, "epoch": 18.697589098532493, "percentage": 93.49, "elapsed_time": "1:31:16", "remaining_time": "0:06:21", "throughput": 4249.32, "total_tokens": 23271344} {"current_steps": 35680, "total_steps": 38160, "loss": 0.4069, "lr": 1.282114151183944e-05, "epoch": 18.70020964360587, "percentage": 93.5, "elapsed_time": "1:31:17", "remaining_time": "0:06:20", "throughput": 4249.39, "total_tokens": 23274960} {"current_steps": 35685, "total_steps": 38160, "loss": 0.4416, "lr": 1.2769737151192562e-05, "epoch": 18.702830188679247, "percentage": 93.51, "elapsed_time": "1:31:17", "remaining_time": "0:06:19", "throughput": 4249.42, "total_tokens": 23278160} {"current_steps": 35690, "total_steps": 38160, "loss": 0.4615, "lr": 1.2718434713558047e-05, "epoch": 18.70545073375262, "percentage": 93.53, "elapsed_time": "1:31:18", "remaining_time": "0:06:19", "throughput": 4249.5, "total_tokens": 23282192} {"current_steps": 35695, "total_steps": 38160, "loss": 0.3885, "lr": 1.2667234209667755e-05, "epoch": 18.708071278825997, "percentage": 93.54, "elapsed_time": "1:31:19", "remaining_time": "0:06:18", "throughput": 4249.56, "total_tokens": 23285648} {"current_steps": 35700, "total_steps": 38160, "loss": 0.6108, "lr": 1.2616135650232286e-05, "epoch": 18.71069182389937, "percentage": 93.55, "elapsed_time": "1:31:20", "remaining_time": "0:06:17", "throughput": 4249.54, "total_tokens": 23288304} {"current_steps": 35705, "total_steps": 38160, "loss": 0.384, "lr": 1.2565139045940866e-05, "epoch": 18.713312368972748, "percentage": 93.57, "elapsed_time": "1:31:20", "remaining_time": "0:06:16", "throughput": 4249.56, "total_tokens": 23291408} {"current_steps": 35710, "total_steps": 38160, "loss": 0.4041, "lr": 1.2514244407461462e-05, "epoch": 18.71593291404612, "percentage": 93.58, "elapsed_time": "1:31:21", "remaining_time": "0:06:16", "throughput": 4249.57, "total_tokens": 23294448} {"current_steps": 35715, "total_steps": 38160, "loss": 0.4618, "lr": 1.2463451745440501e-05, "epoch": 18.718553459119498, "percentage": 93.59, "elapsed_time": "1:31:22", "remaining_time": "0:06:15", "throughput": 4249.57, "total_tokens": 23297232} {"current_steps": 35720, "total_steps": 38160, "loss": 0.4629, "lr": 1.241276107050343e-05, "epoch": 18.72117400419287, "percentage": 93.61, "elapsed_time": "1:31:23", "remaining_time": "0:06:14", "throughput": 4249.67, "total_tokens": 23301264} {"current_steps": 35725, "total_steps": 38160, "loss": 0.4489, "lr": 1.236217239325399e-05, "epoch": 18.72379454926625, "percentage": 93.62, "elapsed_time": "1:31:23", "remaining_time": "0:06:13", "throughput": 4249.72, "total_tokens": 23304720} {"current_steps": 35730, "total_steps": 38160, "loss": 0.4643, "lr": 1.2311685724274768e-05, "epoch": 18.72641509433962, "percentage": 93.63, "elapsed_time": "1:31:24", "remaining_time": "0:06:13", "throughput": 4249.79, "total_tokens": 23308592} {"current_steps": 35735, "total_steps": 38160, "loss": 0.8562, "lr": 1.2261301074127096e-05, "epoch": 18.729035639413, "percentage": 93.65, "elapsed_time": "1:31:25", "remaining_time": "0:06:12", "throughput": 4249.85, "total_tokens": 23312080} {"current_steps": 35740, "total_steps": 38160, "loss": 0.6608, "lr": 1.2211018453350874e-05, "epoch": 18.731656184486372, "percentage": 93.66, "elapsed_time": "1:31:26", "remaining_time": "0:06:11", "throughput": 4249.83, "total_tokens": 23314800} {"current_steps": 35745, "total_steps": 38160, "loss": 0.5304, "lr": 1.2160837872464581e-05, "epoch": 18.73427672955975, "percentage": 93.67, "elapsed_time": "1:31:26", "remaining_time": "0:06:10", "throughput": 4249.84, "total_tokens": 23317840} {"current_steps": 35750, "total_steps": 38160, "loss": 0.4351, "lr": 1.2110759341965428e-05, "epoch": 18.736897274633122, "percentage": 93.68, "elapsed_time": "1:31:27", "remaining_time": "0:06:09", "throughput": 4249.89, "total_tokens": 23321200} {"current_steps": 35755, "total_steps": 38160, "loss": 0.5064, "lr": 1.2060782872329256e-05, "epoch": 18.7395178197065, "percentage": 93.7, "elapsed_time": "1:31:28", "remaining_time": "0:06:09", "throughput": 4249.86, "total_tokens": 23323824} {"current_steps": 35760, "total_steps": 38160, "loss": 0.4459, "lr": 1.2010908474010595e-05, "epoch": 18.742138364779873, "percentage": 93.71, "elapsed_time": "1:31:28", "remaining_time": "0:06:08", "throughput": 4249.88, "total_tokens": 23326928} {"current_steps": 35765, "total_steps": 38160, "loss": 0.5196, "lr": 1.1961136157442654e-05, "epoch": 18.74475890985325, "percentage": 93.72, "elapsed_time": "1:31:29", "remaining_time": "0:06:07", "throughput": 4249.95, "total_tokens": 23330576} {"current_steps": 35770, "total_steps": 38160, "loss": 0.4839, "lr": 1.1911465933037214e-05, "epoch": 18.747379454926623, "percentage": 93.74, "elapsed_time": "1:31:30", "remaining_time": "0:06:06", "throughput": 4250.06, "total_tokens": 23334832} {"current_steps": 35775, "total_steps": 38160, "loss": 0.3525, "lr": 1.1861897811184686e-05, "epoch": 18.75, "percentage": 93.75, "elapsed_time": "1:31:31", "remaining_time": "0:06:06", "throughput": 4250.04, "total_tokens": 23337488} {"current_steps": 35780, "total_steps": 38160, "loss": 0.3354, "lr": 1.1812431802254109e-05, "epoch": 18.752620545073377, "percentage": 93.76, "elapsed_time": "1:31:31", "remaining_time": "0:06:05", "throughput": 4250.12, "total_tokens": 23341296} {"current_steps": 35785, "total_steps": 38160, "loss": 0.4981, "lr": 1.1763067916593262e-05, "epoch": 18.75524109014675, "percentage": 93.78, "elapsed_time": "1:31:33", "remaining_time": "0:06:04", "throughput": 4250.4, "total_tokens": 23348144} {"current_steps": 35790, "total_steps": 38160, "loss": 0.3961, "lr": 1.1713806164528496e-05, "epoch": 18.757861635220127, "percentage": 93.79, "elapsed_time": "1:31:33", "remaining_time": "0:06:03", "throughput": 4250.48, "total_tokens": 23352080} {"current_steps": 35795, "total_steps": 38160, "loss": 0.2556, "lr": 1.1664646556364844e-05, "epoch": 18.7604821802935, "percentage": 93.8, "elapsed_time": "1:31:34", "remaining_time": "0:06:03", "throughput": 4250.52, "total_tokens": 23355536} {"current_steps": 35800, "total_steps": 38160, "loss": 0.3476, "lr": 1.161558910238597e-05, "epoch": 18.763102725366878, "percentage": 93.82, "elapsed_time": "1:31:35", "remaining_time": "0:06:02", "throughput": 4250.5, "total_tokens": 23358160} {"current_steps": 35805, "total_steps": 38160, "loss": 0.5274, "lr": 1.1566633812854e-05, "epoch": 18.76572327044025, "percentage": 93.83, "elapsed_time": "1:31:36", "remaining_time": "0:06:01", "throughput": 4250.53, "total_tokens": 23361296} {"current_steps": 35810, "total_steps": 38160, "loss": 0.4236, "lr": 1.151778069800985e-05, "epoch": 18.768343815513628, "percentage": 93.84, "elapsed_time": "1:31:36", "remaining_time": "0:06:00", "throughput": 4250.62, "total_tokens": 23365264} {"current_steps": 35815, "total_steps": 38160, "loss": 0.3163, "lr": 1.1469029768073125e-05, "epoch": 18.770964360587, "percentage": 93.85, "elapsed_time": "1:31:37", "remaining_time": "0:05:59", "throughput": 4250.63, "total_tokens": 23368208} {"current_steps": 35820, "total_steps": 38160, "loss": 0.4608, "lr": 1.1420381033241889e-05, "epoch": 18.77358490566038, "percentage": 93.87, "elapsed_time": "1:31:38", "remaining_time": "0:05:59", "throughput": 4250.63, "total_tokens": 23371248} {"current_steps": 35825, "total_steps": 38160, "loss": 0.3427, "lr": 1.1371834503693002e-05, "epoch": 18.77620545073375, "percentage": 93.88, "elapsed_time": "1:31:39", "remaining_time": "0:05:58", "throughput": 4250.71, "total_tokens": 23374960} {"current_steps": 35830, "total_steps": 38160, "loss": 0.3504, "lr": 1.1323390189581784e-05, "epoch": 18.77882599580713, "percentage": 93.89, "elapsed_time": "1:31:39", "remaining_time": "0:05:57", "throughput": 4250.78, "total_tokens": 23378832} {"current_steps": 35835, "total_steps": 38160, "loss": 0.514, "lr": 1.127504810104213e-05, "epoch": 18.781446540880502, "percentage": 93.91, "elapsed_time": "1:31:40", "remaining_time": "0:05:56", "throughput": 4250.81, "total_tokens": 23382032} {"current_steps": 35840, "total_steps": 38160, "loss": 0.3865, "lr": 1.1226808248186782e-05, "epoch": 18.78406708595388, "percentage": 93.92, "elapsed_time": "1:31:41", "remaining_time": "0:05:56", "throughput": 4250.85, "total_tokens": 23385456} {"current_steps": 35845, "total_steps": 38160, "loss": 0.4484, "lr": 1.1178670641106891e-05, "epoch": 18.786687631027252, "percentage": 93.93, "elapsed_time": "1:31:42", "remaining_time": "0:05:55", "throughput": 4250.87, "total_tokens": 23388592} {"current_steps": 35850, "total_steps": 38160, "loss": 0.4082, "lr": 1.1130635289872403e-05, "epoch": 18.78930817610063, "percentage": 93.95, "elapsed_time": "1:31:42", "remaining_time": "0:05:54", "throughput": 4250.9, "total_tokens": 23391824} {"current_steps": 35855, "total_steps": 38160, "loss": 0.4023, "lr": 1.1082702204531725e-05, "epoch": 18.791928721174003, "percentage": 93.96, "elapsed_time": "1:31:43", "remaining_time": "0:05:53", "throughput": 4250.93, "total_tokens": 23394896} {"current_steps": 35860, "total_steps": 38160, "loss": 0.3763, "lr": 1.1034871395111778e-05, "epoch": 18.79454926624738, "percentage": 93.97, "elapsed_time": "1:31:44", "remaining_time": "0:05:53", "throughput": 4251.09, "total_tokens": 23399888} {"current_steps": 35865, "total_steps": 38160, "loss": 0.3961, "lr": 1.0987142871618394e-05, "epoch": 18.797169811320753, "percentage": 93.99, "elapsed_time": "1:31:45", "remaining_time": "0:05:52", "throughput": 4251.1, "total_tokens": 23402832} {"current_steps": 35870, "total_steps": 38160, "loss": 0.5302, "lr": 1.0939516644035696e-05, "epoch": 18.79979035639413, "percentage": 94.0, "elapsed_time": "1:31:45", "remaining_time": "0:05:51", "throughput": 4251.12, "total_tokens": 23405968} {"current_steps": 35875, "total_steps": 38160, "loss": 0.5617, "lr": 1.0891992722326716e-05, "epoch": 18.802410901467507, "percentage": 94.01, "elapsed_time": "1:31:46", "remaining_time": "0:05:50", "throughput": 4251.11, "total_tokens": 23408656} {"current_steps": 35880, "total_steps": 38160, "loss": 0.59, "lr": 1.0844571116432778e-05, "epoch": 18.80503144654088, "percentage": 94.03, "elapsed_time": "1:31:47", "remaining_time": "0:05:49", "throughput": 4251.14, "total_tokens": 23411952} {"current_steps": 35885, "total_steps": 38160, "loss": 0.4504, "lr": 1.0797251836274003e-05, "epoch": 18.807651991614257, "percentage": 94.04, "elapsed_time": "1:31:47", "remaining_time": "0:05:49", "throughput": 4251.15, "total_tokens": 23414896} {"current_steps": 35890, "total_steps": 38160, "loss": 0.5086, "lr": 1.0750034891748972e-05, "epoch": 18.81027253668763, "percentage": 94.05, "elapsed_time": "1:31:48", "remaining_time": "0:05:48", "throughput": 4251.18, "total_tokens": 23418224} {"current_steps": 35895, "total_steps": 38160, "loss": 0.3793, "lr": 1.0702920292735009e-05, "epoch": 18.812893081761008, "percentage": 94.06, "elapsed_time": "1:31:49", "remaining_time": "0:05:47", "throughput": 4251.18, "total_tokens": 23421008} {"current_steps": 35900, "total_steps": 38160, "loss": 0.3846, "lr": 1.0655908049087893e-05, "epoch": 18.81551362683438, "percentage": 94.08, "elapsed_time": "1:31:49", "remaining_time": "0:05:46", "throughput": 4251.17, "total_tokens": 23423792} {"current_steps": 35905, "total_steps": 38160, "loss": 0.4634, "lr": 1.0608998170642149e-05, "epoch": 18.818134171907758, "percentage": 94.09, "elapsed_time": "1:31:50", "remaining_time": "0:05:46", "throughput": 4251.14, "total_tokens": 23426320} {"current_steps": 35910, "total_steps": 38160, "loss": 0.4991, "lr": 1.0562190667210703e-05, "epoch": 18.82075471698113, "percentage": 94.1, "elapsed_time": "1:31:51", "remaining_time": "0:05:45", "throughput": 4251.19, "total_tokens": 23429840} {"current_steps": 35915, "total_steps": 38160, "loss": 0.3364, "lr": 1.0515485548585113e-05, "epoch": 18.82337526205451, "percentage": 94.12, "elapsed_time": "1:31:52", "remaining_time": "0:05:44", "throughput": 4251.17, "total_tokens": 23432720} {"current_steps": 35920, "total_steps": 38160, "loss": 0.3472, "lr": 1.0468882824535676e-05, "epoch": 18.82599580712788, "percentage": 94.13, "elapsed_time": "1:31:52", "remaining_time": "0:05:43", "throughput": 4251.25, "total_tokens": 23436592} {"current_steps": 35925, "total_steps": 38160, "loss": 0.3523, "lr": 1.0422382504811034e-05, "epoch": 18.82861635220126, "percentage": 94.14, "elapsed_time": "1:31:53", "remaining_time": "0:05:43", "throughput": 4251.29, "total_tokens": 23439856} {"current_steps": 35930, "total_steps": 38160, "loss": 0.3457, "lr": 1.0375984599138633e-05, "epoch": 18.831236897274632, "percentage": 94.16, "elapsed_time": "1:31:54", "remaining_time": "0:05:42", "throughput": 4251.29, "total_tokens": 23442832} {"current_steps": 35935, "total_steps": 38160, "loss": 0.3674, "lr": 1.0329689117224261e-05, "epoch": 18.83385744234801, "percentage": 94.17, "elapsed_time": "1:31:55", "remaining_time": "0:05:41", "throughput": 4251.35, "total_tokens": 23446416} {"current_steps": 35940, "total_steps": 38160, "loss": 0.399, "lr": 1.0283496068752507e-05, "epoch": 18.836477987421382, "percentage": 94.18, "elapsed_time": "1:31:55", "remaining_time": "0:05:40", "throughput": 4251.34, "total_tokens": 23449104} {"current_steps": 35945, "total_steps": 38160, "loss": 0.4735, "lr": 1.0237405463386418e-05, "epoch": 18.83909853249476, "percentage": 94.2, "elapsed_time": "1:31:56", "remaining_time": "0:05:39", "throughput": 4251.36, "total_tokens": 23452272} {"current_steps": 35950, "total_steps": 38160, "loss": 0.4437, "lr": 1.0191417310767503e-05, "epoch": 18.841719077568133, "percentage": 94.21, "elapsed_time": "1:31:57", "remaining_time": "0:05:39", "throughput": 4251.35, "total_tokens": 23455088} {"current_steps": 35955, "total_steps": 38160, "loss": 0.4573, "lr": 1.0145531620516179e-05, "epoch": 18.84433962264151, "percentage": 94.22, "elapsed_time": "1:31:57", "remaining_time": "0:05:38", "throughput": 4251.41, "total_tokens": 23458704} {"current_steps": 35960, "total_steps": 38160, "loss": 0.4269, "lr": 1.009974840223099e-05, "epoch": 18.846960167714883, "percentage": 94.23, "elapsed_time": "1:31:58", "remaining_time": "0:05:37", "throughput": 4251.5, "total_tokens": 23462704} {"current_steps": 35965, "total_steps": 38160, "loss": 0.3427, "lr": 1.0054067665489386e-05, "epoch": 18.84958071278826, "percentage": 94.25, "elapsed_time": "1:31:59", "remaining_time": "0:05:36", "throughput": 4251.48, "total_tokens": 23465328} {"current_steps": 35970, "total_steps": 38160, "loss": 0.4781, "lr": 1.0008489419847278e-05, "epoch": 18.852201257861637, "percentage": 94.26, "elapsed_time": "1:32:00", "remaining_time": "0:05:36", "throughput": 4251.55, "total_tokens": 23468912} {"current_steps": 35975, "total_steps": 38160, "loss": 0.3724, "lr": 9.963013674839038e-06, "epoch": 18.85482180293501, "percentage": 94.27, "elapsed_time": "1:32:00", "remaining_time": "0:05:35", "throughput": 4251.56, "total_tokens": 23471984} {"current_steps": 35980, "total_steps": 38160, "loss": 0.3482, "lr": 9.91764043997767e-06, "epoch": 18.857442348008387, "percentage": 94.29, "elapsed_time": "1:32:01", "remaining_time": "0:05:34", "throughput": 4251.63, "total_tokens": 23475888} {"current_steps": 35985, "total_steps": 38160, "loss": 0.3959, "lr": 9.872369724754804e-06, "epoch": 18.86006289308176, "percentage": 94.3, "elapsed_time": "1:32:02", "remaining_time": "0:05:33", "throughput": 4251.63, "total_tokens": 23478704} {"current_steps": 35990, "total_steps": 38160, "loss": 0.3791, "lr": 9.827201538640473e-06, "epoch": 18.862683438155138, "percentage": 94.31, "elapsed_time": "1:32:02", "remaining_time": "0:05:33", "throughput": 4251.59, "total_tokens": 23481136} {"current_steps": 35995, "total_steps": 38160, "loss": 0.3275, "lr": 9.782135891083455e-06, "epoch": 18.86530398322851, "percentage": 94.33, "elapsed_time": "1:32:03", "remaining_time": "0:05:32", "throughput": 4251.53, "total_tokens": 23483408} {"current_steps": 36000, "total_steps": 38160, "loss": 0.4428, "lr": 9.737172791510873e-06, "epoch": 18.867924528301888, "percentage": 94.34, "elapsed_time": "1:32:04", "remaining_time": "0:05:31", "throughput": 4251.63, "total_tokens": 23487568} {"current_steps": 36005, "total_steps": 38160, "loss": 0.486, "lr": 9.692312249328483e-06, "epoch": 18.87054507337526, "percentage": 94.35, "elapsed_time": "1:32:05", "remaining_time": "0:05:30", "throughput": 4251.63, "total_tokens": 23490512} {"current_steps": 36010, "total_steps": 38160, "loss": 0.4898, "lr": 9.647554273920722e-06, "epoch": 18.87316561844864, "percentage": 94.37, "elapsed_time": "1:32:05", "remaining_time": "0:05:29", "throughput": 4251.66, "total_tokens": 23493680} {"current_steps": 36015, "total_steps": 38160, "loss": 0.4379, "lr": 9.602898874650323e-06, "epoch": 18.87578616352201, "percentage": 94.38, "elapsed_time": "1:32:06", "remaining_time": "0:05:29", "throughput": 4251.75, "total_tokens": 23497680} {"current_steps": 36020, "total_steps": 38160, "loss": 0.4638, "lr": 9.558346060858759e-06, "epoch": 18.87840670859539, "percentage": 94.39, "elapsed_time": "1:32:07", "remaining_time": "0:05:28", "throughput": 4251.74, "total_tokens": 23500464} {"current_steps": 36025, "total_steps": 38160, "loss": 0.3628, "lr": 9.51389584186596e-06, "epoch": 18.881027253668762, "percentage": 94.41, "elapsed_time": "1:32:07", "remaining_time": "0:05:27", "throughput": 4251.73, "total_tokens": 23503184} {"current_steps": 36030, "total_steps": 38160, "loss": 0.4666, "lr": 9.469548226970326e-06, "epoch": 18.88364779874214, "percentage": 94.42, "elapsed_time": "1:32:08", "remaining_time": "0:05:26", "throughput": 4251.72, "total_tokens": 23506064} {"current_steps": 36035, "total_steps": 38160, "loss": 0.4821, "lr": 9.425303225448989e-06, "epoch": 18.886268343815512, "percentage": 94.43, "elapsed_time": "1:32:09", "remaining_time": "0:05:26", "throughput": 4251.71, "total_tokens": 23508848} {"current_steps": 36040, "total_steps": 38160, "loss": 0.4835, "lr": 9.381160846557435e-06, "epoch": 18.88888888888889, "percentage": 94.44, "elapsed_time": "1:32:10", "remaining_time": "0:05:25", "throughput": 4251.77, "total_tokens": 23512432} {"current_steps": 36045, "total_steps": 38160, "loss": 0.5042, "lr": 9.337121099529722e-06, "epoch": 18.891509433962263, "percentage": 94.46, "elapsed_time": "1:32:10", "remaining_time": "0:05:24", "throughput": 4251.76, "total_tokens": 23515312} {"current_steps": 36050, "total_steps": 38160, "loss": 0.4751, "lr": 9.293183993578535e-06, "epoch": 18.89412997903564, "percentage": 94.47, "elapsed_time": "1:32:11", "remaining_time": "0:05:23", "throughput": 4251.83, "total_tokens": 23519024} {"current_steps": 36055, "total_steps": 38160, "loss": 0.3286, "lr": 9.249349537894968e-06, "epoch": 18.896750524109013, "percentage": 94.48, "elapsed_time": "1:32:12", "remaining_time": "0:05:22", "throughput": 4251.85, "total_tokens": 23522032} {"current_steps": 36060, "total_steps": 38160, "loss": 0.5296, "lr": 9.205617741648686e-06, "epoch": 18.89937106918239, "percentage": 94.5, "elapsed_time": "1:32:12", "remaining_time": "0:05:22", "throughput": 4251.85, "total_tokens": 23524912} {"current_steps": 36065, "total_steps": 38160, "loss": 0.3009, "lr": 9.161988613987982e-06, "epoch": 18.901991614255767, "percentage": 94.51, "elapsed_time": "1:32:13", "remaining_time": "0:05:21", "throughput": 4251.86, "total_tokens": 23527984} {"current_steps": 36070, "total_steps": 38160, "loss": 0.4853, "lr": 9.118462164039387e-06, "epoch": 18.90461215932914, "percentage": 94.52, "elapsed_time": "1:32:14", "remaining_time": "0:05:20", "throughput": 4251.94, "total_tokens": 23531792} {"current_steps": 36075, "total_steps": 38160, "loss": 0.415, "lr": 9.07503840090823e-06, "epoch": 18.907232704402517, "percentage": 94.54, "elapsed_time": "1:32:15", "remaining_time": "0:05:19", "throughput": 4252.01, "total_tokens": 23535504} {"current_steps": 36080, "total_steps": 38160, "loss": 0.4045, "lr": 9.031717333678303e-06, "epoch": 18.90985324947589, "percentage": 94.55, "elapsed_time": "1:32:15", "remaining_time": "0:05:19", "throughput": 4252.06, "total_tokens": 23538864} {"current_steps": 36085, "total_steps": 38160, "loss": 0.4879, "lr": 8.988498971411851e-06, "epoch": 18.912473794549268, "percentage": 94.56, "elapsed_time": "1:32:16", "remaining_time": "0:05:18", "throughput": 4252.14, "total_tokens": 23542736} {"current_steps": 36090, "total_steps": 38160, "loss": 0.4748, "lr": 8.945383323149647e-06, "epoch": 18.91509433962264, "percentage": 94.58, "elapsed_time": "1:32:17", "remaining_time": "0:05:17", "throughput": 4252.3, "total_tokens": 23547504} {"current_steps": 36095, "total_steps": 38160, "loss": 0.3808, "lr": 8.902370397911031e-06, "epoch": 18.917714884696018, "percentage": 94.59, "elapsed_time": "1:32:18", "remaining_time": "0:05:16", "throughput": 4252.28, "total_tokens": 23550224} {"current_steps": 36100, "total_steps": 38160, "loss": 0.5029, "lr": 8.859460204693748e-06, "epoch": 18.92033542976939, "percentage": 94.6, "elapsed_time": "1:32:18", "remaining_time": "0:05:16", "throughput": 4252.32, "total_tokens": 23553488} {"current_steps": 36105, "total_steps": 38160, "loss": 0.5101, "lr": 8.816652752474175e-06, "epoch": 18.92295597484277, "percentage": 94.61, "elapsed_time": "1:32:19", "remaining_time": "0:05:15", "throughput": 4252.35, "total_tokens": 23556816} {"current_steps": 36110, "total_steps": 38160, "loss": 0.3153, "lr": 8.773948050207148e-06, "epoch": 18.92557651991614, "percentage": 94.63, "elapsed_time": "1:32:20", "remaining_time": "0:05:14", "throughput": 4252.32, "total_tokens": 23559280} {"current_steps": 36115, "total_steps": 38160, "loss": 0.5044, "lr": 8.731346106826021e-06, "epoch": 18.92819706498952, "percentage": 94.64, "elapsed_time": "1:32:21", "remaining_time": "0:05:13", "throughput": 4252.33, "total_tokens": 23562416} {"current_steps": 36120, "total_steps": 38160, "loss": 0.3342, "lr": 8.6888469312425e-06, "epoch": 18.930817610062892, "percentage": 94.65, "elapsed_time": "1:32:21", "remaining_time": "0:05:12", "throughput": 4252.39, "total_tokens": 23566032} {"current_steps": 36125, "total_steps": 38160, "loss": 0.484, "lr": 8.646450532347083e-06, "epoch": 18.93343815513627, "percentage": 94.67, "elapsed_time": "1:32:22", "remaining_time": "0:05:12", "throughput": 4252.39, "total_tokens": 23568880} {"current_steps": 36130, "total_steps": 38160, "loss": 0.3792, "lr": 8.604156919008565e-06, "epoch": 18.936058700209642, "percentage": 94.68, "elapsed_time": "1:32:23", "remaining_time": "0:05:11", "throughput": 4252.34, "total_tokens": 23571216} {"current_steps": 36135, "total_steps": 38160, "loss": 0.5367, "lr": 8.561966100074258e-06, "epoch": 18.93867924528302, "percentage": 94.69, "elapsed_time": "1:32:23", "remaining_time": "0:05:10", "throughput": 4252.45, "total_tokens": 23575216} {"current_steps": 36140, "total_steps": 38160, "loss": 0.401, "lr": 8.519878084370048e-06, "epoch": 18.941299790356393, "percentage": 94.71, "elapsed_time": "1:32:24", "remaining_time": "0:05:09", "throughput": 4252.49, "total_tokens": 23578576} {"current_steps": 36145, "total_steps": 38160, "loss": 0.3816, "lr": 8.477892880700222e-06, "epoch": 18.94392033542977, "percentage": 94.72, "elapsed_time": "1:32:25", "remaining_time": "0:05:09", "throughput": 4252.43, "total_tokens": 23580848} {"current_steps": 36150, "total_steps": 38160, "loss": 0.5002, "lr": 8.436010497847646e-06, "epoch": 18.946540880503143, "percentage": 94.73, "elapsed_time": "1:32:25", "remaining_time": "0:05:08", "throughput": 4252.41, "total_tokens": 23583440} {"current_steps": 36155, "total_steps": 38160, "loss": 0.3324, "lr": 8.39423094457359e-06, "epoch": 18.94916142557652, "percentage": 94.75, "elapsed_time": "1:32:26", "remaining_time": "0:05:07", "throughput": 4252.44, "total_tokens": 23586640} {"current_steps": 36160, "total_steps": 38160, "loss": 0.3794, "lr": 8.352554229617892e-06, "epoch": 18.951781970649897, "percentage": 94.76, "elapsed_time": "1:32:27", "remaining_time": "0:05:06", "throughput": 4252.48, "total_tokens": 23589968} {"current_steps": 36165, "total_steps": 38160, "loss": 0.3504, "lr": 8.310980361698861e-06, "epoch": 18.95440251572327, "percentage": 94.77, "elapsed_time": "1:32:27", "remaining_time": "0:05:06", "throughput": 4252.44, "total_tokens": 23592368} {"current_steps": 36170, "total_steps": 38160, "loss": 0.3765, "lr": 8.26950934951326e-06, "epoch": 18.957023060796647, "percentage": 94.79, "elapsed_time": "1:32:28", "remaining_time": "0:05:05", "throughput": 4252.44, "total_tokens": 23595248} {"current_steps": 36175, "total_steps": 38160, "loss": 0.4357, "lr": 8.22814120173626e-06, "epoch": 18.95964360587002, "percentage": 94.8, "elapsed_time": "1:32:29", "remaining_time": "0:05:04", "throughput": 4252.47, "total_tokens": 23598384} {"current_steps": 36180, "total_steps": 38160, "loss": 0.481, "lr": 8.186875927021775e-06, "epoch": 18.962264150943398, "percentage": 94.81, "elapsed_time": "1:32:30", "remaining_time": "0:05:03", "throughput": 4252.53, "total_tokens": 23602128} {"current_steps": 36185, "total_steps": 38160, "loss": 0.316, "lr": 8.145713534001897e-06, "epoch": 18.96488469601677, "percentage": 94.82, "elapsed_time": "1:32:30", "remaining_time": "0:05:02", "throughput": 4252.55, "total_tokens": 23605232} {"current_steps": 36190, "total_steps": 38160, "loss": 0.3828, "lr": 8.104654031287406e-06, "epoch": 18.967505241090148, "percentage": 94.84, "elapsed_time": "1:32:31", "remaining_time": "0:05:02", "throughput": 4252.56, "total_tokens": 23608272} {"current_steps": 36195, "total_steps": 38160, "loss": 0.3777, "lr": 8.063697427467486e-06, "epoch": 18.97012578616352, "percentage": 94.85, "elapsed_time": "1:32:32", "remaining_time": "0:05:01", "throughput": 4252.51, "total_tokens": 23610576} {"current_steps": 36200, "total_steps": 38160, "loss": 0.4814, "lr": 8.022843731109675e-06, "epoch": 18.9727463312369, "percentage": 94.86, "elapsed_time": "1:32:32", "remaining_time": "0:05:00", "throughput": 4252.56, "total_tokens": 23614000} {"current_steps": 36205, "total_steps": 38160, "loss": 0.3688, "lr": 7.982092950760245e-06, "epoch": 18.97536687631027, "percentage": 94.88, "elapsed_time": "1:32:33", "remaining_time": "0:04:59", "throughput": 4252.59, "total_tokens": 23617264} {"current_steps": 36210, "total_steps": 38160, "loss": 0.4542, "lr": 7.941445094943711e-06, "epoch": 18.97798742138365, "percentage": 94.89, "elapsed_time": "1:32:34", "remaining_time": "0:04:59", "throughput": 4252.59, "total_tokens": 23620240} {"current_steps": 36215, "total_steps": 38160, "loss": 0.3813, "lr": 7.900900172163107e-06, "epoch": 18.980607966457022, "percentage": 94.9, "elapsed_time": "1:32:35", "remaining_time": "0:04:58", "throughput": 4252.6, "total_tokens": 23623216} {"current_steps": 36220, "total_steps": 38160, "loss": 0.3715, "lr": 7.860458190900144e-06, "epoch": 18.9832285115304, "percentage": 94.92, "elapsed_time": "1:32:35", "remaining_time": "0:04:57", "throughput": 4252.6, "total_tokens": 23626064} {"current_steps": 36225, "total_steps": 38160, "loss": 0.4644, "lr": 7.820119159614669e-06, "epoch": 18.985849056603772, "percentage": 94.93, "elapsed_time": "1:32:36", "remaining_time": "0:04:56", "throughput": 4252.64, "total_tokens": 23629360} {"current_steps": 36230, "total_steps": 38160, "loss": 0.4304, "lr": 7.779883086745098e-06, "epoch": 18.98846960167715, "percentage": 94.94, "elapsed_time": "1:32:37", "remaining_time": "0:04:56", "throughput": 4252.6, "total_tokens": 23631792} {"current_steps": 36235, "total_steps": 38160, "loss": 0.3842, "lr": 7.739749980708533e-06, "epoch": 18.991090146750523, "percentage": 94.96, "elapsed_time": "1:32:37", "remaining_time": "0:04:55", "throughput": 4252.74, "total_tokens": 23636400} {"current_steps": 36240, "total_steps": 38160, "loss": 0.4036, "lr": 7.6997198499002e-06, "epoch": 18.9937106918239, "percentage": 94.97, "elapsed_time": "1:32:38", "remaining_time": "0:04:54", "throughput": 4252.73, "total_tokens": 23639056} {"current_steps": 36245, "total_steps": 38160, "loss": 0.3463, "lr": 7.659792702694068e-06, "epoch": 18.996331236897273, "percentage": 94.98, "elapsed_time": "1:32:39", "remaining_time": "0:04:53", "throughput": 4252.79, "total_tokens": 23642672} {"current_steps": 36250, "total_steps": 38160, "loss": 0.402, "lr": 7.619968547442346e-06, "epoch": 18.99895178197065, "percentage": 94.99, "elapsed_time": "1:32:39", "remaining_time": "0:04:52", "throughput": 4252.72, "total_tokens": 23644848} {"current_steps": 36252, "total_steps": 38160, "eval_loss": 0.46669089794158936, "epoch": 19.0, "percentage": 95.0, "elapsed_time": "1:32:53", "remaining_time": "0:04:53", "throughput": 4242.19, "total_tokens": 23645440} {"current_steps": 36255, "total_steps": 38160, "loss": 0.3034, "lr": 7.580247392475926e-06, "epoch": 19.001572327044027, "percentage": 95.01, "elapsed_time": "1:32:56", "remaining_time": "0:04:52", "throughput": 4240.83, "total_tokens": 23647040} {"current_steps": 36260, "total_steps": 38160, "loss": 0.4126, "lr": 7.540629246103825e-06, "epoch": 19.0041928721174, "percentage": 95.02, "elapsed_time": "1:32:56", "remaining_time": "0:04:52", "throughput": 4240.82, "total_tokens": 23649760} {"current_steps": 36265, "total_steps": 38160, "loss": 0.3458, "lr": 7.501114116613861e-06, "epoch": 19.006813417190777, "percentage": 95.03, "elapsed_time": "1:32:57", "remaining_time": "0:04:51", "throughput": 4240.82, "total_tokens": 23652672} {"current_steps": 36270, "total_steps": 38160, "loss": 0.4088, "lr": 7.461702012272087e-06, "epoch": 19.00943396226415, "percentage": 95.05, "elapsed_time": "1:32:58", "remaining_time": "0:04:50", "throughput": 4240.83, "total_tokens": 23655584} {"current_steps": 36275, "total_steps": 38160, "loss": 0.4572, "lr": 7.422392941323075e-06, "epoch": 19.012054507337528, "percentage": 95.06, "elapsed_time": "1:32:58", "remaining_time": "0:04:49", "throughput": 4240.81, "total_tokens": 23658496} {"current_steps": 36280, "total_steps": 38160, "loss": 0.3665, "lr": 7.383186911989858e-06, "epoch": 19.0146750524109, "percentage": 95.07, "elapsed_time": "1:32:59", "remaining_time": "0:04:49", "throughput": 4240.77, "total_tokens": 23660928} {"current_steps": 36285, "total_steps": 38160, "loss": 0.6045, "lr": 7.344083932473822e-06, "epoch": 19.017295597484278, "percentage": 95.09, "elapsed_time": "1:33:00", "remaining_time": "0:04:48", "throughput": 4240.81, "total_tokens": 23664448} {"current_steps": 36290, "total_steps": 38160, "loss": 0.5478, "lr": 7.305084010954976e-06, "epoch": 19.01991614255765, "percentage": 95.1, "elapsed_time": "1:33:00", "remaining_time": "0:04:47", "throughput": 4240.88, "total_tokens": 23668128} {"current_steps": 36295, "total_steps": 38160, "loss": 0.4284, "lr": 7.26618715559152e-06, "epoch": 19.02253668763103, "percentage": 95.11, "elapsed_time": "1:33:01", "remaining_time": "0:04:46", "throughput": 4240.97, "total_tokens": 23672128} {"current_steps": 36300, "total_steps": 38160, "loss": 0.3928, "lr": 7.227393374520386e-06, "epoch": 19.0251572327044, "percentage": 95.13, "elapsed_time": "1:33:02", "remaining_time": "0:04:46", "throughput": 4241.01, "total_tokens": 23675392} {"current_steps": 36305, "total_steps": 38160, "loss": 0.471, "lr": 7.18870267585664e-06, "epoch": 19.02777777777778, "percentage": 95.14, "elapsed_time": "1:33:03", "remaining_time": "0:04:45", "throughput": 4241.08, "total_tokens": 23679136} {"current_steps": 36310, "total_steps": 38160, "loss": 0.4341, "lr": 7.150115067694085e-06, "epoch": 19.030398322851152, "percentage": 95.15, "elapsed_time": "1:33:03", "remaining_time": "0:04:44", "throughput": 4241.07, "total_tokens": 23681920} {"current_steps": 36315, "total_steps": 38160, "loss": 0.3693, "lr": 7.111630558104653e-06, "epoch": 19.03301886792453, "percentage": 95.17, "elapsed_time": "1:33:04", "remaining_time": "0:04:43", "throughput": 4241.16, "total_tokens": 23685824} {"current_steps": 36320, "total_steps": 38160, "loss": 0.4818, "lr": 7.073249155138961e-06, "epoch": 19.035639412997902, "percentage": 95.18, "elapsed_time": "1:33:05", "remaining_time": "0:04:42", "throughput": 4241.22, "total_tokens": 23689344} {"current_steps": 36325, "total_steps": 38160, "loss": 0.3727, "lr": 7.0349708668259736e-06, "epoch": 19.03825995807128, "percentage": 95.19, "elapsed_time": "1:33:06", "remaining_time": "0:04:42", "throughput": 4241.24, "total_tokens": 23692384} {"current_steps": 36330, "total_steps": 38160, "loss": 0.3992, "lr": 6.996795701173009e-06, "epoch": 19.040880503144653, "percentage": 95.2, "elapsed_time": "1:33:06", "remaining_time": "0:04:41", "throughput": 4241.3, "total_tokens": 23695936} {"current_steps": 36335, "total_steps": 38160, "loss": 0.4489, "lr": 6.958723666165901e-06, "epoch": 19.04350104821803, "percentage": 95.22, "elapsed_time": "1:33:07", "remaining_time": "0:04:40", "throughput": 4241.3, "total_tokens": 23698848} {"current_steps": 36340, "total_steps": 38160, "loss": 0.3901, "lr": 6.9207547697689446e-06, "epoch": 19.046121593291403, "percentage": 95.23, "elapsed_time": "1:33:08", "remaining_time": "0:04:39", "throughput": 4241.36, "total_tokens": 23702464} {"current_steps": 36345, "total_steps": 38160, "loss": 0.3496, "lr": 6.882889019924676e-06, "epoch": 19.04874213836478, "percentage": 95.24, "elapsed_time": "1:33:09", "remaining_time": "0:04:39", "throughput": 4241.36, "total_tokens": 23705344} {"current_steps": 36350, "total_steps": 38160, "loss": 0.4499, "lr": 6.84512642455426e-06, "epoch": 19.051362683438157, "percentage": 95.26, "elapsed_time": "1:33:09", "remaining_time": "0:04:38", "throughput": 4241.42, "total_tokens": 23708992} {"current_steps": 36355, "total_steps": 38160, "loss": 0.3377, "lr": 6.8074669915572095e-06, "epoch": 19.05398322851153, "percentage": 95.27, "elapsed_time": "1:33:10", "remaining_time": "0:04:37", "throughput": 4241.43, "total_tokens": 23711808} {"current_steps": 36360, "total_steps": 38160, "loss": 0.5293, "lr": 6.769910728811391e-06, "epoch": 19.056603773584907, "percentage": 95.28, "elapsed_time": "1:33:11", "remaining_time": "0:04:36", "throughput": 4241.44, "total_tokens": 23714720} {"current_steps": 36365, "total_steps": 38160, "loss": 0.5391, "lr": 6.73245764417324e-06, "epoch": 19.05922431865828, "percentage": 95.3, "elapsed_time": "1:33:11", "remaining_time": "0:04:36", "throughput": 4241.47, "total_tokens": 23717984} {"current_steps": 36370, "total_steps": 38160, "loss": 0.437, "lr": 6.695107745477435e-06, "epoch": 19.061844863731658, "percentage": 95.31, "elapsed_time": "1:33:12", "remaining_time": "0:04:35", "throughput": 4241.49, "total_tokens": 23721184} {"current_steps": 36375, "total_steps": 38160, "loss": 0.4458, "lr": 6.657861040537117e-06, "epoch": 19.06446540880503, "percentage": 95.32, "elapsed_time": "1:33:13", "remaining_time": "0:04:34", "throughput": 4241.51, "total_tokens": 23724384} {"current_steps": 36380, "total_steps": 38160, "loss": 0.4599, "lr": 6.620717537143994e-06, "epoch": 19.067085953878408, "percentage": 95.34, "elapsed_time": "1:33:14", "remaining_time": "0:04:33", "throughput": 4241.54, "total_tokens": 23727680} {"current_steps": 36385, "total_steps": 38160, "loss": 0.5164, "lr": 6.583677243067965e-06, "epoch": 19.06970649895178, "percentage": 95.35, "elapsed_time": "1:33:14", "remaining_time": "0:04:32", "throughput": 4241.54, "total_tokens": 23730464} {"current_steps": 36390, "total_steps": 38160, "loss": 0.3298, "lr": 6.546740166057441e-06, "epoch": 19.072327044025158, "percentage": 95.36, "elapsed_time": "1:33:15", "remaining_time": "0:04:32", "throughput": 4241.58, "total_tokens": 23733888} {"current_steps": 36395, "total_steps": 38160, "loss": 0.4311, "lr": 6.5099063138392975e-06, "epoch": 19.07494758909853, "percentage": 95.37, "elapsed_time": "1:33:16", "remaining_time": "0:04:31", "throughput": 4241.58, "total_tokens": 23736736} {"current_steps": 36400, "total_steps": 38160, "loss": 0.4452, "lr": 6.473175694118705e-06, "epoch": 19.07756813417191, "percentage": 95.39, "elapsed_time": "1:33:16", "remaining_time": "0:04:30", "throughput": 4241.6, "total_tokens": 23739872} {"current_steps": 36405, "total_steps": 38160, "loss": 0.3497, "lr": 6.436548314579349e-06, "epoch": 19.080188679245282, "percentage": 95.4, "elapsed_time": "1:33:17", "remaining_time": "0:04:29", "throughput": 4241.58, "total_tokens": 23742592} {"current_steps": 36410, "total_steps": 38160, "loss": 0.5368, "lr": 6.400024182883158e-06, "epoch": 19.08280922431866, "percentage": 95.41, "elapsed_time": "1:33:18", "remaining_time": "0:04:29", "throughput": 4241.73, "total_tokens": 23747296} {"current_steps": 36415, "total_steps": 38160, "loss": 0.4247, "lr": 6.363603306670629e-06, "epoch": 19.085429769392032, "percentage": 95.43, "elapsed_time": "1:33:19", "remaining_time": "0:04:28", "throughput": 4241.79, "total_tokens": 23751040} {"current_steps": 36420, "total_steps": 38160, "loss": 0.4725, "lr": 6.327285693560614e-06, "epoch": 19.08805031446541, "percentage": 95.44, "elapsed_time": "1:33:20", "remaining_time": "0:04:27", "throughput": 4241.87, "total_tokens": 23754976} {"current_steps": 36425, "total_steps": 38160, "loss": 0.5075, "lr": 6.2910713511503125e-06, "epoch": 19.090670859538783, "percentage": 95.45, "elapsed_time": "1:33:20", "remaining_time": "0:04:26", "throughput": 4241.92, "total_tokens": 23758464} {"current_steps": 36430, "total_steps": 38160, "loss": 0.4728, "lr": 6.254960287015332e-06, "epoch": 19.09329140461216, "percentage": 95.47, "elapsed_time": "1:33:21", "remaining_time": "0:04:26", "throughput": 4242.04, "total_tokens": 23762880} {"current_steps": 36435, "total_steps": 38160, "loss": 0.5596, "lr": 6.218952508709741e-06, "epoch": 19.095911949685533, "percentage": 95.48, "elapsed_time": "1:33:22", "remaining_time": "0:04:25", "throughput": 4242.03, "total_tokens": 23765664} {"current_steps": 36440, "total_steps": 38160, "loss": 0.573, "lr": 6.183048023765903e-06, "epoch": 19.09853249475891, "percentage": 95.49, "elapsed_time": "1:33:23", "remaining_time": "0:04:24", "throughput": 4242.15, "total_tokens": 23770016} {"current_steps": 36445, "total_steps": 38160, "loss": 0.4412, "lr": 6.147246839694698e-06, "epoch": 19.101153039832287, "percentage": 95.51, "elapsed_time": "1:33:24", "remaining_time": "0:04:23", "throughput": 4242.19, "total_tokens": 23773408} {"current_steps": 36450, "total_steps": 38160, "loss": 0.3591, "lr": 6.111548963985247e-06, "epoch": 19.10377358490566, "percentage": 95.52, "elapsed_time": "1:33:24", "remaining_time": "0:04:22", "throughput": 4242.21, "total_tokens": 23776672} {"current_steps": 36455, "total_steps": 38160, "loss": 0.3477, "lr": 6.075954404105188e-06, "epoch": 19.106394129979037, "percentage": 95.53, "elapsed_time": "1:33:25", "remaining_time": "0:04:22", "throughput": 4242.19, "total_tokens": 23779264} {"current_steps": 36460, "total_steps": 38160, "loss": 0.4582, "lr": 6.040463167500509e-06, "epoch": 19.10901467505241, "percentage": 95.55, "elapsed_time": "1:33:26", "remaining_time": "0:04:21", "throughput": 4242.27, "total_tokens": 23783104} {"current_steps": 36465, "total_steps": 38160, "loss": 0.3454, "lr": 6.005075261595494e-06, "epoch": 19.111635220125788, "percentage": 95.56, "elapsed_time": "1:33:26", "remaining_time": "0:04:20", "throughput": 4242.27, "total_tokens": 23785856} {"current_steps": 36470, "total_steps": 38160, "loss": 0.3494, "lr": 5.969790693792998e-06, "epoch": 19.11425576519916, "percentage": 95.57, "elapsed_time": "1:33:27", "remaining_time": "0:04:19", "throughput": 4242.32, "total_tokens": 23789344} {"current_steps": 36475, "total_steps": 38160, "loss": 0.4377, "lr": 5.9346094714740615e-06, "epoch": 19.116876310272538, "percentage": 95.58, "elapsed_time": "1:33:28", "remaining_time": "0:04:19", "throughput": 4242.39, "total_tokens": 23793056} {"current_steps": 36480, "total_steps": 38160, "loss": 0.496, "lr": 5.8995316019982425e-06, "epoch": 19.11949685534591, "percentage": 95.6, "elapsed_time": "1:33:29", "remaining_time": "0:04:18", "throughput": 4242.36, "total_tokens": 23795552} {"current_steps": 36485, "total_steps": 38160, "loss": 0.3878, "lr": 5.8645570927034485e-06, "epoch": 19.122117400419288, "percentage": 95.61, "elapsed_time": "1:33:29", "remaining_time": "0:04:17", "throughput": 4242.32, "total_tokens": 23797920} {"current_steps": 36490, "total_steps": 38160, "loss": 0.4982, "lr": 5.8296859509058275e-06, "epoch": 19.12473794549266, "percentage": 95.62, "elapsed_time": "1:33:30", "remaining_time": "0:04:16", "throughput": 4242.33, "total_tokens": 23800864} {"current_steps": 36495, "total_steps": 38160, "loss": 0.4003, "lr": 5.794918183900155e-06, "epoch": 19.12735849056604, "percentage": 95.64, "elapsed_time": "1:33:31", "remaining_time": "0:04:15", "throughput": 4242.39, "total_tokens": 23804480} {"current_steps": 36500, "total_steps": 38160, "loss": 0.3456, "lr": 5.760253798959447e-06, "epoch": 19.129979035639412, "percentage": 95.65, "elapsed_time": "1:33:31", "remaining_time": "0:04:15", "throughput": 4242.38, "total_tokens": 23807296} {"current_steps": 36505, "total_steps": 38160, "loss": 0.3211, "lr": 5.725692803335015e-06, "epoch": 19.13259958071279, "percentage": 95.66, "elapsed_time": "1:33:32", "remaining_time": "0:04:14", "throughput": 4242.41, "total_tokens": 23810432} {"current_steps": 36510, "total_steps": 38160, "loss": 0.3634, "lr": 5.691235204256739e-06, "epoch": 19.135220125786162, "percentage": 95.68, "elapsed_time": "1:33:33", "remaining_time": "0:04:13", "throughput": 4242.39, "total_tokens": 23813088} {"current_steps": 36515, "total_steps": 38160, "loss": 0.6378, "lr": 5.65688100893258e-06, "epoch": 19.13784067085954, "percentage": 95.69, "elapsed_time": "1:33:33", "remaining_time": "0:04:12", "throughput": 4242.38, "total_tokens": 23815968} {"current_steps": 36520, "total_steps": 38160, "loss": 0.419, "lr": 5.622630224549174e-06, "epoch": 19.140461215932913, "percentage": 95.7, "elapsed_time": "1:33:34", "remaining_time": "0:04:12", "throughput": 4242.44, "total_tokens": 23819392} {"current_steps": 36525, "total_steps": 38160, "loss": 0.532, "lr": 5.588482858271404e-06, "epoch": 19.14308176100629, "percentage": 95.72, "elapsed_time": "1:33:35", "remaining_time": "0:04:11", "throughput": 4242.43, "total_tokens": 23822144} {"current_steps": 36530, "total_steps": 38160, "loss": 0.4649, "lr": 5.554438917242444e-06, "epoch": 19.145702306079663, "percentage": 95.73, "elapsed_time": "1:33:36", "remaining_time": "0:04:10", "throughput": 4242.53, "total_tokens": 23826144} {"current_steps": 36535, "total_steps": 38160, "loss": 0.4344, "lr": 5.520498408583985e-06, "epoch": 19.14832285115304, "percentage": 95.74, "elapsed_time": "1:33:36", "remaining_time": "0:04:09", "throughput": 4242.58, "total_tokens": 23829536} {"current_steps": 36540, "total_steps": 38160, "loss": 0.3224, "lr": 5.486661339395904e-06, "epoch": 19.150943396226417, "percentage": 95.75, "elapsed_time": "1:33:37", "remaining_time": "0:04:09", "throughput": 4242.66, "total_tokens": 23833408} {"current_steps": 36545, "total_steps": 38160, "loss": 0.335, "lr": 5.452927716756595e-06, "epoch": 19.15356394129979, "percentage": 95.77, "elapsed_time": "1:33:38", "remaining_time": "0:04:08", "throughput": 4242.62, "total_tokens": 23835808} {"current_steps": 36550, "total_steps": 38160, "loss": 0.5183, "lr": 5.419297547722635e-06, "epoch": 19.156184486373167, "percentage": 95.78, "elapsed_time": "1:33:38", "remaining_time": "0:04:07", "throughput": 4242.62, "total_tokens": 23838624} {"current_steps": 36555, "total_steps": 38160, "loss": 0.3105, "lr": 5.385770839329229e-06, "epoch": 19.15880503144654, "percentage": 95.79, "elapsed_time": "1:33:39", "remaining_time": "0:04:06", "throughput": 4242.6, "total_tokens": 23841312} {"current_steps": 36560, "total_steps": 38160, "loss": 0.3949, "lr": 5.352347598589713e-06, "epoch": 19.161425576519918, "percentage": 95.81, "elapsed_time": "1:33:40", "remaining_time": "0:04:05", "throughput": 4242.62, "total_tokens": 23844416} {"current_steps": 36565, "total_steps": 38160, "loss": 0.3408, "lr": 5.319027832495826e-06, "epoch": 19.16404612159329, "percentage": 95.82, "elapsed_time": "1:33:40", "remaining_time": "0:04:05", "throughput": 4242.65, "total_tokens": 23847744} {"current_steps": 36570, "total_steps": 38160, "loss": 0.5108, "lr": 5.285811548017661e-06, "epoch": 19.166666666666668, "percentage": 95.83, "elapsed_time": "1:33:41", "remaining_time": "0:04:04", "throughput": 4242.62, "total_tokens": 23850144} {"current_steps": 36575, "total_steps": 38160, "loss": 0.556, "lr": 5.252698752103713e-06, "epoch": 19.16928721174004, "percentage": 95.85, "elapsed_time": "1:33:42", "remaining_time": "0:04:03", "throughput": 4242.69, "total_tokens": 23853952} {"current_steps": 36580, "total_steps": 38160, "loss": 0.4346, "lr": 5.219689451680832e-06, "epoch": 19.171907756813418, "percentage": 95.86, "elapsed_time": "1:33:43", "remaining_time": "0:04:02", "throughput": 4242.73, "total_tokens": 23857376} {"current_steps": 36585, "total_steps": 38160, "loss": 0.4513, "lr": 5.186783653654214e-06, "epoch": 19.17452830188679, "percentage": 95.87, "elapsed_time": "1:33:43", "remaining_time": "0:04:02", "throughput": 4242.79, "total_tokens": 23861056} {"current_steps": 36590, "total_steps": 38160, "loss": 0.335, "lr": 5.153981364907245e-06, "epoch": 19.17714884696017, "percentage": 95.89, "elapsed_time": "1:33:44", "remaining_time": "0:04:01", "throughput": 4242.78, "total_tokens": 23863968} {"current_steps": 36595, "total_steps": 38160, "loss": 0.3893, "lr": 5.121282592301935e-06, "epoch": 19.179769392033542, "percentage": 95.9, "elapsed_time": "1:33:45", "remaining_time": "0:04:00", "throughput": 4242.78, "total_tokens": 23866912} {"current_steps": 36600, "total_steps": 38160, "loss": 0.3297, "lr": 5.088687342678422e-06, "epoch": 19.18238993710692, "percentage": 95.91, "elapsed_time": "1:33:45", "remaining_time": "0:03:59", "throughput": 4242.78, "total_tokens": 23869856} {"current_steps": 36605, "total_steps": 38160, "loss": 0.4246, "lr": 5.056195622855253e-06, "epoch": 19.185010482180292, "percentage": 95.93, "elapsed_time": "1:33:46", "remaining_time": "0:03:59", "throughput": 4242.81, "total_tokens": 23873088} {"current_steps": 36610, "total_steps": 38160, "loss": 0.3707, "lr": 5.023807439629324e-06, "epoch": 19.18763102725367, "percentage": 95.94, "elapsed_time": "1:33:47", "remaining_time": "0:03:58", "throughput": 4242.83, "total_tokens": 23876160} {"current_steps": 36615, "total_steps": 38160, "loss": 0.473, "lr": 4.991522799775938e-06, "epoch": 19.190251572327043, "percentage": 95.95, "elapsed_time": "1:33:48", "remaining_time": "0:03:57", "throughput": 4242.81, "total_tokens": 23878880} {"current_steps": 36620, "total_steps": 38160, "loss": 0.347, "lr": 4.9593417100485816e-06, "epoch": 19.19287211740042, "percentage": 95.96, "elapsed_time": "1:33:48", "remaining_time": "0:03:56", "throughput": 4242.9, "total_tokens": 23882912} {"current_steps": 36625, "total_steps": 38160, "loss": 0.3699, "lr": 4.927264177179258e-06, "epoch": 19.195492662473793, "percentage": 95.98, "elapsed_time": "1:33:49", "remaining_time": "0:03:55", "throughput": 4242.96, "total_tokens": 23886560} {"current_steps": 36630, "total_steps": 38160, "loss": 0.5331, "lr": 4.895290207878156e-06, "epoch": 19.19811320754717, "percentage": 95.99, "elapsed_time": "1:33:50", "remaining_time": "0:03:55", "throughput": 4242.98, "total_tokens": 23889728} {"current_steps": 36635, "total_steps": 38160, "loss": 0.4265, "lr": 4.863419808833924e-06, "epoch": 19.200733752620547, "percentage": 96.0, "elapsed_time": "1:33:51", "remaining_time": "0:03:54", "throughput": 4243.05, "total_tokens": 23893408} {"current_steps": 36640, "total_steps": 38160, "loss": 0.3684, "lr": 4.831652986713453e-06, "epoch": 19.20335429769392, "percentage": 96.02, "elapsed_time": "1:33:51", "remaining_time": "0:03:53", "throughput": 4243.1, "total_tokens": 23896960} {"current_steps": 36645, "total_steps": 38160, "loss": 0.3784, "lr": 4.799989748161926e-06, "epoch": 19.205974842767297, "percentage": 96.03, "elapsed_time": "1:33:52", "remaining_time": "0:03:52", "throughput": 4243.1, "total_tokens": 23899936} {"current_steps": 36650, "total_steps": 38160, "loss": 0.3593, "lr": 4.768430099803101e-06, "epoch": 19.20859538784067, "percentage": 96.04, "elapsed_time": "1:33:53", "remaining_time": "0:03:52", "throughput": 4243.14, "total_tokens": 23903360} {"current_steps": 36655, "total_steps": 38160, "loss": 0.3543, "lr": 4.736974048238696e-06, "epoch": 19.211215932914047, "percentage": 96.06, "elapsed_time": "1:33:54", "remaining_time": "0:03:51", "throughput": 4243.17, "total_tokens": 23906784} {"current_steps": 36660, "total_steps": 38160, "loss": 0.2881, "lr": 4.705621600049115e-06, "epoch": 19.21383647798742, "percentage": 96.07, "elapsed_time": "1:33:54", "remaining_time": "0:03:50", "throughput": 4243.22, "total_tokens": 23910240} {"current_steps": 36665, "total_steps": 38160, "loss": 0.4108, "lr": 4.674372761792889e-06, "epoch": 19.216457023060798, "percentage": 96.08, "elapsed_time": "1:33:55", "remaining_time": "0:03:49", "throughput": 4243.27, "total_tokens": 23913888} {"current_steps": 36670, "total_steps": 38160, "loss": 0.3626, "lr": 4.6432275400069e-06, "epoch": 19.21907756813417, "percentage": 96.1, "elapsed_time": "1:33:56", "remaining_time": "0:03:49", "throughput": 4243.31, "total_tokens": 23917312} {"current_steps": 36675, "total_steps": 38160, "loss": 0.3997, "lr": 4.6121859412063264e-06, "epoch": 19.221698113207548, "percentage": 96.11, "elapsed_time": "1:33:57", "remaining_time": "0:03:48", "throughput": 4243.29, "total_tokens": 23920032} {"current_steps": 36680, "total_steps": 38160, "loss": 0.4931, "lr": 4.581247971884861e-06, "epoch": 19.22431865828092, "percentage": 96.12, "elapsed_time": "1:33:57", "remaining_time": "0:03:47", "throughput": 4243.37, "total_tokens": 23924000} {"current_steps": 36685, "total_steps": 38160, "loss": 0.3236, "lr": 4.550413638514217e-06, "epoch": 19.2269392033543, "percentage": 96.13, "elapsed_time": "1:33:58", "remaining_time": "0:03:46", "throughput": 4243.47, "total_tokens": 23928128} {"current_steps": 36690, "total_steps": 38160, "loss": 0.427, "lr": 4.519682947544679e-06, "epoch": 19.229559748427672, "percentage": 96.15, "elapsed_time": "1:33:59", "remaining_time": "0:03:45", "throughput": 4243.52, "total_tokens": 23931712} {"current_steps": 36695, "total_steps": 38160, "loss": 0.4843, "lr": 4.489055905404715e-06, "epoch": 19.23218029350105, "percentage": 96.16, "elapsed_time": "1:34:00", "remaining_time": "0:03:45", "throughput": 4243.53, "total_tokens": 23934912} {"current_steps": 36700, "total_steps": 38160, "loss": 0.507, "lr": 4.4585325185012014e-06, "epoch": 19.234800838574422, "percentage": 96.17, "elapsed_time": "1:34:01", "remaining_time": "0:03:44", "throughput": 4243.58, "total_tokens": 23938560} {"current_steps": 36705, "total_steps": 38160, "loss": 0.4427, "lr": 4.428112793219197e-06, "epoch": 19.2374213836478, "percentage": 96.19, "elapsed_time": "1:34:01", "remaining_time": "0:03:43", "throughput": 4243.58, "total_tokens": 23941440} {"current_steps": 36710, "total_steps": 38160, "loss": 0.4182, "lr": 4.397796735922277e-06, "epoch": 19.240041928721173, "percentage": 96.2, "elapsed_time": "1:34:02", "remaining_time": "0:03:42", "throughput": 4243.6, "total_tokens": 23944736} {"current_steps": 36715, "total_steps": 38160, "loss": 0.6641, "lr": 4.367584352952092e-06, "epoch": 19.24266247379455, "percentage": 96.21, "elapsed_time": "1:34:03", "remaining_time": "0:03:42", "throughput": 4243.74, "total_tokens": 23949376} {"current_steps": 36720, "total_steps": 38160, "loss": 0.4654, "lr": 4.337475650628808e-06, "epoch": 19.245283018867923, "percentage": 96.23, "elapsed_time": "1:34:04", "remaining_time": "0:03:41", "throughput": 4243.77, "total_tokens": 23952640} {"current_steps": 36725, "total_steps": 38160, "loss": 0.4095, "lr": 4.307470635250832e-06, "epoch": 19.2479035639413, "percentage": 96.24, "elapsed_time": "1:34:05", "remaining_time": "0:03:40", "throughput": 4243.88, "total_tokens": 23956992} {"current_steps": 36730, "total_steps": 38160, "loss": 0.3438, "lr": 4.277569313094809e-06, "epoch": 19.250524109014677, "percentage": 96.25, "elapsed_time": "1:34:05", "remaining_time": "0:03:39", "throughput": 4243.89, "total_tokens": 23960192} {"current_steps": 36735, "total_steps": 38160, "loss": 0.2995, "lr": 4.247771690415791e-06, "epoch": 19.25314465408805, "percentage": 96.27, "elapsed_time": "1:34:06", "remaining_time": "0:03:39", "throughput": 4243.89, "total_tokens": 23963040} {"current_steps": 36740, "total_steps": 38160, "loss": 0.4326, "lr": 4.218077773447071e-06, "epoch": 19.255765199161427, "percentage": 96.28, "elapsed_time": "1:34:07", "remaining_time": "0:03:38", "throughput": 4243.86, "total_tokens": 23965664} {"current_steps": 36745, "total_steps": 38160, "loss": 0.4281, "lr": 4.1884875684003455e-06, "epoch": 19.2583857442348, "percentage": 96.29, "elapsed_time": "1:34:07", "remaining_time": "0:03:37", "throughput": 4243.89, "total_tokens": 23968992} {"current_steps": 36750, "total_steps": 38160, "loss": 0.767, "lr": 4.159001081465497e-06, "epoch": 19.261006289308177, "percentage": 96.31, "elapsed_time": "1:34:08", "remaining_time": "0:03:36", "throughput": 4243.9, "total_tokens": 23972032} {"current_steps": 36755, "total_steps": 38160, "loss": 0.536, "lr": 4.129618318810702e-06, "epoch": 19.26362683438155, "percentage": 96.32, "elapsed_time": "1:34:09", "remaining_time": "0:03:35", "throughput": 4243.91, "total_tokens": 23975040} {"current_steps": 36760, "total_steps": 38160, "loss": 0.4195, "lr": 4.100339286582655e-06, "epoch": 19.266247379454928, "percentage": 96.33, "elapsed_time": "1:34:09", "remaining_time": "0:03:35", "throughput": 4243.87, "total_tokens": 23977408} {"current_steps": 36765, "total_steps": 38160, "loss": 0.4315, "lr": 4.071163990906068e-06, "epoch": 19.2688679245283, "percentage": 96.34, "elapsed_time": "1:34:10", "remaining_time": "0:03:34", "throughput": 4243.84, "total_tokens": 23980032} {"current_steps": 36770, "total_steps": 38160, "loss": 0.377, "lr": 4.042092437884115e-06, "epoch": 19.271488469601678, "percentage": 96.36, "elapsed_time": "1:34:11", "remaining_time": "0:03:33", "throughput": 4243.83, "total_tokens": 23982720} {"current_steps": 36775, "total_steps": 38160, "loss": 0.4636, "lr": 4.013124633598264e-06, "epoch": 19.27410901467505, "percentage": 96.37, "elapsed_time": "1:34:11", "remaining_time": "0:03:32", "throughput": 4243.86, "total_tokens": 23985984} {"current_steps": 36780, "total_steps": 38160, "loss": 0.5292, "lr": 3.984260584108168e-06, "epoch": 19.27672955974843, "percentage": 96.38, "elapsed_time": "1:34:12", "remaining_time": "0:03:32", "throughput": 4243.9, "total_tokens": 23989504} {"current_steps": 36785, "total_steps": 38160, "loss": 0.4322, "lr": 3.955500295451942e-06, "epoch": 19.279350104821802, "percentage": 96.4, "elapsed_time": "1:34:13", "remaining_time": "0:03:31", "throughput": 4243.89, "total_tokens": 23992160} {"current_steps": 36790, "total_steps": 38160, "loss": 0.5027, "lr": 3.926843773645883e-06, "epoch": 19.28197064989518, "percentage": 96.41, "elapsed_time": "1:34:14", "remaining_time": "0:03:30", "throughput": 4244.15, "total_tokens": 23998816} {"current_steps": 36795, "total_steps": 38160, "loss": 0.4209, "lr": 3.8982910246846415e-06, "epoch": 19.284591194968552, "percentage": 96.42, "elapsed_time": "1:34:15", "remaining_time": "0:03:29", "throughput": 4244.25, "total_tokens": 24003040} {"current_steps": 36800, "total_steps": 38160, "loss": 0.459, "lr": 3.869842054541051e-06, "epoch": 19.28721174004193, "percentage": 96.44, "elapsed_time": "1:34:16", "remaining_time": "0:03:29", "throughput": 4244.28, "total_tokens": 24006272} {"current_steps": 36805, "total_steps": 38160, "loss": 0.3771, "lr": 3.84149686916635e-06, "epoch": 19.289832285115303, "percentage": 96.45, "elapsed_time": "1:34:16", "remaining_time": "0:03:28", "throughput": 4244.33, "total_tokens": 24009792} {"current_steps": 36810, "total_steps": 38160, "loss": 0.3331, "lr": 3.8132554744900183e-06, "epoch": 19.29245283018868, "percentage": 96.46, "elapsed_time": "1:34:17", "remaining_time": "0:03:27", "throughput": 4244.35, "total_tokens": 24012960} {"current_steps": 36815, "total_steps": 38160, "loss": 0.5595, "lr": 3.7851178764198302e-06, "epoch": 19.295073375262053, "percentage": 96.48, "elapsed_time": "1:34:18", "remaining_time": "0:03:26", "throughput": 4244.4, "total_tokens": 24016416} {"current_steps": 36820, "total_steps": 38160, "loss": 0.3412, "lr": 3.7570840808419104e-06, "epoch": 19.29769392033543, "percentage": 96.49, "elapsed_time": "1:34:19", "remaining_time": "0:03:25", "throughput": 4244.42, "total_tokens": 24019520} {"current_steps": 36825, "total_steps": 38160, "loss": 0.4084, "lr": 3.729154093620568e-06, "epoch": 19.300314465408803, "percentage": 96.5, "elapsed_time": "1:34:19", "remaining_time": "0:03:25", "throughput": 4244.48, "total_tokens": 24023168} {"current_steps": 36830, "total_steps": 38160, "loss": 0.4144, "lr": 3.7013279205984073e-06, "epoch": 19.30293501048218, "percentage": 96.51, "elapsed_time": "1:34:20", "remaining_time": "0:03:24", "throughput": 4244.5, "total_tokens": 24026368} {"current_steps": 36835, "total_steps": 38160, "loss": 0.3441, "lr": 3.6736055675963275e-06, "epoch": 19.305555555555557, "percentage": 96.53, "elapsed_time": "1:34:21", "remaining_time": "0:03:23", "throughput": 4244.47, "total_tokens": 24028960} {"current_steps": 36840, "total_steps": 38160, "loss": 0.4784, "lr": 3.645987040413634e-06, "epoch": 19.30817610062893, "percentage": 96.54, "elapsed_time": "1:34:21", "remaining_time": "0:03:22", "throughput": 4244.43, "total_tokens": 24031392} {"current_steps": 36845, "total_steps": 38160, "loss": 0.4131, "lr": 3.6184723448277056e-06, "epoch": 19.310796645702307, "percentage": 96.55, "elapsed_time": "1:34:22", "remaining_time": "0:03:22", "throughput": 4244.43, "total_tokens": 24034368} {"current_steps": 36850, "total_steps": 38160, "loss": 0.4571, "lr": 3.5910614865943826e-06, "epoch": 19.31341719077568, "percentage": 96.57, "elapsed_time": "1:34:23", "remaining_time": "0:03:21", "throughput": 4244.45, "total_tokens": 24037472} {"current_steps": 36855, "total_steps": 38160, "loss": 0.4573, "lr": 3.563754471447689e-06, "epoch": 19.316037735849058, "percentage": 96.58, "elapsed_time": "1:34:23", "remaining_time": "0:03:20", "throughput": 4244.48, "total_tokens": 24040672} {"current_steps": 36860, "total_steps": 38160, "loss": 0.4154, "lr": 3.5365513050998334e-06, "epoch": 19.31865828092243, "percentage": 96.59, "elapsed_time": "1:34:24", "remaining_time": "0:03:19", "throughput": 4244.52, "total_tokens": 24044192} {"current_steps": 36865, "total_steps": 38160, "loss": 0.4202, "lr": 3.5094519932415414e-06, "epoch": 19.321278825995808, "percentage": 96.61, "elapsed_time": "1:34:25", "remaining_time": "0:03:19", "throughput": 4244.56, "total_tokens": 24047520} {"current_steps": 36870, "total_steps": 38160, "loss": 0.534, "lr": 3.4824565415416123e-06, "epoch": 19.32389937106918, "percentage": 96.62, "elapsed_time": "1:34:26", "remaining_time": "0:03:18", "throughput": 4244.59, "total_tokens": 24050944} {"current_steps": 36875, "total_steps": 38160, "loss": 0.3959, "lr": 3.4555649556471946e-06, "epoch": 19.32651991614256, "percentage": 96.63, "elapsed_time": "1:34:26", "remaining_time": "0:03:17", "throughput": 4244.56, "total_tokens": 24053440} {"current_steps": 36880, "total_steps": 38160, "loss": 0.4353, "lr": 3.4287772411837338e-06, "epoch": 19.329140461215932, "percentage": 96.65, "elapsed_time": "1:34:27", "remaining_time": "0:03:16", "throughput": 4244.57, "total_tokens": 24056480} {"current_steps": 36885, "total_steps": 38160, "loss": 0.3426, "lr": 3.402093403754858e-06, "epoch": 19.33176100628931, "percentage": 96.66, "elapsed_time": "1:34:28", "remaining_time": "0:03:15", "throughput": 4244.68, "total_tokens": 24060768} {"current_steps": 36890, "total_steps": 38160, "loss": 0.4913, "lr": 3.375513448942602e-06, "epoch": 19.334381551362682, "percentage": 96.67, "elapsed_time": "1:34:29", "remaining_time": "0:03:15", "throughput": 4244.64, "total_tokens": 24063200} {"current_steps": 36895, "total_steps": 38160, "loss": 0.5868, "lr": 3.349037382307074e-06, "epoch": 19.33700209643606, "percentage": 96.69, "elapsed_time": "1:34:29", "remaining_time": "0:03:14", "throughput": 4244.64, "total_tokens": 24066272} {"current_steps": 36900, "total_steps": 38160, "loss": 0.4101, "lr": 3.322665209386899e-06, "epoch": 19.339622641509433, "percentage": 96.7, "elapsed_time": "1:34:30", "remaining_time": "0:03:13", "throughput": 4244.62, "total_tokens": 24068960} {"current_steps": 36905, "total_steps": 38160, "loss": 0.5584, "lr": 3.29639693569872e-06, "epoch": 19.34224318658281, "percentage": 96.71, "elapsed_time": "1:34:31", "remaining_time": "0:03:12", "throughput": 4244.62, "total_tokens": 24071936} {"current_steps": 36910, "total_steps": 38160, "loss": 0.4329, "lr": 3.270232566737641e-06, "epoch": 19.344863731656183, "percentage": 96.72, "elapsed_time": "1:34:31", "remaining_time": "0:03:12", "throughput": 4244.61, "total_tokens": 24074752} {"current_steps": 36915, "total_steps": 38160, "loss": 0.4745, "lr": 3.244172107976895e-06, "epoch": 19.34748427672956, "percentage": 96.74, "elapsed_time": "1:34:32", "remaining_time": "0:03:11", "throughput": 4244.66, "total_tokens": 24078240} {"current_steps": 36920, "total_steps": 38160, "loss": 0.4198, "lr": 3.2182155648680657e-06, "epoch": 19.350104821802937, "percentage": 96.75, "elapsed_time": "1:34:33", "remaining_time": "0:03:10", "throughput": 4244.73, "total_tokens": 24081920} {"current_steps": 36925, "total_steps": 38160, "loss": 0.4922, "lr": 3.1923629428409205e-06, "epoch": 19.35272536687631, "percentage": 96.76, "elapsed_time": "1:34:34", "remaining_time": "0:03:09", "throughput": 4244.82, "total_tokens": 24085952} {"current_steps": 36930, "total_steps": 38160, "loss": 0.4111, "lr": 3.166614247303634e-06, "epoch": 19.355345911949687, "percentage": 96.78, "elapsed_time": "1:34:34", "remaining_time": "0:03:09", "throughput": 4244.81, "total_tokens": 24088672} {"current_steps": 36935, "total_steps": 38160, "loss": 0.4622, "lr": 3.140969483642453e-06, "epoch": 19.35796645702306, "percentage": 96.79, "elapsed_time": "1:34:35", "remaining_time": "0:03:08", "throughput": 4244.86, "total_tokens": 24092064} {"current_steps": 36940, "total_steps": 38160, "loss": 0.4965, "lr": 3.1154286572219747e-06, "epoch": 19.360587002096437, "percentage": 96.8, "elapsed_time": "1:34:36", "remaining_time": "0:03:07", "throughput": 4244.89, "total_tokens": 24095328} {"current_steps": 36945, "total_steps": 38160, "loss": 0.4752, "lr": 3.089991773385037e-06, "epoch": 19.36320754716981, "percentage": 96.82, "elapsed_time": "1:34:37", "remaining_time": "0:03:06", "throughput": 4244.91, "total_tokens": 24098560} {"current_steps": 36950, "total_steps": 38160, "loss": 0.4193, "lr": 3.064658837452772e-06, "epoch": 19.365828092243188, "percentage": 96.83, "elapsed_time": "1:34:37", "remaining_time": "0:03:05", "throughput": 4244.93, "total_tokens": 24101696} {"current_steps": 36955, "total_steps": 38160, "loss": 0.5001, "lr": 3.0394298547246068e-06, "epoch": 19.36844863731656, "percentage": 96.84, "elapsed_time": "1:34:38", "remaining_time": "0:03:05", "throughput": 4244.92, "total_tokens": 24104448} {"current_steps": 36960, "total_steps": 38160, "loss": 0.4235, "lr": 3.0143048304779875e-06, "epoch": 19.371069182389938, "percentage": 96.86, "elapsed_time": "1:34:39", "remaining_time": "0:03:04", "throughput": 4244.93, "total_tokens": 24107520} {"current_steps": 36965, "total_steps": 38160, "loss": 0.372, "lr": 2.989283769968987e-06, "epoch": 19.37368972746331, "percentage": 96.87, "elapsed_time": "1:34:39", "remaining_time": "0:03:03", "throughput": 4244.92, "total_tokens": 24110304} {"current_steps": 36970, "total_steps": 38160, "loss": 0.5129, "lr": 2.964366678431585e-06, "epoch": 19.37631027253669, "percentage": 96.88, "elapsed_time": "1:34:40", "remaining_time": "0:03:02", "throughput": 4244.97, "total_tokens": 24113792} {"current_steps": 36975, "total_steps": 38160, "loss": 0.4426, "lr": 2.9395535610781678e-06, "epoch": 19.378930817610062, "percentage": 96.89, "elapsed_time": "1:34:41", "remaining_time": "0:03:02", "throughput": 4244.94, "total_tokens": 24116224} {"current_steps": 36980, "total_steps": 38160, "loss": 0.3788, "lr": 2.9148444230994166e-06, "epoch": 19.38155136268344, "percentage": 96.91, "elapsed_time": "1:34:42", "remaining_time": "0:03:01", "throughput": 4245.04, "total_tokens": 24120480} {"current_steps": 36985, "total_steps": 38160, "loss": 0.5368, "lr": 2.890239269664141e-06, "epoch": 19.384171907756812, "percentage": 96.92, "elapsed_time": "1:34:42", "remaining_time": "0:03:00", "throughput": 4245.04, "total_tokens": 24123424} {"current_steps": 36990, "total_steps": 38160, "loss": 0.3593, "lr": 2.8657381059194466e-06, "epoch": 19.38679245283019, "percentage": 96.93, "elapsed_time": "1:34:43", "remaining_time": "0:02:59", "throughput": 4245.06, "total_tokens": 24126528} {"current_steps": 36995, "total_steps": 38160, "loss": 0.3643, "lr": 2.8413409369907885e-06, "epoch": 19.389412997903563, "percentage": 96.95, "elapsed_time": "1:34:44", "remaining_time": "0:02:59", "throughput": 4245.21, "total_tokens": 24131360} {"current_steps": 37000, "total_steps": 38160, "loss": 0.4317, "lr": 2.817047767981695e-06, "epoch": 19.39203354297694, "percentage": 96.96, "elapsed_time": "1:34:45", "remaining_time": "0:02:58", "throughput": 4245.19, "total_tokens": 24133920} {"current_steps": 37005, "total_steps": 38160, "loss": 0.3721, "lr": 2.7928586039740466e-06, "epoch": 19.394654088050313, "percentage": 96.97, "elapsed_time": "1:34:45", "remaining_time": "0:02:57", "throughput": 4245.25, "total_tokens": 24137536} {"current_steps": 37010, "total_steps": 38160, "loss": 0.3816, "lr": 2.7687734500279615e-06, "epoch": 19.39727463312369, "percentage": 96.99, "elapsed_time": "1:34:46", "remaining_time": "0:02:56", "throughput": 4245.24, "total_tokens": 24140448} {"current_steps": 37015, "total_steps": 38160, "loss": 0.4815, "lr": 2.744792311181743e-06, "epoch": 19.399895178197063, "percentage": 97.0, "elapsed_time": "1:34:47", "remaining_time": "0:02:55", "throughput": 4245.25, "total_tokens": 24143488} {"current_steps": 37020, "total_steps": 38160, "loss": 0.3899, "lr": 2.720915192451989e-06, "epoch": 19.40251572327044, "percentage": 97.01, "elapsed_time": "1:34:47", "remaining_time": "0:02:55", "throughput": 4245.3, "total_tokens": 24146944} {"current_steps": 37025, "total_steps": 38160, "loss": 0.4235, "lr": 2.697142098833538e-06, "epoch": 19.405136268343817, "percentage": 97.03, "elapsed_time": "1:34:48", "remaining_time": "0:02:54", "throughput": 4245.4, "total_tokens": 24150944} {"current_steps": 37030, "total_steps": 38160, "loss": 0.4184, "lr": 2.6734730352993563e-06, "epoch": 19.40775681341719, "percentage": 97.04, "elapsed_time": "1:34:49", "remaining_time": "0:02:53", "throughput": 4245.37, "total_tokens": 24153504} {"current_steps": 37035, "total_steps": 38160, "loss": 0.4093, "lr": 2.649908006800872e-06, "epoch": 19.410377358490567, "percentage": 97.05, "elapsed_time": "1:34:50", "remaining_time": "0:02:52", "throughput": 4245.37, "total_tokens": 24156480} {"current_steps": 37040, "total_steps": 38160, "loss": 0.5618, "lr": 2.626447018267586e-06, "epoch": 19.41299790356394, "percentage": 97.06, "elapsed_time": "1:34:50", "remaining_time": "0:02:52", "throughput": 4245.44, "total_tokens": 24160192} {"current_steps": 37045, "total_steps": 38160, "loss": 0.4577, "lr": 2.603090074607184e-06, "epoch": 19.415618448637318, "percentage": 97.08, "elapsed_time": "1:34:51", "remaining_time": "0:02:51", "throughput": 4245.4, "total_tokens": 24162560} {"current_steps": 37050, "total_steps": 38160, "loss": 0.4331, "lr": 2.579837180705813e-06, "epoch": 19.41823899371069, "percentage": 97.09, "elapsed_time": "1:34:52", "remaining_time": "0:02:50", "throughput": 4245.4, "total_tokens": 24165568} {"current_steps": 37055, "total_steps": 38160, "loss": 0.3426, "lr": 2.556688341427582e-06, "epoch": 19.420859538784068, "percentage": 97.1, "elapsed_time": "1:34:52", "remaining_time": "0:02:49", "throughput": 4245.42, "total_tokens": 24168608} {"current_steps": 37060, "total_steps": 38160, "loss": 0.5014, "lr": 2.5336435616150066e-06, "epoch": 19.42348008385744, "percentage": 97.12, "elapsed_time": "1:34:53", "remaining_time": "0:02:48", "throughput": 4245.43, "total_tokens": 24171552} {"current_steps": 37065, "total_steps": 38160, "loss": 0.3937, "lr": 2.510702846088786e-06, "epoch": 19.42610062893082, "percentage": 97.13, "elapsed_time": "1:34:54", "remaining_time": "0:02:48", "throughput": 4245.42, "total_tokens": 24174336} {"current_steps": 37070, "total_steps": 38160, "loss": 0.3085, "lr": 2.487866199647915e-06, "epoch": 19.428721174004192, "percentage": 97.14, "elapsed_time": "1:34:55", "remaining_time": "0:02:47", "throughput": 4245.52, "total_tokens": 24178400} {"current_steps": 37075, "total_steps": 38160, "loss": 0.3661, "lr": 2.4651336270695156e-06, "epoch": 19.43134171907757, "percentage": 97.16, "elapsed_time": "1:34:55", "remaining_time": "0:02:46", "throughput": 4245.52, "total_tokens": 24181312} {"current_steps": 37080, "total_steps": 38160, "loss": 0.4408, "lr": 2.442505133108952e-06, "epoch": 19.433962264150942, "percentage": 97.17, "elapsed_time": "1:34:56", "remaining_time": "0:02:45", "throughput": 4245.55, "total_tokens": 24184544} {"current_steps": 37085, "total_steps": 38160, "loss": 0.2861, "lr": 2.419980722499937e-06, "epoch": 19.43658280922432, "percentage": 97.18, "elapsed_time": "1:34:57", "remaining_time": "0:02:45", "throughput": 4245.49, "total_tokens": 24186720} {"current_steps": 37090, "total_steps": 38160, "loss": 0.4594, "lr": 2.397560399954202e-06, "epoch": 19.439203354297693, "percentage": 97.2, "elapsed_time": "1:34:57", "remaining_time": "0:02:44", "throughput": 4245.52, "total_tokens": 24189984} {"current_steps": 37095, "total_steps": 38160, "loss": 0.3654, "lr": 2.3752441701618833e-06, "epoch": 19.44182389937107, "percentage": 97.21, "elapsed_time": "1:34:58", "remaining_time": "0:02:43", "throughput": 4245.49, "total_tokens": 24192448} {"current_steps": 37100, "total_steps": 38160, "loss": 0.3748, "lr": 2.3530320377913027e-06, "epoch": 19.444444444444443, "percentage": 97.22, "elapsed_time": "1:34:59", "remaining_time": "0:02:42", "throughput": 4245.55, "total_tokens": 24196128} {"current_steps": 37105, "total_steps": 38160, "loss": 0.3611, "lr": 2.3309240074890213e-06, "epoch": 19.44706498951782, "percentage": 97.24, "elapsed_time": "1:34:59", "remaining_time": "0:02:42", "throughput": 4245.56, "total_tokens": 24199104} {"current_steps": 37110, "total_steps": 38160, "loss": 0.54, "lr": 2.3089200838796176e-06, "epoch": 19.449685534591197, "percentage": 97.25, "elapsed_time": "1:35:00", "remaining_time": "0:02:41", "throughput": 4245.57, "total_tokens": 24202176} {"current_steps": 37115, "total_steps": 38160, "loss": 0.4897, "lr": 2.2870202715662426e-06, "epoch": 19.45230607966457, "percentage": 97.26, "elapsed_time": "1:35:01", "remaining_time": "0:02:40", "throughput": 4245.62, "total_tokens": 24205824} {"current_steps": 37120, "total_steps": 38160, "loss": 0.5309, "lr": 2.265224575130009e-06, "epoch": 19.454926624737947, "percentage": 97.27, "elapsed_time": "1:35:02", "remaining_time": "0:02:39", "throughput": 4245.61, "total_tokens": 24208640} {"current_steps": 37125, "total_steps": 38160, "loss": 0.2571, "lr": 2.2435329991303268e-06, "epoch": 19.45754716981132, "percentage": 97.29, "elapsed_time": "1:35:03", "remaining_time": "0:02:39", "throughput": 4245.89, "total_tokens": 24215456} {"current_steps": 37130, "total_steps": 38160, "loss": 0.4262, "lr": 2.2219455481047868e-06, "epoch": 19.460167714884697, "percentage": 97.3, "elapsed_time": "1:35:03", "remaining_time": "0:02:38", "throughput": 4245.93, "total_tokens": 24218752} {"current_steps": 37135, "total_steps": 38160, "loss": 0.3992, "lr": 2.2004622265693886e-06, "epoch": 19.46278825995807, "percentage": 97.31, "elapsed_time": "1:35:04", "remaining_time": "0:02:37", "throughput": 4245.92, "total_tokens": 24221632} {"current_steps": 37140, "total_steps": 38160, "loss": 0.4954, "lr": 2.179083039018037e-06, "epoch": 19.465408805031448, "percentage": 97.33, "elapsed_time": "1:35:05", "remaining_time": "0:02:36", "throughput": 4246.03, "total_tokens": 24225824} {"current_steps": 37145, "total_steps": 38160, "loss": 0.4513, "lr": 2.157807989923044e-06, "epoch": 19.46802935010482, "percentage": 97.34, "elapsed_time": "1:35:06", "remaining_time": "0:02:35", "throughput": 4246.05, "total_tokens": 24228960} {"current_steps": 37150, "total_steps": 38160, "loss": 0.374, "lr": 2.1366370837349603e-06, "epoch": 19.470649895178198, "percentage": 97.35, "elapsed_time": "1:35:06", "remaining_time": "0:02:35", "throughput": 4246.1, "total_tokens": 24232352} {"current_steps": 37155, "total_steps": 38160, "loss": 0.3531, "lr": 2.1155703248825207e-06, "epoch": 19.47327044025157, "percentage": 97.37, "elapsed_time": "1:35:07", "remaining_time": "0:02:34", "throughput": 4246.12, "total_tokens": 24235456} {"current_steps": 37160, "total_steps": 38160, "loss": 0.4298, "lr": 2.094607717772534e-06, "epoch": 19.47589098532495, "percentage": 97.38, "elapsed_time": "1:35:08", "remaining_time": "0:02:33", "throughput": 4246.09, "total_tokens": 24238016} {"current_steps": 37165, "total_steps": 38160, "loss": 0.3859, "lr": 2.0737492667902702e-06, "epoch": 19.478511530398322, "percentage": 97.39, "elapsed_time": "1:35:08", "remaining_time": "0:02:32", "throughput": 4246.07, "total_tokens": 24240672} {"current_steps": 37170, "total_steps": 38160, "loss": 0.3173, "lr": 2.0529949762989608e-06, "epoch": 19.4811320754717, "percentage": 97.41, "elapsed_time": "1:35:09", "remaining_time": "0:02:32", "throughput": 4246.06, "total_tokens": 24243520} {"current_steps": 37175, "total_steps": 38160, "loss": 0.4524, "lr": 2.032344850640244e-06, "epoch": 19.483752620545072, "percentage": 97.42, "elapsed_time": "1:35:10", "remaining_time": "0:02:31", "throughput": 4246.08, "total_tokens": 24246784} {"current_steps": 37180, "total_steps": 38160, "loss": 0.6324, "lr": 2.011798894133887e-06, "epoch": 19.48637316561845, "percentage": 97.43, "elapsed_time": "1:35:11", "remaining_time": "0:02:30", "throughput": 4246.17, "total_tokens": 24250848} {"current_steps": 37185, "total_steps": 38160, "loss": 0.4488, "lr": 1.9913571110777852e-06, "epoch": 19.488993710691823, "percentage": 97.44, "elapsed_time": "1:35:11", "remaining_time": "0:02:29", "throughput": 4246.21, "total_tokens": 24254208} {"current_steps": 37190, "total_steps": 38160, "loss": 0.4439, "lr": 1.971019505748295e-06, "epoch": 19.4916142557652, "percentage": 97.46, "elapsed_time": "1:35:13", "remaining_time": "0:02:29", "throughput": 4246.47, "total_tokens": 24260896} {"current_steps": 37195, "total_steps": 38160, "loss": 0.4328, "lr": 1.9507860823996803e-06, "epoch": 19.494234800838573, "percentage": 97.47, "elapsed_time": "1:35:13", "remaining_time": "0:02:28", "throughput": 4246.43, "total_tokens": 24263232} {"current_steps": 37200, "total_steps": 38160, "loss": 0.4888, "lr": 1.9306568452645e-06, "epoch": 19.49685534591195, "percentage": 97.48, "elapsed_time": "1:35:14", "remaining_time": "0:02:27", "throughput": 4246.48, "total_tokens": 24266784} {"current_steps": 37205, "total_steps": 38160, "loss": 0.357, "lr": 1.910631798553664e-06, "epoch": 19.499475890985323, "percentage": 97.5, "elapsed_time": "1:35:15", "remaining_time": "0:02:26", "throughput": 4246.52, "total_tokens": 24270112} {"current_steps": 37210, "total_steps": 38160, "loss": 0.4867, "lr": 1.8907109464562088e-06, "epoch": 19.5020964360587, "percentage": 97.51, "elapsed_time": "1:35:16", "remaining_time": "0:02:25", "throughput": 4246.53, "total_tokens": 24273184} {"current_steps": 37215, "total_steps": 38160, "loss": 0.4502, "lr": 1.870894293139247e-06, "epoch": 19.504716981132077, "percentage": 97.52, "elapsed_time": "1:35:16", "remaining_time": "0:02:25", "throughput": 4246.55, "total_tokens": 24276224} {"current_steps": 37220, "total_steps": 38160, "loss": 0.3666, "lr": 1.8511818427482396e-06, "epoch": 19.50733752620545, "percentage": 97.54, "elapsed_time": "1:35:17", "remaining_time": "0:02:24", "throughput": 4246.7, "total_tokens": 24281024} {"current_steps": 37225, "total_steps": 38160, "loss": 0.5454, "lr": 1.8315735994068327e-06, "epoch": 19.509958071278827, "percentage": 97.55, "elapsed_time": "1:35:18", "remaining_time": "0:02:23", "throughput": 4246.69, "total_tokens": 24283840} {"current_steps": 37230, "total_steps": 38160, "loss": 0.248, "lr": 1.8120695672168009e-06, "epoch": 19.5125786163522, "percentage": 97.56, "elapsed_time": "1:35:18", "remaining_time": "0:02:22", "throughput": 4246.65, "total_tokens": 24286240} {"current_steps": 37235, "total_steps": 38160, "loss": 0.3818, "lr": 1.792669750258158e-06, "epoch": 19.515199161425578, "percentage": 97.58, "elapsed_time": "1:35:19", "remaining_time": "0:02:22", "throughput": 4246.64, "total_tokens": 24288992} {"current_steps": 37240, "total_steps": 38160, "loss": 0.4034, "lr": 1.7733741525892134e-06, "epoch": 19.51781970649895, "percentage": 97.59, "elapsed_time": "1:35:20", "remaining_time": "0:02:21", "throughput": 4246.67, "total_tokens": 24292288} {"current_steps": 37245, "total_steps": 38160, "loss": 0.4658, "lr": 1.7541827782462937e-06, "epoch": 19.520440251572328, "percentage": 97.6, "elapsed_time": "1:35:21", "remaining_time": "0:02:20", "throughput": 4246.7, "total_tokens": 24295584} {"current_steps": 37250, "total_steps": 38160, "loss": 0.3764, "lr": 1.7350956312440768e-06, "epoch": 19.5230607966457, "percentage": 97.62, "elapsed_time": "1:35:21", "remaining_time": "0:02:19", "throughput": 4246.7, "total_tokens": 24298400} {"current_steps": 37255, "total_steps": 38160, "loss": 0.3428, "lr": 1.716112715575313e-06, "epoch": 19.52568134171908, "percentage": 97.63, "elapsed_time": "1:35:22", "remaining_time": "0:02:19", "throughput": 4246.69, "total_tokens": 24301280} {"current_steps": 37260, "total_steps": 38160, "loss": 0.4553, "lr": 1.6972340352110481e-06, "epoch": 19.528301886792452, "percentage": 97.64, "elapsed_time": "1:35:23", "remaining_time": "0:02:18", "throughput": 4246.68, "total_tokens": 24303968} {"current_steps": 37265, "total_steps": 38160, "loss": 0.4346, "lr": 1.6784595941004565e-06, "epoch": 19.53092243186583, "percentage": 97.65, "elapsed_time": "1:35:23", "remaining_time": "0:02:17", "throughput": 4246.72, "total_tokens": 24307456} {"current_steps": 37270, "total_steps": 38160, "loss": 0.3948, "lr": 1.659789396171063e-06, "epoch": 19.533542976939202, "percentage": 97.67, "elapsed_time": "1:35:24", "remaining_time": "0:02:16", "throughput": 4246.78, "total_tokens": 24310912} {"current_steps": 37275, "total_steps": 38160, "loss": 0.4151, "lr": 1.6412234453282993e-06, "epoch": 19.53616352201258, "percentage": 97.68, "elapsed_time": "1:35:25", "remaining_time": "0:02:15", "throughput": 4246.77, "total_tokens": 24313728} {"current_steps": 37280, "total_steps": 38160, "loss": 0.4073, "lr": 1.622761745456003e-06, "epoch": 19.538784067085953, "percentage": 97.69, "elapsed_time": "1:35:25", "remaining_time": "0:02:15", "throughput": 4246.8, "total_tokens": 24316928} {"current_steps": 37285, "total_steps": 38160, "loss": 0.366, "lr": 1.6044043004161958e-06, "epoch": 19.54140461215933, "percentage": 97.71, "elapsed_time": "1:35:26", "remaining_time": "0:02:14", "throughput": 4246.78, "total_tokens": 24319552} {"current_steps": 37290, "total_steps": 38160, "loss": 0.4135, "lr": 1.5861511140489725e-06, "epoch": 19.544025157232703, "percentage": 97.72, "elapsed_time": "1:35:27", "remaining_time": "0:02:13", "throughput": 4246.74, "total_tokens": 24321984} {"current_steps": 37295, "total_steps": 38160, "loss": 0.4859, "lr": 1.5680021901727237e-06, "epoch": 19.54664570230608, "percentage": 97.73, "elapsed_time": "1:35:27", "remaining_time": "0:02:12", "throughput": 4246.73, "total_tokens": 24324928} {"current_steps": 37300, "total_steps": 38160, "loss": 0.3087, "lr": 1.5499575325840232e-06, "epoch": 19.549266247379457, "percentage": 97.75, "elapsed_time": "1:35:28", "remaining_time": "0:02:12", "throughput": 4246.76, "total_tokens": 24328064} {"current_steps": 37305, "total_steps": 38160, "loss": 0.5207, "lr": 1.5320171450576293e-06, "epoch": 19.55188679245283, "percentage": 97.76, "elapsed_time": "1:35:29", "remaining_time": "0:02:11", "throughput": 4246.77, "total_tokens": 24331136} {"current_steps": 37310, "total_steps": 38160, "loss": 0.4399, "lr": 1.5141810313463733e-06, "epoch": 19.554507337526207, "percentage": 97.77, "elapsed_time": "1:35:30", "remaining_time": "0:02:10", "throughput": 4246.77, "total_tokens": 24334112} {"current_steps": 37315, "total_steps": 38160, "loss": 0.3635, "lr": 1.4964491951814374e-06, "epoch": 19.55712788259958, "percentage": 97.79, "elapsed_time": "1:35:30", "remaining_time": "0:02:09", "throughput": 4246.85, "total_tokens": 24338048} {"current_steps": 37320, "total_steps": 38160, "loss": 0.5321, "lr": 1.4788216402720766e-06, "epoch": 19.559748427672957, "percentage": 97.8, "elapsed_time": "1:35:31", "remaining_time": "0:02:09", "throughput": 4246.9, "total_tokens": 24341632} {"current_steps": 37325, "total_steps": 38160, "loss": 0.4173, "lr": 1.4612983703058413e-06, "epoch": 19.56236897274633, "percentage": 97.81, "elapsed_time": "1:35:32", "remaining_time": "0:02:08", "throughput": 4246.96, "total_tokens": 24345088} {"current_steps": 37330, "total_steps": 38160, "loss": 0.4175, "lr": 1.4438793889483549e-06, "epoch": 19.564989517819708, "percentage": 97.82, "elapsed_time": "1:35:33", "remaining_time": "0:02:07", "throughput": 4247.02, "total_tokens": 24348736} {"current_steps": 37335, "total_steps": 38160, "loss": 0.3316, "lr": 1.4265646998434246e-06, "epoch": 19.56761006289308, "percentage": 97.84, "elapsed_time": "1:35:33", "remaining_time": "0:02:06", "throughput": 4247.04, "total_tokens": 24351776} {"current_steps": 37340, "total_steps": 38160, "loss": 0.3668, "lr": 1.409354306613153e-06, "epoch": 19.570230607966458, "percentage": 97.85, "elapsed_time": "1:35:34", "remaining_time": "0:02:05", "throughput": 4247.09, "total_tokens": 24355296} {"current_steps": 37345, "total_steps": 38160, "loss": 0.4171, "lr": 1.3922482128577718e-06, "epoch": 19.57285115303983, "percentage": 97.86, "elapsed_time": "1:35:35", "remaining_time": "0:02:05", "throughput": 4247.17, "total_tokens": 24359168} {"current_steps": 37350, "total_steps": 38160, "loss": 0.4846, "lr": 1.3752464221556404e-06, "epoch": 19.57547169811321, "percentage": 97.88, "elapsed_time": "1:35:36", "remaining_time": "0:02:04", "throughput": 4247.23, "total_tokens": 24362720} {"current_steps": 37355, "total_steps": 38160, "loss": 0.382, "lr": 1.358348938063303e-06, "epoch": 19.578092243186582, "percentage": 97.89, "elapsed_time": "1:35:36", "remaining_time": "0:02:03", "throughput": 4247.24, "total_tokens": 24365824} {"current_steps": 37360, "total_steps": 38160, "loss": 0.35, "lr": 1.341555764115543e-06, "epoch": 19.58071278825996, "percentage": 97.9, "elapsed_time": "1:35:37", "remaining_time": "0:02:02", "throughput": 4247.26, "total_tokens": 24368928} {"current_steps": 37365, "total_steps": 38160, "loss": 0.3859, "lr": 1.3248669038253835e-06, "epoch": 19.583333333333332, "percentage": 97.92, "elapsed_time": "1:35:38", "remaining_time": "0:02:02", "throughput": 4247.3, "total_tokens": 24372192} {"current_steps": 37370, "total_steps": 38160, "loss": 0.4425, "lr": 1.3082823606838656e-06, "epoch": 19.58595387840671, "percentage": 97.93, "elapsed_time": "1:35:38", "remaining_time": "0:02:01", "throughput": 4247.28, "total_tokens": 24374912} {"current_steps": 37375, "total_steps": 38160, "loss": 0.3914, "lr": 1.2918021381603251e-06, "epoch": 19.588574423480082, "percentage": 97.94, "elapsed_time": "1:35:39", "remaining_time": "0:02:00", "throughput": 4247.31, "total_tokens": 24378176} {"current_steps": 37380, "total_steps": 38160, "loss": 0.3741, "lr": 1.275426239702171e-06, "epoch": 19.59119496855346, "percentage": 97.96, "elapsed_time": "1:35:40", "remaining_time": "0:01:59", "throughput": 4247.37, "total_tokens": 24381760} {"current_steps": 37385, "total_steps": 38160, "loss": 0.3935, "lr": 1.2591546687351073e-06, "epoch": 19.593815513626833, "percentage": 97.97, "elapsed_time": "1:35:41", "remaining_time": "0:01:59", "throughput": 4247.48, "total_tokens": 24386144} {"current_steps": 37390, "total_steps": 38160, "loss": 0.4078, "lr": 1.2429874286629673e-06, "epoch": 19.59643605870021, "percentage": 97.98, "elapsed_time": "1:35:42", "remaining_time": "0:01:58", "throughput": 4247.53, "total_tokens": 24389600} {"current_steps": 37395, "total_steps": 38160, "loss": 0.4075, "lr": 1.2269245228677116e-06, "epoch": 19.599056603773583, "percentage": 98.0, "elapsed_time": "1:35:42", "remaining_time": "0:01:57", "throughput": 4247.49, "total_tokens": 24392160} {"current_steps": 37400, "total_steps": 38160, "loss": 0.4063, "lr": 1.210965954709542e-06, "epoch": 19.60167714884696, "percentage": 98.01, "elapsed_time": "1:35:43", "remaining_time": "0:01:56", "throughput": 4247.54, "total_tokens": 24395584} {"current_steps": 37405, "total_steps": 38160, "loss": 0.3625, "lr": 1.1951117275268431e-06, "epoch": 19.604297693920337, "percentage": 98.02, "elapsed_time": "1:35:44", "remaining_time": "0:01:55", "throughput": 4247.47, "total_tokens": 24397696} {"current_steps": 37410, "total_steps": 38160, "loss": 0.4169, "lr": 1.1793618446360732e-06, "epoch": 19.60691823899371, "percentage": 98.03, "elapsed_time": "1:35:44", "remaining_time": "0:01:55", "throughput": 4247.55, "total_tokens": 24401696} {"current_steps": 37415, "total_steps": 38160, "loss": 0.4148, "lr": 1.1637163093319303e-06, "epoch": 19.609538784067087, "percentage": 98.05, "elapsed_time": "1:35:45", "remaining_time": "0:01:54", "throughput": 4247.53, "total_tokens": 24404416} {"current_steps": 37420, "total_steps": 38160, "loss": 0.37, "lr": 1.1481751248874072e-06, "epoch": 19.61215932914046, "percentage": 98.06, "elapsed_time": "1:35:46", "remaining_time": "0:01:53", "throughput": 4247.51, "total_tokens": 24407008} {"current_steps": 37425, "total_steps": 38160, "loss": 0.3025, "lr": 1.1327382945533482e-06, "epoch": 19.614779874213838, "percentage": 98.07, "elapsed_time": "1:35:46", "remaining_time": "0:01:52", "throughput": 4247.54, "total_tokens": 24410208} {"current_steps": 37430, "total_steps": 38160, "loss": 0.3042, "lr": 1.1174058215591143e-06, "epoch": 19.61740041928721, "percentage": 98.09, "elapsed_time": "1:35:47", "remaining_time": "0:01:52", "throughput": 4247.69, "total_tokens": 24415168} {"current_steps": 37435, "total_steps": 38160, "loss": 0.3679, "lr": 1.1021777091119732e-06, "epoch": 19.620020964360588, "percentage": 98.1, "elapsed_time": "1:35:48", "remaining_time": "0:01:51", "throughput": 4247.68, "total_tokens": 24417984} {"current_steps": 37440, "total_steps": 38160, "loss": 0.4822, "lr": 1.0870539603975994e-06, "epoch": 19.62264150943396, "percentage": 98.11, "elapsed_time": "1:35:49", "remaining_time": "0:01:50", "throughput": 4247.72, "total_tokens": 24421376} {"current_steps": 37445, "total_steps": 38160, "loss": 0.2813, "lr": 1.0720345785795727e-06, "epoch": 19.62526205450734, "percentage": 98.13, "elapsed_time": "1:35:50", "remaining_time": "0:01:49", "throughput": 4247.74, "total_tokens": 24424544} {"current_steps": 37450, "total_steps": 38160, "loss": 0.3549, "lr": 1.0571195667998802e-06, "epoch": 19.627882599580712, "percentage": 98.14, "elapsed_time": "1:35:50", "remaining_time": "0:01:49", "throughput": 4247.73, "total_tokens": 24427488} {"current_steps": 37455, "total_steps": 38160, "loss": 0.4368, "lr": 1.042308928178526e-06, "epoch": 19.63050314465409, "percentage": 98.15, "elapsed_time": "1:35:51", "remaining_time": "0:01:48", "throughput": 4247.73, "total_tokens": 24430336} {"current_steps": 37460, "total_steps": 38160, "loss": 0.4106, "lr": 1.0276026658137538e-06, "epoch": 19.633123689727462, "percentage": 98.17, "elapsed_time": "1:35:52", "remaining_time": "0:01:47", "throughput": 4247.87, "total_tokens": 24435136} {"current_steps": 37465, "total_steps": 38160, "loss": 0.4952, "lr": 1.013000782781881e-06, "epoch": 19.63574423480084, "percentage": 98.18, "elapsed_time": "1:35:53", "remaining_time": "0:01:46", "throughput": 4247.93, "total_tokens": 24438848} {"current_steps": 37470, "total_steps": 38160, "loss": 0.4517, "lr": 9.985032821375195e-07, "epoch": 19.638364779874212, "percentage": 98.19, "elapsed_time": "1:35:53", "remaining_time": "0:01:45", "throughput": 4247.89, "total_tokens": 24441248} {"current_steps": 37475, "total_steps": 38160, "loss": 0.3931, "lr": 9.841101669134101e-07, "epoch": 19.64098532494759, "percentage": 98.2, "elapsed_time": "1:35:54", "remaining_time": "0:01:45", "throughput": 4247.86, "total_tokens": 24443840} {"current_steps": 37480, "total_steps": 38160, "loss": 0.4657, "lr": 9.69821440120311e-07, "epoch": 19.643605870020963, "percentage": 98.22, "elapsed_time": "1:35:55", "remaining_time": "0:01:44", "throughput": 4247.9, "total_tokens": 24447200} {"current_steps": 37485, "total_steps": 38160, "loss": 0.5455, "lr": 9.556371047473866e-07, "epoch": 19.64622641509434, "percentage": 98.23, "elapsed_time": "1:35:55", "remaining_time": "0:01:43", "throughput": 4247.91, "total_tokens": 24450368} {"current_steps": 37490, "total_steps": 38160, "loss": 0.3123, "lr": 9.415571637617082e-07, "epoch": 19.648846960167717, "percentage": 98.24, "elapsed_time": "1:35:56", "remaining_time": "0:01:42", "throughput": 4247.89, "total_tokens": 24452992} {"current_steps": 37495, "total_steps": 38160, "loss": 0.477, "lr": 9.275816201087528e-07, "epoch": 19.65146750524109, "percentage": 98.26, "elapsed_time": "1:35:57", "remaining_time": "0:01:42", "throughput": 4247.84, "total_tokens": 24455264} {"current_steps": 37500, "total_steps": 38160, "loss": 0.4983, "lr": 9.137104767120153e-07, "epoch": 19.654088050314467, "percentage": 98.27, "elapsed_time": "1:35:57", "remaining_time": "0:01:41", "throughput": 4247.84, "total_tokens": 24458304} {"current_steps": 37505, "total_steps": 38160, "loss": 0.486, "lr": 8.999437364731189e-07, "epoch": 19.65670859538784, "percentage": 98.28, "elapsed_time": "1:35:58", "remaining_time": "0:01:40", "throughput": 4247.89, "total_tokens": 24461824} {"current_steps": 37510, "total_steps": 38160, "loss": 0.3793, "lr": 8.862814022720378e-07, "epoch": 19.659329140461217, "percentage": 98.3, "elapsed_time": "1:35:59", "remaining_time": "0:01:39", "throughput": 4247.89, "total_tokens": 24464736} {"current_steps": 37515, "total_steps": 38160, "loss": 0.3724, "lr": 8.727234769666526e-07, "epoch": 19.66194968553459, "percentage": 98.31, "elapsed_time": "1:35:59", "remaining_time": "0:01:39", "throughput": 4247.86, "total_tokens": 24467264} {"current_steps": 37520, "total_steps": 38160, "loss": 0.4585, "lr": 8.592699633931389e-07, "epoch": 19.664570230607968, "percentage": 98.32, "elapsed_time": "1:36:00", "remaining_time": "0:01:38", "throughput": 4247.92, "total_tokens": 24470912} {"current_steps": 37525, "total_steps": 38160, "loss": 0.4497, "lr": 8.459208643659122e-07, "epoch": 19.66719077568134, "percentage": 98.34, "elapsed_time": "1:36:01", "remaining_time": "0:01:37", "throughput": 4247.97, "total_tokens": 24474304} {"current_steps": 37530, "total_steps": 38160, "loss": 0.3752, "lr": 8.326761826773499e-07, "epoch": 19.669811320754718, "percentage": 98.35, "elapsed_time": "1:36:02", "remaining_time": "0:01:36", "throughput": 4247.98, "total_tokens": 24477280} {"current_steps": 37535, "total_steps": 38160, "loss": 0.4012, "lr": 8.195359210981246e-07, "epoch": 19.67243186582809, "percentage": 98.36, "elapsed_time": "1:36:02", "remaining_time": "0:01:35", "throughput": 4247.91, "total_tokens": 24479456} {"current_steps": 37540, "total_steps": 38160, "loss": 0.4812, "lr": 8.065000823770929e-07, "epoch": 19.67505241090147, "percentage": 98.38, "elapsed_time": "1:36:03", "remaining_time": "0:01:35", "throughput": 4247.94, "total_tokens": 24482624} {"current_steps": 37545, "total_steps": 38160, "loss": 0.3898, "lr": 7.935686692410737e-07, "epoch": 19.677672955974842, "percentage": 98.39, "elapsed_time": "1:36:04", "remaining_time": "0:01:34", "throughput": 4247.96, "total_tokens": 24485792} {"current_steps": 37550, "total_steps": 38160, "loss": 0.3794, "lr": 7.807416843952364e-07, "epoch": 19.68029350104822, "percentage": 98.4, "elapsed_time": "1:36:04", "remaining_time": "0:01:33", "throughput": 4247.95, "total_tokens": 24488576} {"current_steps": 37555, "total_steps": 38160, "loss": 0.5857, "lr": 7.68019130522879e-07, "epoch": 19.682914046121592, "percentage": 98.41, "elapsed_time": "1:36:05", "remaining_time": "0:01:32", "throughput": 4247.92, "total_tokens": 24491136} {"current_steps": 37560, "total_steps": 38160, "loss": 0.6165, "lr": 7.554010102853726e-07, "epoch": 19.68553459119497, "percentage": 98.43, "elapsed_time": "1:36:06", "remaining_time": "0:01:32", "throughput": 4247.96, "total_tokens": 24494528} {"current_steps": 37565, "total_steps": 38160, "loss": 0.5233, "lr": 7.428873263223279e-07, "epoch": 19.688155136268342, "percentage": 98.44, "elapsed_time": "1:36:07", "remaining_time": "0:01:31", "throughput": 4248.06, "total_tokens": 24498816} {"current_steps": 37570, "total_steps": 38160, "loss": 0.3905, "lr": 7.304780812513734e-07, "epoch": 19.69077568134172, "percentage": 98.45, "elapsed_time": "1:36:07", "remaining_time": "0:01:30", "throughput": 4248.12, "total_tokens": 24502368} {"current_steps": 37575, "total_steps": 38160, "loss": 0.4011, "lr": 7.181732776684325e-07, "epoch": 19.693396226415093, "percentage": 98.47, "elapsed_time": "1:36:08", "remaining_time": "0:01:29", "throughput": 4248.14, "total_tokens": 24505440} {"current_steps": 37580, "total_steps": 38160, "loss": 0.4615, "lr": 7.059729181475572e-07, "epoch": 19.69601677148847, "percentage": 98.48, "elapsed_time": "1:36:09", "remaining_time": "0:01:29", "throughput": 4248.16, "total_tokens": 24508512} {"current_steps": 37585, "total_steps": 38160, "loss": 0.3764, "lr": 6.938770052409282e-07, "epoch": 19.698637316561843, "percentage": 98.49, "elapsed_time": "1:36:09", "remaining_time": "0:01:28", "throughput": 4248.16, "total_tokens": 24511360} {"current_steps": 37590, "total_steps": 38160, "loss": 0.4547, "lr": 6.81885541478855e-07, "epoch": 19.70125786163522, "percentage": 98.51, "elapsed_time": "1:36:10", "remaining_time": "0:01:27", "throughput": 4248.14, "total_tokens": 24514048} {"current_steps": 37595, "total_steps": 38160, "loss": 0.3693, "lr": 6.699985293697197e-07, "epoch": 19.703878406708597, "percentage": 98.52, "elapsed_time": "1:36:11", "remaining_time": "0:01:26", "throughput": 4248.14, "total_tokens": 24517088} {"current_steps": 37600, "total_steps": 38160, "loss": 0.4787, "lr": 6.582159714003111e-07, "epoch": 19.70649895178197, "percentage": 98.53, "elapsed_time": "1:36:11", "remaining_time": "0:01:25", "throughput": 4248.12, "total_tokens": 24519808} {"current_steps": 37605, "total_steps": 38160, "loss": 0.4893, "lr": 6.465378700352687e-07, "epoch": 19.709119496855347, "percentage": 98.55, "elapsed_time": "1:36:12", "remaining_time": "0:01:25", "throughput": 4248.26, "total_tokens": 24524320} {"current_steps": 37610, "total_steps": 38160, "loss": 0.4393, "lr": 6.349642277176382e-07, "epoch": 19.71174004192872, "percentage": 98.56, "elapsed_time": "1:36:13", "remaining_time": "0:01:24", "throughput": 4248.34, "total_tokens": 24528192} {"current_steps": 37615, "total_steps": 38160, "loss": 0.4694, "lr": 6.23495046868372e-07, "epoch": 19.714360587002098, "percentage": 98.57, "elapsed_time": "1:36:14", "remaining_time": "0:01:23", "throughput": 4248.32, "total_tokens": 24530880} {"current_steps": 37620, "total_steps": 38160, "loss": 0.4592, "lr": 6.121303298868286e-07, "epoch": 19.71698113207547, "percentage": 98.58, "elapsed_time": "1:36:14", "remaining_time": "0:01:22", "throughput": 4248.34, "total_tokens": 24533952} {"current_steps": 37625, "total_steps": 38160, "loss": 0.4091, "lr": 6.008700791502175e-07, "epoch": 19.719601677148848, "percentage": 98.6, "elapsed_time": "1:36:15", "remaining_time": "0:01:22", "throughput": 4248.37, "total_tokens": 24537152} {"current_steps": 37630, "total_steps": 38160, "loss": 0.2973, "lr": 5.8971429701421e-07, "epoch": 19.72222222222222, "percentage": 98.61, "elapsed_time": "1:36:16", "remaining_time": "0:01:21", "throughput": 4248.34, "total_tokens": 24539776} {"current_steps": 37635, "total_steps": 38160, "loss": 0.4464, "lr": 5.786629858123283e-07, "epoch": 19.7248427672956, "percentage": 98.62, "elapsed_time": "1:36:17", "remaining_time": "0:01:20", "throughput": 4248.36, "total_tokens": 24542944} {"current_steps": 37640, "total_steps": 38160, "loss": 0.3889, "lr": 5.677161478565008e-07, "epoch": 19.72746331236897, "percentage": 98.64, "elapsed_time": "1:36:17", "remaining_time": "0:01:19", "throughput": 4248.33, "total_tokens": 24545504} {"current_steps": 37645, "total_steps": 38160, "loss": 0.4629, "lr": 5.56873785436618e-07, "epoch": 19.73008385744235, "percentage": 98.65, "elapsed_time": "1:36:18", "remaining_time": "0:01:19", "throughput": 4248.35, "total_tokens": 24548736} {"current_steps": 37650, "total_steps": 38160, "loss": 0.6219, "lr": 5.4613590082081e-07, "epoch": 19.732704402515722, "percentage": 98.66, "elapsed_time": "1:36:19", "remaining_time": "0:01:18", "throughput": 4248.39, "total_tokens": 24552000} {"current_steps": 37655, "total_steps": 38160, "loss": 0.376, "lr": 5.355024962552801e-07, "epoch": 19.7353249475891, "percentage": 98.68, "elapsed_time": "1:36:19", "remaining_time": "0:01:17", "throughput": 4248.47, "total_tokens": 24555968} {"current_steps": 37660, "total_steps": 38160, "loss": 0.4779, "lr": 5.249735739644157e-07, "epoch": 19.737945492662472, "percentage": 98.69, "elapsed_time": "1:36:20", "remaining_time": "0:01:16", "throughput": 4248.5, "total_tokens": 24559104} {"current_steps": 37665, "total_steps": 38160, "loss": 0.4605, "lr": 5.145491361508436e-07, "epoch": 19.74056603773585, "percentage": 98.7, "elapsed_time": "1:36:21", "remaining_time": "0:01:15", "throughput": 4248.49, "total_tokens": 24561824} {"current_steps": 37670, "total_steps": 38160, "loss": 0.3957, "lr": 5.042291849950975e-07, "epoch": 19.743186582809223, "percentage": 98.72, "elapsed_time": "1:36:22", "remaining_time": "0:01:15", "throughput": 4248.5, "total_tokens": 24564864} {"current_steps": 37675, "total_steps": 38160, "loss": 0.3753, "lr": 4.940137226560615e-07, "epoch": 19.7458071278826, "percentage": 98.73, "elapsed_time": "1:36:22", "remaining_time": "0:01:14", "throughput": 4248.54, "total_tokens": 24568224} {"current_steps": 37680, "total_steps": 38160, "loss": 0.4078, "lr": 4.839027512706928e-07, "epoch": 19.748427672955973, "percentage": 98.74, "elapsed_time": "1:36:23", "remaining_time": "0:01:13", "throughput": 4248.72, "total_tokens": 24573312} {"current_steps": 37685, "total_steps": 38160, "loss": 0.3993, "lr": 4.7389627295407743e-07, "epoch": 19.75104821802935, "percentage": 98.76, "elapsed_time": "1:36:24", "remaining_time": "0:01:12", "throughput": 4248.8, "total_tokens": 24577248} {"current_steps": 37690, "total_steps": 38160, "loss": 0.3869, "lr": 4.6399428979948534e-07, "epoch": 19.753668763102727, "percentage": 98.77, "elapsed_time": "1:36:25", "remaining_time": "0:01:12", "throughput": 4248.83, "total_tokens": 24580544} {"current_steps": 37695, "total_steps": 38160, "loss": 0.4324, "lr": 4.541968038782596e-07, "epoch": 19.7562893081761, "percentage": 98.78, "elapsed_time": "1:36:25", "remaining_time": "0:01:11", "throughput": 4248.79, "total_tokens": 24582944} {"current_steps": 37700, "total_steps": 38160, "loss": 0.5885, "lr": 4.445038172399829e-07, "epoch": 19.758909853249477, "percentage": 98.79, "elapsed_time": "1:36:26", "remaining_time": "0:01:10", "throughput": 4248.78, "total_tokens": 24585728} {"current_steps": 37705, "total_steps": 38160, "loss": 0.4863, "lr": 4.3491533191225563e-07, "epoch": 19.76153039832285, "percentage": 98.81, "elapsed_time": "1:36:27", "remaining_time": "0:01:09", "throughput": 4248.78, "total_tokens": 24588640} {"current_steps": 37710, "total_steps": 38160, "loss": 0.4548, "lr": 4.254313499009177e-07, "epoch": 19.764150943396228, "percentage": 98.82, "elapsed_time": "1:36:27", "remaining_time": "0:01:09", "throughput": 4248.82, "total_tokens": 24592064} {"current_steps": 37715, "total_steps": 38160, "loss": 0.3957, "lr": 4.1605187318982664e-07, "epoch": 19.7667714884696, "percentage": 98.83, "elapsed_time": "1:36:29", "remaining_time": "0:01:08", "throughput": 4249.08, "total_tokens": 24598944} {"current_steps": 37720, "total_steps": 38160, "loss": 0.3797, "lr": 4.067769037411906e-07, "epoch": 19.769392033542978, "percentage": 98.85, "elapsed_time": "1:36:29", "remaining_time": "0:01:07", "throughput": 4249.02, "total_tokens": 24601152} {"current_steps": 37725, "total_steps": 38160, "loss": 0.4028, "lr": 3.9760644349517984e-07, "epoch": 19.77201257861635, "percentage": 98.86, "elapsed_time": "1:36:30", "remaining_time": "0:01:06", "throughput": 4249.01, "total_tokens": 24603904} {"current_steps": 37730, "total_steps": 38160, "loss": 0.3788, "lr": 3.885404943700932e-07, "epoch": 19.77463312368973, "percentage": 98.87, "elapsed_time": "1:36:31", "remaining_time": "0:01:05", "throughput": 4248.97, "total_tokens": 24606240} {"current_steps": 37735, "total_steps": 38160, "loss": 0.445, "lr": 3.795790582624692e-07, "epoch": 19.7772536687631, "percentage": 98.89, "elapsed_time": "1:36:31", "remaining_time": "0:01:05", "throughput": 4248.97, "total_tokens": 24609088} {"current_steps": 37740, "total_steps": 38160, "loss": 0.3871, "lr": 3.707221370469749e-07, "epoch": 19.77987421383648, "percentage": 98.9, "elapsed_time": "1:36:32", "remaining_time": "0:01:04", "throughput": 4249.0, "total_tokens": 24612320} {"current_steps": 37745, "total_steps": 38160, "loss": 0.4046, "lr": 3.6196973257629494e-07, "epoch": 19.782494758909852, "percentage": 98.91, "elapsed_time": "1:36:33", "remaining_time": "0:01:03", "throughput": 4249.19, "total_tokens": 24617664} {"current_steps": 37750, "total_steps": 38160, "loss": 0.3933, "lr": 3.533218466813537e-07, "epoch": 19.78511530398323, "percentage": 98.93, "elapsed_time": "1:36:34", "remaining_time": "0:01:02", "throughput": 4249.34, "total_tokens": 24622304} {"current_steps": 37755, "total_steps": 38160, "loss": 0.3953, "lr": 3.447784811712595e-07, "epoch": 19.787735849056602, "percentage": 98.94, "elapsed_time": "1:36:35", "remaining_time": "0:01:02", "throughput": 4249.33, "total_tokens": 24625088} {"current_steps": 37760, "total_steps": 38160, "loss": 0.4197, "lr": 3.363396378331385e-07, "epoch": 19.79035639412998, "percentage": 98.95, "elapsed_time": "1:36:35", "remaining_time": "0:01:01", "throughput": 4249.36, "total_tokens": 24628544} {"current_steps": 37765, "total_steps": 38160, "loss": 0.5636, "lr": 3.280053184323006e-07, "epoch": 19.792976939203353, "percentage": 98.96, "elapsed_time": "1:36:36", "remaining_time": "0:01:00", "throughput": 4249.4, "total_tokens": 24631776} {"current_steps": 37770, "total_steps": 38160, "loss": 0.4295, "lr": 3.1977552471218476e-07, "epoch": 19.79559748427673, "percentage": 98.98, "elapsed_time": "1:36:37", "remaining_time": "0:00:59", "throughput": 4249.43, "total_tokens": 24634976} {"current_steps": 37775, "total_steps": 38160, "loss": 0.49, "lr": 3.116502583943581e-07, "epoch": 19.798218029350103, "percentage": 98.99, "elapsed_time": "1:36:37", "remaining_time": "0:00:59", "throughput": 4249.42, "total_tokens": 24637696} {"current_steps": 37780, "total_steps": 38160, "loss": 0.3671, "lr": 3.036295211785722e-07, "epoch": 19.80083857442348, "percentage": 99.0, "elapsed_time": "1:36:38", "remaining_time": "0:00:58", "throughput": 4249.44, "total_tokens": 24640864} {"current_steps": 37785, "total_steps": 38160, "loss": 0.2871, "lr": 2.957133147425961e-07, "epoch": 19.803459119496857, "percentage": 99.02, "elapsed_time": "1:36:39", "remaining_time": "0:00:57", "throughput": 4249.65, "total_tokens": 24646784} {"current_steps": 37790, "total_steps": 38160, "loss": 0.3882, "lr": 2.879016407425494e-07, "epoch": 19.80607966457023, "percentage": 99.03, "elapsed_time": "1:36:40", "remaining_time": "0:00:56", "throughput": 4249.68, "total_tokens": 24650048} {"current_steps": 37795, "total_steps": 38160, "loss": 0.3888, "lr": 2.8019450081240295e-07, "epoch": 19.808700209643607, "percentage": 99.04, "elapsed_time": "1:36:41", "remaining_time": "0:00:56", "throughput": 4249.74, "total_tokens": 24653728} {"current_steps": 37800, "total_steps": 38160, "loss": 0.3346, "lr": 2.7259189656447803e-07, "epoch": 19.81132075471698, "percentage": 99.06, "elapsed_time": "1:36:41", "remaining_time": "0:00:55", "throughput": 4249.71, "total_tokens": 24656288} {"current_steps": 37805, "total_steps": 38160, "loss": 0.3878, "lr": 2.650938295891692e-07, "epoch": 19.813941299790358, "percentage": 99.07, "elapsed_time": "1:36:42", "remaining_time": "0:00:54", "throughput": 4249.75, "total_tokens": 24659744} {"current_steps": 37810, "total_steps": 38160, "loss": 0.5245, "lr": 2.5770030145494395e-07, "epoch": 19.81656184486373, "percentage": 99.08, "elapsed_time": "1:36:43", "remaining_time": "0:00:53", "throughput": 4249.8, "total_tokens": 24663488} {"current_steps": 37815, "total_steps": 38160, "loss": 0.3635, "lr": 2.504113137083985e-07, "epoch": 19.819182389937108, "percentage": 99.1, "elapsed_time": "1:36:44", "remaining_time": "0:00:52", "throughput": 4249.8, "total_tokens": 24666272} {"current_steps": 37820, "total_steps": 38160, "loss": 0.2474, "lr": 2.4322686787442425e-07, "epoch": 19.82180293501048, "percentage": 99.11, "elapsed_time": "1:36:44", "remaining_time": "0:00:52", "throughput": 4249.89, "total_tokens": 24670400} {"current_steps": 37825, "total_steps": 38160, "loss": 0.3938, "lr": 2.3614696545581904e-07, "epoch": 19.82442348008386, "percentage": 99.12, "elapsed_time": "1:36:45", "remaining_time": "0:00:51", "throughput": 4249.88, "total_tokens": 24673280} {"current_steps": 37830, "total_steps": 38160, "loss": 0.4644, "lr": 2.2917160793367585e-07, "epoch": 19.82704402515723, "percentage": 99.14, "elapsed_time": "1:36:46", "remaining_time": "0:00:50", "throughput": 4249.9, "total_tokens": 24676320} {"current_steps": 37835, "total_steps": 38160, "loss": 0.3086, "lr": 2.2230079676716086e-07, "epoch": 19.82966457023061, "percentage": 99.15, "elapsed_time": "1:36:47", "remaining_time": "0:00:49", "throughput": 4250.02, "total_tokens": 24680960} {"current_steps": 37840, "total_steps": 38160, "loss": 0.4518, "lr": 2.1553453339356875e-07, "epoch": 19.832285115303982, "percentage": 99.16, "elapsed_time": "1:36:48", "remaining_time": "0:00:49", "throughput": 4250.17, "total_tokens": 24685792} {"current_steps": 37845, "total_steps": 38160, "loss": 0.3705, "lr": 2.0887281922826738e-07, "epoch": 19.83490566037736, "percentage": 99.17, "elapsed_time": "1:36:48", "remaining_time": "0:00:48", "throughput": 4250.15, "total_tokens": 24688448} {"current_steps": 37850, "total_steps": 38160, "loss": 0.3311, "lr": 2.023156556648642e-07, "epoch": 19.837526205450732, "percentage": 99.19, "elapsed_time": "1:36:49", "remaining_time": "0:00:47", "throughput": 4250.17, "total_tokens": 24691552} {"current_steps": 37855, "total_steps": 38160, "loss": 0.3933, "lr": 1.9586304407503975e-07, "epoch": 19.84014675052411, "percentage": 99.2, "elapsed_time": "1:36:50", "remaining_time": "0:00:46", "throughput": 4250.17, "total_tokens": 24694368} {"current_steps": 37860, "total_steps": 38160, "loss": 0.4543, "lr": 1.8951498580860315e-07, "epoch": 19.842767295597483, "percentage": 99.21, "elapsed_time": "1:36:50", "remaining_time": "0:00:46", "throughput": 4250.11, "total_tokens": 24696608} {"current_steps": 37865, "total_steps": 38160, "loss": 0.3981, "lr": 1.832714821934922e-07, "epoch": 19.84538784067086, "percentage": 99.23, "elapsed_time": "1:36:51", "remaining_time": "0:00:45", "throughput": 4250.14, "total_tokens": 24699872} {"current_steps": 37870, "total_steps": 38160, "loss": 0.3778, "lr": 1.7713253453577328e-07, "epoch": 19.848008385744233, "percentage": 99.24, "elapsed_time": "1:36:52", "remaining_time": "0:00:44", "throughput": 4250.3, "total_tokens": 24704608} {"current_steps": 37875, "total_steps": 38160, "loss": 0.4473, "lr": 1.7109814411964132e-07, "epoch": 19.85062893081761, "percentage": 99.25, "elapsed_time": "1:36:53", "remaining_time": "0:00:43", "throughput": 4250.38, "total_tokens": 24708544} {"current_steps": 37880, "total_steps": 38160, "loss": 0.4523, "lr": 1.651683122074754e-07, "epoch": 19.853249475890987, "percentage": 99.27, "elapsed_time": "1:36:53", "remaining_time": "0:00:42", "throughput": 4250.34, "total_tokens": 24710880} {"current_steps": 37885, "total_steps": 38160, "loss": 0.3786, "lr": 1.5934304003961675e-07, "epoch": 19.85587002096436, "percentage": 99.28, "elapsed_time": "1:36:54", "remaining_time": "0:00:42", "throughput": 4250.44, "total_tokens": 24715008} {"current_steps": 37890, "total_steps": 38160, "loss": 0.4264, "lr": 1.5362232883475713e-07, "epoch": 19.858490566037737, "percentage": 99.29, "elapsed_time": "1:36:55", "remaining_time": "0:00:41", "throughput": 4250.46, "total_tokens": 24718240} {"current_steps": 37895, "total_steps": 38160, "loss": 0.3491, "lr": 1.4800617978949492e-07, "epoch": 19.86111111111111, "percentage": 99.31, "elapsed_time": "1:36:56", "remaining_time": "0:00:40", "throughput": 4250.43, "total_tokens": 24720800} {"current_steps": 37900, "total_steps": 38160, "loss": 0.4266, "lr": 1.424945940787792e-07, "epoch": 19.863731656184488, "percentage": 99.32, "elapsed_time": "1:36:56", "remaining_time": "0:00:39", "throughput": 4250.4, "total_tokens": 24723392} {"current_steps": 37905, "total_steps": 38160, "loss": 0.4186, "lr": 1.3708757285552098e-07, "epoch": 19.86635220125786, "percentage": 99.33, "elapsed_time": "1:36:57", "remaining_time": "0:00:39", "throughput": 4250.37, "total_tokens": 24725792} {"current_steps": 37910, "total_steps": 38160, "loss": 0.3973, "lr": 1.3178511725076004e-07, "epoch": 19.868972746331238, "percentage": 99.34, "elapsed_time": "1:36:58", "remaining_time": "0:00:38", "throughput": 4250.37, "total_tokens": 24728672} {"current_steps": 37915, "total_steps": 38160, "loss": 0.4687, "lr": 1.265872283738312e-07, "epoch": 19.87159329140461, "percentage": 99.36, "elapsed_time": "1:36:58", "remaining_time": "0:00:37", "throughput": 4250.43, "total_tokens": 24732384} {"current_steps": 37920, "total_steps": 38160, "loss": 0.389, "lr": 1.2149390731192033e-07, "epoch": 19.87421383647799, "percentage": 99.37, "elapsed_time": "1:36:59", "remaining_time": "0:00:36", "throughput": 4250.47, "total_tokens": 24735744} {"current_steps": 37925, "total_steps": 38160, "loss": 0.4022, "lr": 1.1650515513061955e-07, "epoch": 19.87683438155136, "percentage": 99.38, "elapsed_time": "1:37:00", "remaining_time": "0:00:36", "throughput": 4250.45, "total_tokens": 24738496} {"current_steps": 37930, "total_steps": 38160, "loss": 0.3821, "lr": 1.1162097287342743e-07, "epoch": 19.87945492662474, "percentage": 99.4, "elapsed_time": "1:37:00", "remaining_time": "0:00:35", "throughput": 4250.51, "total_tokens": 24742080} {"current_steps": 37935, "total_steps": 38160, "loss": 0.3836, "lr": 1.0684136156213775e-07, "epoch": 19.882075471698112, "percentage": 99.41, "elapsed_time": "1:37:01", "remaining_time": "0:00:34", "throughput": 4250.48, "total_tokens": 24744512} {"current_steps": 37940, "total_steps": 38160, "loss": 0.3552, "lr": 1.0216632219650634e-07, "epoch": 19.88469601677149, "percentage": 99.42, "elapsed_time": "1:37:02", "remaining_time": "0:00:33", "throughput": 4250.55, "total_tokens": 24748224} {"current_steps": 37945, "total_steps": 38160, "loss": 0.5227, "lr": 9.759585575458418e-08, "epoch": 19.887316561844862, "percentage": 99.44, "elapsed_time": "1:37:03", "remaining_time": "0:00:32", "throughput": 4250.56, "total_tokens": 24751232} {"current_steps": 37950, "total_steps": 38160, "loss": 0.3906, "lr": 9.312996319238432e-08, "epoch": 19.88993710691824, "percentage": 99.45, "elapsed_time": "1:37:03", "remaining_time": "0:00:32", "throughput": 4250.57, "total_tokens": 24754208} {"current_steps": 37955, "total_steps": 38160, "loss": 0.414, "lr": 8.876864544421493e-08, "epoch": 19.892557651991613, "percentage": 99.46, "elapsed_time": "1:37:04", "remaining_time": "0:00:31", "throughput": 4250.6, "total_tokens": 24757440} {"current_steps": 37960, "total_steps": 38160, "loss": 0.4331, "lr": 8.451190342229077e-08, "epoch": 19.89517819706499, "percentage": 99.48, "elapsed_time": "1:37:05", "remaining_time": "0:00:30", "throughput": 4250.56, "total_tokens": 24759808} {"current_steps": 37965, "total_steps": 38160, "loss": 0.3844, "lr": 8.035973801717722e-08, "epoch": 19.897798742138363, "percentage": 99.49, "elapsed_time": "1:37:05", "remaining_time": "0:00:29", "throughput": 4250.5, "total_tokens": 24761952} {"current_steps": 37970, "total_steps": 38160, "loss": 0.5027, "lr": 7.631215009740178e-08, "epoch": 19.90041928721174, "percentage": 99.5, "elapsed_time": "1:37:06", "remaining_time": "0:00:29", "throughput": 4250.54, "total_tokens": 24765280} {"current_steps": 37975, "total_steps": 38160, "loss": 0.4227, "lr": 7.236914050973153e-08, "epoch": 19.903039832285117, "percentage": 99.52, "elapsed_time": "1:37:07", "remaining_time": "0:00:28", "throughput": 4250.55, "total_tokens": 24768320} {"current_steps": 37980, "total_steps": 38160, "loss": 0.4272, "lr": 6.853071007895117e-08, "epoch": 19.90566037735849, "percentage": 99.53, "elapsed_time": "1:37:07", "remaining_time": "0:00:27", "throughput": 4250.53, "total_tokens": 24770912} {"current_steps": 37985, "total_steps": 38160, "loss": 0.5197, "lr": 6.479685960797399e-08, "epoch": 19.908280922431867, "percentage": 99.54, "elapsed_time": "1:37:08", "remaining_time": "0:00:26", "throughput": 4250.56, "total_tokens": 24774176} {"current_steps": 37990, "total_steps": 38160, "loss": 0.4546, "lr": 6.116758987800841e-08, "epoch": 19.91090146750524, "percentage": 99.55, "elapsed_time": "1:37:09", "remaining_time": "0:00:26", "throughput": 4250.56, "total_tokens": 24777120} {"current_steps": 37995, "total_steps": 38160, "loss": 0.3814, "lr": 5.7642901648113924e-08, "epoch": 19.913522012578618, "percentage": 99.57, "elapsed_time": "1:37:09", "remaining_time": "0:00:25", "throughput": 4250.54, "total_tokens": 24779712} {"current_steps": 38000, "total_steps": 38160, "loss": 0.4565, "lr": 5.422279565570065e-08, "epoch": 19.91614255765199, "percentage": 99.58, "elapsed_time": "1:37:10", "remaining_time": "0:00:24", "throughput": 4250.59, "total_tokens": 24783200} {"current_steps": 38005, "total_steps": 38160, "loss": 0.533, "lr": 5.090727261619632e-08, "epoch": 19.918763102725368, "percentage": 99.59, "elapsed_time": "1:37:11", "remaining_time": "0:00:23", "throughput": 4250.63, "total_tokens": 24786592} {"current_steps": 38010, "total_steps": 38160, "loss": 0.3519, "lr": 4.7696333223212765e-08, "epoch": 19.92138364779874, "percentage": 99.61, "elapsed_time": "1:37:11", "remaining_time": "0:00:23", "throughput": 4250.64, "total_tokens": 24789664} {"current_steps": 38015, "total_steps": 38160, "loss": 0.4375, "lr": 4.4589978148323884e-08, "epoch": 19.92400419287212, "percentage": 99.62, "elapsed_time": "1:37:12", "remaining_time": "0:00:22", "throughput": 4250.62, "total_tokens": 24792288} {"current_steps": 38020, "total_steps": 38160, "loss": 0.3561, "lr": 4.1588208041454244e-08, "epoch": 19.92662473794549, "percentage": 99.63, "elapsed_time": "1:37:13", "remaining_time": "0:00:21", "throughput": 4250.68, "total_tokens": 24796000} {"current_steps": 38025, "total_steps": 38160, "loss": 0.3805, "lr": 3.8691023530545985e-08, "epoch": 19.92924528301887, "percentage": 99.65, "elapsed_time": "1:37:14", "remaining_time": "0:00:20", "throughput": 4250.69, "total_tokens": 24798976} {"current_steps": 38030, "total_steps": 38160, "loss": 0.3813, "lr": 3.589842522155884e-08, "epoch": 19.931865828092242, "percentage": 99.66, "elapsed_time": "1:37:14", "remaining_time": "0:00:19", "throughput": 4250.68, "total_tokens": 24801760} {"current_steps": 38035, "total_steps": 38160, "loss": 0.4208, "lr": 3.321041369874767e-08, "epoch": 19.93448637316562, "percentage": 99.67, "elapsed_time": "1:37:15", "remaining_time": "0:00:19", "throughput": 4250.74, "total_tokens": 24805376} {"current_steps": 38040, "total_steps": 38160, "loss": 0.4813, "lr": 3.0626989524384916e-08, "epoch": 19.937106918238992, "percentage": 99.69, "elapsed_time": "1:37:16", "remaining_time": "0:00:18", "throughput": 4250.82, "total_tokens": 24809440} {"current_steps": 38045, "total_steps": 38160, "loss": 0.4518, "lr": 2.8148153238927167e-08, "epoch": 19.93972746331237, "percentage": 99.7, "elapsed_time": "1:37:17", "remaining_time": "0:00:17", "throughput": 4250.91, "total_tokens": 24813472} {"current_steps": 38050, "total_steps": 38160, "loss": 0.4683, "lr": 2.5773905360904072e-08, "epoch": 19.942348008385743, "percentage": 99.71, "elapsed_time": "1:37:17", "remaining_time": "0:00:16", "throughput": 4250.93, "total_tokens": 24816608} {"current_steps": 38055, "total_steps": 38160, "loss": 0.4927, "lr": 2.3504246386918392e-08, "epoch": 19.94496855345912, "percentage": 99.72, "elapsed_time": "1:37:18", "remaining_time": "0:00:16", "throughput": 4250.95, "total_tokens": 24819776} {"current_steps": 38060, "total_steps": 38160, "loss": 0.3691, "lr": 2.133917679186803e-08, "epoch": 19.947589098532493, "percentage": 99.74, "elapsed_time": "1:37:19", "remaining_time": "0:00:15", "throughput": 4250.94, "total_tokens": 24822560} {"current_steps": 38065, "total_steps": 38160, "loss": 0.3015, "lr": 1.9278697028557447e-08, "epoch": 19.95020964360587, "percentage": 99.75, "elapsed_time": "1:37:20", "remaining_time": "0:00:14", "throughput": 4250.94, "total_tokens": 24825600} {"current_steps": 38070, "total_steps": 38160, "loss": 0.4665, "lr": 1.7322807528086238e-08, "epoch": 19.952830188679247, "percentage": 99.76, "elapsed_time": "1:37:20", "remaining_time": "0:00:13", "throughput": 4250.92, "total_tokens": 24828224} {"current_steps": 38075, "total_steps": 38160, "loss": 0.3996, "lr": 1.547150869957159e-08, "epoch": 19.95545073375262, "percentage": 99.78, "elapsed_time": "1:37:21", "remaining_time": "0:00:13", "throughput": 4250.9, "total_tokens": 24830848} {"current_steps": 38080, "total_steps": 38160, "loss": 0.4331, "lr": 1.3724800930314806e-08, "epoch": 19.958071278825997, "percentage": 99.79, "elapsed_time": "1:37:22", "remaining_time": "0:00:12", "throughput": 4250.94, "total_tokens": 24834304} {"current_steps": 38085, "total_steps": 38160, "loss": 0.3117, "lr": 1.2082684585634773e-08, "epoch": 19.96069182389937, "percentage": 99.8, "elapsed_time": "1:37:22", "remaining_time": "0:00:11", "throughput": 4251.02, "total_tokens": 24838112} {"current_steps": 38090, "total_steps": 38160, "loss": 0.3964, "lr": 1.0545160009145516e-08, "epoch": 19.963312368972748, "percentage": 99.82, "elapsed_time": "1:37:23", "remaining_time": "0:00:10", "throughput": 4251.12, "total_tokens": 24842240} {"current_steps": 38095, "total_steps": 38160, "loss": 0.3396, "lr": 9.112227522423133e-09, "epoch": 19.96593291404612, "percentage": 99.83, "elapsed_time": "1:37:24", "remaining_time": "0:00:09", "throughput": 4251.17, "total_tokens": 24845824} {"current_steps": 38100, "total_steps": 38160, "loss": 0.5092, "lr": 7.783887425172331e-09, "epoch": 19.968553459119498, "percentage": 99.84, "elapsed_time": "1:37:25", "remaining_time": "0:00:09", "throughput": 4251.18, "total_tokens": 24848704} {"current_steps": 38105, "total_steps": 38160, "loss": 0.2943, "lr": 6.560139995392955e-09, "epoch": 19.97117400419287, "percentage": 99.86, "elapsed_time": "1:37:26", "remaining_time": "0:00:08", "throughput": 4251.29, "total_tokens": 24853120} {"current_steps": 38110, "total_steps": 38160, "loss": 0.5035, "lr": 5.440985488935901e-09, "epoch": 19.97379454926625, "percentage": 99.87, "elapsed_time": "1:37:26", "remaining_time": "0:00:07", "throughput": 4251.34, "total_tokens": 24856800} {"current_steps": 38115, "total_steps": 38160, "loss": 0.4863, "lr": 4.426424140058227e-09, "epoch": 19.97641509433962, "percentage": 99.88, "elapsed_time": "1:37:27", "remaining_time": "0:00:06", "throughput": 4251.31, "total_tokens": 24859392} {"current_steps": 38120, "total_steps": 38160, "loss": 0.4299, "lr": 3.5164561608680424e-09, "epoch": 19.979035639413, "percentage": 99.9, "elapsed_time": "1:37:28", "remaining_time": "0:00:06", "throughput": 4251.4, "total_tokens": 24863328} {"current_steps": 38125, "total_steps": 38160, "loss": 0.3743, "lr": 2.7110817417685953e-09, "epoch": 19.981656184486372, "percentage": 99.91, "elapsed_time": "1:37:28", "remaining_time": "0:00:05", "throughput": 4251.42, "total_tokens": 24866496} {"current_steps": 38130, "total_steps": 38160, "loss": 0.3776, "lr": 2.010301051291741e-09, "epoch": 19.98427672955975, "percentage": 99.92, "elapsed_time": "1:37:29", "remaining_time": "0:00:04", "throughput": 4251.57, "total_tokens": 24871328} {"current_steps": 38135, "total_steps": 38160, "loss": 0.3589, "lr": 1.4141142359314074e-09, "epoch": 19.986897274633122, "percentage": 99.93, "elapsed_time": "1:37:30", "remaining_time": "0:00:03", "throughput": 4251.57, "total_tokens": 24874336} {"current_steps": 38140, "total_steps": 38160, "loss": 0.3865, "lr": 9.22521420476663e-10, "epoch": 19.9895178197065, "percentage": 99.95, "elapsed_time": "1:37:31", "remaining_time": "0:00:03", "throughput": 4251.55, "total_tokens": 24877024} {"current_steps": 38145, "total_steps": 38160, "loss": 0.4515, "lr": 5.355227077341596e-10, "epoch": 19.992138364779873, "percentage": 99.96, "elapsed_time": "1:37:31", "remaining_time": "0:00:02", "throughput": 4251.56, "total_tokens": 24880096} {"current_steps": 38150, "total_steps": 38160, "loss": 0.4372, "lr": 2.5311817863915566e-10, "epoch": 19.99475890985325, "percentage": 99.97, "elapsed_time": "1:37:32", "remaining_time": "0:00:01", "throughput": 4251.57, "total_tokens": 24883200} {"current_steps": 38155, "total_steps": 38160, "loss": 0.4077, "lr": 7.53078923110273e-11, "epoch": 19.997379454926623, "percentage": 99.99, "elapsed_time": "1:37:33", "remaining_time": "0:00:00", "throughput": 4251.54, "total_tokens": 24885664} {"current_steps": 38160, "total_steps": 38160, "loss": 0.301, "lr": 2.0918859422458526e-12, "epoch": 20.0, "percentage": 100.0, "elapsed_time": "1:37:34", "remaining_time": "0:00:00", "throughput": 4251.37, "total_tokens": 24887720} {"current_steps": 38160, "total_steps": 38160, "eval_loss": 0.4668559730052948, "epoch": 20.0, "percentage": 100.0, "elapsed_time": "1:37:47", "remaining_time": "0:00:00", "throughput": 4241.53, "total_tokens": 24887720} {"current_steps": 38160, "total_steps": 38160, "epoch": 20.0, "percentage": 100.0, "elapsed_time": "1:37:49", "remaining_time": "0:00:00", "throughput": 4240.4, "total_tokens": 24887720}